[
  {
    "path": ".github/workflows/ci.yml",
    "content": "name: CI Pipeline\n\non:\n  push:\n    branches: [master]\n  pull_request:\n\nenv:\n  REGISTRY: ghcr.io\n  IMAGE_NAME: ${{ github.repository }}\n\njobs:\n  test-and-build-stats:\n    runs-on: ubuntu-latest\n    permissions:\n      contents: read\n      packages: write\n\n    steps:\n    - name: Checkout repository\n      uses: actions/checkout@v4\n\n    - name: Set up QEMU\n      uses: docker/setup-qemu-action@v3\n\n    - name: Set up Docker Buildx\n      uses: docker/setup-buildx-action@v3\n\n    - name: Log in to Container Registry\n      uses: docker/login-action@v3\n      with:\n        registry: ${{ env.REGISTRY }}\n        username: ${{ github.actor }}\n        password: ${{ secrets.GITHUB_TOKEN }}\n\n    - name: Extract metadata for stats image\n      id: meta-stats\n      uses: docker/metadata-action@v5\n      with:\n        images: ${{ env.REGISTRY }}/${{ env.IMAGE_NAME }}/stats\n        tags: |\n          type=ref,event=branch\n          type=ref,event=pr\n          type=sha\n          type=raw,value=latest,enable={{is_default_branch}}\n\n    - name: Build stats Docker image\n      uses: docker/build-push-action@v5\n      with:\n        context: .\n        file: ./stats.Dockerfile\n        load: true\n        platforms: linux/amd64\n        tags: |\n          ${{ env.REGISTRY }}/${{ env.IMAGE_NAME }}/stats:${{ github.sha }}\n\n    - name: Run unit tests\n      run: |\n        docker run --rm \\\n          -v ${{ github.workspace }}/tests:/app/tests \\\n          ${{ env.REGISTRY }}/${{ env.IMAGE_NAME }}/stats:${{ github.sha }} \\\n          python -m pytest -s tests/\n\n    - name: Push stats Docker image\n      if: |\n        success() && (\n          github.event_name == 'push' && github.ref == 'refs/heads/master' ||\n          github.event_name == 'pull_request' && github.event.pull_request.head.repo.full_name == github.repository\n        )\n      uses: docker/build-push-action@v5\n      with:\n        context: .\n        file: ./stats.Dockerfile\n        push: true\n        platforms: linux/amd64,linux/arm64\n        tags: ${{ steps.meta-stats.outputs.tags }}\n        labels: ${{ steps.meta-stats.outputs.labels }}\n\n  build-site:\n    runs-on: ubuntu-latest\n    permissions:\n      contents: read\n      packages: write\n\n    steps:\n    - name: Checkout repository\n      uses: actions/checkout@v4\n\n    - name: Log in to Container Registry\n      uses: docker/login-action@v3\n      with:\n        registry: ${{ env.REGISTRY }}\n        username: ${{ github.actor }}\n        password: ${{ secrets.GITHUB_TOKEN }}\n\n    - name: Extract metadata for site image\n      id: meta-site\n      uses: docker/metadata-action@v5\n      with:\n        images: ${{ env.REGISTRY }}/${{ env.IMAGE_NAME }}/site\n        tags: |\n          type=ref,event=branch\n          type=ref,event=pr\n          type=sha\n          type=raw,value=latest,enable={{is_default_branch}}\n\n    - name: Build and push site Docker image\n      uses: docker/build-push-action@v5\n      with:\n        context: .\n        file: ./site.Dockerfile\n        push: ${{ github.event.pull_request.head.repo.full_name == github.repository }}\n        tags: ${{ steps.meta-site.outputs.tags }}\n        labels: ${{ steps.meta-site.outputs.labels }}\n"
  },
  {
    "path": ".gitignore",
    "content": "# Byte-compiled / optimized / DLL files\n__pycache__/\n*.py[cod]\n*$py.class\n\n# C extensions\n*.so\n\n# Distribution / packaging\n.Python\nenv/\nbuild/\ndevelop-eggs/\ndist/\ndownloads/\neggs/\n.eggs/\nlib/\nlib64/\nparts/\nsdist/\nvar/\n*.egg-info/\n.installed.cfg\n*.egg\n\n# PyInstaller\n#  Usually these files are written by a python script from a template\n#  before PyInstaller builds the exe, so as to inject date/other infos into it.\n*.manifest\n*.spec\n\n# Installer logs\npip-log.txt\npip-delete-this-directory.txt\n\n# Unit test / coverage reports\nhtmlcov/\n.tox/\n.coverage\n.coverage.*\n.cache\nnosetests.xml\ncoverage.xml\n*,cover\n.hypothesis/\n\n# Translations\n*.mo\n*.pot\n\n# Django stuff:\n*.log\nlocal_settings.py\n\n# Flask stuff:\ninstance/\n.webassets-cache\n\n# Scrapy stuff:\n.scrapy\n\n# Sphinx documentation\ndocs/_build/\n\n# PyBuilder\ntarget/\n\n# IPython Notebook\n.ipynb_checkpoints\n\n# pyenv\n.python-version\n\n# celery beat schedule file\ncelerybeat-schedule\n\n# dotenv\n.env\n\n# virtualenv\nvenv/\nENV/\n\n# Spyder project settings\n.spyderproject\n\n# Rope project settings\n.ropeproject\n\n# Eclipse PyDev\n.project\n.pydevproject\n.settings/\n\n# Jekyll files to run github-pages locally\n_site\n.sass-cache\n.jekyll-metadata\nGemfile\nGemfile.lock\nassets\n_includes\n_sass\njs\nvendor/\n.bundle/\nthemes/\n\n# crawl statistics files\nstats/*.gz\nstats/crawls.txt\nstats/excerpt/\n\n# generated CSV data\ndata/\n\n# macOS Desktop Services Store\n.DS_Store\n"
  },
  {
    "path": "LICENSE",
    "content": "                                 Apache License\n                           Version 2.0, January 2004\n                        http://www.apache.org/licenses/\n\n   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION\n\n   1. Definitions.\n\n      \"License\" shall mean the terms and conditions for use, reproduction,\n      and distribution as defined by Sections 1 through 9 of this document.\n\n      \"Licensor\" shall mean the copyright owner or entity authorized by\n      the copyright owner that is granting the License.\n\n      \"Legal Entity\" shall mean the union of the acting entity and all\n      other entities that control, are controlled by, or are under common\n      control with that entity. For the purposes of this definition,\n      \"control\" means (i) the power, direct or indirect, to cause the\n      direction or management of such entity, whether by contract or\n      otherwise, or (ii) ownership of fifty percent (50%) or more of the\n      outstanding shares, or (iii) beneficial ownership of such entity.\n\n      \"You\" (or \"Your\") shall mean an individual or Legal Entity\n      exercising permissions granted by this License.\n\n      \"Source\" form shall mean the preferred form for making modifications,\n      including but not limited to software source code, documentation\n      source, and configuration files.\n\n      \"Object\" form shall mean any form resulting from mechanical\n      transformation or translation of a Source form, including but\n      not limited to compiled object code, generated documentation,\n      and conversions to other media types.\n\n      \"Work\" shall mean the work of authorship, whether in Source or\n      Object form, made available under the License, as indicated by a\n      copyright notice that is included in or attached to the work\n      (an example is provided in the Appendix below).\n\n      \"Derivative Works\" shall mean any work, whether in Source or Object\n      form, that is based on (or derived from) the Work and for which the\n      editorial revisions, annotations, elaborations, or other modifications\n      represent, as a whole, an original work of authorship. For the purposes\n      of this License, Derivative Works shall not include works that remain\n      separable from, or merely link (or bind by name) to the interfaces of,\n      the Work and Derivative Works thereof.\n\n      \"Contribution\" shall mean any work of authorship, including\n      the original version of the Work and any modifications or additions\n      to that Work or Derivative Works thereof, that is intentionally\n      submitted to Licensor for inclusion in the Work by the copyright owner\n      or by an individual or Legal Entity authorized to submit on behalf of\n      the copyright owner. For the purposes of this definition, \"submitted\"\n      means any form of electronic, verbal, or written communication sent\n      to the Licensor or its representatives, including but not limited to\n      communication on electronic mailing lists, source code control systems,\n      and issue tracking systems that are managed by, or on behalf of, the\n      Licensor for the purpose of discussing and improving the Work, but\n      excluding communication that is conspicuously marked or otherwise\n      designated in writing by the copyright owner as \"Not a Contribution.\"\n\n      \"Contributor\" shall mean Licensor and any individual or Legal Entity\n      on behalf of whom a Contribution has been received by Licensor and\n      subsequently incorporated within the Work.\n\n   2. Grant of Copyright License. Subject to the terms and conditions of\n      this License, each Contributor hereby grants to You a perpetual,\n      worldwide, non-exclusive, no-charge, royalty-free, irrevocable\n      copyright license to reproduce, prepare Derivative Works of,\n      publicly display, publicly perform, sublicense, and distribute the\n      Work and such Derivative Works in Source or Object form.\n\n   3. Grant of Patent License. Subject to the terms and conditions of\n      this License, each Contributor hereby grants to You a perpetual,\n      worldwide, non-exclusive, no-charge, royalty-free, irrevocable\n      (except as stated in this section) patent license to make, have made,\n      use, offer to sell, sell, import, and otherwise transfer the Work,\n      where such license applies only to those patent claims licensable\n      by such Contributor that are necessarily infringed by their\n      Contribution(s) alone or by combination of their Contribution(s)\n      with the Work to which such Contribution(s) was submitted. If You\n      institute patent litigation against any entity (including a\n      cross-claim or counterclaim in a lawsuit) alleging that the Work\n      or a Contribution incorporated within the Work constitutes direct\n      or contributory patent infringement, then any patent licenses\n      granted to You under this License for that Work shall terminate\n      as of the date such litigation is filed.\n\n   4. Redistribution. You may reproduce and distribute copies of the\n      Work or Derivative Works thereof in any medium, with or without\n      modifications, and in Source or Object form, provided that You\n      meet the following conditions:\n\n      (a) You must give any other recipients of the Work or\n          Derivative Works a copy of this License; and\n\n      (b) You must cause any modified files to carry prominent notices\n          stating that You changed the files; and\n\n      (c) You must retain, in the Source form of any Derivative Works\n          that You distribute, all copyright, patent, trademark, and\n          attribution notices from the Source form of the Work,\n          excluding those notices that do not pertain to any part of\n          the Derivative Works; and\n\n      (d) If the Work includes a \"NOTICE\" text file as part of its\n          distribution, then any Derivative Works that You distribute must\n          include a readable copy of the attribution notices contained\n          within such NOTICE file, excluding those notices that do not\n          pertain to any part of the Derivative Works, in at least one\n          of the following places: within a NOTICE text file distributed\n          as part of the Derivative Works; within the Source form or\n          documentation, if provided along with the Derivative Works; or,\n          within a display generated by the Derivative Works, if and\n          wherever such third-party notices normally appear. The contents\n          of the NOTICE file are for informational purposes only and\n          do not modify the License. You may add Your own attribution\n          notices within Derivative Works that You distribute, alongside\n          or as an addendum to the NOTICE text from the Work, provided\n          that such additional attribution notices cannot be construed\n          as modifying the License.\n\n      You may add Your own copyright statement to Your modifications and\n      may provide additional or different license terms and conditions\n      for use, reproduction, or distribution of Your modifications, or\n      for any such Derivative Works as a whole, provided Your use,\n      reproduction, and distribution of the Work otherwise complies with\n      the conditions stated in this License.\n\n   5. Submission of Contributions. Unless You explicitly state otherwise,\n      any Contribution intentionally submitted for inclusion in the Work\n      by You to the Licensor shall be under the terms and conditions of\n      this License, without any additional terms or conditions.\n      Notwithstanding the above, nothing herein shall supersede or modify\n      the terms of any separate license agreement you may have executed\n      with Licensor regarding such Contributions.\n\n   6. Trademarks. This License does not grant permission to use the trade\n      names, trademarks, service marks, or product names of the Licensor,\n      except as required for reasonable and customary use in describing the\n      origin of the Work and reproducing the content of the NOTICE file.\n\n   7. Disclaimer of Warranty. Unless required by applicable law or\n      agreed to in writing, Licensor provides the Work (and each\n      Contributor provides its Contributions) on an \"AS IS\" BASIS,\n      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or\n      implied, including, without limitation, any warranties or conditions\n      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A\n      PARTICULAR PURPOSE. You are solely responsible for determining the\n      appropriateness of using or redistributing the Work and assume any\n      risks associated with Your exercise of permissions under this License.\n\n   8. Limitation of Liability. In no event and under no legal theory,\n      whether in tort (including negligence), contract, or otherwise,\n      unless required by applicable law (such as deliberate and grossly\n      negligent acts) or agreed to in writing, shall any Contributor be\n      liable to You for damages, including any direct, indirect, special,\n      incidental, or consequential damages of any character arising as a\n      result of this License or out of the use or inability to use the\n      Work (including but not limited to damages for loss of goodwill,\n      work stoppage, computer failure or malfunction, or any and all\n      other commercial damages or losses), even if such Contributor\n      has been advised of the possibility of such damages.\n\n   9. Accepting Warranty or Additional Liability. While redistributing\n      the Work or Derivative Works thereof, You may choose to offer,\n      and charge a fee for, acceptance of support, warranty, indemnity,\n      or other liability obligations and/or rights consistent with this\n      License. However, in accepting such obligations, You may act only\n      on Your own behalf and on Your sole responsibility, not on behalf\n      of any other Contributor, and only if You agree to indemnify,\n      defend, and hold each Contributor harmless for any liability\n      incurred by, or claims asserted against, such Contributor by reason\n      of your accepting any such warranty or additional liability.\n\n   END OF TERMS AND CONDITIONS\n\n   APPENDIX: How to apply the Apache License to your work.\n\n      To apply the Apache License to your work, attach the following\n      boilerplate notice, with the fields enclosed by brackets \"{}\"\n      replaced with your own identifying information. (Don't include\n      the brackets!)  The text should be enclosed in the appropriate\n      comment syntax for the file format. We also recommend that a\n      file or class name and description of purpose be included on the\n      same \"printed page\" as the copyright notice for easier\n      identification within third-party archives.\n\n   Copyright {yyyy} {name of copyright owner}\n\n   Licensed under the Apache License, Version 2.0 (the \"License\");\n   you may not use this file except in compliance with the License.\n   You may obtain a copy of the License at\n\n       http://www.apache.org/licenses/LICENSE-2.0\n\n   Unless required by applicable law or agreed to in writing, software\n   distributed under the License is distributed on an \"AS IS\" BASIS,\n   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.\n   See the License for the specific language governing permissions and\n   limitations under the License.\n"
  },
  {
    "path": "README.md",
    "content": "Basic Statistics of Common Crawl Monthly Archives\n=================================================\n\nAnalyze the [Common Crawl](https://commoncrawl.org/) data to get metrics about the monthly crawl archives:\n* size of the monthly crawls, number of\n  * fetched pages\n  * unique URLs\n  * unique documents (by content digest)\n  * number of different hosts, domains, top-level domains\n* distribution of pages/URLs on hosts, domains, top-level domains\n* and ...\n  * mime types\n  * protocols / schemes (http vs. https)\n  * content languages (since summer 2018)\n\nThis is a description how to generate the statistics from the Common Crawl URL index files.\n\nThe results are presented on https://commoncrawl.github.io/cc-crawl-statistics/.\n\n\nStep 1: Count Items\n-------------------\n\nThe items (URLs, hosts, domains, etc.) are counted using the Common Crawl index files\non AWS S3 `s3://commoncrawl/cc-index/collections/*/indexes/cdx-*.gz`.\n\n1. define a pattern of cdx files to process - usually from one monthly crawl (here: `CC-MAIN-2016-26`)\n   - either smaller set of local files for testing\n   ```\n   INPUT=\"test/cdx/cdx-0000[0-3].gz\"\n   ```\n   - or one monthly crawl to be accessed via Hadoop on AWS S3:\n   ```\n   INPUT=\"s3a://commoncrawl/cc-index/collections/CC-MAIN-2016-26/indexes/cdx-*.gz\"\n   ```\n\n2. run `crawlstats.py --job=count` to process the cdx files and count the items:\n   ```\n   python3 crawlstats.py --job=count --no-exact-counts \\\n        --no-output --output-dir .../count/ $INPUT\n   ```\n\nHelp on command-line parameters (including [mrjob](https://pypi.org/project/mrjob/) options) are shown by\n`python3 crawlstats.py --help`.\nThe option `--no-exact-counts` is recommended (and is the default) to save storage space and computation time\nwhen counting URLs and content digests.\n\n\nStep 2: Aggregate Counts\n------------------------\n\nRun `crawlstats.py --job=stats` on the output of step 1:\n```\npython3 crawlstats.py --job=stats --max-top-hosts-domains=500 \\\n     --no-output --output-dir .../stats/ .../count/\n```\nThe max. number of most frequent thosts and domains contained in the output is set by the option\n`--max-top-hosts-domains=N`.\n\n\nStep 3: Download the Data\n-------------------------\n\nIn order to prepare the plots, the the output of step 2 must be downloaded to local disk.\nSimplest, the data is fetched from the Common Crawl Public Data Set bucket on AWS S3:\n```sh\nwhile read crawl; do\n    aws s3 cp s3://commoncrawl/crawl-analysis/$crawl/stats/part-00000.gz ./stats/$crawl.gz\ndone <<EOF\nCC-MAIN-2008-2009\n...\nEOF\n```\n\nOne aggregated, gzip-compressed statistics file, is about 1 MiB in size. So you could just run\n[get_stats.sh](get_stats.sh) to download the data files for all released monthly crawls.\n\nAlso the output of step 1 is provided on `s3://commoncrawl/`. The counts for every crawl is hold\nin 10 bzip2-compressed files, together 1 GiB per crawl in average. To download the counts for one crawl:\n- if you're on AWS and [AWS CLI]() is installed and configured\n  ```sh\n  CRAWL=CC-MAIN-2022-05\n  aws s3 cp --recursive s3://commoncrawl/crawl-analysis/$CRAWL/count stats/count/$CRAWL\n  ```\n- otherwise\n  ```sh\n  CRAWL=CC-MAIN-2022-05\n  mkdir -p stats/count/$CRAWL\n  for i in $(seq 0 9); do\n    curl https://data.commoncrawl.org/crawl-analysis/$CRAWL/count/part-0000$i.bz2 \\\n      >stats/count/$CRAWL/part-0000$i.bz2\n  done\n  ```\n\n\nStep 4: Plot the Data\n---------------------\n\nTo prepare the plots using the downloaded aggregated data:\n```\ngzip -dc stats/CC-MAIN-*.gz | python3 plot/crawl_size.py\n```\nThe full list of commands to prepare all plots is found in [plot.sh](plot.sh). Don't forget to install the Python\nmodules [required for plotting](requirements_plot.txt).\n\n\nStep 5: Local Site Preview\n--------------------------\n\nThe [crawl statistics site](https://commoncrawl.github.io/cc-crawl-statistics/) is hosted by [Github pages](https://pages.github.com/). The site is updated as soon as plots or description texts are updated, committed and pushed to the Github repository.\n\nTo preview local changes, it's possible to serve the site locally:\n1. build the Docker image with Ruby, Jekyll and the content to be served\n   ```\n   docker build -f site.Dockerfile -t cc-crawl-statistics-site:latest .\n   ```\n2. run a Docker container to serve the site preview\n   ```\n   docker run --network=host --rm -ti cc-crawl-statistics-site:latest\n   ```\n   The site should be served on localhost, port 4000 (http://127.0.0.1:4000).\n   If not, the correct location is shown in the output of the `docker run` command.\n\n   If running this on a Mac, you may find that the loopback interface (127.0.0.1) within the container is not accessible, so you can change the line in the [Dockerfile](site.Dockerfile) to:\n\n   ```\n   CMD bundle exec jekyll serve --host 0.0.0.0\n   ```\n\n   ... and then the site will be served on http://0.0.0.0:4000 instead.  (You will of course need to rebuild the Docker image after updating the Dockerfile.)\n\n\nRun via Container\n-----------------\n\nThe whole workflow can be run as a container (docker or podman) including downloading stats files from Common Crawl's S3 bucket and generating new plots.\n\n```bash\n# clone the repository (to have the latest crawl IDs)\ngit clone https://github.com/commoncrawl/cc-crawl-statistics.git\ncd cc-crawl-statistics\n\n# download stats and generate plots\n# SSH, AWS keys, and stats and plots directories must be mounted into the container\npodman run --rm -v ~/.aws:/root/.aws:ro -v $(pwd -P)/stats:/app/stats -v $(pwd -P)/plots:/app/plots ghcr.io/commoncrawl/cc-crawl-statistics/stats:latest \n\n# if needed you can manually build the container image\npodman build -f stats.Dockerfile -t ghcr.io/commoncrawl/cc-crawl-statistics/stats:latest\n\n# for development it is recommend to mount the whole repository into the container\npodman run -it -v ~/.aws:/root/.aws:ro -v $(pwd -P):/app ghcr.io/commoncrawl/cc-crawl-statistics/stats:latest /bin/bash\n\n```\n\n\nRelated Projects\n----------------\n\nThe [columnar index](https://commoncrawl.org/2018/03/index-to-warc-files-and-urls-in-columnar-format/)\nsimplifies counting and analytics a lot - easier to maintain, more transparent, reproducible and\nextensible than running two MapReduce jobs, see the the list of example\n- [SQL queries](https://github.com/commoncrawl/cc-index-table#query-the-table-in-amazon-athena) and\n- [Jupyter notebooks](https://github.com/commoncrawl/cc-notebooks)\n\n"
  },
  {
    "path": "_config.yml",
    "content": "title: Statistics of Common Crawl Monthly Archives\ndescription: Number of pages, distribution of top-level domains, crawl overlaps, etc. - basic metrics about Common Crawl Monthly Crawl Archives\nrepository: commoncrawl/cc-crawl-statistics\nlatest_crawl: CC-MAIN-2026-17\n\nshow_navigation: True\nnavlist:\n - title: Home\n   url: /\n - title: Size of crawls\n   url: /plots/crawlsize\n - title: Top-level domains\n   url: /plots/tlds\n - title: Registered domains\n   url: /plots/domains\n - title: Crawler metrics\n   url: /plots/crawlermetrics\n - title: Crawl overlaps\n   url: /plots/crawloverlap\n - title: Media types\n   url: /plots/mimetypes\n - title: Character sets\n   url: /plots/charsets\n - title: Languages\n   url: /plots/languages\n\ntheme: jekyll-theme-minimal\n"
  },
  {
    "path": "_layouts/default.html",
    "content": "<!doctype html>\n<html lang=\"{{ site.lang | default: \"en-US\" }}\">\n  <head>\n    <meta charset=\"utf-8\">\n    <meta http-equiv=\"X-UA-Compatible\" content=\"chrome=1\">\n    <title>{{ site.title | default: site.github.repository_name }} by {{ site.github.owner_name }}</title>\n\n    <link rel=\"stylesheet\" href=\"{{ '/assets/css/style.css?v=' | append: site.github.build_revision | relative_url }}\">\n    <meta name=\"viewport\" content=\"width=device-width\">\n    <!--[if lt IE 9]>\n    <script src=\"//html5shiv.googlecode.com/svn/trunk/html5.js\"></script>\n    <![endif]-->\n  </head>\n  <body>\n    <div class=\"wrapper\">\n      <header>\n        <h1>{{ site.title | default: site.github.repository_name }}</h1>\n        <p>{{ site.description | default: site.github.project_tagline }}\n        <br>Latest crawl: {{site.latest_crawl}}\n        </p>\n\n        {% if site.show_navigation %}\n          <nav>\n            <p>\n            {% for node in site.navlist %}\n              <a href=\"{{ site.baseurl }}{{ node.url }}\">{{ node.title }}</a><br/>\n            {% endfor %}\n            </p>\n          </nav>\n        {% endif %}\n\n      </header>\n      <section>\n\n      {{ content }}\n\n      </section>\n      <footer>\n        {% if site.github.is_project_page %}\n          <p class=\"view\"><a href=\"{{ site.github.repository_url }}\">View the Project on GitHub <small>{{ github_name }}</small></a></p>\n        {% endif %}\n        {% if site.github.is_project_page %}\n        <p>This project is maintained by <a href=\"{{ site.github.owner_url }}\">{{ site.github.owner_name }}</a></p>\n        {% endif %}\n        <p><small>Hosted on GitHub Pages &mdash; Theme by <a href=\"https://github.com/orderedlist\">orderedlist</a></small></p>\n      </footer>\n    </div>\n    <script src=\"{{ '/assets/js/scale.fix.js' | relative_url }}\"></script>\n\n  </body>\n</html>\n<!--\n Based on:\n  https://github.com/pages-themes/minimal\n  https://github.com/orderedlist/minimal\n-->"
  },
  {
    "path": "_layouts/table.html",
    "content": "<!doctype html>\n<html lang=\"{{ site.lang | default: \"en-US\" }}\">\n  <head>\n    <meta charset=\"utf-8\">\n    <meta http-equiv=\"X-UA-Compatible\" content=\"chrome=1\">\n    <title>{{ site.title | default: site.github.repository_name }} by {{ site.github.owner_name }}</title>\n\n    <link rel=\"stylesheet\" href=\"{{ '/assets/css/style.css?v=' | append: site.github.build_revision | relative_url }}\">\n    <meta name=\"viewport\" content=\"width=device-width\">\n    <!--[if lt IE 9]>\n    <script src=\"//html5shiv.googlecode.com/svn/trunk/html5.js\"></script>\n    <![endif]-->\n    <script src=\"{{ '/assets/js/jquery-3.7.1.min.js?v=' | append: site.github.build_revision | relative_url }}\"></script>\n    <script src=\"{{ '/assets/js/jquery.tablesorter.min.js?v=' | append: site.github.build_revision | relative_url }}\"></script>\n    <script type=\"text/javascript\">\n      $(document).ready(function() {\n        $(\".tablesorter\").tablesorter({{ page.table_sortlist }});\n        $(\"table.iso639-3-language tbody tr th\").each(function() {\n          $(this).html(\"<a href='https://en.wikipedia.org/wiki/ISO_639:\" + $(this).html() + \"'>\" + $(this).html() + \"</a>\");\n        });\n\t    $(\"#search\").on(\"keyup\", function() {\n    \t  var value = $(this).val().toLowerCase();\n          $(\".tablesearcher tbody tr\").filter(function() {\n            $(this).toggle($(this).children('th').text().indexOf(value) > -1);\n          });\n        });\n      });\n    </script>\n    <style>\n      table.tablepercentage { table-layout: auto; }\n      table.tablepercentage thead tr:first-child th {\n          hyphens: auto; font-size: small;\n      }\n      table.tablepercentage td { min-width: 60px; }\n      table.tablepercentage tbody th { max-width: 200px; hyphens: auto; }\n      table.tablepercentage thead tr:last-child .header:not(:first-child):before {\n        content: \"%\";\n      }\n      table.matrix tbody tr th {\n        font-weight: bold;\n      }\n      table.tablesorter thead tr:last-child .header {\n        background-image: url({{ '/assets/img/bg.gif?v=' | append: site.github.build_revision | relative_url }});\n        background-repeat: no-repeat;\n        background-position: center right;\n        cursor: pointer;\n      }\n      table.tablesorter thead tr:last-child .headerSortUp {\n        background-image: url({{ '/assets/img/asc.gif?v=' | append: site.github.build_revision | relative_url }});\n      }\n      table.tablesorter thead tr:last-child .headerSortDown {\n        background-image: url({{ '/assets/img/desc.gif?v=' | append: site.github.build_revision | relative_url }});\n      }\n      table tbody th { font-weight: normal; }\n      table tbody td { text-align: right; }\n    </style>\n\n  </head>\n  <body>\n    <div class=\"wrapper\">\n      <header>\n        <h1>{{ site.title | default: site.github.repository_name }}</h1>\n        <p>{{ site.description | default: site.github.project_tagline }}\n        <br>Latest crawl: {{site.latest_crawl}}\n        </p>\n\n        {% if site.show_navigation %}\n          <nav>\n            <p>\n            {% for node in site.navlist %}\n              <a href=\"{{ site.baseurl }}{{ node.url }}\">{{ node.title }}</a><br/>\n            {% endfor %}\n            </p>\n          </nav>\n        {% endif %}\n\n        {% if site.github.is_project_page %}\n          <p class=\"view\"><a href=\"{{ site.github.repository_url }}\">View the Project on GitHub <small>{{ github_name }}</small></a></p>\n        {% endif %}\n\n      </header>\n      <section>\n\n      {{ content }}\n\n      {% if page.table_searcher %}\n      <p><input type=\"text\" id=\"search\" placeholder=\"{{ page.table_searcher }}\"></p>\n      {% endif %}\n\n      {% for table in page.table_include %}\n      {% include_relative {{ table }} %}\n      <br>\n      {% endfor %}\n\n      </section>\n      <footer>\n        {% if site.github.is_project_page %}\n        <p>This project is maintained by <a href=\"{{ site.github.owner_url }}\">{{ site.github.owner_name }}</a></p>\n        {% endif %}\n        <p><small>Hosted on GitHub Pages &mdash; Theme by <a href=\"https://github.com/orderedlist\">orderedlist</a></small></p>\n      </footer>\n    </div>\n    <script src=\"{{ '/assets/js/scale.fix.js' | relative_url }}\"></script>\n\n  </body>\n</html>\n<!--\n Based on:\n  https://github.com/pages-themes/minimal\n  https://github.com/orderedlist/minimal\n  http://tablesorter.com/\n-->"
  },
  {
    "path": "crawlplot.py",
    "content": "\"\"\"\nBase plotting module for Common Crawl statistics visualization.\n\nThis module provides the CrawlPlot base class which handles:\n- Plot library selection (matplotlib, rpy2/ggplot2, or legacy ggplot)\n- Common plot styling to match ggplot2 aesthetics\n- Data input from stdin or files\n- Output directory management\n\nThe plot library is controlled by the PLOTLIB environment variable:\n- 'matplotlib' (recommended)\n- 'rpy2.ggplot2' (requires R and rpy2)\n- 'ggplot' (deprecated)\n\nThe output directory is controlled by PLOTDIR (defaults to 'plots/').\n\"\"\"\n\nimport json\nimport logging\nimport os\nimport os.path\nimport sys\nfrom typing import Literal\n\nimport fsspec\nimport numpy as np\n\n\n# Supported plot library backends\nPlotLibType = Literal[\"rpy2.ggplot2\", \"ggplot\", \"matplotlib\"]\n\n\nclass CrawlPlot:\n    \"\"\"\n    Base class for Common Crawl statistics plots.\n\n    Provides common functionality for all plot types including:\n    - Plot library initialization and configuration\n    - Data reading from stdin or gzipped files\n    - Line plot generation with consistent styling\n    - Output directory management\n\n    Subclasses should implement:\n    - add(key, val): Process a single data record\n    - plot(): Generate the specific visualization\n\n    Attributes:\n        PLOTLIB: The plotting library to use ('matplotlib', 'rpy2.ggplot2', or 'ggplot')\n        PLOTDIR: Directory for saving plot output files\n        DEFAULT_FIGSIZE: Default figure size in inches (7 = 2100px at 300 DPI)\n        DEFAULT_DPI: Default resolution for saved figures\n    \"\"\"\n\n    GGPLOT2_THEME = None\n    GGPLOT2_THEME_KWARGS = None\n\n    # figure with square aspect ratio : 7 inches * 300 DPI = 2100 pixels\n    DEFAULT_FIGSIZE = 7\n    DEFAULT_DPI = 300\n\n    title_fontsize = 15\n    title_pad = 20\n    title_fontweight = \"normal\"\n    title_loc = \"left\"\n    xlabel_fontsize = 12\n    ylabel_fontsize = 12\n    ticks_fontsize = 10\n    ticks_color = \"#E6E6E6\"\n    ticks_length = 8\n    ticks_width = 1.0\n    bar_width = 0.8\n    legend_fontsize = 10\n    legend_title_fontsize = 11\n    line_width = 0.75\n    marker_size = 4\n    grid_major_linewidth = 1.0\n    grid_minor_linewidth = 0.5\n    grid_major_color = \"#E6E6E6\"\n    grid_minor_color = \"#E6E6E6\"\n    tight_layout_pad = 0.5\n    savefig_facecolor = \"white\"\n    savefig_bbox_inches = None\n\n    # -------------------------------------------------------------------------\n    # Matplotlib helper methods for reducing code duplication\n    # -------------------------------------------------------------------------\n\n    def create_figure(self, ratio=1.0):\n        \"\"\"Create a matplotlib figure with consistent sizing.\n\n        Args:\n            ratio: Height ratio relative to width (default: 1.0 for square)\n\n        Returns:\n            Tuple of (fig, ax)\n        \"\"\"\n        import matplotlib.pyplot as plt\n        return plt.subplots(figsize=(self.DEFAULT_FIGSIZE, self.DEFAULT_FIGSIZE * ratio))\n\n    def set_title(self, ax, title):\n        \"\"\"Apply consistent title styling to an axes.\n\n        Args:\n            ax: matplotlib Axes object\n            title: Title text\n        \"\"\"\n        ax.set_title(\n            title,\n            fontsize=self.title_fontsize,\n            fontweight=self.title_fontweight,\n            pad=self.title_pad,\n            loc=self.title_loc,\n        )\n\n    def apply_ggplot2_style(self, ax, show_grid=True, grid_axis='both'):\n        \"\"\"Apply ggplot2-like minimal styling to an axes.\n\n        Removes spines, adds grid lines, and sets axes below plot elements.\n\n        Args:\n            ax: matplotlib Axes object\n            show_grid: Whether to show grid lines (default: True)\n            grid_axis: Which axis to show grid on ('both', 'x', or 'y')\n        \"\"\"\n        # Remove all spines\n        for spine in ['top', 'right', 'left', 'bottom']:\n            ax.spines[spine].set_visible(False)\n\n        # Add grid\n        if show_grid:\n            ax.grid(True, which='major', linewidth=self.grid_major_linewidth,\n                    color=self.grid_major_color, zorder=0, axis=grid_axis)\n\n        ax.set_axisbelow(True)\n\n    def set_tick_labels_black(self, ax):\n        \"\"\"Set all tick labels to black color.\n\n        Args:\n            ax: matplotlib Axes object\n        \"\"\"\n        for label in ax.get_xticklabels() + ax.get_yticklabels():\n            label.set_color('black')\n\n    def apply_nice_ticks(self, ax, axis='y', use_scientific=True):\n        \"\"\"Apply nice tick spacing using the nice_tick_step calculation.\n\n        Sets minor and major ticks at 'nice' intervals (multiples of 1, 2, or 5).\n        Optionally applies scientific notation for large values.\n\n        Args:\n            ax: matplotlib Axes object\n            axis: Which axis to apply to ('x' or 'y')\n            use_scientific: Whether to use scientific notation for large values\n        \"\"\"\n        from matplotlib.ticker import MultipleLocator, FormatStrFormatter\n\n        if axis == 'y':\n            vmin, vmax = ax.get_ylim()\n            axis_obj = ax.yaxis\n        else:\n            vmin, vmax = ax.get_xlim()\n            axis_obj = ax.xaxis\n\n        minor = self.nice_tick_step(vmin, vmax, n=8)\n        major = 2 * minor\n\n        axis_obj.set_minor_locator(MultipleLocator(minor))\n        axis_obj.set_major_locator(MultipleLocator(major))\n\n        if use_scientific and vmax > 1e4:\n            axis_obj.set_major_formatter(FormatStrFormatter('%.0e'))\n\n    def save_figure(self, fig, img_path):\n        \"\"\"Save figure with consistent settings and close it.\n\n        Args:\n            fig: matplotlib Figure object\n            img_path: Output file path\n\n        Returns:\n            The figure object (for chaining)\n        \"\"\"\n        import matplotlib.pyplot as plt\n        plt.tight_layout(pad=self.tight_layout_pad)\n        plt.savefig(img_path, dpi=self.DEFAULT_DPI,\n                    bbox_inches=self.savefig_bbox_inches,\n                    facecolor=self.savefig_facecolor)\n        plt.close()\n        return fig\n\n    def hide_tick_marks(self, ax, tick_color='#FFFFFF'):\n        \"\"\"Hide tick marks by setting them to a background color.\n\n        The tick labels remain visible but the tick marks themselves are hidden.\n\n        Args:\n            ax: matplotlib Axes object\n            tick_color: Color to set ticks to (default: white)\n        \"\"\"\n        ax.tick_params(axis='both', which='both', colors=tick_color,\n                       length=self.ticks_length, width=self.ticks_width)\n\n    def __init__(self):\n        \"\"\"Initialize the plot with library selection and output directory setup.\"\"\"\n        # Settings defined via environment variables\n        self.PLOTLIB: PlotLibType = os.environ.get('PLOTLIB', 'matplotlib')\n        self.PLOTDIR = os.environ.get('PLOTDIR', 'plots')\n\n        if self.PLOTLIB == 'ggplot':\n            # nothing to do here\n            pass\n        elif self.PLOTLIB == 'rpy2.ggplot2':\n            from rpy2.robjects.lib import ggplot2\n            from rpy2.robjects import pandas2ri\n            pandas2ri.activate()\n            # use minimal theme with white background set in plot constructor\n            # https://ggplot2.tidyverse.org/reference/ggtheme.html\n            self.GGPLOT2_THEME = ggplot2.theme_minimal(base_size=12, base_family=\"Helvetica\")\n\n            self.GGPLOT2_THEME_KWARGS = {\n                'panel.background': ggplot2.element_rect(fill='white', color='white'),\n                'plot.background': ggplot2.element_rect(fill='white', color='white')\n            }\n\n        elif self.PLOTLIB == \"matplotlib\":\n            import matplotlib.pyplot as plt\n\n            # ggplot2-inspired color palette\n            ggplot_colors = [\n                \"#F8766D\", \"#00BE67\", \"#00A9FF\", \"#CD9600\", \"#7CAE00\",\n                \"#00BFC4\", \"#C77CFF\", \"#FF61CC\",\n            ]\n\n            # Set up ggplot2-like minimal theme with larger fonts\n            plt.style.use('default')\n            plt.rcParams.update({\n                'font.family': 'sans-serif',\n                'font.sans-serif': ['Liberation Sans', 'Arial', 'DejaVu Sans'],\n                'font.size': 20,  # Much larger base font size\n                'axes.linewidth': 1.5,\n                'axes.spines.left': True,\n                'axes.spines.bottom': True,\n                'axes.spines.top': False,\n                'axes.spines.right': False,\n                'axes.axisbelow': True,\n                'axes.grid': True,\n                'axes.grid.axis': 'both',\n                'grid.linewidth': 1.0,\n                'grid.color': '#E6E6E6',  # Gray grid lines\n                'axes.facecolor': 'white',  # White background\n                'figure.facecolor': 'white',\n                'xtick.bottom': True,\n                'xtick.top': False,\n                'ytick.left': True,\n                'ytick.right': False,\n                'xtick.direction': 'out',\n                'ytick.direction': 'out',\n                'axes.prop_cycle':  plt.cycler(color=ggplot_colors),\n            })\n\n        else:\n            raise ValueError(\"Invalid PLOTLIB defined\")\n\n        # Make sure output directories exists\n        os.makedirs(os.path.join(self.PLOTDIR, \"crawler\"), exist_ok=True)\n        os.makedirs(os.path.join(self.PLOTDIR, \"crawloverlap\"), exist_ok=True)\n        os.makedirs(os.path.join(self.PLOTDIR, \"crawlsize\"), exist_ok=True)\n        os.makedirs(os.path.join(self.PLOTDIR, \"tld\"), exist_ok=True)\n\n\n    def read_from_stdin_or_file(self):\n        \"\"\"Read statistics data from a file argument or stdin.\n\n        If a file path is provided as the first command line argument,\n        reads from that file (supports gzip compression). Otherwise,\n        reads from stdin.\n        \"\"\"\n        if len(sys.argv) > 1:\n            # File provided as argument\n            fp = sys.argv[1]\n            compression = (\"gzip\" if fp.endswith(\".gz\") else None)\n\n            with fsspec.open(fp, 'r', compression=compression) as f:\n                self.read_data(f)\n        else:\n            # No argument, use stdin\n            self.read_data(sys.stdin)\n\n    def read_data(self, stream):\n        \"\"\"Parse tab-separated JSON key-value pairs from a stream.\n\n        Args:\n            stream: Input stream containing lines of tab-separated JSON data.\n                   Each line should have format: JSON_KEY<tab>JSON_VALUE\n        \"\"\"\n        for line in stream:\n            keyval = line.split('\\t')\n            if len(keyval) == 2:\n                key = json.loads(keyval[0])\n                val = json.loads(keyval[1])\n                self.add(key, val)\n            else:\n                logging.error(\"Not a key-value pair: {}\".find(line))\n\n    def line_plot_with_ggplot(\n        self,\n        data,\n        title,\n        ylabel,\n        img_path,\n        x=\"date\",\n        y=\"size\",\n        c=\"type\",\n        clabel=\"\",\n        ratio=1.0,\n    ):\n        \"\"\"Generate a line plot using the legacy ggplot library (deprecated).\"\"\"\n        from ggplot import ggplot, aes, ggtitle, ylab, xlab, scale_x_date, date_breaks, geom_line, geom_point\n\n        date_label = \"%Y\\n%W\"  # year + week number\n        p = (\n            ggplot(data, aes(x=x, y=y, color=c))\n            + ggtitle(title)\n            + ylab(ylabel)\n            + xlab(\" \")\n            + scale_x_date(breaks=date_breaks(\"3 months\"), labels=date_label)\n            + geom_line()\n            + geom_point()\n        )\n        p.save(img_path)\n        return p\n\n    def line_plot_with_rpy2_ggplot2(\n        self,\n        data,\n        title,\n        ylabel,\n        img_path,\n        x=\"date\",\n        y=\"size\",\n        c=\"type\",\n        clabel=\"\",\n        ratio=1.0,\n    ):\n        \"\"\"Generate a line plot using R's ggplot2 via rpy2.\"\"\"\n        from rpy2.robjects.lib import ggplot2\n\n        # Convert y axis to float because R uses 32-bit signed integers\n        # and values >= 2 billion (2^31) will overflow\n        data[y] = data[y].astype(float)\n        if y != \"size\" and \"size\" in data.columns:\n            data[\"size\"] = data[\"size\"].astype(float)\n        p = (\n            ggplot2.ggplot(data)\n            + ggplot2.aes_string(x=x, y=y, color=c)\n            + ggplot2.geom_line(linewidth=0.5)\n            + ggplot2.geom_point()\n            + self.GGPLOT2_THEME\n            + ggplot2.theme(\n                **{\n                    \"legend.position\": \"bottom\",\n                    \"aspect.ratio\": ratio,\n                    **self.GGPLOT2_THEME_KWARGS,\n                }\n            )\n            + ggplot2.labs(title=title, x=\"\", y=ylabel, color=clabel)\n        )\n\n        p.save(img_path)\n\n        return p\n\n    @staticmethod\n    def nice_tick_step(vmin, vmax, n=5):\n        \"\"\"Calculate a 'nice' tick step for axis labels.\n\n        Returns a tick step value that is a multiple of 1, 2, or 5 times\n        a power of 10, which produces clean, readable axis labels.\n\n        Args:\n            vmin: Minimum value of the axis range\n            vmax: Maximum value of the axis range\n            n: Approximate number of tick intervals desired (default: 5)\n\n        Returns:\n            A 'nice' tick step value (1/2/5 * 10^k)\n        \"\"\"\n        span = abs(vmax - vmin)\n        if span == 0:\n            return 1.0\n        raw = span / n\n        exp = np.floor(np.log10(raw))\n        frac = raw / (10**exp)\n        nice_frac = 1 if frac <= 1 else 2 if frac <= 2 else 5 if frac <= 5 else 10\n        return nice_frac * 10**exp\n    \n    @staticmethod\n    def center_legend_title(fig, ax, leg_items, leg_title, x_axes=0.1):\n        \"\"\"Center the legend title vertically with respect to legend items.\"\"\"\n        fig.canvas.draw()\n        r = fig.canvas.get_renderer()\n        bb = leg_items.get_window_extent(r)\n        y = fig.transFigure.inverted().transform((0, (bb.y0+bb.y1)/2))[1]\n        x = fig.transFigure.inverted().transform(ax.transAxes.transform((x_axes, 0)))[0]\n        leg_title.set_bbox_to_anchor((x, y), transform=fig.transFigure)\n\n    def line_plot_with_matplotlib(\n        self,\n        data,\n        title,\n        ylabel,\n        img_path,\n        x=\"date\",\n        y=\"size\",\n        c=\"type\",\n        clabel=\"\",\n        ratio=1.0,\n    ):\n        \"\"\"Generate a line plot using matplotlib with ggplot2-like styling.\n\n        Creates a multi-series line plot with markers, styled to match\n        ggplot2's minimal theme aesthetic.\n\n        Args:\n            data: pandas DataFrame containing the plot data\n            title: Plot title\n            ylabel: Y-axis label\n            img_path: Output file path for the saved image\n            x: Column name for x-axis values (default: 'date')\n            y: Column name for y-axis values (default: 'size')\n            c: Column name for grouping/color (default: 'type')\n            clabel: Legend title (default: '')\n            ratio: Aspect ratio for the plot (default: 1.0)\n\n        Returns:\n            matplotlib Figure object\n        \"\"\"\n        from matplotlib.ticker import AutoMinorLocator\n        from matplotlib.dates import YearLocator, DateFormatter\n\n        # Convert y axis to float for consistency with large values\n        data[y] = data[y].astype(float)\n        if y != \"size\" and \"size\" in data.columns:\n            data[\"size\"] = data[\"size\"].astype(float)\n\n        fig, ax = self.create_figure()\n        groups = data.groupby(c)\n\n        # Use ggplot2 default colors for small group counts\n        colors = [\"#F8766D\", \"#00BA38\", \"#619CFF\"] if len(groups) <= 3 else None\n\n        for i, (group_key, group_df) in enumerate(groups):\n            group_color = colors[i] if colors is not None else None\n            ax.plot(\n                group_df[x], group_df[y], \"o-\",\n                color=group_color, label=group_key,\n                linewidth=self.line_width, markersize=self.marker_size,\n            )\n\n        self.set_title(ax, title)\n        ax.set_xlabel(\"\")\n        ax.set_ylabel(ylabel, fontsize=self.ylabel_fontsize)\n\n        # Apply nice y-axis ticks\n        self.apply_nice_ticks(ax, axis='y')\n\n        # Axes ratio\n        axes_aspect_ratio = 1 / ax.get_data_ratio() * ratio\n        if axes_aspect_ratio < 1:\n            ax.set_aspect(axes_aspect_ratio)\n\n        # Date formatting for x-axis\n        ax.xaxis.set_major_formatter(DateFormatter(\"%Y\"))\n        ax.xaxis.set_major_locator(YearLocator(base=5))\n        ax.xaxis.set_minor_locator(AutoMinorLocator(2))\n\n        ax.tick_params(axis=\"both\", labelsize=self.ticks_fontsize)\n\n        # Grid with both major and minor lines\n        ax.grid(True, which=\"major\", linewidth=self.grid_major_linewidth,\n                color=self.grid_major_color, zorder=0)\n        ax.grid(True, which=\"minor\", linewidth=self.grid_minor_linewidth,\n                color=self.grid_minor_color, zorder=0)\n        ax.set_axisbelow(True)\n\n        # Apply ggplot2 style (remove spines)\n        for spine in ['top', 'right', 'left', 'bottom']:\n            ax.spines[spine].set_visible(False)\n\n        # Hide tick marks but keep labels black\n        self.hide_tick_marks(ax)\n        self.set_tick_labels_black(ax)\n\n        # Legend setup\n        num_legend_items = len(groups)\n        ncol = 5 if num_legend_items == 5 else 4\n\n        if clabel:\n            leg_items = ax.legend(\n                loc=\"upper center\", ncol=ncol, bbox_to_anchor=(0.6, -0.1),\n                frameon=False, fontsize=self.legend_fontsize,\n            )\n            ax.legend(\n                [], [], title=clabel, loc=\"upper center\",\n                bbox_to_anchor=(0.2, -0.075), frameon=False,\n                title_fontsize=self.legend_title_fontsize,\n            )\n            ax.add_artist(leg_items)\n        else:\n            ax.legend(\n                loc=\"upper center\", bbox_to_anchor=(0.5, -0.1),\n                ncol=ncol, frameon=False, fontsize=self.legend_fontsize,\n            )\n\n        return self.save_figure(fig, img_path)\n\n    def line_plot(\n        self,\n        data,\n        title,\n        ylabel,\n        img_file,\n        x=\"date\",\n        y=\"size\",\n        c=\"type\",\n        clabel=\"\",\n        ratio=1.0,\n    ):\n        \"\"\"Generate a line plot using the configured plotting library.\n\n        This is the main entry point for creating line plots. It delegates\n        to the appropriate backend based on the PLOTLIB setting.\n\n        Args:\n            data: pandas DataFrame containing the plot data\n            title: Plot title\n            ylabel: Y-axis label\n            img_file: Output filename relative to PLOTDIR\n            x: Column name for x-axis values (default: 'date')\n            y: Column name for y-axis values (default: 'size')\n            c: Column name for grouping/color (default: 'type')\n            clabel: Legend title (default: '')\n            ratio: Aspect ratio for the plot (default: 1.0)\n\n        Returns:\n            Plot object (type depends on backend)\n        \"\"\"\n        img_path = os.path.join(self.PLOTDIR, img_file)\n\n        if self.PLOTLIB == \"ggplot\":\n            return self.line_plot_with_ggplot(\n                data=data,\n                title=title,\n                ylabel=ylabel,\n                img_path=img_path,\n                x=x,\n                y=y,\n                c=c,\n                clabel=clabel,\n                ratio=ratio,\n            )\n\n        elif self.PLOTLIB == \"rpy2.ggplot2\":\n            return self.line_plot_with_rpy2_ggplot2(\n                data=data,\n                title=title,\n                ylabel=ylabel,\n                img_path=img_path,\n                x=x,\n                y=y,\n                c=c,\n                clabel=clabel,\n                ratio=ratio,\n            )\n\n        elif self.PLOTLIB == \"matplotlib\":\n            return self.line_plot_with_matplotlib(\n                data=data,\n                title=title,\n                ylabel=ylabel,\n                img_path=img_path,\n                x=x,\n                y=y,\n                c=c,\n                clabel=clabel,\n                ratio=ratio,\n            )\n"
  },
  {
    "path": "crawlstats.py",
    "content": "import heapq\nimport json\nimport logging\nimport os\nimport re\n\nfrom collections import defaultdict, Counter\nfrom datetime import date\nfrom enum import Enum\nfrom urllib.parse import urlparse\n\nimport mrjob.util\nimport tldextract\nimport ujson\n\nfrom hyperloglog import HyperLogLog\nfrom isoweek import Week\nfrom mrjob.job import MRJob, MRStep\nfrom mrjob.protocol import JSONProtocol, RawValueProtocol\n\n\nHYPERLOGLOG_ERROR = .01\n\n# threshold when to add a HyperLogLog for SURT domains\nMIN_SURT_HLL_SIZE = 50000\n\nLOGGING_FORMAT = '%(asctime)s: [%(levelname)s]: %(message)s'\nLOGGING_LEVEL = logging.INFO\nLOG = logging.getLogger('CCStatsJob')\nmrjob.util.log_to_stream(format=LOGGING_FORMAT,\n                         level=LOGGING_LEVEL,\n                         name='CCStatsJob')\n\n\nclass MonthlyCrawl:\n    \"\"\"Enumeration of monthly crawl archives\"\"\"\n\n    by_name = {\n               'CC-MAIN-2008-2009': 88,\n               'CC-MAIN-2009-2010': 89,\n               'CC-MAIN-2012': 90,\n               'CC-MAIN-2013-20': 91,\n               'CC-MAIN-2013-48': 92,\n               'CC-MAIN-2014-10': 93,\n               'CC-MAIN-2014-15': 94,\n               'CC-MAIN-2014-23': 95,\n               'CC-MAIN-2014-35': 96,\n               'CC-MAIN-2014-41': 97,\n               'CC-MAIN-2014-42': 98,\n               'CC-MAIN-2014-49': 99,\n               'CC-MAIN-2014-52': 0,\n               'CC-MAIN-2015-06': 1,\n               'CC-MAIN-2015-11': 2,\n               'CC-MAIN-2015-14': 3,\n               'CC-MAIN-2015-18': 4,\n               'CC-MAIN-2015-22': 5,\n               'CC-MAIN-2015-27': 6,\n               'CC-MAIN-2015-32': 7,\n               'CC-MAIN-2015-35': 8,\n               'CC-MAIN-2015-40': 9,\n               'CC-MAIN-2015-48': 10,\n               'CC-MAIN-2016-07': 11,\n               'CC-MAIN-2016-18': 12,\n               'CC-MAIN-2016-22': 13,\n               'CC-MAIN-2016-26': 14,\n               'CC-MAIN-2016-30': 15,\n               'CC-MAIN-2016-36': 16,\n               'CC-MAIN-2016-40': 17,\n               'CC-MAIN-2016-44': 18,\n               'CC-MAIN-2016-50': 19,\n               'CC-MAIN-2017-04': 20,\n               'CC-MAIN-2017-09': 21,\n               'CC-MAIN-2017-13': 22,\n               'CC-MAIN-2017-17': 23,\n               'CC-MAIN-2017-22': 24,\n               'CC-MAIN-2017-26': 25,\n               'CC-MAIN-2017-30': 26,\n               'CC-MAIN-2017-34': 27,\n               'CC-MAIN-2017-39': 28,\n               'CC-MAIN-2017-43': 29,\n               'CC-MAIN-2017-47': 30,\n               'CC-MAIN-2017-51': 31,\n               'CC-MAIN-2018-05': 32,\n               'CC-MAIN-2018-09': 33,\n               'CC-MAIN-2018-13': 34,\n               'CC-MAIN-2018-17': 35,\n               'CC-MAIN-2018-22': 36,\n               'CC-MAIN-2018-26': 37,\n               'CC-MAIN-2018-30': 38,\n               'CC-MAIN-2018-34': 39,\n               'CC-MAIN-2018-39': 40,\n               'CC-MAIN-2018-43': 41,\n               'CC-MAIN-2018-47': 42,\n               'CC-MAIN-2018-51': 43,\n               'CC-MAIN-2019-04': 44,\n               'CC-MAIN-2019-09': 45,\n               'CC-MAIN-2019-13': 46,\n               'CC-MAIN-2019-18': 47,\n               'CC-MAIN-2019-22': 48,\n               'CC-MAIN-2019-26': 49,\n               'CC-MAIN-2019-30': 50,\n               'CC-MAIN-2019-35': 51,\n               'CC-MAIN-2019-39': 52,\n               'CC-MAIN-2019-43': 53,\n               'CC-MAIN-2019-47': 54,\n               'CC-MAIN-2019-51': 55,\n               'CC-MAIN-2020-05': 56,\n               'CC-MAIN-2020-10': 57,\n               'CC-MAIN-2020-16': 58,\n               'CC-MAIN-2020-24': 59,\n               'CC-MAIN-2020-29': 60,\n               'CC-MAIN-2020-34': 61,\n               'CC-MAIN-2020-40': 62,\n               'CC-MAIN-2020-45': 63,\n               'CC-MAIN-2020-50': 64,\n               'CC-MAIN-2021-04': 65,\n               'CC-MAIN-2021-10': 66,\n               'CC-MAIN-2021-17': 67,\n               'CC-MAIN-2021-21': 68,\n               'CC-MAIN-2021-25': 69,\n               'CC-MAIN-2021-31': 70,\n               'CC-MAIN-2021-39': 71,\n               'CC-MAIN-2021-43': 72,\n               'CC-MAIN-2021-49': 73,\n               'CC-MAIN-2022-05': 74,\n               'CC-MAIN-2022-21': 75,\n               'CC-MAIN-2022-27': 76,\n               'CC-MAIN-2022-33': 77,\n               'CC-MAIN-2022-40': 78,\n               'CC-MAIN-2022-49': 79,\n               'CC-MAIN-2023-06': 80,\n               'CC-MAIN-2023-14': 81,\n               'CC-MAIN-2023-23': 82,\n               'CC-MAIN-2023-40': 83,\n               'CC-MAIN-2023-50': 84,\n               'CC-MAIN-2024-10': 85,\n               'CC-MAIN-2024-18': 86,\n               'CC-MAIN-2024-22': 87,\n               'CC-MAIN-2024-26': 100,\n               'CC-MAIN-2024-30': 101,\n               'CC-MAIN-2024-33': 102,\n               'CC-MAIN-2024-38': 103,\n               'CC-MAIN-2024-42': 104,\n               'CC-MAIN-2024-46': 105,\n               'CC-MAIN-2024-51': 106,\n               'CC-MAIN-2025-05': 107,\n               'CC-MAIN-2025-08': 108,\n               'CC-MAIN-2025-13': 109,\n               'CC-MAIN-2025-18': 110,\n               'CC-MAIN-2025-21': 111,\n               'CC-MAIN-2025-26': 112,\n               'CC-MAIN-2025-30': 113,\n               'CC-MAIN-2025-33': 114,\n               'CC-MAIN-2025-38': 115,\n               'CC-MAIN-2025-43': 116,\n               'CC-MAIN-2025-47': 117,\n               'CC-MAIN-2025-51': 118,\n               'CC-MAIN-2026-04': 119,\n               'CC-MAIN-2026-08': 120,\n               'CC-MAIN-2026-12': 121,\n               'CC-MAIN-2026-17': 122,\n               'CC-MAIN-2026-21': 123,\n    }\n\n    by_id = dict(map(reversed, by_name.items()))\n\n    @staticmethod\n    def get_by_name(name):\n        return MonthlyCrawl.by_name[name]\n\n    @staticmethod\n    def to_name(crawl):\n        return MonthlyCrawl.by_id[crawl]\n\n    @staticmethod\n    def to_bit_mask(crawl):\n        return (1 << crawl)\n\n    @staticmethod\n    def date_of(crawl):\n        if crawl == 'CC-MAIN-2008-2009':\n            return date(2009, 1, 12)\n        if crawl == 'CC-MAIN-2009-2010':\n            return date(2010, 9, 25)\n        if crawl == 'CC-MAIN-2012':\n            return date(2012, 11, 2)\n        [_, _, year, week] = crawl.split('-')\n        return Week(int(year), int(week)).monday()\n\n    @staticmethod\n    def year_of(crawl):\n        return MonthlyCrawl.date_of(crawl).year\n\n    @staticmethod\n    def short_name(name):\n        return name.replace('CC-MAIN-', '')\n\n    @staticmethod\n    def get_latest(n):\n        return sorted(MonthlyCrawl.by_name.keys())[-n:]\n\n\nclass MonthlyCrawlSet:\n    \"\"\"Dense representation of a list of monthly crawls.\n    Represent in which crawls a given item (URL, but also\n    domain, host, digest) occurs.\n    \"\"\"\n\n    def __init__(self, crawls=0):\n        self.bits = crawls\n\n    def add(self, crawl):\n        self.bits |= MonthlyCrawl.to_bit_mask(crawl)\n\n    def update(self, *others):\n        for other in others:\n            self.bits |= other.get_bits()\n\n    def clear(self):\n        self.bits = 0\n\n    def discard(self, crawl):\n        self.bits &= ~MonthlyCrawl.to_bit_mask(crawl)\n\n    def __contains__(self, crawl):\n        return (self.bits & MonthlyCrawl.to_bit_mask(crawl)) != 0\n\n    def __len__(self):\n        \"\"\"popcount of a 32 bit integer.\"\"\"\n        i = self.bits\n        i = i - ((i >> 1) & 0x55555555)\n        i = (i & 0x33333333) + ((i >> 2) & 0x33333333)\n        return (((i + (i >> 4) & 0xF0F0F0F) * 0x1010101) & 0xffffffff) >> 24\n\n    def get_bits(self):\n        return self.bits\n\n    def get_crawls(self):\n        i = self.bits\n        r = 0\n        while (i):\n            if (i & 1):\n                yield r\n            r += 1\n            i >>= 1\n\n    def is_new(self, crawl):\n        \"\"\"True if there are no older crawls in set (no lower id)\"\"\"\n        if (self.bits == 0):\n            return True\n        i = self.bits\n        i = (i ^ (i - 1)) >> 1  # set trailing 0s to 1s and zero rest\n        r = 0\n        while (i):\n            if r == crawl:\n                return True\n            r += 1\n            i >>= 1\n        if (r < crawl):\n            return False\n        return True\n\n    def is_newest(self, crawl):\n        \"\"\"True if crawl is the newest crawl in set (highest id)\"\"\"\n        # i = self.bits\n        # j = MonthlyCrawl.to_bit_mask(crawl)\n        # return (i & ~j) < j\n        return self.bits.bit_length() == (crawl + 1)\n\n\nclass CST(Enum):\n    \"\"\"Enum for crawl statistics types.\n    Every line (key-value pair) has a marker which indicates the type\n    of the count / frequency:\n    - pages, URLs, hosts, etc.\n    - size (number of unique items), histograms, etc.\n    The type marker (the first element in the key tuple) determines\n    the format of the line (key-value pair):\n      <<type, key_params...>, <values...>>\n    The format may vary for different steps (job, mapper, reducer).\n    The count job (CCCountJob) uses the numeric types to reduce\n    the data size, while CCCountJob outputs the type names for better\n    readability.\n    Types of countable items\n    #   <<type, item, crawl>, <count(s)>>\n    # For hosts, domains, etc. MultiCount is used to hold two counts -\n    # the number of pages and URLs per item.\"\"\"\n    url = 0\n    \"\"\"(unique) URL\"\"\"\n    digest = 1\n    \"\"\"(unique) content digest (MD5)\"\"\"\n    host = 2\n    \"\"\"hostname (\"www.commoncrawl.org\")\"\"\"\n    domain = 3\n    \"\"\"pay-level domain or private domain (\"commoncrawl.org\")\"\"\"\n    tld = 4\n    \"\"\"public suffix (\"org\" or \"co.uk\")\n    - not necessarily a TLD / \"top-level domain\" according to\n      https://github.com/google/guava/wiki/InternetDomainNameExplained\n    - here following https://github.com/john-kurkowski/tldextract\"\"\"\n    surt_domain = 5\n    \"\"\"surt_domain :- SURT domain (\"org,commoncrawl\")\n    - Sort-friendly URI Reordering Transform, cf.\n      http://crawler.archive.org/articles/user_manual/glossary.html#surt\"\"\"\n    scheme = 6\n    \"\"\"URI scheme (\"http\", \"https\")\n    see https://en.wikipedia.org/wiki/Uniform_Resource_Identifier#Syntax\"\"\"\n    mimetype = 7\n    \"\"\"MIME type / media type / content type\n    - as sent by the server as \"Content-Type\" in the HTTP header,\n      weakly normalized, not verified\"\"\"\n    mimetype_detected = 77\n    \"\"\"MIME type detected based on content, URL and HTTP Content-Type\"\"\"\n    page = 8\n    \"\"\"number of successfully fetched pages (HTTP status 200),\n    including URL-level and content-level duplicates\"\"\"\n    fetch = 9\n    \"\"\"number of fetches, including 404s, redirects, robots.txt, etc.\n    - since CC-MAIN-2016-50\"\"\"\n    http_status = 10\n    \"\"\"detected charset\n    - since CC-MAIN-2018-34\"\"\"\n    charset = 11\n    \"\"\"detected languages or combination of languages\n    - since CC-MAIN-2018-34\n    NOTE: since gld2 identifies 160 languages and up to 3 languages,\n    the number of possible combinations is too high (4 millions) and\n    only the more common ones are preserved\"\"\"\n    languages = 12\n    \"\"\"primary language of the document (first of the detected languages)\n    - since CC-MAIN-2018-34\"\"\"\n    primary_language = 13\n    \"\"\"number of HTTP status codes (200, 404, etc.)\n    - since CC-MAIN-2016-50\"\"\"\n    crawl_status = 55\n    \"\"\"crawl status (successful fetches, 404s, exceptions, etc.)\n    - following Nutch CrawlDatum status codes\n    - similar to HTTP status but less fine-grained\n    - includes crawler-specific statuses (e.g., \"denied by robots.txt\")\"\"\"\n    robotstxt_status = 56\n    \"\"\"HTTP status of robots.txt responses\"\"\"\n    size = 90\n    \"\"\"size of a crawl (number of unique items):\n    - pages,\n    - URLs (one URL may be fetched multiple times),\n    - content digests,\n    - domains, hosts, top-level domains\n    - mime types\n    - etc.\n    format:\n      <<size, item_type, crawl>, number_of_unique_items>\"\"\"\n    size_estimate = 91\n    \"\"\"estimates for unique URLs and content digests\n    - estimates by HyperLogLog probabilistic counters\"\"\"\n    size_estimate_for = 92\n    \"\"\"estimates per large-sized item\n    (domains, hosts, TLDs, SURT domains)\n    - aimed to estimate domain coverage over time / multiple crawls\n    - CC-MAIN-2016-44 adds HyperLogLogs for SURT domain (>=50,000 URLs)\n    format:\n     <<size_estimate_for, per_item_type, per_item, item_type, crawl>, hll>\"\"\"\n    size_robotstxt = 93\n    \"\"\"number of robots.txt fetches\"\"\"\n    new_items = 95\n    \"\"\"new items (URLs, content digests) for a given crawl\n    - first seen in this crawl, not observed in previous crawls\n    - only with exact counts for all crawls\n    - could be estimated by HyperLogLog set operations otherwise\"\"\"\n    histogram = 96\n    \"\"\"frequency of item counts per page or URL\n    format:\n      <<type, item_type, crawl, counted_per, count>, frequency>\"\"\"\n\n\nclass MultiCount(defaultdict):\n    \"\"\"Dictionary with multiple counters for the same key\"\"\"\n\n    def __init__(self, size):\n        self.default_factory = lambda: [0]*size\n        self.size = size\n\n    def incr(self, key, *counts):\n        for i in range(0, self.size):\n            self[key][i] += counts[i]\n\n    @staticmethod\n    def compress(size, counts):\n        compress_from = size-1\n        last_val = counts[compress_from]\n        while compress_from > 0 and last_val == counts[compress_from-1]:\n            compress_from -= 1\n        if compress_from == 0:\n            return counts[0]\n        else:\n            return counts[0:compress_from+1]\n\n    def get_compressed(self, key):\n        return MultiCount.compress(self.size, self.get(key))\n\n    @staticmethod\n    def get_count(index, value):\n        if isinstance(value, int):\n            return value\n        if len(value) <= index:\n            return value[-1]\n        return value[index]\n\n    @staticmethod\n    def sum_values(values, compress=True):\n        counts = [0]\n        size = 1\n        for val in values:\n            if isinstance(val, int):\n                # compressed count, one unique count\n                for i in range(0, size):\n                    counts[i] += val\n            else:\n                if len(val) >= size:\n                    # enlarge counts array\n                    base_count = counts[-1]\n                    for j in range(size, len(val)):\n                        counts.append(base_count)\n                    size = len(val)\n                for i in range(0, len(val)):\n                    counts[i] += val[i]\n                if len(val) < size:\n                    for j in range(i+1, size):\n                        # add compressed counts\n                        counts[j] += val[i]\n        if compress:\n            return MultiCount.compress(size, counts)\n        else:\n            return counts\n\n\nclass CrawlStatsJSONEncoder(json.JSONEncoder):\n\n    def default(self, o):\n        if isinstance(o, MonthlyCrawlSet):\n            return o.get_bits()\n        if isinstance(o, HyperLogLog):\n            return CrawlStatsJSONEncoder.json_encode_hyperloglog(o)\n        return json.JSONEncoder.default(self, o)\n\n    @staticmethod\n    def json_encode_hyperloglog(o):\n        return {'__type__': 'HyperLogLog',\n                'card': o.card(),\n                'p': o.p, 'M': o.M, 'm': o.m, 'alpha': o.alpha}\n\n\nclass CrawlStatsJSONDecoder(json.JSONDecoder):\n\n    def __init__(self, *args, **kargs):\n        json.JSONDecoder.__init__(self, object_hook=self.dict_to_object,\n                                  *args, **kargs)\n\n    def dict_to_object(self, dic):\n        if '__type__' not in dic:\n            return dic\n        if dic['__type__'] == 'HyperLogLog':\n            try:\n                return CrawlStatsJSONDecoder.json_decode_hyperloglog(dic)\n            except Exception as e:\n                LOG.error('Cannot decode object of type {0}'.format(\n                    dic['__type__']))\n                raise e\n        return dic\n\n    @staticmethod\n    def json_decode_hyperloglog(dic):\n        hll = HyperLogLog(HYPERLOGLOG_ERROR)\n        hll.p = dic['p']\n        hll.m = dic['m']\n        hll.alpha = dic['alpha']\n        hll.M = dic['M']\n        return hll\n\n\nclass HostDomainCount:\n    \"\"\"Counts requiring URL parsing (host, domain, TLD, scheme).\n    For each item both total pages and unique URLs are counted.\n    \"\"\"\n\n    IPpattern = re.compile(r'^\\d{1,3}.\\d{1,3}.\\d{1,3}.\\d{1,3}$')\n\n    def __init__(self):\n        self.hosts = MultiCount(2)\n        self.schemes = MultiCount(2)\n\n    def add(self, url, count):\n        uri = urlparse(url)\n        host = uri.hostname\n        if host is not None:\n            host = host.lower().strip('.')\n            self.hosts.incr(host, count, 1)\n        self.schemes.incr(uri.scheme, count, 1)\n\n    def output(self, crawl):\n        domains = MultiCount(3)  # pages, URLs, hosts\n        tlds = MultiCount(4)     # pages, URLs, hosts, domains\n        for scheme, counts in self.schemes.items():\n            yield (CST.scheme.value, scheme, crawl), counts\n        for host, counts in self.hosts.items():\n            yield (CST.host.value, host, crawl), counts\n            try:\n                parsedhost = tldextract.extract(host)\n                hosttld = parsedhost.suffix\n            except TypeError as e:\n                LOG.error('Failed to parse host {}: {}'.format(host, e))\n                hosttld = None\n            if hosttld is None:\n                hostdomain = '(invalid)'\n            elif hosttld == '':\n                hostdomain = parsedhost.domain\n                if self.IPpattern.match(host):\n                    hosttld = '(ip address)'\n            else:\n                hostdomain = '.'.join([parsedhost.domain, parsedhost.suffix])\n            domains.incr((hostdomain, hosttld),\n                         counts[0], counts[1], 1)\n        for dom, counts in domains.items():\n            tlds.incr(dom[1], counts[0], counts[1], counts[2], 1)\n            yield (CST.domain.value, dom[0], crawl), counts\n        for tld, counts in tlds.items():\n            yield (CST.tld.value, tld, crawl), counts\n\n\nclass SurtDomainCount:\n    \"\"\"Counters for one single SURT prefix/domain.\"\"\"\n\n    robots_txt_warc_pattern = re.compile(r'/robotstxt/')\n\n    def __init__(self, surt_domain):\n        self.surt_domain = surt_domain\n        self.pages = 0\n        self.url = defaultdict(int)\n        self.digest = defaultdict(lambda: [0, 0])\n        self.mime = defaultdict(lambda: [0, 0])\n        self.mime_detected = defaultdict(lambda: [0, 0])\n        self.charset = defaultdict(lambda: [0, 0])\n        self.languages = defaultdict(lambda: [0, 0])\n        self.http_status = defaultdict(int)\n        self.robotstxt_status = defaultdict(lambda: [0, 0])\n        self.robotstxt_url = defaultdict(int)\n\n    def add(self, _path, metadata):\n        status = -1\n        if 'status' in metadata:\n            status = int(metadata['status'])\n        if self.robots_txt_warc_pattern.search(metadata['filename']):\n            self.robotstxt_status[status][0] += 1\n            if metadata['url'] not in self.robotstxt_url:\n                self.robotstxt_status[status][1] += 1\n            self.robotstxt_url[metadata['url']] += 1\n            # do not count robots.txt responses as \"ordinary\" pages\n            return\n        self.http_status[status] += 1\n        if status != 200:\n            # skip content-related metrics for non-200 responses\n            return\n        self.pages += 1\n        mime = 'unk'\n        if 'mime' in metadata:\n            mime = metadata['mime']\n        self.mime[mime][0] += 1\n        mime_detected = None\n        if 'mime-detected' in metadata:\n            mime_detected = metadata['mime-detected']\n            self.mime_detected[mime_detected][0] += 1\n        charset = None\n        if 'charset' in metadata:\n            charset = metadata['charset']\n            self.charset[charset][0] += 1\n        languages = None\n        if 'languages' in metadata:\n            languages = metadata['languages']\n            self.languages[languages][0] += 1\n        digest = None\n        if 'digest' in metadata:\n            digest = metadata['digest']\n            self.digest[digest][0] += 1\n        if metadata['url'] not in self.url:\n            if digest:\n                self.digest[digest][1] += 1\n            self.mime[mime][1] += 1\n            if mime_detected:\n                self.mime_detected[mime_detected][1] += 1\n            if languages:\n                self.languages[languages][1] += 1\n            if charset:\n                self.charset[charset][1] += 1\n        self.url[metadata['url']] += 1\n\n    def unique_urls(self):\n        return len(self.url)\n\n    def output(self, crawl, exact_count=True, min_surt_hll_size=50000):\n        counts = (self.pages, self.unique_urls())\n        host_domain_count = HostDomainCount()\n        surt_hll = None\n        if self.unique_urls() >= min_surt_hll_size:\n            surt_hll = HyperLogLog(HYPERLOGLOG_ERROR)\n        for url, count in self.url.items():\n            host_domain_count.add(url, count)\n            if exact_count:\n                yield (CST.url.value, self.surt_domain, url), (crawl, count)\n            if surt_hll is not None:\n                surt_hll.add(url)\n        if exact_count:\n            for digest, counts in self.digest.items():\n                yield (CST.digest.value, digest), (crawl, counts)\n        for mime, counts in self.mime.items():\n            yield (CST.mimetype.value, mime, crawl), counts\n        for mime, counts in self.mime_detected.items():\n            yield (CST.mimetype_detected.value, mime, crawl), counts\n        for charset, counts in self.charset.items():\n            yield (CST.charset.value, charset, crawl), counts\n        for languages, counts in self.languages.items():\n            yield (CST.languages.value, languages, crawl), counts\n            # yield primary language\n            prim_l = languages.split(',')[0]\n            yield (CST.primary_language.value, prim_l, crawl), counts\n        for key, val in host_domain_count.output(crawl):\n            yield key, val\n        yield((CST.surt_domain.value, self.surt_domain, crawl),\n              (self.pages, self.unique_urls(), len(host_domain_count.hosts)))\n        if surt_hll is not None:\n            yield((CST.size_estimate_for.value, CST.surt_domain.value,\n                   self.surt_domain, CST.url.value, crawl),\n                  (self.unique_urls(),\n                   CrawlStatsJSONEncoder.json_encode_hyperloglog(surt_hll)))\n        for status, counts in self.http_status.items():\n            yield (CST.http_status.value, status, crawl), counts\n        for url, count in self.robotstxt_url.items():\n            yield (CST.size_robotstxt.value, CST.url.value, crawl), 1\n            yield (CST.size_robotstxt.value, CST.page.value, crawl), count\n        for status, counts in self.robotstxt_status.items():\n            yield (CST.robotstxt_status.value, status, crawl), counts\n\n\nclass UnhandledTypeError(Exception):\n    def __init__(self, outputType):\n        self.message = 'Unhandled type {}\\n'.format(outputType)\n\n\nclass InputError(Exception):\n    def __init__(self, message):\n        self.message = message\n\n\nclass CCStatsJob(MRJob):\n    '''Job to get crawl statistics from Common Crawl index\n       --job=count\n            run count job (first step) to get counts\n            from Common Crawl index files (cdx-*.gz)\n       --job=stats\n            run statistics job (second step) on output\n            from count job'''\n\n    OUTPUT_PROTOCOL = JSONProtocol\n\n    JOBCONF = {\n        'mapreduce.task.timeout': '9600000',\n        'mapreduce.map.speculative': 'false',\n        'mapreduce.reduce.speculative': 'false',\n        'mapreduce.job.jvm.numtasks': '-1',\n    }\n\n    s3pattern = re.compile(r'^s3://([^/]+)/(.+)')\n    gzpattern = re.compile(r'\\.gz$')\n    crawlpattern = re.compile(r'(CC-MAIN-2\\d{3}-\\d{2})')\n\n    def configure_args(self):\n        \"\"\"Custom command line options for common crawl index statistics\"\"\"\n        super(CCStatsJob, self).configure_args()\n        self.add_passthru_arg(\n            '--job', dest='job_to_run',\n            default='', choices=['count', 'stats', ''],\n            help='''Job(s) to run (\"count\", \"stats\", or empty to run both)''')\n        self.add_passthru_arg(\n            '--exact-counts', dest='exact_counts',\n            action='store_true', default=None,\n            help='''Exact counts for URLs and content digests,\n                    this increases the output size significantly''')\n        self.add_passthru_arg(\n            '--no-exact-counts', dest='exact_counts',\n            action='store_false', default=None,\n            help='''No exact counts for URLs and content digests\n                    to save storage space and computation time''')\n        self.add_passthru_arg(\n            '--max-top-hosts-domains', dest='max_hosts',\n            type=int, default=200,\n            help='''Max. number of most frequent hosts or domains shown\n                    in final statistics (cf. --min-urls-top-host-domain)''')\n        self.add_passthru_arg(\n            '--min-urls-top-host-domain', dest='min_domain_frequency',\n            type=int, default=1,\n            help='''Min. number of URLs required per host or domain shown\n                    in final statistics (cf. --max-top-hosts-domains).''')\n        self.add_passthru_arg(\n            '--min-lang-comb-freq', dest='min_lang_comb_freq',\n            type=int, default=1,\n            help='''Min. number of pages required for a combination of detected\n                    languages to be shown in final statistics.''')\n        self.add_passthru_arg(\n            '--crawl', dest='crawl', default=None,\n            help='''ID/name of the crawl analyzed (if not given detected\n                    from input path)''')\n\n    def input_protocol(self):\n        if self.options.job_to_run != 'stats':\n            LOG.debug('Reading text input from cdx files')\n            return RawValueProtocol()\n        LOG.debug('Reading JSON input from count job')\n        return JSONProtocol()\n\n    def hadoop_input_format(self):\n        input_format = self.HADOOP_INPUT_FORMAT\n        if self.options.job_to_run != 'stats':\n            input_format = 'org.apache.hadoop.mapred.TextInputFormat'\n        LOG.info(\"Setting input format for {} job: {}\".format(\n            self.options.job_to_run, input_format))\n        return input_format\n\n    def count_mapper_init(self):\n        \"\"\"Because cdx.gz files cannot be split and\n        mapreduce.input.fileinputformat.split.minsize is set to a value larger\n        than any cdx.gz file, the mapper is guaranteed to process the content\n        of a single cdx file. Input lines of a cdx file are sorted by SURT URL\n        which allows to aggregate URL counts for one SURT domain in memory.\n        It may happen that one SURT domain spans over multiple cdx files.\n        In this case (and without --exact-counts) the count of unique URLs\n        and the URL histograms may be slightly off in case the same URL occurs\n        also in a second cdx file. However, this problem is negligible because\n        there are only 300 cdx files.\"\"\"\n        self.counters = Counter()\n        self.cdx_path = os.environ['mapreduce_map_input_file']\n        LOG.info('Reading {0}'.format(self.cdx_path))\n        self.crawl_name = None\n        self.crawl = None\n        if self.options.crawl is not None:\n            self.crawl_name = self.options.crawl\n        else:\n            crawl_name_match = self.crawlpattern.search(self.cdx_path)\n            if crawl_name_match is not None:\n                self.crawl_name = crawl_name_match.group(1)\n            else:\n                raise InputError(\n                    \"Cannot determine ID of monthly crawl from input path {}\"\n                    .format(self.cdx_path))\n        if self.crawl_name is None:\n            raise InputError(\"Name of crawl not given\")\n        self.crawl = MonthlyCrawl.get_by_name(self.crawl_name)\n        self.fetches_total = 0\n        self.pages_total = 0\n        self.urls_total = 0\n        self.urls_hll = HyperLogLog(HYPERLOGLOG_ERROR)\n        self.digest_hll = HyperLogLog(HYPERLOGLOG_ERROR)\n        self.url_histogram = Counter()\n        self.count = None\n        # first and last SURT may continue in previous/next cdx\n        self.min_surt_hll_size = 1\n        self.increment_counter('cdx-stats', 'cdx files processed', 1)\n\n    def count_mapper(self, _, line):\n        self.fetches_total += 1\n        if (self.fetches_total % 1000) == 0:\n            self.increment_counter('cdx-stats', 'cdx lines read', 1000)\n            if (self.fetches_total % 100000) == 0:\n                LOG.info('Read {0} cdx lines'.format(self.fetches_total))\n            else:\n                LOG.debug('Read {0} cdx lines'.format(self.fetches_total))\n        parts = line.split(' ')\n        [surt_domain, path] = parts[0].split(')', 1)\n        if self.count is None:\n            self.count = SurtDomainCount(surt_domain)\n        if surt_domain != self.count.surt_domain:\n            # output accumulated statistics for one SURT domain\n            for pair in self.count.output(self.crawl,\n                                          self.options.exact_counts,\n                                          self.min_surt_hll_size):\n                yield pair\n            self.urls_total += self.count.unique_urls()\n            for url, cnt in self.count.url.items():\n                self.urls_hll.add(url)\n                self.url_histogram[cnt] += 1\n            for digest in self.count.digest:\n                self.digest_hll.add(digest)\n            self.pages_total += self.count.pages\n            self.count = SurtDomainCount(surt_domain)\n            self.min_surt_hll_size = MIN_SURT_HLL_SIZE\n        json_string = ' '.join(parts[2:])\n        try:\n            metadata = ujson.loads(json_string)\n            self.count.add(path, metadata)\n        except ValueError as e:\n            LOG.error('Failed to parse json: {0} - {1}'.format(\n                e, json_string))\n\n    def count_mapper_final(self):\n        self.increment_counter('cdx-stats',\n                               'cdx lines read', self.fetches_total % 1000)\n        if self.count is None:\n            return\n        for pair in self.count.output(self.crawl, self.options.exact_counts, 1):\n            yield pair\n        self.urls_total += self.count.unique_urls()\n        for url, cnt in self.count.url.items():\n            self.urls_hll.add(url)\n            self.url_histogram[cnt] += 1\n        for digest in self.count.digest:\n            self.digest_hll.add(digest)\n        self.pages_total += self.count.pages\n        if not self.options.exact_counts:\n            for count, frequency in self.url_histogram.items():\n                yield((CST.histogram.value, CST.url.value, self.crawl,\n                       CST.page.value, count), frequency)\n        yield (CST.size.value, CST.page.value, self.crawl), self.pages_total\n        yield (CST.size.value, CST.fetch.value, self.crawl), self.fetches_total\n        if not self.options.exact_counts:\n            yield (CST.size.value, CST.url.value, self.crawl), self.urls_total\n        yield((CST.size_estimate.value, CST.url.value, self.crawl),\n              CrawlStatsJSONEncoder.json_encode_hyperloglog(self.urls_hll))\n        yield((CST.size_estimate.value, CST.digest.value, self.crawl),\n              CrawlStatsJSONEncoder.json_encode_hyperloglog(self.digest_hll))\n        self.increment_counter('cdx-stats', 'cdx files finished', 1)\n\n    def reducer_init(self):\n        self.counters = Counter()\n        self.mostfrequent = defaultdict(list)\n\n    def count_reducer(self, key, values):\n        outputType = key[0]\n        if outputType in (CST.size.value, CST.size_robotstxt.value):\n            yield key, sum(values)\n        elif outputType == CST.histogram.value:\n            yield key, sum(values)\n        elif outputType in (CST.url.value, CST.digest.value):\n            # only with --exact-counts\n            crawls = MonthlyCrawlSet()\n            new_crawls = set()\n            page_count = MultiCount(2)\n            for val in values:\n                if type(val) is list:\n                    if (outputType == CST.url.value):\n                        (crawl, pages) = val\n                        page_count.incr(crawl, pages, 1)\n                    else:  # digest\n                        (crawl, (pages, urls)) = val\n                        page_count.incr(crawl, pages, urls)\n                    crawls.add(crawl)\n                    new_crawls.add(crawl)\n                else:\n                    # crawl set bit mask\n                    crawls.update(val)\n            yield key, crawls.get_bits()\n            for new_crawl in new_crawls:\n                if crawls.is_new(new_crawl):\n                    self.counters[(CST.new_items.value,\n                                   outputType, new_crawl)] += 1\n            # url/digest duplicate histograms\n            for crawl, counts in page_count.items():\n                items = (1+counts[0]-counts[1])\n                self.counters[(CST.histogram.value, outputType,\n                               crawl, CST.page.value, items)] += 1\n            # size in terms of unique URLs and unique content digests\n            for crawl, counts in page_count.items():\n                self.counters[(CST.size.value, outputType, crawl)] += 1\n        elif outputType in (CST.mimetype.value,\n                            CST.mimetype_detected.value,\n                            CST.charset.value,\n                            CST.languages.value,\n                            CST.primary_language.value,\n                            CST.scheme.value,\n                            CST.tld.value,\n                            CST.domain.value,\n                            CST.surt_domain.value,\n                            CST.host.value,\n                            CST.http_status.value,\n                            CST.robotstxt_status.value):\n            yield key, MultiCount.sum_values(values)\n        elif outputType == CST.size_estimate.value:\n            hll = HyperLogLog(HYPERLOGLOG_ERROR)\n            for val in values:\n                hll.update(\n                    CrawlStatsJSONDecoder.json_decode_hyperloglog(val))\n            yield(key,\n                  CrawlStatsJSONEncoder.json_encode_hyperloglog(hll))\n        elif outputType == CST.size_estimate_for.value:\n            res = None\n            hll = None\n            cnt = 0\n            for val in values:\n                if res:\n                    if hll is None:\n                        cnt = res[0]\n                        hll = CrawlStatsJSONDecoder.json_decode_hyperloglog(res[1])\n                    cnt += val[0]\n                    hll.update(CrawlStatsJSONDecoder.json_decode_hyperloglog(val[1]))\n                else:\n                    res = val\n            if hll is not None and cnt >= MIN_SURT_HLL_SIZE:\n                yield(key, (cnt, CrawlStatsJSONEncoder.json_encode_hyperloglog(hll)))\n            elif res[0] >= MIN_SURT_HLL_SIZE:\n                yield(key, res)\n        else:\n            raise UnhandledTypeError(outputType)\n\n    def stats_mapper_init(self):\n        self.counters = Counter()\n\n    def stats_mapper(self, key, value):\n        if key[0] in (CST.url.value, CST.digest.value,\n                      CST.size_estimate_for.value):\n            return\n        if ((self.options.min_domain_frequency > 1) and\n            (key[0] in (CST.host.value, CST.domain.value,\n                        CST.surt_domain.value))):\n            # quick skip of infrequent host and domains,\n            # significantly limits amount of tuples processed in reducer\n            page_count = MultiCount.get_count(0, value)\n            url_count = MultiCount.get_count(1, value)\n            self.counters[(CST.size.value, key[0], key[2])] += 1\n            self.counters[(CST.histogram.value, key[0],\n                           key[2], CST.page.value, page_count)] += 1\n            self.counters[(CST.histogram.value, key[0],\n                           key[2], CST.url.value, url_count)] += 1\n            if key[0] in (CST.domain.value, CST.surt_domain.value):\n                host_count = MultiCount.get_count(2, value)\n                self.counters[(CST.histogram.value, key[0],\n                               key[2], CST.host.value, host_count)] += 1\n            if url_count < self.options.min_domain_frequency:\n                return\n        if key[0] == CST.languages.value:\n            # yield only frequent language combinations (if configured)\n            page_count = MultiCount.get_count(0, value)\n            if ((self.options.min_lang_comb_freq > 1) and\n                    (page_count < self.options.min_lang_comb_freq) and\n                    (',' in key[1])):\n                return\n        yield key, value\n\n    def stats_mapper_final(self):\n        for (counter, count) in self.counters.items():\n            yield counter, count\n\n    def stats_reducer(self, key, values):\n        outputType = CST(key[0])\n        item = key[1]\n        crawl = MonthlyCrawl.to_name(key[2])\n        if outputType in (CST.size, CST.new_items,\n                          CST.size_estimate, CST.size_robotstxt):\n            verbose_key = (outputType.name, CST(item).name, crawl)\n            if outputType in (CST.size, CST.size_robotstxt):\n                val = sum(values)\n            elif outputType == CST.new_items:\n                val = MultiCount.sum_values(values)\n            elif outputType == CST.size_estimate:\n                # already \"reduced\" in count job\n                for val in values:\n                    break\n            yield verbose_key, val\n        elif outputType == CST.histogram:\n            yield((outputType.name, CST(item).name, crawl,\n                   CST(key[3]).name, key[4]), sum(values))\n        elif outputType in (CST.mimetype, CST.mimetype_detected, CST.charset,\n                            CST.languages, CST.primary_language, CST.scheme,\n                            CST.surt_domain, CST.tld, CST.domain, CST.host,\n                            CST.http_status, CST.robotstxt_status):\n            item = key[1]\n            for counts in values:\n                page_count = MultiCount.get_count(0, counts)\n                url_count = MultiCount.get_count(1, counts)\n                if outputType in (CST.domain, CST.surt_domain, CST.tld):\n                    host_count = MultiCount.get_count(2, counts)\n                if (self.options.min_domain_frequency <= 1 or\n                    outputType not in (CST.host, CST.domain,\n                                       CST.surt_domain)):\n                    self.counters[(CST.size.name, outputType.name, crawl)] += 1\n                    self.counters[(CST.histogram.name, outputType.name,\n                                   crawl, CST.page.name, page_count)] += 1\n                    self.counters[(CST.histogram.name, outputType.name,\n                                   crawl, CST.url.name, url_count)] += 1\n                    if outputType in (CST.domain, CST.surt_domain, CST.tld):\n                        self.counters[(CST.histogram.name, outputType.name,\n                                       crawl, CST.host.name, host_count)] += 1\n                if outputType == CST.tld:\n                    domain_count = MultiCount.get_count(3, counts)\n                    self.counters[(CST.histogram.name, outputType.name,\n                                   crawl, CST.domain.name, domain_count)] += 1\n                if outputType in (CST.domain, CST.host, CST.surt_domain):\n                    outKey = (outputType.name, crawl)\n                    outVal = (page_count, url_count, item)\n                    if outputType in (CST.domain, CST.surt_domain):\n                        outVal = (page_count, url_count, host_count, item)\n                    # take most common\n                    if len(self.mostfrequent[outKey]) < self.options.max_hosts:\n                        heapq.heappush(self.mostfrequent[outKey], outVal)\n                    else:\n                        heapq.heappushpop(self.mostfrequent[outKey], outVal)\n                else:\n                    yield((outputType.name, item, crawl), counts)\n        else:\n            raise UnhandledTypeError(outputType)\n\n    def reducer_final(self):\n        for (counter, count) in self.counters.items():\n            yield counter, count\n        for key, mostfrequent in self.mostfrequent.items():\n            (outputType, crawl) = key\n            if outputType in (CST.domain.name, CST.surt_domain.name):\n                for (pages, urls, hosts, item) in mostfrequent:\n                    yield((outputType, item, crawl),\n                          MultiCount.compress(3, [pages, urls, hosts]))\n            else:\n                for (pages, urls, item) in mostfrequent:\n                    yield((outputType, item, crawl),\n                          MultiCount.compress(2, [pages, urls]))\n\n    def steps(self):\n        reduces = 10\n        cdxminsplitsize = 2**32  # do not split cdx map input files\n        if self.options.exact_counts:\n            # with exact counts need many reducers to aggregate the counts\n            # in reasonable time and to get not too large partitions\n            reduces = 200\n        count_job = \\\n            MRStep(mapper_init=self.count_mapper_init,\n                   mapper=self.count_mapper,\n                   mapper_final=self.count_mapper_final,\n                   reducer_init=self.reducer_init,\n                   reducer=self.count_reducer,\n                   reducer_final=self.reducer_final,\n                   jobconf={'mapreduce.job.reduces': reduces,\n                            'mapreduce.input.fileinputformat.split.minsize':\n                                cdxminsplitsize,\n                            'mapreduce.output.fileoutputformat.compress':\n                                \"true\",\n                            'mapreduce.output.fileoutputformat.compress.codec':\n                                'org.apache.hadoop.io.compress.BZip2Codec'})\n        stats_job = \\\n            MRStep(mapper_init=self.stats_mapper_init,\n                   mapper=self.stats_mapper,\n                   mapper_final=self.stats_mapper_final,\n                   reducer_init=self.reducer_init,\n                   reducer=self.stats_reducer,\n                   reducer_final=self.reducer_final,\n                   jobconf={'mapreduce.job.reduces': 1,\n                            'mapreduce.output.fileoutputformat.compress':\n                                \"true\",\n                            'mapreduce.output.fileoutputformat.compress.codec':\n                                'org.apache.hadoop.io.compress.GzipCodec'})\n        if self.options.job_to_run == 'count':\n            return [count_job]\n        if self.options.job_to_run == 'stats':\n            return [stats_job]\n        return [count_job, stats_job]\n\n\nif __name__ == '__main__':\n    CCStatsJob.run()\n"
  },
  {
    "path": "get_stats.sh",
    "content": "#!/bin/bash\n\nset -o pipefail\n\nif aws s3 ls s3://commoncrawl/crawl-analysis/ | sed -E 's@.* @@; s@/$@@' >./stats/crawls.txt; then\n    ON_AWS=true;\n    echo \"Running on AWS (AWS CLI configured for authenticated access)\"\nelse\n    echo \"Downloading from https://data.commoncrawl.org/ using curl\"\n    # list of crawls enumerated in crawlstats.py\n    python3 -c 'from crawlstats import MonthlyCrawl; [print(c) for c in sorted(MonthlyCrawl.by_name.keys())]' >./stats/crawls.txt\n    ON_AWS=false\nfi\n\nwhile read crawl; do\n    echo $crawl\n    if [ -e stats/$crawl.gz ]; then\n        echo \"  ... exists\"\n        continue\n    fi\n    if $ON_AWS; then\n        aws s3 cp s3://commoncrawl/crawl-analysis/$crawl/stats/part-00000.gz ./stats/$crawl.gz\n    else\n        curl --silent https://data.commoncrawl.org/crawl-analysis/$crawl/stats/part-00000.gz >./stats/$crawl.gz\n    fi\ndone <./stats/crawls.txt\n"
  },
  {
    "path": "get_stats_and_plot.sh",
    "content": "#!/bin/bash\nset -e\n\necho \"Starting ...\"\n\n./get_stats.sh\n\n# make sure plot directories exist\nmkdir -p plots/crawler\nmkdir -p plots/crawloverlap\nmkdir -p plots/crawlsize\nmkdir -p plots/throughput\nmkdir -p plots/tld\n\n./plot.sh\n\necho \"Done.\""
  },
  {
    "path": "index.md",
    "content": "Statistics of Common Crawl Monthly Archives\n===========================================\n\nStatistics of [Common Crawl](https://commoncrawl.org/)'s [web archives](https://commoncrawl.org/the-data/get-started/) released on a monthly base:\n\n* [size of the crawls](plots/crawlsize) - number of pages, unique URLs, hosts, domains, top-level domains (public suffixes), cumulative growth of crawled data over time\n* [top-level domains](plots/tlds) - distribution and comparison\n* [top-500 registered domains](plots/domains.md)\n* [crawler-related metrics](plots/crawlermetrics) - fetch status, etc.\n* [overlaps between monthly crawls](plots/crawloverlap)\n* distribution of\n    - [media types (MIME)](plots/mimetypes)\n\t- [character encodings](plots/charsets.md)\n\t- [languages](plots/languages.md)\n\nAll metrics presented here are generated from [Common Crawl's URL index](https://index.commoncrawl.org/) data using the code of the [cc-crawl-statistics project](https://github.com/commoncrawl/cc-crawl-statistics). Inspired by Sebastian Spiegler's [Statistics of the Common Crawl Corpus 2012](https://commoncrawl.org/2013/08/a-look-inside-common-crawls-210tb-2012-web-corpus/).\n\nSee also our [Web Graph statistics](https://commoncrawl.github.io/cc-webgraph-statistics/).\n\n"
  },
  {
    "path": "plot/charset.py",
    "content": "import sys\n\nfrom plot.table import TabularStats\nfrom crawlstats import CST, MonthlyCrawl\n\n\nclass CharsetStats(TabularStats):\n\n    MIN_AVERAGE_COUNT = 500\n    MAX_CHARSETS = 100\n\n    def __init__(self):\n        super().__init__()\n        self.MAX_TYPE_VALUES = CharsetStats.MAX_CHARSETS\n\n    def add(self, key, val):\n        self.add_check_type(key, val, CST.charset)\n\n\nif __name__ == '__main__':\n    plot_crawls = sys.argv[1:]\n    plot_name = 'charsets'\n    column_header = 'charset'\n    if len(plot_crawls) == 0:\n        plot_crawls = MonthlyCrawl.get_latest(3)\n        print(plot_crawls)\n    else:\n        plot_name += '-' + '-'.join(plot_crawls)\n    plot = CharsetStats()\n    plot.read_from_stdin_or_file()\n    plot.transform_data(CharsetStats.MAX_CHARSETS,\n                        CharsetStats.MIN_AVERAGE_COUNT,\n                        None)\n    plot.save_data_percentage(plot_name, dir_name='plots', type_name='charset')\n    plot.plot(plot_crawls, plot_name, column_header)\n"
  },
  {
    "path": "plot/crawl_size.py",
    "content": "\"\"\"\nPlot crawl size metrics over time.\n\nThis module generates visualizations of crawl size statistics including:\n- Monthly crawl sizes (pages, URLs, content digests)\n- Cumulative sizes over time\n- New URLs per crawl\n- URL status by year (new, revisit, duplicate)\n- Domain/host/TLD counts\n\nThe plots show the growth and evolution of the Common Crawl archive.\n\"\"\"\n\nimport os\nimport re\nimport types\nfrom collections import defaultdict\n\nimport pandas\nfrom hyperloglog import HyperLogLog\n\nfrom crawlplot import CrawlPlot\nfrom crawlstats import CST, CrawlStatsJSONDecoder, HYPERLOGLOG_ERROR, MonthlyCrawl\n\n\nclass CrawlSizePlot(CrawlPlot):\n    \"\"\"Generate plots showing crawl size metrics over time.\n\n    Tracks various size metrics including page counts, unique URLs,\n    unique content digests, and cumulative statistics across crawls.\n    Uses HyperLogLog for efficient cardinality estimation.\n    \"\"\"\n\n    def __init__(self):\n        super().__init__()\n\n        self.size = defaultdict(dict)\n        self.size_by_type = defaultdict(dict)\n        self.type_index = defaultdict(dict)\n        self.crawls = {}\n        self.ncrawls = 0\n        self.hll = defaultdict(dict)\n        self.N = 0\n        self.sum_counts = False\n\n    def add(self, key, val):\n        \"\"\"Process a size or size_estimate record from statistics data.\"\"\"\n        cst = CST[key[0]]\n        if cst not in (CST.size, CST.size_estimate):\n            return\n        item_type = key[1]\n        crawl = key[2]\n        count = 0\n        if cst == CST.size_estimate:\n            item_type = ' '.join([item_type, 'estim.'])\n            hll = CrawlStatsJSONDecoder.json_decode_hyperloglog(val)\n            count = len(hll)\n            self.hll[item_type][crawl] = hll\n        elif cst == CST.size:\n            count = val\n        self.add_by_type(crawl, item_type, count)\n\n    def add_by_type(self, crawl, item_type, count):\n        \"\"\"Add a count for a specific crawl and item type combination.\"\"\"\n        if crawl not in self.crawls:\n            self.crawls[crawl] = self.ncrawls\n            self.size['crawl'][self.ncrawls] = crawl\n            date = pandas.Timestamp(MonthlyCrawl.date_of(crawl))\n            self.size['date'][self.ncrawls] = date\n            self.ncrawls += 1\n        else:\n            date = self.size['date'][self.crawls[crawl]]\n        if item_type in self.size and \\\n                self.crawls[crawl] in self.size[item_type]:\n            # add count to existing record?\n            if self.sum_counts:\n                count += self.size[item_type][self.crawls[crawl]]\n                self.size[item_type][self.crawls[crawl]] = count\n                _N = self.type_index[item_type][self.crawls[crawl]]\n                self.size_by_type['size'][_N] = count\n            return\n        self.size[item_type][self.crawls[crawl]] = count\n        self.size_by_type['crawl'][self.N] = crawl\n        self.size_by_type['date'][self.N] = date\n        self.size_by_type['type'][self.N] = item_type\n        self.size_by_type['size'][self.N] = count\n        self.type_index[item_type][self.crawls[crawl]] = self.N\n        self.N += 1\n\n    def cumulative_size(self):\n        \"\"\"Calculate cumulative sizes across crawls using HyperLogLog unions.\"\"\"\n        latest_n_crawls_cumul = [2, 3, 4, 6, 9, 12]\n        total_pages = 0\n        sorted_crawls = sorted(self.crawls)\n        for crawl in sorted_crawls:\n            total_pages += self.size['page'][self.crawls[crawl]]\n            self.add_by_type(crawl, 'page cumul.', total_pages)\n        urls_cumul = defaultdict(dict)\n        for item_type in self.hll.keys():\n            item_type_cumul = ' '.join([item_type, 'cumul.'])\n            item_type_new = ' '.join([item_type, 'new'])\n            cumul_hll = HyperLogLog(HYPERLOGLOG_ERROR)\n            n = 0\n            hlls = []\n            for crawl in sorted(self.hll[item_type]):\n                n += 1\n                hll = self.hll[item_type][crawl]\n                last_cumul_hll_len = len(cumul_hll)\n                cumul_hll.update(hll)\n                # cumulative size\n                self.add_by_type(crawl, item_type_cumul, len(cumul_hll))\n                # new unseen items this crawl (since the first analyzed crawl)\n                unseen = (len(cumul_hll) - last_cumul_hll_len)\n                if unseen > len(hll):\n                    # 1% error rate for cumulative HLLs is large in comparison\n                    # to crawl size, adjust to size of items in this crawl\n                    # (there can be no more new items than the size of the crawl)\n                    unseen = len(hll)\n                self.add_by_type(crawl, item_type_new, unseen)\n                hlls.append(hll)\n                # cumulative size for last N crawls\n                for n_crawls in latest_n_crawls_cumul:\n                    item_type_n_crawls = '{} cumul. last {} crawls'.format(\n                        item_type, n_crawls)\n                    if n_crawls <= len(hlls):\n                        cum_hll = HyperLogLog(HYPERLOGLOG_ERROR)\n                        for i in range(1, (n_crawls+1)):\n                            if i > len(hlls):\n                                break\n                            cum_hll.update(hlls[-i])\n                        size_last_n = len(cum_hll)\n                        if item_type == 'url estim.':\n                            urls_cumul[crawl][str(n_crawls)] = size_last_n\n                    else:\n                        size_last_n = 'nan'\n                    self.add_by_type(crawl, item_type_n_crawls, size_last_n)\n        for n, crawl in enumerate(sorted_crawls):\n            for n_crawls in latest_n_crawls_cumul:\n                if n_crawls > (n+1):\n                    self.add_by_type(crawl,\n                                     'page cumul. last {} crawls'.format(n_crawls),\n                                     'nan')\n                    continue\n                cumul_pages = 0\n                for c in sorted_crawls[(1+n-n_crawls):(n+1)]:\n                    cumul_pages += self.size['page'][self.crawls[c]]\n                self.add_by_type(crawl,\n                                 'page cumul. last {} crawls'.format(n_crawls),\n                                 cumul_pages)\n                urls_cumul[crawl][str(n_crawls)] = urls_cumul[crawl][str(n_crawls)]/cumul_pages\n        for crawl in urls_cumul:\n            for n_crawls in urls_cumul[crawl]:\n                self.add_by_type(crawl,\n                                 'URLs/pages last {} crawls'.format(n_crawls),\n                                 urls_cumul[crawl][n_crawls])\n\n    def transform_data(self):\n        \"\"\"Convert internal dictionaries to pandas DataFrames.\"\"\"\n        self.size = pandas.DataFrame(self.size)\n        self.size_by_type = pandas.DataFrame(self.size_by_type)\n\n    def save_data(self):\n        \"\"\"Save size data to CSV files.\"\"\"\n        self.size.to_csv('data/crawlsize.csv')\n        self.size_by_type.to_csv('data/crawlsizebytype.csv')\n\n    def duplicate_ratio(self):\n        \"\"\"Calculate and save URL and content duplicate ratios per crawl.\"\"\"\n        data = self.size[['crawl', 'page', 'url', 'digest estim.']]\n        data['1-(urls/pages)'] = 100 * (1.0 - (data['url'] / data['page']))\n        data['1-(digests/pages)'] = \\\n            100 * (1.0 - (data['digest estim.'] / data['page']))\n        floatf = '{0:.1f}%'.format\n        print(data.to_string(formatters={'1-(urls/pages)': floatf,\n                                         '1-(digests/pages)': floatf}),\n              file=open('data/crawlduplicates.txt', 'w'))\n\n    def plot(self):\n        \"\"\"Generate all crawl size plots.\"\"\"\n        # Size per crawl (pages, URL and content digest)\n        row_types = ['page', 'url', 'digest estim.']\n        self.size_plot(self.size_by_type, row_types, '',\n                       'Crawl Size', 'Pages / Unique Items',\n                       'crawlsize/monthly.png',\n                       data_export_csv='crawlsize/monthly.csv')\n        # -- cumulative size\n        row_types = ['page cumul.', 'url estim. cumul.',\n                     'digest estim. cumul.']\n        self.size_plot(self.size_by_type, row_types, r' cumul\\.$',\n                       'Crawl Size Cumulative',\n                       'Pages / Unique Items Cumulative',\n                       'crawlsize/cumulative.png',\n                       data_export_csv='crawlsize/cumulative.csv')\n        # -- new URLs per crawl\n        row_types = ['url estim. new']\n        self.size_plot(self.size_by_type, row_types, '',\n                       'New URLs per Crawl (not observed in prior crawls)',\n                       'New URLs', 'crawlsize/monthly_new.png',\n                       data_export_csv='crawlsize/monthly_new.csv')\n        # -- cumulative URLs over last N crawls (this and preceding N-1 crawls)\n        row_types = ['url', '1 crawl',  # 'url' replaced by '1 crawl'\n                     'url estim. cumul. last 2 crawls',\n                     'url estim. cumul. last 3 crawls',\n                     'url estim. cumul. last 4 crawls',\n                     'url estim. cumul. last 6 crawls',\n                     'url estim. cumul. last 9 crawls',\n                     'url estim. cumul. last 12 crawls']\n        data = self.size_by_type\n        data = data[data['type'].isin(row_types)]\n        data.replace(to_replace='url', value='1 crawl', inplace=True)\n        self.size_plot(data, row_types, r'^url estim\\. cumul\\. last | crawls?$',\n                       'URLs Cumulative Over Last N Crawls',\n                       'Unique URLs cumulative',\n                       'crawlsize/url_last_n_crawls.png',\n                       clabel='n crawls',\n                       data_export_csv='crawlsize/url_last_n_crawls.csv')\n        # -- ratio unique URLs by total page captures over last N crawls (this and preceding N-1 crawls)\n        row_types = ['URLs/pages last 2 crawls',\n                     'URLs/pages last 3 crawls',\n                     'URLs/pages last 4 crawls',\n                     'URLs/pages last 6 crawls',\n                     'URLs/pages last 9 crawls',\n                     'URLs/pages last 12 crawls']\n        data = self.size_by_type\n        data = data[data['type'].isin(row_types)]\n        data.replace(to_replace='url', value='1 crawl', inplace=True)\n        self.size_plot(data, row_types, r'^URLs/pages last | crawls?$',\n                       'Ratio Unique URLs / Total Pages Captured Over Last N Crawls',\n                       'URLs/Pages',\n                       'crawlsize/url_page_ratio_last_n_crawls.png',\n                       clabel='n crawls',\n                       data_export_csv='crawlsize/url_page_ratio_last_n_crawls.csv')\n        # -- cumul. digests over last N crawls (this and preceding N-1 crawls)\n        row_types = ['digest estim.', '1 crawl',  # 'url' replaced by '1 crawl'\n                     'digest estim. cumul. last 2 crawls',\n                     'digest estim. cumul. last 3 crawls',\n                     'digest estim. cumul. last 6 crawls',\n                     'digest estim. cumul. last 12 crawls']\n        data = self.size_by_type\n        data = data[data['type'].isin(row_types)]\n        data.replace(to_replace='digest estim.', value='1 crawl', inplace=True)\n        self.size_plot(data, row_types,\n                       r'^digest estim\\. cumul\\. last | crawls?$',\n                       'Content Digest Cumulative Over Last N Crawls',\n                       'Unique content digests cumulative',\n                       'crawlsize/digest_last_n_crawls.png',\n                       clabel='n crawls')\n        # -- URLs, hosts, domains, tlds (normalized)\n        data = self.size_by_type\n        row_types = ['url', 'tld', 'domain', 'host']\n        data = data[data['type'].isin(row_types)]\n        self.export_csv(data, 'crawlsize/domain.csv')\n        # --- domains only (not yet normalized)\n        self.size_plot(data[data['type'].isin(['domain'])], '', '',\n                       'Unique Domains per Crawl',\n                       '', 'crawlsize/registered-domains.png')\n        # normalize scale (exponent) of counts so that they fit on one plot\n        size_norm = data['size'] / 1000.0\n        data['size'] = size_norm.where(data['type'] == 'tld',\n                                       other=data['size'])\n        data.replace(to_replace='tld', value='tld e+04', inplace=True)\n        size_norm = size_norm / 10000.0\n        data['size'] = size_norm.where(data['type'] == 'host',\n                                       other=data['size'])\n        data.replace(to_replace='host', value='host e+07', inplace=True)\n        data['size'] = size_norm.where(data['type'] == 'domain',\n                                       other=data['size'])\n        data.replace(to_replace='domain', value='domain e+07', inplace=True)\n        size_norm = size_norm / 100.0\n        data['size'] = size_norm.where(data.type == 'url',\n                                       other=data['size'])\n        data.replace(to_replace='url', value='url e+09', inplace=True)\n        self.size_plot(data, '', '',\n                       'URLs / Hosts / Domains / TLDs per Crawl',\n                       'Unique Items', 'crawlsize/domain.png')\n        # -- URL status by year:\n        # --   duplicates (pages - URLs), known URLs (URLs - new), new URLs\n        data = self.size[['crawl', 'page', 'url', 'url estim. new']]\n        data['year'] = data['crawl'].apply(lambda c: int(MonthlyCrawl.year_of(c)))\n        by_year = data[['year', 'page', 'url', 'url estim. new']] \\\n            .groupby('year').agg(sum).reset_index()\n        by_year['revisit'] = by_year['url'] - by_year['url estim. new']\n        by_year['duplicate'] = by_year['page'] - by_year['url']\n        by_year['new'] = by_year['url estim. new']\n        print('URL status by year:')\n        print(by_year)\n        by_year_by_type = by_year[['year', 'new', 'revisit', 'duplicate', 'page']].melt(\n            id_vars=['year', 'page'],\n            value_vars=['new', 'revisit', 'duplicate'],\n            var_name='url_status', value_name='page_captures')\n        by_year_by_type['ratio'] = by_year_by_type['page_captures'] / by_year_by_type['page']\n        by_year_by_type['perc'] = by_year_by_type['ratio'].apply(lambda x: round((100.0*x), 1)).astype(str) + '%'\n        by_year_by_type['year'] = pandas.Categorical(by_year_by_type['year'], ordered=True)\n        by_year_by_type['url_status'] = pandas.Categorical(by_year_by_type['url_status'],\n                                                           ordered=True,\n                                                           categories=['duplicate',\n                                                                       'revisit', 'new'])\n        by_year_by_type['page_captures'] = by_year_by_type['page_captures'].astype(float)\n\n        # url_status_by_year\n        img_path = os.path.join(self.PLOTDIR, 'crawlsize', 'url_status_by_year.png')\n\n        if self.PLOTLIB == \"rpy2.ggplot2\":\n            return self.plot_with_rpy2_ggplot2(by_year_by_type, img_path)\n        elif self.PLOTLIB == \"matplotlib\":\n            return self.plot_with_matplotlib(by_year_by_type, img_path)\n        else:\n            raise ValueError(\"Invalid PLOTLIB\")\n        \n    def plot_with_rpy2_ggplot2(self, by_year_by_type, img_path):\n        \"\"\"Generate URL status by year stacked bar chart using rpy2/ggplot2.\"\"\"\n        from rpy2.robjects.lib import ggplot2\n        from rpy2 import robjects\n        from rpy2.robjects import pandas2ri\n        pandas2ri.activate()\n\n        p = ggplot2.ggplot(by_year_by_type) \\\n            + ggplot2.aes_string(x='year', y='page_captures', fill='url_status', label='perc') \\\n            + ggplot2.geom_bar(stat='identity', position='stack') \\\n            + ggplot2.geom_text(\n                data=by_year_by_type[\n                    by_year_by_type['url_status'].isin(['new'])\n                    & ~by_year_by_type['year'].isin(by_year_by_type['year'].tolist()[0:3])],\n                color='black', size=2,\n                position=ggplot2.position_dodge(width=.5)) \\\n            + self.GGPLOT2_THEME \\\n            + ggplot2.scale_fill_manual(values=robjects.r('c(\"duplicate\"=\"#00BA38\", \"revisit\"=\"#619CFF\", \"new\"=\"#F8766D\")')) \\\n            + ggplot2.theme(**{'legend.position': 'right',\n                            'aspect.ratio': .7,\n                            **self.GGPLOT2_THEME_KWARGS},\n                            **{'axis.text.x':\n                            ggplot2.element_text(angle=45, size=10,\n                                                    vjust=1, hjust=1)}) \\\n            + ggplot2.labs(title='Number of Page Captures', x='', y='', fill='URL status')\n        p.save(img_path)\n\n        return p\n\n\n    def plot_with_matplotlib(self, by_year_by_type, img_path):\n        \"\"\"Generate URL status by year stacked bar chart using matplotlib.\"\"\"\n        import numpy as np\n\n        aspect_ratio = 0.7\n        bar_label_fontsize = 5\n        title = 'Number of Page Captures'\n\n        fig, ax = self.create_figure()\n\n        # Prepare data for stacked bar chart\n        years = by_year_by_type['year'].unique()\n        url_statuses = ['new', 'revisit', 'duplicate']\n        colors = {'duplicate': '#00BA38', 'revisit': '#619CFF', 'new': '#F8766D'}\n\n        # Create stacked bars\n        bottoms = np.zeros(len(years))\n        bars = {}\n\n        for status in url_statuses:\n            status_data = by_year_by_type[by_year_by_type['url_status'] == status]\n            values = []\n            labels = []\n\n            for year in years:\n                year_data = status_data[status_data['year'] == year]\n                if len(year_data) > 0:\n                    values.append(year_data['page_captures'].iloc[0])\n                    labels.append(year_data['perc'].iloc[0])\n                else:\n                    values.append(0)\n                    labels.append('')\n\n            bars[status] = ax.bar(range(len(years)), values, bottom=bottoms,\n                                  color=colors[status], label=status, width=self.bar_width)\n\n            # Add text labels only for 'new' status, excluding first 3 years\n            if status == 'new':\n                for i, (bar, label) in enumerate(zip(bars[status], labels)):\n                    if i >= 3 and label:\n                        height = bar.get_height()\n                        ax.text(bar.get_x() + bar.get_width() / 2.,\n                                bottoms[i] + height, label,\n                                ha='center', va='top', color='black',\n                                fontsize=bar_label_fontsize)\n\n            bottoms += values\n\n        self.set_title(ax, title)\n        ax.set_xlabel('')\n        ax.set_ylabel('')\n\n        # Format x-axis\n        ax.set_xticks(range(len(years)))\n        ax.set_xticklabels(years, rotation=45, ha='right', va='top',\n                          fontsize=self.ticks_fontsize)\n        ax.set_xlim(-0.5, len(years) - 0.5)\n\n        # Axes ratio\n        ax.set_aspect(1 / ax.get_data_ratio() * aspect_ratio)\n\n        # Apply nice y-axis ticks\n        self.apply_nice_ticks(ax, axis='y')\n\n        # Grid styling\n        ax.grid(True, which='minor', linewidth=self.grid_minor_linewidth,\n                color=self.grid_minor_color, zorder=0, axis='both')\n        ax.grid(True, which='major', linewidth=self.grid_major_linewidth,\n                color=self.grid_major_color, zorder=0, axis='both')\n        ax.set_axisbelow(True)\n\n        # Apply ggplot2 style\n        self.apply_ggplot2_style(ax, show_grid=False)\n\n        # Set tick colors\n        ax.tick_params(axis='y', which='both', colors='#FFFFFF',\n                       length=self.ticks_length, width=self.grid_major_linewidth,\n                       labelsize=self.ticks_fontsize)\n        ax.tick_params(axis='x', which='both', colors='#E6E6E6',\n                       length=self.ticks_length, width=self.grid_major_linewidth,\n                       labelsize=self.ticks_fontsize)\n        self.set_tick_labels_black(ax)\n\n        # Position legend on right side with reversed order\n        handles, labels = ax.get_legend_handles_labels()\n        legend = ax.legend(handles[::-1], labels[::-1], loc='center left',\n                          bbox_to_anchor=(1.0, 0.5), frameon=False,\n                          fontsize=self.legend_fontsize, title='URL status',\n                          title_fontsize=self.legend_title_fontsize)\n        legend._legend_box.align = 'left'\n\n        return self.save_figure(fig, img_path)\n\n\n    def export_csv(self, data, csv):\n        \"\"\"Export pivot table data to CSV file.\"\"\"\n        if csv is not None:\n            data.reset_index().pivot(index='crawl',\n                                     columns='type', values='size').to_csv(\n                                         os.path.join(self.PLOTDIR, csv))\n\n    def norm_data(self, data, row_filter, type_name_norm):\n        \"\"\"Filter and normalize type names in the data for plotting.\"\"\"\n        if len(row_filter) > 0:\n            data = data[data['type'].isin(row_filter)]\n        if type_name_norm != '':\n            for value in row_filter:\n                replacement = value\n                if isinstance(type_name_norm, str):\n                    if re.search(type_name_norm, value):\n                        while re.search(type_name_norm, replacement):\n                            replacement = re.sub(type_name_norm,\n                                                 '', replacement)\n                elif isinstance(type_name_norm, types.FunctionType):\n                    replacement = type_name_norm(value)\n                if replacement != value:\n                    data.replace(to_replace=value, value=replacement,\n                                 inplace=True)\n        return data\n\n    def size_plot(self, data, row_filter, type_name_norm,\n                  title, ylabel, img_file, clabel='', data_export_csv=None,\n                  x='date', y='size', c='type'):\n        \"\"\"Generate a size plot with filtering and normalization.\n\n        Args:\n            data: DataFrame containing the size data\n            row_filter: List of type values to include\n            type_name_norm: Regex pattern or function to normalize type names\n            title: Plot title\n            ylabel: Y-axis label\n            img_file: Output filename\n            clabel: Legend title\n            data_export_csv: Optional CSV export path\n            x, y, c: Column names for x-axis, y-axis, and color grouping\n        \"\"\"\n        data = self.norm_data(data, row_filter, type_name_norm)\n        self.export_csv(data, data_export_csv)\n        return self.line_plot(data, title, ylabel, img_file,\n                              x=x, y=y, c=c, clabel=clabel, ratio=.9)\n\n\nif __name__ == '__main__':\n    plot = CrawlSizePlot()\n    plot.read_from_stdin_or_file()\n    plot.cumulative_size()\n    plot.transform_data()\n    plot.save_data()\n    plot.duplicate_ratio()\n    plot.plot()\n"
  },
  {
    "path": "plot/crawler_metrics.py",
    "content": "\"\"\"\nPlot crawler performance metrics.\n\nThis module generates visualizations of crawler metrics including:\n- Fetch status breakdown (success, redirect, denied, failed, skipped)\n- CrawlDb status counts\n- HTTP vs HTTPS URL distribution\n\nThese metrics help monitor crawler health and performance over time.\n\"\"\"\n\nimport logging\nimport os\nimport re\n\nimport pandas\n\nfrom crawlstats import CST, MultiCount\nfrom crawl_size import CrawlSizePlot\n\n\nLOGGING_LEVEL = logging.INFO\nlogging.basicConfig(level=LOGGING_LEVEL)\n\n\nclass CrawlerMetrics(CrawlSizePlot):\n    \"\"\"Generate plots showing crawler performance metrics.\n\n    Tracks fetch statuses, CrawlDb sizes, and URL protocol distribution\n    across crawls.\n    \"\"\"\n\n    metrics_map = {\n        'fetcher:aggr:redirect': ('fetcher:temp_moved', 'fetcher:moved',\n                                  'fetcher:redirect_count_exceeded',\n                                  'fetcher:redirect_deduplicated',\n                                  # new counter names (NUTCH-3132)\n                                  # unchanged: 'fetcher:temp_moved', 'fetcher:moved',\n                                  'fetcher:redirect_count_exceeded_total',\n                                  'fetcher:redirect_deduplicated_total',\n                                  'fetcher:redirect_not_created_total'),\n        'fetcher:aggr:denied':   ('fetcher:access_denied',\n                                  'fetcher:robots_denied',\n                                  'fetcher:robots_denied_maxcrawldelay',\n                                  'fetcher:robots_defer_visits_dropped',\n                                  'fetcher:filter_denied',\n                                  # new counter names (NUTCH-3132)\n                                  # unchanged: 'fetcher:access_denied',\n                                  'fetcher:robots_denied_total',\n                                  'fetcher:robots_denied_maxcrawldelay_total',\n                                  'fetcher:robots_defer_visits_dropped_total'),\n        'fetcher:aggr:failed':   ('fetcher:gone', 'fetcher:notfound',\n                                  'fetcher:exception',\n                                  # (no) new counter names (NUTCH-3132)\n                                  ),\n        'fetcher:aggr:skipped':  ('fetcher:hitByThrougputThreshold',\n                                  'fetcher:hitByTimeLimit',\n                                  'fetcher:AboveExceptionThresholdInQueue',\n                                  'fetcher:filtered',\n                                  # new counter names (NUTCH-3132)\n                                  'fetcher:hit_by_throughput_threshold_total',\n                                  'fetcher:hit_by_timelimit_total',\n                                  'fetcher:above_exception_threshold_total',\n                                  'fetcher:hit_by_timeout_total',\n                                  'fetcher:filtered_total')\n    }\n\n    def __init__(self):\n        super().__init__()\n        self.sum_counts = True\n\n    def add(self, key, val):\n        \"\"\"Process crawl status, size, and scheme records.\"\"\"\n        cst = CST[key[0]]\n        item_type = key[1]\n        crawl = key[2]\n        if not (cst == CST.crawl_status or\n                (cst == CST.size and item_type in ('page', 'url'))\n                or cst == CST.scheme):\n            return\n        if cst == CST.scheme:\n            item_type = 'scheme:' + item_type\n            val = MultiCount.get_count(1, val)\n        self.add_by_type(crawl, item_type, val)\n        for metric in self.metrics_map:\n            if item_type in self.metrics_map[metric]:\n                logging.debug('Adding metric %s for <%s, %s> = %s', metric, crawl, item_type, val)\n                self.add_by_type(crawl, metric, val)\n\n    def save_data(self):\n        \"\"\"Save crawler metrics data to CSV files.\"\"\"\n        self.size.sort_values(['crawl'], inplace=True)\n        self.size.to_csv('data/crawlmetrics.csv')\n        self.size_by_type.to_csv('data/crawlmetricsbytype.csv')\n\n    def add_percent(self):\n        \"\"\"Calculate percentage values for fetch statuses and schemes.\"\"\"\n        for crawl in self.crawls:\n            if self.crawls[crawl] not in self.size['fetcher:total']:\n                logging.debug('Crawl %s not found in fetch status data', crawl)\n                continue\n            total = self.size['fetcher:total'][self.crawls[crawl]]\n            for item_type in self.type_index:\n                if self.crawls[crawl] not in self.size[item_type]:\n                    continue\n                count = self.size[item_type][self.crawls[crawl]]\n                _N = self.type_index[item_type][self.crawls[crawl]]\n                if (item_type.startswith('fetcher:') and\n                    item_type != 'fetcher:total'):\n                    self.size_by_type['percentage'][_N] = 100.0*count/total\n                elif item_type.startswith('scheme:'):\n                    total = self.size['url'][self.crawls[crawl]]\n                    self.size_by_type['percentage'][_N] = 100.0*count/total\n\n    @staticmethod\n    def row2title(row):\n        \"\"\"Convert metric row name to human-readable title.\"\"\"\n        row = re.sub('(?<=^fetch)er(?::aggr)?|^generator:', '', row)\n        row = re.sub('[:_]', ' ', row)\n        if row == 'page':\n            row = 'pages released'\n        return row\n\n    def plot(self):\n        \"\"\"Generate all crawler metrics plots.\"\"\"\n        row_types = ['generator:fetch_list',\n                     'fetcher:success', 'fetcher:total',\n                     'fetcher:aggr:redirect', 'fetcher:notmodified',\n                     'fetcher:aggr:failed', 'fetcher:aggr:denied',\n                     'fetcher:aggr:skipped', 'page']\n        self.size_plot(self.size_by_type, row_types, CrawlerMetrics.row2title,\n                       'Crawler Metrics', 'Pages',\n                       'crawler/metrics.png')\n        # -- stacked bar plot\n        row_types = ['fetcher:success', 'fetcher:notmodified',\n                     'fetcher:aggr:redirect', 'fetcher:aggr:failed',\n                     'fetcher:aggr:denied', 'fetcher:aggr:skipped']\n        ratio = 0.1 + self.ncrawls * .05\n        self.plot_fetch_status(self.size_by_type, row_types,\n                               'crawler/fetch_status_percentage.png',\n                               ratio=ratio)\n        # -- status of pages in CrawlDb\n        row_types = ['crawldb:status:db_fetched',\n                     'crawldb:status:db_notmodified',\n                     'crawldb:status:db_redir_perm',\n                     'crawldb:status:db_redir_temp',\n                     'crawldb:status:db_duplicate',\n                     'crawldb:status:db_gone',\n                     'crawldb:status:db_unfetched',\n                     'crawldb:status:db_orphan']\n        self.plot_crawldb_status(self.size_by_type, row_types,\n                                 'crawler/crawldb_status.png',\n                                 ratio=ratio)\n        # successfully fetched http:// vs https:// URLs\n        self.size_plot(self.size_by_type, ['scheme:http', 'scheme:https'], lambda x: x.split(':')[1],\n                       'HTTP vs HTTPS URLs', 'Successfully fetched URLs',\n                       'crawler/url_protocols.png')\n        self.size_plot(self.size_by_type, ['scheme:http', 'scheme:https'], lambda x: x.split(':')[1],\n                       'Percentage of HTTP vs HTTPS URLs', 'Percentage of successfully fetched URLs',\n                       'crawler/url_protocols_percentage.png', y='percentage')\n\n    def plot_fetch_status_with_rpy2_ggplot2(self, data, img_path, ratio):\n        \"\"\"Generate fetch status stacked bar chart using rpy2/ggplot2.\"\"\"\n        from rpy2.robjects.lib import ggplot2\n\n        p = ggplot2.ggplot(data) \\\n            + ggplot2.aes_string(x='crawl', y='percentage', fill='type') \\\n            + ggplot2.geom_bar(stat='identity', position='stack', width=.9) \\\n            + ggplot2.coord_flip() \\\n            + ggplot2.scale_fill_brewer(palette='RdYlGn', type='sequential',\n                                        guide=ggplot2.guide_legend(reverse=True)) \\\n            + self.GGPLOT2_THEME \\\n            + ggplot2.theme(**{'legend.position': 'bottom',\n                            'aspect.ratio': ratio,\n                            **self.GGPLOT2_THEME_KWARGS}) \\\n            + ggplot2.labs(title='Percentage of Fetch Status',\n                        x='', y='', fill='')\n\n        p.save(img_path, height = int(7 * ratio), width = 7)\n\n        return p\n\n    def plot_fetch_status_with_matplotlib(self, data, categories, img_path, ratio):\n        \"\"\"Generate fetch status stacked bar chart using matplotlib.\"\"\"\n        import numpy as np\n        from matplotlib.ticker import MaxNLocator\n\n        crawls = data['crawl'].unique()\n        n_crawls = len(crawls)\n\n        # Define colors from dark green (success) to dark red (denied)\n        status_order = ['success', 'skipped', 'redirect', 'notmodified', 'failed', 'denied']\n        status_colors = {\n            'success': '#1A9850', 'skipped': '#91CF60', 'redirect': '#D9EF8B',\n            'notmodified': '#FEE08B', 'failed': '#FC8D59', 'denied': '#D73027'\n        }\n        categories_ordered = [cat for cat in status_order if cat in categories]\n\n        fig, ax = self.create_figure(ratio=ratio)\n\n        # Prepare data for horizontal stacked bar chart\n        bar_positions = np.arange(n_crawls)\n        lefts = np.zeros(n_crawls)\n\n        for category in categories_ordered:\n            category_data = data[data['type'] == category]\n            values = [\n                category_data[category_data['crawl'] == crawl]['percentage'].iloc[0]\n                if len(category_data[category_data['crawl'] == crawl]) > 0 else 0\n                for crawl in crawls\n            ]\n            ax.barh(bar_positions, values, left=lefts, height=self.bar_width,\n                    color=status_colors[category], label=category)\n            lefts += values\n\n        self.set_title(ax, 'Percentage of Fetch Status')\n        ax.set_xlabel('')\n        ax.set_ylabel('')\n\n        # Format y-axis (crawl names)\n        ax.set_yticks(bar_positions)\n        ax.set_yticklabels(crawls, fontsize=self.ticks_fontsize)\n        ax.set_ylim(-0.5, n_crawls - 0.5)\n\n        # Format x-axis (percentage)\n        max_value = lefts.max()\n        ax.set_xlim(0, max_value * 1.02)\n        ax.xaxis.set_major_locator(MaxNLocator(nbins=5))\n\n        # Apply ggplot2-like styling\n        self.apply_ggplot2_style(ax, grid_axis='x')\n\n        # Set tick colors\n        ax.tick_params(axis='y', which='both', colors='#E6E6E6', length=20,\n                       width=1.5, labelsize=self.ticks_fontsize)\n        ax.tick_params(axis='x', which='both', colors='#E6E6E6', length=4,\n                       width=1.5, labelsize=self.ticks_fontsize)\n        self.set_tick_labels_black(ax)\n\n        # Position legend at bottom\n        handles, labels = ax.get_legend_handles_labels()\n        ax.legend(handles, labels, loc='upper center', bbox_to_anchor=(0.5, -0.05),\n                  ncol=min(3, len(categories)), frameon=False,\n                  fontsize=self.legend_fontsize, title='')\n\n        return self.save_figure(fig, img_path)\n\n    def plot_fetch_status(self, data, row_filter, img_file, ratio=1.0):\n        \"\"\"Generate fetch status percentage stacked bar chart.\"\"\"\n        if row_filter:\n            data = data[data['type'].isin(row_filter)]\n        data = data[['crawl', 'percentage', 'type']]\n        categories = []\n        for value in row_filter:\n            if re.search('^fetcher:(?:aggr:)?', value):\n                replacement = re.sub('^fetcher:(?:aggr:)?', '', value)\n                categories.append(replacement)\n                data.replace(to_replace=value, value=replacement, inplace=True)\n        data['type'] = pandas.Categorical(data['type'], ordered=True,\n                                          categories=categories.reverse())\n        ratio = 0.1 + len(data['crawl'].unique()) * .03\n        img_path = os.path.join(self.PLOTDIR, img_file)\n\n        if self.PLOTLIB == \"rpy2.ggplot2\":\n            return self.plot_fetch_status_with_rpy2_ggplot2(data=data, img_path=img_path, ratio=ratio)\n        elif self.PLOTLIB == \"matplotlib\":\n            return self.plot_fetch_status_with_matplotlib(data=data, categories=categories, img_path=img_path, ratio=ratio)\n        else:\n            raise ValueError(\"Invalid PLOTLIB\")\n\n    def plot_crawldb_status_with_rpy2_ggplot2(self, data, img_path, ratio):\n        \"\"\"Generate CrawlDb status stacked bar chart using rpy2/ggplot2.\"\"\"\n        from rpy2.robjects.lib import ggplot2\n\n        p = ggplot2.ggplot(data) \\\n            + ggplot2.aes_string(x='crawl', y='size', fill='type') \\\n            + ggplot2.geom_bar(stat='identity', position='stack', width=.9) \\\n            + ggplot2.coord_flip() \\\n            + ggplot2.scale_fill_brewer(palette='Pastel1', type='sequential',\n                                        guide=ggplot2.guide_legend(reverse=False)) \\\n            + self.GGPLOT2_THEME \\\n            + ggplot2.theme(**{'legend.position': 'bottom',\n                            'aspect.ratio': ratio,\n                            **self.GGPLOT2_THEME_KWARGS}) \\\n            + ggplot2.labs(title='CrawlDb Size and Status Counts',\n                        x='', y='', fill='')\n\n        p.save(img_path, height = int(7 * ratio), width = 7)\n        return p\n\n    def plot_crawldb_status_with_matplotlib(self, data, img_path, ratio):\n        \"\"\"Generate CrawlDb status stacked bar chart using matplotlib.\"\"\"\n        import numpy as np\n\n        crawls = data['crawl'].unique()\n        n_crawls = len(crawls)\n\n        # Pastel1 palette colors\n        pastel1_colors = ['#FDDAEC', '#E5D8BD', '#FFFFCC', '#FED9A6',\n                          '#DECBE4', '#CCEBC5', '#B3CDE3', '#FBB4AE', '#F2F2F2']\n        categories_ordered = ['unfetched', 'redir_temp', 'redir_perm', 'orphan',\n                              'notmodified', 'gone', 'fetched', 'duplicate']\n\n        fig, ax = self.create_figure(ratio=ratio)\n\n        bar_positions = np.arange(n_crawls)\n        lefts = np.zeros(n_crawls)\n\n        for i, category in enumerate(categories_ordered):\n            category_data = data[data['type'] == category]\n            values = [\n                category_data[category_data['crawl'] == crawl]['size'].iloc[0]\n                if len(category_data[category_data['crawl'] == crawl]) > 0 else 0\n                for crawl in crawls\n            ]\n            color = pastel1_colors[i % len(pastel1_colors)]\n            ax.barh(bar_positions, values, left=lefts, height=self.bar_width,\n                    color=color, label=category)\n            lefts += values\n\n        self.set_title(ax, 'CrawlDb Size and Status Counts')\n        ax.set_xlabel('')\n        ax.set_ylabel('')\n\n        # Format y-axis (crawl names)\n        ax.set_yticks(bar_positions)\n        ax.set_yticklabels(crawls, fontsize=self.ticks_fontsize)\n        ax.set_ylim(-0.5, n_crawls - 0.5)\n\n        # Format x-axis (size counts)\n        max_value = lefts.max()\n        ax.set_xlim(0, max_value * 1.02)\n\n        # Axes ratio\n        ax.set_aspect(1 / ax.get_data_ratio() * ratio)\n\n        # Apply nice x-axis ticks\n        self.apply_nice_ticks(ax, axis='x')\n\n        # Apply ggplot2-like styling with x-axis grid\n        ax.grid(True, which='both', linewidth=self.grid_major_linewidth,\n                color=self.grid_major_color, zorder=0, axis='x')\n        ax.set_axisbelow(True)\n        self.apply_ggplot2_style(ax, show_grid=False)\n\n        # Set tick colors\n        ax.tick_params(axis='both', which='both', colors=self.ticks_color,\n                       length=self.ticks_length, width=0.8,\n                       labelsize=self.ticks_fontsize)\n        self.set_tick_labels_black(ax)\n\n        # Position legend at bottom with reversed order\n        handles, labels = ax.get_legend_handles_labels()\n        ax.legend(handles[::-1], labels[::-1], loc='upper center',\n                  bbox_to_anchor=(0.5, -0.05), ncol=min(4, len(categories_ordered)),\n                  frameon=False, fontsize=self.legend_fontsize, title='')\n\n        return self.save_figure(fig, img_path)\n\n    def plot_crawldb_status(self, data, row_filter, img_file, ratio=1.0):\n        \"\"\"Generate CrawlDb status stacked bar chart.\"\"\"\n        if row_filter:\n            data = data[data['type'].isin(row_filter)]\n        categories = []\n        for value in row_filter:\n            if re.search('^crawldb:status:db_', value):\n                replacement = re.sub('^crawldb:status:db_', '', value)\n                categories.append(replacement)\n                data.replace(to_replace=value, value=replacement, inplace=True)\n        data['type'] = pandas.Categorical(data['type'], ordered=True,\n                                          categories=categories.reverse())\n        data['size'] = data['size'].astype(float)\n        ratio = 0.1 + len(data['crawl'].unique()) * .03\n        img_path = os.path.join(self.PLOTDIR, img_file)\n\n        if self.PLOTLIB == \"rpy2.ggplot2\":\n            return self.plot_crawldb_status_with_rpy2_ggplot2(\n                data=data, img_path=img_path, ratio=ratio\n            )\n\n        elif self.PLOTLIB == \"matplotlib\":\n            return self.plot_crawldb_status_with_matplotlib(\n                data=data, img_path=img_path, ratio=ratio\n            )\n\n        else:\n            raise ValueError(\"Invalid PLOTLIB\")\n\n\nif __name__ == '__main__':\n    plot = CrawlerMetrics()\n    plot.read_from_stdin_or_file()\n    plot.add_percent()\n    plot.transform_data()\n    plot.save_data()\n    plot.plot()\n"
  },
  {
    "path": "plot/domain.py",
    "content": "import sys\n\nimport pandas\n\nfrom crawlstats import CST, MonthlyCrawl, MultiCount\nfrom plot.table import TabularStats\n\n\nclass DomainStats(TabularStats):\n\n    # defined via crawlstats command-line option --max-top-hosts-domains\n    MAX_TOP_DOMAINS = 500\n\n    def __init__(self, crawl):\n        super().__init__()\n        self.crawl = crawl\n        self.N = 0\n\n    def add(self, key, val):\n        cst = CST[key[0]]\n        if cst not in (CST.size, CST.domain):\n            return\n        typeval = key[1]\n        crawl = key[2]\n        if crawl != self.crawl:\n            return\n        if cst == CST.size:\n            self.size[typeval] = val\n            return\n        self.type_stats['domain'][self.N] = typeval \n        self.type_stats['pages'][self.N] = MultiCount.get_count(0, val)\n        self.type_stats['urls'][self.N] = MultiCount.get_count(1, val)\n        self.type_stats['hosts'][self.N] = MultiCount.get_count(2, val)\n        # self.type_stats['crawl'][self.N] = crawl\n        self.N += 1\n\n    def transform_data(self):\n        data = pandas.DataFrame(self.type_stats)\n        for cnt in ['pages', 'urls']:\n            total = self.size[cnt[:-1]]\n            data['%' + cnt] = 100.0 * data[cnt] / total\n        data.sort_values(ascending=False, inplace=True, by='pages')\n        print(data)\n        self.type_stats = data\n\n    def save_data(self, name, dir_name='data/'):\n        self.type_stats.to_csv('{}/{}-top-{}.csv'.format(self.PLOTDIR, name, self.MAX_TOP_DOMAINS),\n                               float_format='%.6f', index=None)\n\n    def plot(self, name):\n        data = self.type_stats\n        css_classes = ['tablesorter', 'tablesearcher']\n        data = data.set_index('domain')\n        data.columns.name = 'domain'\n        data.index.name = None\n        print(data.to_html('{}/{}-top-{}.html'.format(\n                            self.PLOTDIR, name, self.MAX_TOP_DOMAINS),\n                           float_format='%.6f',\n                           classes=css_classes, index='domain'))\n\nif __name__ == '__main__':\n    plot_crawls = sys.argv[1:]\n    if len(plot_crawls) == 0:\n        plot_crawls = MonthlyCrawl.get_latest(1)\n        print(plot_crawls)\n    latest_crawl = plot_crawls[-1]\n    plot_name = 'domains'\n    plot = DomainStats(latest_crawl)\n    plot.read_from_stdin_or_file()\n    plot.transform_data()\n    plot.save_data(plot_name, dir_name=plot.PLOTDIR)\n    plot.plot(plot_name)\n"
  },
  {
    "path": "plot/histogram.py",
    "content": "\"\"\"\nPlot histogram distributions for crawl statistics.\n\nThis module generates histogram visualizations showing distributions of:\n- Pages per URL (URL-level duplicates)\n- URLs per host/domain/TLD\n- Cumulative URL coverage by domain\n\nThese histograms help understand the distribution patterns in crawl data.\n\"\"\"\n\nimport os.path\nimport sys\nfrom collections import defaultdict\n\nimport pandas\n\nfrom crawlplot import CrawlPlot\nfrom crawlstats import CST\n\n\nclass CrawlHistogram(CrawlPlot):\n    \"\"\"Generate histogram plots for crawl statistics.\n\n    Produces histograms showing frequency distributions of various metrics\n    like duplicate rates, coverage per domain, etc.\n    \"\"\"\n\n    PSEUDO_LOG_BINS = [0, 1, 2, 5, 10, 20, 50, 100, 200, 500, 1000, 2000, 5000,\n                       10000, 20000, 50000, 100000, 200000, 500000, 1000000,\n                       2*10**6, 5*10**6, 10**7, 2*10**7, 5*10**7, 10**8,\n                       2*10**8, 5*10**8, 10**9]\n\n    def __init__(self):\n        super().__init__()\n        self.histogr = defaultdict(dict)\n        self.N = 0\n\n    def add(self, key, frequency):\n        \"\"\"Process a histogram record from statistics data.\"\"\"\n        cst = CST[key[0]]\n        if cst != CST.histogram:\n            return\n        item_type = key[1]\n        if item_type == 'surt_domain':\n            return\n        crawl = key[2]\n        type_counted = key[3]\n        count = key[4]\n        self.histogr['crawl'][self.N] = crawl\n        self.histogr['type'][self.N] = item_type\n        self.histogr['type_counted'][self.N] = type_counted\n        self.histogr['count'][self.N] = count\n        self.histogr['frequency'][self.N] = frequency\n        self.N += 1\n\n    def transform_data(self):\n        \"\"\"Convert internal dictionary to pandas DataFrame.\"\"\"\n        self.histogr = pandas.DataFrame(self.histogr)\n\n    def save_data(self):\n        \"\"\"Save histogram data to CSV file.\"\"\"\n        self.histogr.to_csv('data/crawlhistogr.csv')\n\n    def plot_dupl_url(self):\n        \"\"\"Plot histogram of pages per URL (URL-level duplicates).\"\"\"\n        from rpy2.robjects.lib import ggplot2\n\n        row_filter = ['url']\n        data = self.histogr\n        data = data[data['type'].isin(row_filter)]\n        title = 'Pages per URL (URL-level duplicates)'\n        p = ggplot2.ggplot(data) \\\n            + ggplot2.aes_string(x='count', y='frequency') \\\n            + ggplot2.geom_jitter() \\\n            + ggplot2.facet_wrap('crawl', ncol=5) \\\n            + ggplot2.labs(title=title, x='(duplicate) pages per URL',\n                           y='log(frequency)') \\\n            + ggplot2.scale_y_log10()\n        # + ggplot2.scale_x_log10()  # could use log-log scale\n        img_path = os.path.join(self.PLOTDIR, 'crawler/histogr_url_dupl.png')\n        p.save(img_path)\n        # data.to_csv(img_path + '.csv')\n        return p\n\n    def plot_host_domain_tld(self):\n        \"\"\"Plot histogram of URLs per host/domain/TLD.\"\"\"\n        from rpy2.robjects.lib import ggplot2\n\n        data = self.histogr\n        data = data[data['type'].isin(['host', 'domain', 'tld'])]\n        data = data[data['type_counted'].isin(['url'])]\n        img_path = os.path.join(self.PLOTDIR,\n                                'crawler/histogr_host_domain_tld.png')\n        # data.to_csv(img_path + '.csv')\n        title = 'URLs per Host / Domain / TLD'\n        p = ggplot2.ggplot(data) \\\n            + ggplot2.aes_string(x='count', weight='frequency', color='type') \\\n            + ggplot2.geom_freqpoly(bins=20) \\\n            + ggplot2.facet_wrap('crawl', ncol=4) \\\n            + ggplot2.labs(title='', x=title,\n                           y='Frequency') \\\n            + ggplot2.scale_y_log10() \\\n            + ggplot2.scale_x_log10()\n        p.save(img_path)\n        return p\n\n    def plot_domain_cumul_with_rpy2_ggplot2(self, data, title, img_path):\n        \"\"\"Generate cumulative domain coverage plot using rpy2/ggplot2.\"\"\"\n        from rpy2.robjects.lib import ggplot2\n\n        p = ggplot2.ggplot(data) \\\n            + ggplot2.aes_string(x='cum_domains', y='cum_urls') \\\n            + ggplot2.geom_line() + ggplot2.geom_point() \\\n            + self.GGPLOT2_THEME \\\n            + ggplot2.theme(**self.GGPLOT2_THEME_KWARGS) \\\n            + ggplot2.labs(title=title, x='domains cumulative',\n                            y='URLs cumulative') \\\n            + ggplot2.scale_y_log10() \\\n            + ggplot2.scale_x_log10()\n        p.save(img_path)\n    \n        return p\n    \n    def plot_domain_cumul(self, crawl):\n        \"\"\"Plot cumulative URL coverage by domain for a specific crawl.\"\"\"\n        data = self.histogr\n        data = data[data['type'].isin(['domain'])]\n        data = data[data['crawl'] == crawl]\n        data = data[data['type_counted'].isin(['url'])]\n        data['urls'] = data['count']*data['frequency']\n        print(data)\n        data = data[['urls', 'count', 'frequency']]\n        data = data.sort_values(['count'], ascending=0)\n        data['cum_domains'] = data['frequency'].cumsum()\n        data['cum_urls'] = data['urls'].cumsum()\n        data_perc = data.apply(lambda x: round(100.0*x/float(x.sum()), 1))\n        data['%domains'] = data_perc['frequency']\n        data['%urls'] = data_perc['urls']\n        data['%cum_domains'] = data['cum_domains'].apply(\n            lambda x: round(100.0*x/float(data['frequency'].sum()), 1))\n        data['%cum_urls'] = data['cum_urls'].apply(\n            lambda x: round(100.0*x/float(data['urls'].sum()), 1))\n\n        img_path = os.path.join(self.PLOTDIR,\n                                'crawler/histogr_domain_cumul.png')\n        # data.to_csv(img_path + '.csv')\n        title = 'Cumulative URLs for Top Domains'\n\n        if self.PLOTLIB == \"rpy2.ggplot2\":\n            return self.plot_domain_cumul_with_rpy2_ggplot2(data=data, title=title, img_path=img_path)\n        \n        elif self.PLOTLIB == \"matplotlib\":\n            # this plot is currently not used\n            raise NotImplementedError\n        \n        else:\n            raise ValueError(\"Invalid PLOTLIB\")\n\n\n\nif __name__ == '__main__':\n    latest_crawl = sys.argv[-1]\n    plot = CrawlHistogram()\n    plot.read_from_stdin_or_file()\n    plot.transform_data()\n    plot.save_data()\n    plot.plot_dupl_url()\n    plot.plot_host_domain_tld()\n    plot.plot_domain_cumul(latest_crawl)\n"
  },
  {
    "path": "plot/language.py",
    "content": "import string\nimport sys\n\nfrom plot.table import TabularStats\nfrom crawlstats import CST, MonthlyCrawl\n\n\nclass LanguageStats(TabularStats):\n\n    MIN_AVERAGE_COUNT = 1\n    MAX_LANGUAGES = 200\n\n    def __init__(self):\n        super().__init__()\n        self.MAX_TYPE_VALUES = LanguageStats.MAX_LANGUAGES\n\n    def add(self, key, val):\n        self.add_check_type(key, val, CST.primary_language)\n\n\nif __name__ == '__main__':\n    plot_crawls = sys.argv[1:]\n    plot_name = 'languages'\n    column_header = 'language'\n    if len(plot_crawls) == 0:\n        plot_crawls = MonthlyCrawl.get_latest(3)\n        print(plot_crawls)\n    else:\n        plot_name += '-' + '-'.join(plot_crawls)\n    plot = LanguageStats()\n    plot.read_from_stdin_or_file()\n    plot.transform_data(LanguageStats.MAX_LANGUAGES,\n                        LanguageStats.MIN_AVERAGE_COUNT,\n                        None)\n    plot.save_data_percentage(plot_name, dir_name='plots', type_name='primary_language')\n    plot.plot(plot_crawls, plot_name, column_header,\n              ['iso639-3-language'])\n"
  },
  {
    "path": "plot/mimetype.py",
    "content": "import re\nimport sys\n\nfrom plot.table import TabularStats\nfrom crawlstats import CST, MonthlyCrawl\n\n\nclass MimeTypeStats(TabularStats):\n\n    MIN_AVERAGE_COUNT = 500\n    MAX_MIME_TYPES = 100\n\n    # see https://en.wikipedia.org/wiki/Media_type#Naming\n    mime_pattern_str = \\\n        r'(?:x-)?[a-z]+/[a-z0-9]+' \\\n        r'(?:[.-](?:c\\+\\+[a-z]*|[a-z0-9]+))*(?:\\+[a-z0-9]+)?'\n    mime_pattern = re.compile(r'^'+mime_pattern_str+r'$')\n    mime_extract_pattern = re.compile(r'^\\s*(?:content\\s*=\\s*)?[\"\\']?\\s*(' +\n                                      mime_pattern_str +\n                                      r')(?:\\s*[;,].*)?\\s*[\"\\']?\\s*$')\n\n    def __init__(self):\n        super().__init__()\n        self.MAX_TYPE_VALUES = MimeTypeStats.MAX_MIME_TYPES\n\n    def norm_value(self, mimetype):\n        if type(mimetype) is str:\n            mimetype = mimetype.lower()\n            m = MimeTypeStats.mime_extract_pattern.match(mimetype)\n            if m:\n                return m.group(1)\n            return mimetype.strip('\"\\', \\t')\n        return \"\"\n\n    def add(self, key, val):\n        self.add_check_type(key, val, CST.mimetype)\n\n\nif __name__ == '__main__':\n    plot_crawls = sys.argv[1:]\n    plot_name = 'mimetypes'\n    column_header = 'mimetype'\n    if len(plot_crawls) == 0:\n        plot_crawls = MonthlyCrawl.get_latest(3)\n        print(plot_crawls)\n    else:\n        plot_name += '-' + '-'.join(plot_crawls)\n    plot = MimeTypeStats()\n    plot.read_from_stdin_or_file()\n    plot.transform_data(MimeTypeStats.MAX_MIME_TYPES,\n                        MimeTypeStats.MIN_AVERAGE_COUNT,\n                        MimeTypeStats.mime_pattern)\n    plot.save_data_percentage(plot_name, dir_name='plots', type_name='mimetype')\n    plot.plot(plot_crawls, plot_name, column_header, ['tablesearcher'])\n"
  },
  {
    "path": "plot/mimetype_detected.py",
    "content": "import sys\n\nfrom plot.mimetype import MimeTypeStats\nfrom crawlstats import CST, MonthlyCrawl\n\n\nclass MimeTypeDetectedStats(MimeTypeStats):\n\n    def __init__(self):\n        super().__init__()\n        self.MAX_TYPE_VALUES = MimeTypeStats.MAX_MIME_TYPES\n\n    def norm_value(self, mimetype):\n        return mimetype\n\n    def add(self, key, val):\n        self.add_check_type(key, val, CST.mimetype_detected)\n\n\nif __name__ == '__main__':\n    plot_crawls = sys.argv[1:]\n    plot_name = 'mimetypes_detected'\n    column_header = 'mimetype_detected'\n    if len(plot_crawls) == 0:\n        plot_crawls = MonthlyCrawl.get_latest(3)\n        print(plot_crawls)\n    else:\n        plot_name += '-' + '-'.join(plot_crawls)\n    plot = MimeTypeDetectedStats()\n    plot.read_from_stdin_or_file()\n    plot.transform_data(MimeTypeStats.MAX_MIME_TYPES,\n                        MimeTypeStats.MIN_AVERAGE_COUNT,\n                        None)\n    plot.save_data_percentage(plot_name, dir_name='plots', type_name='mimetype_detected')\n    plot.plot(plot_crawls, plot_name, column_header, ['tablesearcher'])\n"
  },
  {
    "path": "plot/overlap.py",
    "content": "\"\"\"\nPlot crawl overlap and similarity metrics.\n\nThis module generates visualizations showing the overlap between different\ncrawls based on URL or content digest similarities. Uses Jaccard similarity\nto measure the intersection over union of items between crawls.\n\"\"\"\n\nimport copy\nimport os.path\nfrom collections import defaultdict\n\nimport pandas\nimport pygraphviz\n\nfrom crawlplot import CrawlPlot\nfrom crawlstats import CST, CrawlStatsJSONDecoder, MonthlyCrawl\n\n\nclass CrawlOverlap(CrawlPlot):\n    \"\"\"Generate overlap and similarity visualizations between crawls.\n\n    Calculates and visualizes the Jaccard similarity between crawls\n    based on unique URLs or content digests using HyperLogLog cardinality\n    estimation.\n    \"\"\"\n\n    MAX_MATRIX_SIZE = 30\n\n    def __init__(self):\n        super().__init__()\n\n        self.crawl_size = defaultdict(dict)\n        self.overlap = defaultdict(dict)\n        self.similarity = defaultdict(dict)  # Jaccard index\n\n    def add(self, key, val):\n        \"\"\"Process a size_estimate record and store HyperLogLog for overlap calculation.\"\"\"\n        cst = CST[key[0]]\n        if cst != CST.size_estimate:\n            return\n        item_type = key[1]\n        crawl = key[2]\n        hll = CrawlStatsJSONDecoder.json_decode_hyperloglog(val)\n        self.crawl_size[item_type][crawl] = hll\n\n    def fill_overlap_matrix(self):\n        \"\"\"Calculate pairwise overlap and Jaccard similarity between all crawls.\"\"\"\n        for item_type in self.crawl_size:\n            for crawl1 in self.crawl_size[item_type]:\n                hll1 = self.crawl_size[item_type][crawl1]\n                size1 = len(hll1)\n                self.overlap[item_type][crawl1] = defaultdict(list)\n                self.similarity[item_type][crawl1] = defaultdict(float)\n                for crawl2 in self.crawl_size[item_type]:\n                    if crawl1 >= crawl2:\n                        continue\n                    hll2 = self.crawl_size[item_type][crawl2]\n                    size2 = len(hll2)\n                    union_hll = copy.deepcopy(hll1)\n                    union_hll.update(hll2)\n                    union = len(union_hll)\n                    intersection = size1 + size2 - union\n                    jaccard_sim = intersection / union\n                    self.overlap[item_type][crawl1][crawl2] \\\n                        = [intersection, union, size1, size2,\n                           (intersection/size2), jaccard_sim]\n                    self.similarity[item_type][crawl1][crawl2] = jaccard_sim\n\n    def save_overlap_matrix(self):\n        \"\"\"Save overlap and similarity matrices to CSV files.\"\"\"\n        for item_type in self.overlap:\n            data = pandas.DataFrame(self.similarity[item_type])\n            data.to_csv('data/crawlsimilarity_' + item_type + '.csv')\n            data = pandas.DataFrame(self.overlap[item_type])\n            data.to_csv('data/crawloverlap_' + item_type + '.csv')\n\n    def plot_similarity_graph(self, show_edges=False):\n        \"\"\"Visualize similarity as a graph using GraphViz (experimental).\"\"\"\n        g = pygraphviz.AGraph(directed=False, overlap='scale', splines=True)\n        g.node_attr['shape'] = 'plaintext'\n        g.node_attr['fontsize'] = '12'\n        if show_edges:\n            g.edge_attr['color'] = 'lightgrey'\n            g.edge_attr['fontcolor'] = 'grey'\n            g.edge_attr['fontsize'] = '8'\n        else:\n            g.edge_attr['style'] = 'invis'\n        for crawl1 in sorted(self.similarity['url']):\n            for crawl2 in sorted(self.similarity['url'][crawl1]):\n                similarity = self.similarity['url'][crawl1][crawl2]\n                distance = 1.0 - similarity\n                g.add_edge(MonthlyCrawl.short_name(crawl1),\n                           MonthlyCrawl.short_name(crawl2),\n                           len=(distance),\n                           label='{0:.2f}'.format(distance))\n        g.write(os.path.join(self.PLOTDIR, 'crawlsimilarity_url.dot'))\n        g.draw(os.path.join(self.PLOTDIR, 'crawlsimilarity_url.svg'), prog='fdp')\n\n    def plot_similarity_matrix_with_rpy2_ggplot2(self, data, midpoint, title, textsize, img_path):\n        \"\"\"Generate similarity heatmap using rpy2/ggplot2.\"\"\"\n        from rpy2.robjects.lib import ggplot2\n\n        p = ggplot2.ggplot(data) \\\n            + ggplot2.aes_string(x='crawl2', y='crawl1',\n                                fill='similarity', label='sim_rounded') \\\n            + ggplot2.geom_tile(color=\"white\") \\\n            + ggplot2.scale_fill_gradient2(low=\"red\", high=\"blue\", mid=\"white\",\n                                        midpoint=midpoint, space=\"Lab\") \\\n            + self.GGPLOT2_THEME \\\n            + ggplot2.coord_fixed() \\\n            + ggplot2.theme(**{'axis.text.x':\n                            ggplot2.element_text(angle=45,\n                                                    vjust=1, hjust=1),\n                            **self.GGPLOT2_THEME_KWARGS}) \\\n            + ggplot2.labs(title=title, x='', y='') \\\n            + ggplot2.geom_text(color='black', size=textsize)\n\n        p.save(img_path)\n        return p\n    \n    def plot_similarity_matrix_with_matplotlib(self, data, decimals, title, cell_textsize, img_path):\n        \"\"\"Generate similarity heatmap using matplotlib.\n\n        Creates a color-coded matrix showing Jaccard similarity between crawls,\n        with color ranging from red (low) through white to blue (high).\n        \"\"\"\n        import matplotlib.pyplot as plt\n        import numpy as np\n        from matplotlib.colors import LinearSegmentedColormap, Normalize\n\n        # Pivot data to create matrix\n        pivot_data = data.pivot(index='crawl1', columns='crawl2', values='similarity')\n        pivot_data_rounded = pivot_data.round(decimals)\n\n        fig, ax = self.create_figure()\n\n        # Create color map: red (low) -> white (mid) -> blue (high)\n        vmin = pivot_data_rounded.min().min()\n        vmax = pivot_data_rounded.max().max()\n\n        if vmin < 0:\n            colors = ['#ff0801', '#ff6b48', '#ffa388', '#ffd2c4', '#fff4ef',\n                      '#FFFFFF', '#eadaff', '#c6a5ff', '#a073ff', '#6e43ff',\n                      '#4020ff', '#1306ff']\n        else:\n            colors = ['#fff4ef', '#FFFFFF', '#eadaff', '#c6a5ff', '#a073ff',\n                      '#6e43ff', '#4020ff', '#1306ff']\n\n        cmap = LinearSegmentedColormap.from_list('red_white_blue', colors, N=256)\n        norm = Normalize(vmin=vmin, vmax=vmax)\n\n        # Add grey grid lines behind everything\n        ax.set_axisbelow(True)\n        ax.grid(True, which='major', linewidth=0.8, color='#E6E6E6', zorder=-1)\n\n        # Create heatmap with origin='lower' to match ggplot2 (bottom-up)\n        im = ax.imshow(pivot_data_rounded.values, cmap=cmap, norm=norm,\n                       aspect='equal', origin='lower', zorder=1)\n\n        # Add text annotations\n        for i in range(len(pivot_data.index)):\n            for j in range(len(pivot_data.columns)):\n                similarity = pivot_data.iloc[i, j]\n                if pandas.isna(similarity):\n                    continue\n\n                # Draw white rectangle border around each cell\n                rect = plt.Rectangle((j - 0.5, i - 0.5), 1, 1,\n                                      fill=False, edgecolor='white',\n                                      linewidth=0.5, zorder=1)\n                ax.add_patch(rect)\n\n                # Get the rounded text for this cell\n                matching_rows = data[(data['crawl1'] == pivot_data.index[i]) &\n                                     (data['crawl2'] == pivot_data.columns[j])]\n                if len(matching_rows) > 0:\n                    text_val = matching_rows['sim_rounded'].iloc[0]\n                    ax.text(j, i, text_val, ha='center', va='center',\n                            color='black', fontsize=cell_textsize, zorder=2)\n\n        # Set ticks and labels\n        ax.set_xticks(np.arange(len(pivot_data.columns)))\n        ax.set_yticks(np.arange(len(pivot_data.index)))\n        ax.set_xticklabels(pivot_data.columns, fontsize=10)\n        ax.set_yticklabels(pivot_data.index, fontsize=10)\n\n        # Hide tick marks but keep labels black\n        ax.tick_params(axis='both', which='both', colors='#FFFFFF', zorder=0)\n        self.set_tick_labels_black(ax)\n\n        # Rotate x-axis labels\n        plt.setp(ax.get_xticklabels(), rotation=45, ha='right', va='top')\n\n        self.set_title(ax, title)\n        ax.set_xlabel('')\n        ax.set_ylabel('')\n\n        # Add colorbar\n        cbar = plt.colorbar(im, ax=ax, aspect=5, pad=0.04, shrink=0.2)\n        cbar.ax.set_title('similarity', fontsize=10, pad=10, loc=\"left\")\n        cbar.ax.tick_params(labelsize=8)\n        cbar.outline.set_visible(False)\n\n        # Apply ggplot2-like styling\n        self.apply_ggplot2_style(ax, show_grid=False)\n\n        return self.save_figure(fig, img_path)\n\n\n    def plot_similarity_matrix(self, item_type, image_file, title):\n        \"\"\"Plot similarities of crawls as a heatmap matrix.\n\n        Args:\n            item_type: Type of items to compare ('url' or 'digest')\n            image_file: Output filename relative to PLOTDIR\n            title: Plot title\n        \"\"\"\n        data = defaultdict(dict)\n        n = 1\n        for crawl1 in self.similarity[item_type]:\n            for crawl2 in self.similarity[item_type][crawl1]:\n                similarity = self.similarity[item_type][crawl1][crawl2]\n                data['crawl1'][n] = MonthlyCrawl.short_name(crawl1)\n                data['crawl2'][n] = MonthlyCrawl.short_name(crawl2)\n                data['similarity'][n] = similarity\n                data['sim_rounded'][n] = similarity  # to be rounded\n                n += 1\n        data = pandas.DataFrame(data)\n        print(data)\n        # select median of similarity values as midpoint of similarity scale\n        midpoint = data['similarity'].median()\n        decimals = 3\n        textsize = 2\n        minshown = .0005\n        cell_textsize = 6\n\n        if (data['similarity'].max()-data['similarity'].min()) > .2:\n            decimals = 2\n            textsize = 2.8\n            minshown = .005\n            cell_textsize = 8\n\n        data['sim_rounded'] = data['sim_rounded'].apply(\n            lambda x: ('{0:.'+str(decimals)+'f}').format(x).lstrip('0')\n            if x >= minshown else '0')\n        print('Median of similarities for', item_type, '=', midpoint)\n        matrix_size = len(self.similarity[item_type])\n        if matrix_size > self.MAX_MATRIX_SIZE:\n            n = 0\n            for crawl1 in sorted(self.similarity[item_type], reverse=True):\n                short_name = MonthlyCrawl.short_name(crawl1)\n                if n > self.MAX_MATRIX_SIZE:\n                    data = data[data['crawl1'] != short_name]\n                    data = data[data['crawl2'] != short_name]\n                n += 1\n\n        img_path = os.path.join(self.PLOTDIR, image_file)\n\n        if self.PLOTLIB == \"rpy2.ggplot2\":\n            return self.plot_similarity_matrix_with_rpy2_ggplot2(data=data, midpoint=midpoint, title=title, textsize=textsize, img_path=img_path)\n        \n        elif self.PLOTLIB == \"matplotlib\":\n            return self.plot_similarity_matrix_with_matplotlib(data=data, decimals=decimals, title=title, cell_textsize=cell_textsize, img_path=img_path)\n        \n        else:\n            raise ValueError(\"Invalid PLOTLIB\")\n\n\nif __name__ == '__main__':\n    plot = CrawlOverlap()\n    plot.read_from_stdin_or_file()\n    plot.fill_overlap_matrix()\n    plot.save_overlap_matrix()\n    # plot.plot_similarity_graph()\n    plot.plot_similarity_matrix(\n        'url', 'crawloverlap/crawlsimilarity_matrix_url.png',\n        'URL overlap between crawls (Jaccard similarity)')\n    plot.plot_similarity_matrix(\n        'digest', 'crawloverlap/crawlsimilarity_matrix_digest.png',\n        'Content overlap between crawls (Jaccard similarity on digest)')\n"
  },
  {
    "path": "plot/table.py",
    "content": "import heapq\n\nimport numpy\nimport pandas\n\nfrom collections import defaultdict, Counter\n\nfrom crawlplot import CrawlPlot\nfrom crawlstats import CST, MultiCount\n\n\nclass TabularStats(CrawlPlot):\n\n    def __init__(self):\n        super().__init__()\n\n        self.crawls = set()\n        self.types = defaultdict(dict)\n        self.type_stats = defaultdict(dict)\n        self.types_total = Counter()\n        self.size = defaultdict(dict)\n        self.N = 0\n\n    def norm_value(self, typeval):\n        return typeval\n\n    def add_check_type(self, key, val, requ_type_cst):\n        cst = CST[key[0]]\n        if cst != requ_type_cst and cst != CST.size:\n            return\n        typeval = key[1]\n        crawl = key[2]\n        self.crawls.add(crawl)\n        typeval = self.norm_value(typeval)\n        if cst == CST.size:\n            self.size[crawl][typeval] = int(val)\n            return\n        if crawl in self.types[typeval]:\n            self.types[typeval][crawl] = \\\n                MultiCount.sum_values([val, self.types[typeval][crawl]])\n        else:\n            self.types[typeval][crawl] = val\n        npages = MultiCount.get_count(0, val)\n        self.types_total[typeval] += npages\n        if 'known_values' not in self.size[crawl]:\n            self.size[crawl]['known_values'] = 0\n        self.size[crawl]['known_values'] += npages\n\n    def transform_data(self, top_n, min_avg_count, check_pattern=None):\n        print(\"Number of different values after first normalization: {}\"\n              .format(len(self.types)))\n        typevals_for_deletion = set()\n        typevals_mostfrequent = []\n        for typeval in self.types:\n            total_count = self.types_total[typeval]\n            average_count = int(total_count / len(self.crawls))\n            if average_count >= min_avg_count:\n                if not check_pattern or check_pattern.match(typeval):\n                    print('{}\\t{}\\t{}'.format(typeval,\n                                              average_count, total_count))\n                    fval = (total_count, typeval)\n                    if len(typevals_mostfrequent) < top_n:\n                        heapq.heappush(typevals_mostfrequent, fval)\n                    else:\n                        heapq.heappushpop(typevals_mostfrequent, fval)\n                    continue  # ok, keep this type value\n                else:\n                    print('Type value frequent but invalid: <{}> (avg. count = {})'\n                          .format(typeval, average_count))\n            elif average_count >= (min_avg_count/10):\n                if not check_pattern or check_pattern.match(typeval):\n                    print('Skipped type value because of low frequency: <{}> (avg. count = {}, min. = {})'\n                          .format(typeval, average_count, (min_avg_count/10)))\n            typevals_for_deletion.add(typeval)\n        # map low frequency or invalid type values to empty type\n        keep_typevals = set()\n        for (_, typeval) in typevals_mostfrequent:\n            keep_typevals.add(typeval)\n        for typeval in self.types:\n            if (typeval not in keep_typevals and\n                    typeval not in typevals_for_deletion):\n                print('Skipped type value because not in top {}: <{}> (avg. count = {})'\n                      .format(top_n, typeval,\n                              int(self.types_total[typeval]/len(self.crawls))))\n                typevals_for_deletion.add(typeval)\n        typevals_other = dict()\n        for typeval in typevals_for_deletion:\n            for crawl in self.types[typeval]:\n                if crawl in typevals_other:\n                    val = typevals_other[crawl]\n                else:\n                    val = 0\n                typevals_other[crawl] = \\\n                    MultiCount.sum_values([val, self.types[typeval][crawl]])\n            self.types.pop(typeval, None)\n        self.types['<other>'] = typevals_other\n        print('Number of different type values after cleaning and'\n              ' removal of low frequency types: {}'\n              .format(len(self.types)))\n        # unknown values\n        for crawl in self.crawls:\n            known_values = 0\n            if 'known_values' in self.size[crawl]:\n                known_values = self.size[crawl]['known_values']\n            unknown = (self.size[crawl]['page'] - known_values)\n            if unknown > 0:\n                print(\"{} unknown values in {}\".format(unknown, crawl))\n                self.types['<unknown>'][crawl] = unknown\n        for typeval in self.types:\n            for crawl in self.types[typeval]:\n                self.type_stats['type'][self.N] = typeval\n                self.type_stats['crawl'][self.N] = crawl\n                value = self.types[typeval][crawl]\n                n_pages = MultiCount.get_count(0, value)\n                self.type_stats['pages'][self.N] = n_pages\n                n_urls = MultiCount.get_count(1, value)\n                self.type_stats['urls'][self.N] = n_urls\n                self.N += 1\n        self.type_stats = pandas.DataFrame(self.type_stats)\n\n    def save_data(self, base_name, dir_name='data/'):\n        self.type_stats.to_csv(dir_name + base_name + '.csv')\n\n    def save_data_percentage(self, base_name, dir_name='data/', type_name='type'):\n        if dir_name[-1] != '/':\n            dir_name += '/'\n        data = self.type_stats\n        data = data[['crawl', 'type', 'pages', 'urls']]\n        sum_data = data.groupby(['crawl']).aggregate({'pages':'sum'}).add_suffix('_sum').reset_index()\n        data = data.groupby(['crawl', 'type']).aggregate(numpy.sum).reset_index()\n        data = pandas.merge(data, sum_data)\n        data['%pages/crawl'] = 100.0 * data['pages'] / data['pages_sum']\n        data.drop(['pages_sum'], inplace=True, axis=1)\n        data = data.rename(columns={'type': type_name})\n        data.to_csv(dir_name + base_name + '.csv', float_format='%.4f', index=None)\n\n    def plot(self, crawls, name, column_header, xtra_css_classes=[]):\n        # stats comparison for selected crawls\n        field_percentage_formatter = '{0:,.4f}'.format\n        data = self.type_stats\n        data = data[data['crawl'].isin(crawls)]\n        if data.size == 0:\n            print(\"No data points in table for selected crawls ({})\"\n                  .format(crawls))\n            return\n        data[column_header] = data['type']\n        data = data[['crawl', column_header, 'pages']]\n        data = data.groupby(['crawl', column_header]).agg({'pages': 'sum'})\n        data = data.groupby(level=0, as_index=False).apply(lambda x: 100.0*x/float(x.sum()))\n        data = data.reset_index().pivot(index=column_header,\n                                        columns='crawl', values='pages')\n        print(\"\\n-----\\n\")\n        formatters = {c: field_percentage_formatter for c in crawls}\n        print(data.to_string(formatters=formatters))\n        css_classes = ['tablesorter', 'tablepercentage']\n        css_classes.extend(xtra_css_classes)\n        data.to_html('{}/{}-top-{}.html'.format(\n                     self.PLOTDIR, name, self.MAX_TYPE_VALUES),\n                     formatters=formatters,\n                     classes=css_classes)\n\n"
  },
  {
    "path": "plot/tld.py",
    "content": "import sys\n\nfrom collections import defaultdict\n\nimport pandas\n\nfrom crawlplot import CrawlPlot\nfrom crawlstats import CST, MonthlyCrawl, MultiCount\nfrom top_level_domain import TopLevelDomain\nfrom stats.tld_alexa_top_1m import alexa_top_1m_tlds\nfrom stats.tld_cisco_umbrella_top_1m import cisco_umbrella_top_1m_tlds\nfrom stats.tld_majestic_top_1m import majestic_top_1m_tlds\n\n# min. share of URLs for a TLD to be shown in metrics\nmin_urls_percentage = .05\n\n\nclass TldStats(CrawlPlot):\n\n    def __init__(self):\n        super().__init__()\n\n        self.tlds = defaultdict(dict)\n        self.tld_stats = defaultdict(dict)\n        self.N = 0\n\n    def add(self, key, val):\n        cst = CST[key[0]]\n        if cst != CST.tld:\n            return\n        tld = key[1]\n        crawl = key[2]\n        self.tlds[tld][crawl] = val\n\n    def transform_data(self):\n        crawl_has_host_domain_counts = {}\n        for tld in self.tlds:\n            tld_repr = tld\n            tld_obj = None\n            if tld in ('', '(ip address)'):\n                continue\n            else:\n                try:\n                    tld_obj = TopLevelDomain(tld)\n                    tld_repr = tld_obj.tld\n                except:\n                    print('error', tld)\n                    continue\n            for crawl in self.tlds[tld]:\n                self.tld_stats['suffix'][self.N] = tld_repr\n                self.tld_stats['crawl'][self.N] = crawl\n                date = pandas.Timestamp(MonthlyCrawl.date_of(crawl))\n                self.tld_stats['date'][self.N] = date\n                if tld_obj:\n                    self.tld_stats['type'][self.N] \\\n                        = TopLevelDomain.short_type(tld_obj.tld_type)\n                    self.tld_stats['subtype'][self.N] = tld_obj.sub_type\n                    self.tld_stats['tld'][self.N] = tld_obj.first_level\n                else:\n                    self.tld_stats['type'][self.N] = ''\n                    self.tld_stats['subtype'][self.N] = ''\n                    self.tld_stats['tld'][self.N] = ''\n                value = self.tlds[tld][crawl]\n                n_pages = MultiCount.get_count(0, value)\n                self.tld_stats['pages'][self.N] = n_pages\n                n_urls = MultiCount.get_count(1, value)\n                self.tld_stats['urls'][self.N] = n_urls\n                n_hosts = MultiCount.get_count(2, value)\n                self.tld_stats['hosts'][self.N] = n_hosts\n                n_domains = MultiCount.get_count(3, value)\n                self.tld_stats['domains'][self.N] = n_domains\n                if n_urls != n_hosts:\n                    # multi counts including host counts are not (yet)\n                    # available for all crawls\n                    crawl_has_host_domain_counts[crawl] = True\n                elif crawl not in crawl_has_host_domain_counts:\n                    crawl_has_host_domain_counts[crawl] = False\n                self.N += 1\n        for crawl in crawl_has_host_domain_counts:\n            if not crawl_has_host_domain_counts[crawl]:\n                print('No host and domain counts for', crawl)\n                for n in self.tld_stats['crawl']:\n                    if self.tld_stats['crawl'][n] == crawl:\n                        del(self.tld_stats['hosts'][n])\n                        del(self.tld_stats['domains'][n])\n        self.tld_stats = pandas.DataFrame(self.tld_stats)\n\n    @staticmethod\n    def field_percentage_formatter(precision=2, nan='-'):\n        f = '{0:,.' + str(precision) + 'f}'\n        return lambda x: nan if pandas.isna(x) else f.format(x)\n\n\n    def save_data(self):\n        self.tld_stats.to_csv('data/tlds.csv')\n\n    def percent_agg(self, data, column, index, values, aggregate):\n        data = data[[column, index, values]]\n        data = data.groupby([column, index]).agg(aggregate)\n        data = data.groupby(level=0, as_index=False).apply(lambda x: 100.0*x/float(x.sum()))\n        # print(\"\\n-----\\n\")\n        # print(data.to_string(formatters={'urls': TldStats.field_percentage_formatter()}))\n        return data\n\n    def pivot_percentage(self, data, column, index, values, aggregate):\n        data = self.percent_agg(data, column, index, values, aggregate)\n        return data.reset_index().pivot(index=index,\n                                        columns=[column], values=values)\n\n    def plot_groups(self):\n        title = 'Groups of Top-Level Domains'\n        ylabel = 'URLs %'\n        clabel = ''\n        img_file = 'tld/groups.png'\n        data = self.pivot_percentage(self.tld_stats, 'crawl', 'type',\n                                     'urls', {'urls': 'sum'})\n        data = data.transpose()\n        print(\"\\n-----\\n\")\n        types = set(self.tld_stats['type'].tolist())\n        formatters = {c: TldStats.field_percentage_formatter() for c in types}\n        print(data.to_string(formatters=formatters))\n        data.to_html('{}/tld/groups-percentage.html'.format(self.PLOTDIR),\n                     formatters=formatters,\n                     classes=['tablesorter', 'tablepercentage'])\n        data = self.percent_agg(self.tld_stats, 'date', 'type',\n                                'urls', {'urls': 'sum'}).reset_index()\n        return self.line_plot(data, title, ylabel, img_file,\n                              x='date', y='urls', c='type', clabel=clabel)\n\n    def plot(self, crawls, latest_crawl):\n        field_formatters = {c: '{:,.0f}'.format\n                            for c in ['pages', 'urls', 'hosts', 'domains']}\n        for c in ['%urls', '%hosts', '%domains']:\n            field_formatters[c] = TldStats.field_percentage_formatter()\n        data = self.tld_stats\n        data = data[data['crawl'].isin(crawls)]\n        crawl_data = data\n        top_tlds = []\n        # stats per crawl\n        for crawl in crawls:\n            print(\"\\n-----\\n{}\\n\".format(crawl))\n            for aggr_type in ('type', 'tld'):\n                data = crawl_data\n                data = data[data['crawl'].isin([crawl])]\n                data = data[[aggr_type, 'pages', 'urls', 'hosts', 'domains']]\n                data = data.set_index([aggr_type])\n                data = data.groupby(level=0).sum().sort_values(\n                    by=['urls'], ascending=False)\n                for count in ('urls', 'hosts', 'domains'):\n                    data['%'+count] = 100.0 * data[count] / data[count].sum()\n                if aggr_type == 'tld':\n                    # skip less frequent TLDs\n                    data = data[data['%urls'] >= min_urls_percentage]\n                    for tld in data.index.values:\n                        top_tlds.append(tld)\n                print(data.to_string(formatters=field_formatters))\n                print()\n                if crawl == latest_crawl:\n                    # latest crawl by convention\n                    type_name = aggr_type\n                    if aggr_type == 'type':\n                        type_name = 'group'\n                    path = '{}/tld/latest-crawl-{}s.html'.format(\n                        self.PLOTDIR, type_name)\n                    data.to_html(path,\n                                 formatters=field_formatters,\n                                 classes=['tablesorter', 'tablesearcher'])\n        # stats comparison for selected crawls\n        for aggr_type in ('type', 'tld'):\n            data = crawl_data\n            if aggr_type == 'tld':\n                data = data[data['tld'].isin(top_tlds)]\n            data = self.pivot_percentage(data, 'crawl', aggr_type,\n                                         'urls', {'urls': 'sum'})\n            print(\"\\n----- {}\\n\".format(aggr_type))\n            print(data.to_string(formatters={c: TldStats.field_percentage_formatter()\n                                             for c in crawls}))\n            if aggr_type == 'tld':\n                # save as HTML table\n                path = '{}/tld/selected-crawls-percentage.html'.format(\n                                    self.PLOTDIR, len(crawls))\n                data.to_html(path,\n                             float_format=TldStats.field_percentage_formatter(4),\n                             classes=['tablesorter', 'tablepercentage',\n                                      'tablesearcher'])\n\n    def plot_comparison(self, crawl, name, topNlimit=None, method='spearman'):\n        print()\n        print('Comparison for', crawl, '-', name, '-', method)\n        data = self.tld_stats\n        data = data[data['crawl'].isin([crawl])]\n        data = data[data['urls'] >= topNlimit]\n        data = data.set_index(['tld'], drop=False)\n        data = data.sum(level='tld')\n        print(data)\n        data['alexa'] = pandas.Series(alexa_top_1m_tlds)\n        data['cisco'] = pandas.Series(cisco_umbrella_top_1m_tlds)\n        data['majestic'] = pandas.Series(majestic_top_1m_tlds)\n        fields = ('pages', 'urls', 'hosts', 'domains',\n                  'alexa', 'cisco', 'majestic')\n        formatters = {c: '{0:,.3f}'.format for c in fields}\n        # relative frequency (percent)\n        for count in fields:\n            data[count] = 100.0 * data[count] / data[count].sum()\n        # Spearman's rank correlation for all TLDs\n        corr = data.corr(method=method, min_periods=1)\n        print(corr.to_string(formatters=formatters))\n        corr.to_html('{}/tld/{}-comparison-{}-all-tlds.html'\n                     .format(self.PLOTDIR, name, method),\n                     formatters=formatters,\n                     classes=['matrix'])\n        if topNlimit is None:\n            return\n        # Spearman's rank correlation for TLDs covering\n        # at least topNlimit % of urls\n        data = data[data['urls'] >= topNlimit]\n        print()\n        print('Top', len(data), 'TLDs (>= ', topNlimit, '%)')\n        print(data)\n        data.to_html('{}/tld/{}-comparison.html'.format(self.PLOTDIR, name),\n                     formatters=formatters,\n                     classes=['tablesorter', 'tablepercentage'])\n        print()\n        corr = data.corr(method=method, min_periods=1)\n        print(corr.to_string(formatters=formatters))\n        corr.to_html('{}/tld/{}-comparison-{}-frequent-tlds.html'\n                     .format(self.PLOTDIR, name, method),\n                     formatters=formatters,\n                     classes=['matrix'])\n        print()\n\n    def plot_comparison_groups(self):\n        # Alexa and Cisco types/groups:\n        for (name, data) in [('Alexa', alexa_top_1m_tlds),\n                             ('Cisco', cisco_umbrella_top_1m_tlds),\n                             ('Majestic', majestic_top_1m_tlds)]:\n            compare_types = defaultdict(int)\n            for tld in data:\n                compare_types[TopLevelDomain(tld).tld_type] += data[tld]\n            print(name, 'TLD groups:')\n            for tld in compare_types:\n                c = compare_types[tld]\n                print(' {:6d}\\t{:4.1f}\\t{}'.format(c, (100.0*c/1000000), tld))\n            print()\n\n\nif __name__ == '__main__':\n    plot_crawls = sys.argv[1:]\n    latest_crawl = plot_crawls[-1]\n    if len(plot_crawls) == 0:\n        print(sys.argv[0], 'crawl-id...')\n        print()\n        print('Distribution of top-level domains for (selected) monthly crawls')\n        print()\n        print('Example:')\n        print('', sys.argv[0], '[options]', 'CC-MAIN-2014-52', 'CC-MAIN-2016-50')\n        print()\n        print('Last argument is considered to be the latest crawl')\n        print()\n        print('Options:')\n        print()\n        sys.exit(1)\n    plot = TldStats()\n    plot.read_data(sys.stdin)\n    plot.transform_data()\n    plot.save_data()\n    plot.plot_groups()\n    plot.plot(plot_crawls, latest_crawl)\n    if latest_crawl == 'CC-MAIN-2019-09':\n        # plot comparison only for crawl of similar date as benchmark data\n        plot.plot_comparison(latest_crawl, 'selected-crawl',\n                             min_urls_percentage)\n#         plot.plot_comparison(latest_crawl, 'selected-crawl',\n#                              min_urls_percentage, 'pearson')\n    plot.plot_comparison_groups()\n"
  },
  {
    "path": "plot/tld_by_continent.py",
    "content": "\"\"\"\nPlot TLD distributions by continent.\n\nThis module generates visualizations showing how TLDs are distributed\nacross geographic continents and major TLD groups (com/net, org, edu, gov/mil).\nMaps country-code TLDs to their respective continents using ISO country codes.\n\"\"\"\n\nimport json\nimport os.path\nimport sys\nfrom collections import Counter, defaultdict\n\nimport fsspec\nimport matplotlib.pyplot as plt\nimport pandas\nfrom matplotlib.ticker import MaxNLocator\n\nfrom crawlplot import CrawlPlot\nfrom crawlstats import MonthlyCrawl, MultiCount\nfrom top_level_domain import TopLevelDomain\n\n\ntld_counts = defaultdict(lambda: Counter())\n\n# mapping of country-code TLDs to continents\ncontinent_cc_tlds = {\n    'Africa': {'ao', 'bf', 'bi', 'bj', 'bw', 'cd', 'cf', 'cg', 'ci', 'cm', 'cv',\n               'dj', 'dz', 'eg', 'eh', 'er', 'et', 'ga', 'gh', 'gm', 'gn', 'gq',\n               'gw', 'ke', 'km', 'lr', 'ls', 'ly', 'ma', 'mg', 'ml', 'mr', 'mu',\n               'mw', 'mz', 'na', 'ne', 'ng', 're', 'rw', 'sc', 'sd', 'sh', 'sl',\n               'sn', 'so', 'ss', 'st', 'sz', 'td', 'tg', 'tn', 'tz', 'ug', 'yt',\n               'za', 'zm', 'zw'},\n    'Antarctica': {'aq'},\n    'Asia': {'ae', 'af', 'am', 'az', 'bd', 'bh', 'bn', 'bt', 'cc', 'cn', 'cx',\n             'ge', 'hk', 'id', 'il', 'in', 'io', 'iq', 'ir', 'jo', 'jp', 'kg',\n             'kh', 'kp', 'kr', 'kw', 'kz', 'la', 'lb', 'lk', 'mm', 'mn', 'mo',\n             'mv', 'my', 'np', 'om', 'ph', 'pk', 'ps', 'qa', 'sa', 'sg', 'sy',\n             'th', 'tj', 'tm', 'tr', 'tw', 'uz', 'vn', 'ye',\n             'tp' # Timor-Leste: deleted in favor of .tl in 2015\n             },\n    'Europe': {'ad', 'al', 'at', 'ba', 'be', 'bg', 'by', 'ch', 'cy', 'cz',\n               'de', 'dk', 'ee', 'es', 'fi', 'fo', 'fr', 'gg', 'gi', 'gr',\n               'hr', 'hu', 'ie', 'im', 'is', 'it', 'je', 'li', 'lt', 'lu', 'lv',\n               'mc', 'md', 'me', 'mk', 'mt', 'nl', 'no',\n               'pl', 'pt', 'ro', 'rs', 'ru', 'se', 'si', 'sj', 'sk', 'sm',\n               'ua', 'uk', 'va',\n               'xk',  # https://en.wikipedia.org/wiki/.xk\n               'bv', # Bouvet Island (inactive, uninhabited Norwegian territory, South Atlantic Ocean)\n               'gb' # Great Britain (reserved)\n               },\n    'North America': {'ag', 'ai', 'an', 'aw', 'bb', 'bm', 'bs', 'bz',\n                      'ca', 'cr', 'cu', 'cw', 'dm', 'do', 'gd', 'gl', 'gp', 'gt',\n                      'hn', 'ht', 'jm', 'kn', 'ky', 'lc', 'mq',     'ms', 'mx', 'ni',\n                      'pa', 'pm', 'pr', 'sv', 'sx', 'tc', 'tt',\n                      'us', 'vc', 'vg', 'vi',\n                      'bl', # Saint Barthélemy (unused)\n                      'bq', # Bonaire, Sint Eustatius and Saba (reserved)\n                      'mf', # Saint Martin (unassigned)\n                      },\n    'Oceania': {'as', 'au', 'ck', 'fj', 'fm', 'gu', 'ki', 'mh', 'mp',\n                'nc', 'nf', 'nr', 'nu', 'nz', 'pf', 'pg', 'pn', 'pw',\n                'sb', 'tk', 'tl', 'to', 'tv', 'vu', 'wf', 'ws'\n                },\n    'South America': {'ar', 'bo', 'br', 'cl', 'co', 'ec', 'fk', 'gf', 'gy',\n                      'pe', 'py', 'sr', 'uy', 've'},\n}\n\n# Geographic TLDs mapped to continents\n# https://en.wikipedia.org/wiki/List_of_Internet_top-level_domains#Geographic_top-level_domains\ncontinent_geographic_tlds = {\n    'Africa': {'africa', 'capetown', 'durban', 'joburg'},\n    'Asia': {'abudhabi', 'arab', 'asia', 'doha', 'dubai', 'krd', 'kyoto',\n             'nagoya', 'okinawa', 'osaka', 'ryukyu', 'taipei', 'tokyo', 'yokohama',\n             # https://en.wikipedia.org/wiki/List_of_Internet_top-level_domains#Internationalized_geographic_top-level_domains\n             'xn--1qqw23a', '佛山', # Foshan, China\n             'xn--xhq521b', '广东', # Guangdong, China\n             'xn--80adxhks', 'москва', # Moscow, Russia\n             'xn--p1acf', 'рус', # Russian language and culture - https://en.wikipedia.org/wiki/.%D1%80%D1%83%D1%81\n             'xn--mgbca7dzdo', 'ابوظبي', # Abu Dhabi\n             'xn--ngbrx', 'عرب', # Arab\n             },\n    'Europe': {\n        # France\n        'alsace', 'bzh', 'corsica', 'eus', 'paris',\n        # Spain\n        'bcn', 'barcelona', 'cat', 'eus', 'gal', 'madrid',\n        # Germany\n        'bayern', 'berlin', 'cologne', 'koeln', 'hamburg', 'nrw', 'ruhr', 'saarland',\n        # other\n        'eu', 'amsterdam', 'bar', 'brussels', 'cymru', 'wales', 'frl', 'gent', 'helsinki', 'irish', 'ist', 'istanbul', 'london', 'moscow', 'scot', 'stockholm', 'swiss', 'tatar', 'tirol', 'vlaanderen', 'wien', 'zuerich', 'su',\n        # https://en.wikipedia.org/wiki/.ax\n        'ax'\n    },\n    'North America': {'boston', 'miami', 'nyc', 'quebec', 'vegas'},\n    'Oceania': {'kiwi', 'melbourne', 'sydney'},\n    'South America': {'lat', 'rio'}\n}\n\n# list of \"continents\" to be shown in the output\ncontinents = ['(other)', 'com,net', 'org', 'edu', 'gov,mil', 'North America', 'South America', 'Oceania', 'Africa', 'Asia', 'Europe']\n\n# lookup tables TLD -> continent\ntld_continent = {\n    'gov': 'gov,mil', 'mil': 'gov,mil',\n    'com': 'com,net', 'net': 'com,net',\n    'org': 'org', 'edu': 'edu'\n}\n\n# frequency counts of TLDs that cannot be mapped to a continent\ntld_unmapped = Counter()\n\n# fill the lookup table with TLD -> continent mappings\nfor continent in continent_cc_tlds:\n    for tld in continent_cc_tlds[continent]:\n        tld_continent[tld] = continent\n\nfor continent in continent_geographic_tlds:\n    for tld in continent_geographic_tlds[continent]:\n        tld_continent[tld] = continent\n\nfor icctld in TopLevelDomain.tld_ccs:\n    if TopLevelDomain.tld_ccs[icctld] in tld_continent:\n        tld_continent[icctld] = tld_continent[TopLevelDomain.tld_ccs[icctld]]\n\ndef tld2continent(tld):\n    \"\"\"Map a TLD to its corresponding continent.\"\"\"\n    continent = '(other)'\n    tld = tld.lower()\n    if tld in tld_continent and tld_continent[tld] != 'Antarctica':\n        continent = tld_continent[tld]\n    return continent\n\n\ndef get_data(f):\n    \"\"\"Parse TLD statistics and aggregate by year and crawl.\n\n    Returns two dictionaries: one aggregated by year, one by crawl name.\n    \"\"\"\n    d = defaultdict(lambda: defaultdict(list))\n    dd = defaultdict(lambda: defaultdict(list))\n\n    for line in f:\n        keyval = line.split('\\t')\n        if len(keyval) == 2:\n            [_, suffix, crawl] = json.loads(keyval[0])\n            year = MonthlyCrawl.year_of(crawl)\n            val = json.loads(keyval[1])\n            tld = suffix.split('.')[-1].lower()\n            tld_cnt = tld2continent(tld)\n            if tld_cnt == '(other)':\n                tld_unmapped[tld] += MultiCount.get_count(0, val)\n            if tld:\n                # print(tld)\n                tld_counts['(any)'][tld] += MultiCount.get_count(0, val)\n                tld_counts[str(year)][tld] += MultiCount.get_count(0, val)\n            d[str(year)][tld_cnt].append(val)\n            dd[MonthlyCrawl.short_name(crawl)][tld_cnt].append(val)\n\n    return d, dd\n\n\nclass TLDByContinentPlot(CrawlPlot):\n    \"\"\"Generate TLD distribution by continent visualizations.\"\"\"\n\n    def __init__(self):\n        super().__init__()\n\n    def plot(self):\n        \"\"\"Generate TLD by continent/year plots and save data tables.\"\"\"\n        # Read from file path or stdin\n        if len(sys.argv) > 1 and os.path.exists(sys.argv[-1]):\n            with fsspec.open(sys.argv[-1], compression=\"gzip\", mode=\"rt\") as f:\n                d, dd = get_data(f)\n        else:\n            d, dd = get_data(sys.stdin)\n\n        print(\"\\nyear\\t{}\".format(\"\\t\".join(continents)))\n        continent_percentages = dict()\n        for year in d:\n            pages = dict()\n            total = 0\n            values = []\n            for tld in continents:\n                d[year][tld].append([0,0,0,0])\n                val = MultiCount.sum_values(d[year][tld], False)\n                total += val[0]\n                values.append(val[0])\n                # print(\"{}\\t{}\\t{}\\t{}\\t{}\\t{}\".format(year, tld, *val))\n            percentages = [100*val/total for val in values]\n            print(\"{}\\t{}\".format(year, \"\\t\".join(\n                map(lambda x: '{:.2f}'.format(x), percentages))))\n            continent_percentages[year] = percentages\n        continent_percentages = pandas.DataFrame.from_dict(continent_percentages,\n                                                        orient='index',\n                                                        columns=continents)\n        continent_percentages.index.name = 'year'\n        print(continent_percentages)\n\n        top_tlds = tld_counts['(any)'].most_common(16)\n        #print(\"\\n\", top_tlds)\n\n        top_tlds_by_year = defaultdict(list)\n        print(\"\\nyear\\t{}\".format(\"\\t\".join([x[0] for x in top_tlds])))\n        for year in tld_counts:\n            total = sum(tld_counts[year].values())\n            sys.stdout.write(year)\n            for tld in top_tlds:\n                perc = 100*tld_counts[year][tld[0]]/total\n                sys.stdout.write('\\t{:.2f}'.format(perc))\n                top_tlds_by_year[year].append(perc)\n            sys.stdout.write('\\n')\n\n        # table TLDs by year\n        selected_tlds = pandas.DataFrame.from_dict(\n            top_tlds_by_year,\n            orient='index',\n            columns=map(lambda tld: tld[0], top_tlds)\n        )\n        selected_tlds.index.name = 'year'\n        selected_tlds.to_csv(\n            os.path.join(self.PLOTDIR, 'tld', 'selected-tlds-by-year.csv'),\n            index=True)\n        css_classes = ['tablepercentage', 'tablesorter']\n        selected_tlds.to_html(\n            os.path.join(self.PLOTDIR, 'tld', 'selected-tlds-by-year.html'),\n            float_format='%.2f',\n            classes=css_classes,\n            index_names=True)\n\n        print(\"\\ncrawl\\t{}\".format(\"\\t\".join(continents)))\n        for crawl in dd:\n            pages = dict()\n            total = 0\n            values = []\n            for tld in continents:\n                dd[crawl][tld].append([0,0,0,0])\n                val = MultiCount.sum_values(dd[crawl][tld], False)\n                total += val[0]\n                values.append(val[0])\n                # print(\"{}\\t{}\\t{}\\t{}\\t{}\\t{}\".format(year, tld, *val))\n            print(\"{}\\t{}\".format(crawl, \"\\t\".join(['{:.2f}'.format(100*val/total) for val in values])))\n\n        # print unmapped TLDs to verify whether there are any TLDs\n        # that need to be added to the mapping\n        print(\"\\n\", len(tld_unmapped), \" unmapped TLDs: \", str(tld_unmapped), \"\\n\\n\")\n\n\n        data = continent_percentages.melt(id_vars=[], var_name='continent',\n                                        value_name='perc', ignore_index=False)\n        data['continent'] = pandas.Categorical(data['continent'],\n                                            ordered=True,\n                                            categories=continents.reverse())\n        \n        if self.PLOTLIB == \"rpy2.ggplot2\":\n            self.plot_with_rpy2_ggplot2(data=data)\n\n        elif self.PLOTLIB == \"matplotlib\":\n            self.plot_with_matplotlib(data=data)\n\n        else:\n            raise ValueError(\"Invalid PLOTLIB\")\n        \n\n        ### plot and table for print publication\n        #plot = plot + ggplot2.labs(title='',\n        #                           x='', y='', fill='TLD / Continent') \\\n        #            + ggplot2.theme()\n        #plot.save(os.path.join(PLOTDIR, 'tld', 'tlds-by-year-and-continent.pdf'))\n        #print(continent_percentages.to_latex(index=True, float_format='%.2f'))\n        continent_percentages.to_csv(\n            os.path.join(self.PLOTDIR, 'tld', 'tlds-by-year-and-continent.csv'),\n            index=True)\n        css_classes = ['tablepercentage', 'tablesorter']\n        continent_percentages.to_html(\n            os.path.join(self.PLOTDIR, 'tld', 'tlds-by-year-and-continent.html'),\n            float_format='%.2f',\n            classes=css_classes)\n\n    def plot_with_rpy2_ggplot2(self, data):\n        \"\"\"Generate TLD by continent stacked bar chart using rpy2/ggplot2.\"\"\"\n        from rpy2.robjects.lib import ggplot2\n\n        plot = ggplot2.ggplot(data.reset_index()) \\\n                + ggplot2.aes_string(x='year', y='perc', fill='continent', label='perc') \\\n                + ggplot2.geom_bar(stat='identity', position='stack') \\\n                + self.GGPLOT2_THEME + ggplot2.scale_fill_hue() \\\n                + ggplot2.labs(title='Percentage of Page Captures per TLD / Continent',\n                            x='', y='Percentage', fill='TLD / Continent') \\\n                + ggplot2.theme(**{'legend.position': 'right',\n                                'aspect.ratio': .7,\n                                **self.GGPLOT2_THEME_KWARGS,\n                                'axis.text.x':\n                                    ggplot2.element_text(angle=45,\n                                                        vjust=1, hjust=1)})\n        plot.save(os.path.join(self.PLOTDIR, 'tld', 'tlds-by-year-and-continent.png'))\n\n        return plot\n\n\n    def plot_with_matplotlib(self, data):\n        \"\"\"Generate TLD by continent stacked bar chart using matplotlib.\"\"\"\n        aspect_ratio = 0.7\n        title = 'Percentage of Page Captures per TLD / Continent'\n\n        fig, ax = self.create_figure()\n\n        # Colorblind-safe palette (Paul Tol's scheme)\n        colors = ['#4477AA', '#EE6677', '#228833', '#CCBB44', '#AA3377',\n                  '#66CCEE', '#EE8866', '#44AA99', '#BBBBBB', '#99CC66', '#CC99BB']\n\n        years = sorted(data.reset_index()['year'].unique())\n        bottoms = [0] * len(years)\n        sorted_continents = sorted(continents)[::-1]\n\n        for i, continent in enumerate(sorted_continents):\n            values = []\n            for year in years:\n                year_data = data.loc[year]\n                continent_data = year_data[year_data['continent'] == continent]\n                values.append(continent_data['perc'].values[0] if len(continent_data) > 0 else 0)\n\n            ax.bar(range(len(years)), values, bottom=bottoms, label=continent,\n                   color=colors[i % len(colors)], width=self.bar_width)\n            bottoms = [b + v for b, v in zip(bottoms, values)]\n\n        # Axes ratio\n        ax.set_aspect(1 / ax.get_data_ratio() * aspect_ratio)\n\n        self.set_title(ax, title)\n        ax.set_xlabel('')\n        ax.set_ylabel('Percentage', fontsize=self.ylabel_fontsize)\n\n        # Set x-axis ticks and labels\n        ax.set_xticks(range(len(years)))\n        ax.set_xticklabels(years, rotation=45, ha='right', fontsize=self.ticks_fontsize)\n        ax.set_xlim(-0.5, len(years) - 0.5)\n\n        # Set y-axis formatting\n        ax.yaxis.set_major_locator(MaxNLocator(nbins=6))\n        ax.set_ylim(0, 100)\n        ax.tick_params(axis='y', labelsize=self.ticks_fontsize)\n\n        # Apply ggplot2-like styling with y-axis grid\n        ax.grid(True, which='major', linewidth=1.0, color='#E6E6E6', zorder=0, axis='y')\n        ax.set_axisbelow(True)\n\n        # Custom spine styling (thin borders at top/bottom)\n        ax.spines['top'].set_visible(True)\n        ax.spines['top'].set_linewidth(1.0)\n        ax.spines['top'].set_color('#E6E6E6')\n        ax.spines['right'].set_visible(False)\n        ax.spines['left'].set_visible(False)\n        ax.spines['bottom'].set_visible(True)\n        ax.spines['bottom'].set_linewidth(1.0)\n        ax.spines['bottom'].set_color('#E6E6E6')\n\n        # Set tick colors\n        ax.tick_params(axis='both', which='both', colors=self.ticks_color,\n                       length=self.ticks_length, width=1.0)\n        self.set_tick_labels_black(ax)\n\n        # Position legend on right side with reversed order\n        handles, labels = ax.get_legend_handles_labels()\n        legend = ax.legend(handles[::-1], labels[::-1], loc='center left',\n                          bbox_to_anchor=(1.0, 0.5), frameon=False,\n                          fontsize=self.legend_fontsize, title='TLD / Continent',\n                          title_fontsize=self.legend_title_fontsize)\n        legend._legend_box.align = 'left'\n\n        img_path = os.path.join(self.PLOTDIR, 'tld', 'tlds-by-year-and-continent.png')\n        return self.save_figure(fig, img_path)\n\n\nif __name__ == '__main__':\n    plot = TLDByContinentPlot()\n    plot.plot()\n"
  },
  {
    "path": "plot.sh",
    "content": "#!/bin/bash\n\nN_CRAWLS=$(python3 -c 'from crawlstats import MonthlyCrawl; print(len(MonthlyCrawl.by_name))')\nLATEST_CRAWL=$(python3 -c 'from crawlstats import MonthlyCrawl; print(sorted(MonthlyCrawl.by_name.keys())[-1])')\n\n# verify that all stats files are downloaded, cf. get_stats.sh\nN_CRAWLS_STATS_FILES=$(ls stats/CC-MAIN-*.gz | wc -l)\nif [[ $N_CRAWLS -ne $N_CRAWLS_STATS_FILES ]]; then\n    echo \"Number of crawls registered in crawlstats.py ($N_CRAWLS) and\"\n    echo \"the number of statistics files in stats/ ($N_CRAWLS_STATS_FILES) are not equal.\"\n    echo \"Exiting!\"\n    exit 1\nfi\n\necho \"Plotting crawl statistics for $N_CRAWLS crawls\"\necho \"Latest crawl is: $LATEST_CRAWL\"\necho\n\n\n# fail on any kind of error\nset -exo pipefail\n\n\n# register the latest crawl in the website configuration\nsed -i 's@^latest_crawl:.*@latest_crawl: '$LATEST_CRAWL'@' _config.yml\n\n\nfunction update_excerpt() {\n    regex=\"$1\"\n    excerpt=\"$2\"\n    if [ -e \"$excerpt\" ]; then\n        # short-cut for monthy update plots: only add data from latest crawl\n        if ! zgrep -qF \"$LATEST_CRAWL\" $excerpt; then\n            echo \"Updating excerpt $excerpt with latest crawl $LATEST_CRAWL\"\n            zgrep -Eh \"$regex\" stats/$LATEST_CRAWL.gz | gzip >>$excerpt\n        fi\n        # sanity check: are all crawls excerpted?\n        N_CRAWLS_EXCERPTED=$(zcat $excerpt | cut -f1 | jq -r '.[2]' | uniq | sort -u | wc -l)\n        if [[ $N_CRAWLS_EXCERPTED -eq $N_CRAWLS ]]; then\n            echo \"Excerpt $excerpt includes $N_CRAWLS crawls as expected.\"\n        else\n            echo \"Number of crawls excerpted in $excerpt ($N_CRAWLS_EXCERPTED) does not equal $N_CRAWLS\"\n            echo \"Removing excerpt $excerpt\"\n            rm $excerpt\n        fi\n    fi\n    if ! [ -e \"$excerpt\" ]; then\n        echo \"Rebuilding excerpt $excerpt\"\n        zcat stats/CC-MAIN-*.gz | grep -Eh \"$regex\" | gzip  >$excerpt\n    fi\n}\n\n# filter data to speed-up reading while plotting\nmkdir -p stats/excerpt\nupdate_excerpt '^\\[\"size'                               stats/excerpt/size.json.gz\nupdate_excerpt '^\\[\"histogram\"'                         stats/excerpt/histogram.json.gz\nupdate_excerpt '^\\[\"tld\"'                               stats/excerpt/tld.json.gz\nupdate_excerpt '^\\[\"(size|domain)\"'                     stats/excerpt/domain.json.gz\nupdate_excerpt '^\\[\"(size\", *\"page|mimetype)\"'          stats/excerpt/mimetype.json.gz\nupdate_excerpt '^\\[\"(size\", *\"page|mimetype_detected)\"' stats/excerpt/mimetype_detected.json.gz\nupdate_excerpt '^\\[\"(size\", *\"page|charset)\"'           stats/excerpt/charset.json.gz\nupdate_excerpt '^\\[\"(size\", *\"page|primary_language|languages)\"' stats/excerpt/language.json.gz\nupdate_excerpt '^\\[\"scheme\"'                            stats/excerpt/url_protocol.json.gz\n\nmkdir -p data\n\nzcat stats/excerpt/size.json.gz \\\n     | python3 plot/crawl_size.py\n\nzcat stats/excerpt/size.json.gz \\\n     | python3 plot/overlap.py\n\n# zcat stats/excerpt/histogram.json.gz \\\n#     | python3 plot/histogram.py \"$LATEST_CRAWL\"\n\n(cat stats/crawler/CC-MAIN-*.json;\n zcat stats/excerpt/size.json.gz | grep '^\\[\"size\"';\n zcat stats/excerpt/url_protocol.json.gz) \\\n\t| python3 plot/crawler_metrics.py\n\nzcat stats/excerpt/tld.json.gz \\\n    | python3 plot/tld.py CC-MAIN-2008-2009 CC-MAIN-2012 CC-MAIN-2014-10 \\\n              CC-MAIN-2016-30 CC-MAIN-2019-09 CC-MAIN-2022-49 $LATEST_CRAWL\nzcat stats/excerpt/tld.json.gz \\\n    | python3 plot/tld_by_continent.py\n\nzcat stats/excerpt/mimetype.json.gz \\\n    | python3 plot/mimetype.py\n\nzcat stats/excerpt/mimetype_detected.json.gz \\\n    | python3 plot/mimetype_detected.py\n\nzcat stats/excerpt/charset.json.gz \\\n    | python3 plot/charset.py\n\nzcat stats/excerpt/language.json.gz \\\n    | python3 plot/language.py\n\nzcat stats/excerpt/domain.json.gz \\\n    | python3 plot/domain.py\n\necho -e \"\\n\\nAll crawl statistics plotted\\n\""
  },
  {
    "path": "plots/README.md",
    "content": "Plots about Common Crawl Monthly Archives\n=========================================\n\n* [size of the crawls](crawlsize.md) - number of pages, unique URLs, hosts, domains, TLDs\n* [top-level domains](tlds.md) - distribution and comparison\n* [crawler-related metrics](crawlermetrics.md) - fetch status, etc.\n* [overlaps between monthly crawls](crawloverlap.md)\n* distribution of\n\t- [media types (MIME)](mimetypes.md)\n\t- [character sets](charsets.md)\n\t- [languages](languages.md)\n\t- [registered domains](domains.md)\n\t"
  },
  {
    "path": "plots/charsets-top-100.html",
    "content": "<table border=\"1\" class=\"dataframe tablesorter tablepercentage\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th>crawl</th>\n      <th>CC-MAIN-2026-08</th>\n      <th>CC-MAIN-2026-12</th>\n      <th>CC-MAIN-2026-17</th>\n    </tr>\n    <tr>\n      <th>charset</th>\n      <th></th>\n      <th></th>\n      <th></th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>&lt;other&gt;</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>&lt;unknown&gt;</th>\n      <td>1.8164</td>\n      <td>1.8232</td>\n      <td>1.8918</td>\n    </tr>\n    <tr>\n      <th>Big5</th>\n      <td>0.0219</td>\n      <td>0.0198</td>\n      <td>0.0298</td>\n    </tr>\n    <tr>\n      <th>Big5-HKSCS</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>EUC-JP</th>\n      <td>0.1311</td>\n      <td>0.1340</td>\n      <td>0.1266</td>\n    </tr>\n    <tr>\n      <th>EUC-KR</th>\n      <td>0.0785</td>\n      <td>0.0819</td>\n      <td>0.0771</td>\n    </tr>\n    <tr>\n      <th>GB18030</th>\n      <td>0.0149</td>\n      <td>0.0165</td>\n      <td>0.0150</td>\n    </tr>\n    <tr>\n      <th>GB2312</th>\n      <td>0.2307</td>\n      <td>0.2388</td>\n      <td>0.2011</td>\n    </tr>\n    <tr>\n      <th>GBK</th>\n      <td>0.1013</td>\n      <td>0.1000</td>\n      <td>0.0934</td>\n    </tr>\n    <tr>\n      <th>IBM420</th>\n      <td>0.0051</td>\n      <td>0.0049</td>\n      <td>0.0051</td>\n    </tr>\n    <tr>\n      <th>IBM424</th>\n      <td>0.0023</td>\n      <td>0.0021</td>\n      <td>0.0011</td>\n    </tr>\n    <tr>\n      <th>IBM500</th>\n      <td>0.0011</td>\n      <td>0.0011</td>\n      <td>0.0008</td>\n    </tr>\n    <tr>\n      <th>IBM855</th>\n      <td>NaN</td>\n      <td>0.0000</td>\n      <td>NaN</td>\n    </tr>\n    <tr>\n      <th>IBM866</th>\n      <td>0.0003</td>\n      <td>0.0002</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>ISO-2022-JP</th>\n      <td>0.0010</td>\n      <td>0.0012</td>\n      <td>0.0010</td>\n    </tr>\n    <tr>\n      <th>ISO-8859-1</th>\n      <td>6.6472</td>\n      <td>3.3383</td>\n      <td>2.7125</td>\n    </tr>\n    <tr>\n      <th>ISO-8859-13</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>ISO-8859-15</th>\n      <td>0.0466</td>\n      <td>0.0478</td>\n      <td>0.0444</td>\n    </tr>\n    <tr>\n      <th>ISO-8859-16</th>\n      <td>0.0002</td>\n      <td>0.0003</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>ISO-8859-2</th>\n      <td>0.0906</td>\n      <td>0.0882</td>\n      <td>0.0817</td>\n    </tr>\n    <tr>\n      <th>ISO-8859-3</th>\n      <td>0.0002</td>\n      <td>0.0003</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>ISO-8859-4</th>\n      <td>0.0006</td>\n      <td>0.0007</td>\n      <td>0.0007</td>\n    </tr>\n    <tr>\n      <th>ISO-8859-5</th>\n      <td>0.0016</td>\n      <td>0.0015</td>\n      <td>0.0008</td>\n    </tr>\n    <tr>\n      <th>ISO-8859-6</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>ISO-8859-7</th>\n      <td>0.0043</td>\n      <td>0.0043</td>\n      <td>0.0040</td>\n    </tr>\n    <tr>\n      <th>ISO-8859-8</th>\n      <td>0.0007</td>\n      <td>0.0008</td>\n      <td>0.0007</td>\n    </tr>\n    <tr>\n      <th>ISO-8859-9</th>\n      <td>0.0196</td>\n      <td>0.0201</td>\n      <td>0.0235</td>\n    </tr>\n    <tr>\n      <th>KOI8-R</th>\n      <td>0.0067</td>\n      <td>0.0066</td>\n      <td>0.0076</td>\n    </tr>\n    <tr>\n      <th>KOI8-U</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>Shift_JIS</th>\n      <td>0.1749</td>\n      <td>0.1813</td>\n      <td>0.1479</td>\n    </tr>\n    <tr>\n      <th>TIS-620</th>\n      <td>0.0038</td>\n      <td>0.0038</td>\n      <td>0.0036</td>\n    </tr>\n    <tr>\n      <th>US-ASCII</th>\n      <td>0.0189</td>\n      <td>0.0200</td>\n      <td>0.0203</td>\n    </tr>\n    <tr>\n      <th>UTF-16</th>\n      <td>0.0027</td>\n      <td>0.0023</td>\n      <td>0.0022</td>\n    </tr>\n    <tr>\n      <th>UTF-16BE</th>\n      <td>0.0002</td>\n      <td>0.0002</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>UTF-16LE</th>\n      <td>0.0015</td>\n      <td>0.0015</td>\n      <td>0.0039</td>\n    </tr>\n    <tr>\n      <th>UTF-32</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>UTF-32LE</th>\n      <td>0.0002</td>\n      <td>0.0002</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>UTF-8</th>\n      <td>89.8190</td>\n      <td>93.0693</td>\n      <td>93.7434</td>\n    </tr>\n    <tr>\n      <th>windows-1250</th>\n      <td>0.0681</td>\n      <td>0.0689</td>\n      <td>0.0666</td>\n    </tr>\n    <tr>\n      <th>windows-1251</th>\n      <td>0.4820</td>\n      <td>0.5023</td>\n      <td>0.4838</td>\n    </tr>\n    <tr>\n      <th>windows-1252</th>\n      <td>0.1433</td>\n      <td>0.1557</td>\n      <td>0.1526</td>\n    </tr>\n    <tr>\n      <th>windows-1253</th>\n      <td>0.0019</td>\n      <td>0.0024</td>\n      <td>0.0024</td>\n    </tr>\n    <tr>\n      <th>windows-1254</th>\n      <td>0.0104</td>\n      <td>0.0129</td>\n      <td>0.0123</td>\n    </tr>\n    <tr>\n      <th>windows-1255</th>\n      <td>0.0059</td>\n      <td>0.0059</td>\n      <td>0.0053</td>\n    </tr>\n    <tr>\n      <th>windows-1256</th>\n      <td>0.0303</td>\n      <td>0.0276</td>\n      <td>0.0240</td>\n    </tr>\n    <tr>\n      <th>windows-1257</th>\n      <td>0.0062</td>\n      <td>0.0059</td>\n      <td>0.0053</td>\n    </tr>\n    <tr>\n      <th>windows-31j</th>\n      <td>0.0004</td>\n      <td>0.0004</td>\n      <td>0.0004</td>\n    </tr>\n    <tr>\n      <th>x-iso-8859-11</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>x-windows-874</th>\n      <td>0.0072</td>\n      <td>0.0067</td>\n      <td>0.0057</td>\n    </tr>\n    <tr>\n      <th>x-windows-949</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n  </tbody>\n</table>"
  },
  {
    "path": "plots/charsets.csv",
    "content": "crawl,charset,pages,urls,%pages/crawl\nCC-MAIN-2008-2009,<unknown>,1798158091,1798158091,100.0000\nCC-MAIN-2009-2010,<unknown>,2863495211,2863495211,100.0000\nCC-MAIN-2012,<unknown>,3828539877,3828539877,100.0000\nCC-MAIN-2013-20,<unknown>,1796098643,1796098643,100.0000\nCC-MAIN-2013-48,<unknown>,2245773667,2245773667,100.0000\nCC-MAIN-2014-10,<unknown>,2301223474,2301223474,100.0000\nCC-MAIN-2014-15,<unknown>,2641371316,2641371316,100.0000\nCC-MAIN-2014-23,<unknown>,3608720876,3608720876,100.0000\nCC-MAIN-2014-35,<unknown>,2870692423,2870692423,100.0000\nCC-MAIN-2014-41,<unknown>,2979743543,2979743543,100.0000\nCC-MAIN-2014-42,<unknown>,3722131678,3722131678,100.0000\nCC-MAIN-2014-49,<unknown>,1948510433,1948510433,100.0000\nCC-MAIN-2014-52,<unknown>,2085977207,2085977207,100.0000\nCC-MAIN-2015-06,<unknown>,1826024103,1826024103,100.0000\nCC-MAIN-2015-11,<unknown>,1837196089,1837196089,100.0000\nCC-MAIN-2015-14,<unknown>,1646697534,1646697534,100.0000\nCC-MAIN-2015-18,<unknown>,2115818059,2115818059,100.0000\nCC-MAIN-2015-22,<unknown>,2015461448,2015461448,100.0000\nCC-MAIN-2015-27,<unknown>,1675619098,1675619098,100.0000\nCC-MAIN-2015-32,<unknown>,1815492409,1815492409,100.0000\nCC-MAIN-2015-35,<unknown>,1848022475,1848022475,100.0000\nCC-MAIN-2015-40,<unknown>,1321987379,1321987379,100.0000\nCC-MAIN-2015-48,<unknown>,1824170527,1824170527,100.0000\nCC-MAIN-2016-07,<unknown>,1733285122,1733285122,100.0000\nCC-MAIN-2016-18,<unknown>,1335046923,1335046923,100.0000\nCC-MAIN-2016-22,<unknown>,1466220798,1466220798,100.0000\nCC-MAIN-2016-26,<unknown>,1236815660,1236815660,100.0000\nCC-MAIN-2016-30,<unknown>,1737322304,1737322304,100.0000\nCC-MAIN-2016-36,<unknown>,1611613090,1611613090,100.0000\nCC-MAIN-2016-40,<unknown>,1722656393,1722656393,100.0000\nCC-MAIN-2016-44,<unknown>,3254976731,3254976731,100.0000\nCC-MAIN-2016-50,<unknown>,2866282390,2866282390,100.0000\nCC-MAIN-2017-04,<unknown>,3146498026,3146498026,100.0000\nCC-MAIN-2017-09,<unknown>,3084366662,3084366662,100.0000\nCC-MAIN-2017-13,<unknown>,3070720576,3070720576,100.0000\nCC-MAIN-2017-17,<unknown>,2942930482,2942930482,100.0000\nCC-MAIN-2017-22,<unknown>,2967293699,2967293699,100.0000\nCC-MAIN-2017-26,<unknown>,3165214086,3165214086,100.0000\nCC-MAIN-2017-30,<unknown>,2892213652,2892213652,100.0000\nCC-MAIN-2017-34,<unknown>,3280080910,3280080910,100.0000\nCC-MAIN-2017-39,<unknown>,3017180563,3017180563,100.0000\nCC-MAIN-2017-43,<unknown>,3650430218,3650430218,100.0000\nCC-MAIN-2017-47,<unknown>,3204943573,3204943573,100.0000\nCC-MAIN-2017-51,<unknown>,2914004423,2914004423,100.0000\nCC-MAIN-2018-05,<unknown>,3464537205,3464537205,100.0000\nCC-MAIN-2018-09,<unknown>,3488463319,3488463319,100.0000\nCC-MAIN-2018-13,<unknown>,3232738018,3232738018,100.0000\nCC-MAIN-2018-17,<unknown>,3101353989,3101353989,100.0000\nCC-MAIN-2018-22,<unknown>,2788388007,2788388007,100.0000\nCC-MAIN-2018-26,<unknown>,3069414247,3069414247,100.0000\nCC-MAIN-2018-30,<unknown>,3263958200,3263958200,100.0000\nCC-MAIN-2018-34,<other>,5012,4994,0.0002\nCC-MAIN-2018-34,<unknown>,126685829,126685829,4.7160\nCC-MAIN-2018-34,Big5,2474270,2469758,0.0921\nCC-MAIN-2018-34,Big5-HKSCS,6275,6268,0.0002\nCC-MAIN-2018-34,EUC-JP,11086532,10975050,0.4127\nCC-MAIN-2018-34,EUC-KR,3797614,3791178,0.1414\nCC-MAIN-2018-34,GB18030,993684,985878,0.0370\nCC-MAIN-2018-34,GB2312,22121572,22053200,0.8235\nCC-MAIN-2018-34,GBK,11105945,11067218,0.4134\nCC-MAIN-2018-34,IBM500,10,10,0.0000\nCC-MAIN-2018-34,IBM855,5494,5471,0.0002\nCC-MAIN-2018-34,IBM866,13767,13710,0.0005\nCC-MAIN-2018-34,ISO-2022-JP,30712,30609,0.0011\nCC-MAIN-2018-34,ISO-8859-1,137890410,136570574,5.1331\nCC-MAIN-2018-34,ISO-8859-13,10267,10260,0.0004\nCC-MAIN-2018-34,ISO-8859-15,8241896,8180044,0.3068\nCC-MAIN-2018-34,ISO-8859-2,7697233,7657364,0.2865\nCC-MAIN-2018-34,ISO-8859-3,10214,10188,0.0004\nCC-MAIN-2018-34,ISO-8859-4,35155,34111,0.0013\nCC-MAIN-2018-34,ISO-8859-5,56781,56633,0.0021\nCC-MAIN-2018-34,ISO-8859-6,6189,6120,0.0002\nCC-MAIN-2018-34,ISO-8859-7,516140,513946,0.0192\nCC-MAIN-2018-34,ISO-8859-8,29612,29412,0.0011\nCC-MAIN-2018-34,ISO-8859-9,1600600,1591195,0.0596\nCC-MAIN-2018-34,KOI8-R,516307,515283,0.0192\nCC-MAIN-2018-34,KOI8-U,8171,8159,0.0003\nCC-MAIN-2018-34,Shift_JIS,15113141,15006500,0.5626\nCC-MAIN-2018-34,TIS-620,462808,461498,0.0172\nCC-MAIN-2018-34,US-ASCII,664916,661952,0.0248\nCC-MAIN-2018-34,UTF-16,74862,74122,0.0028\nCC-MAIN-2018-34,UTF-16BE,757,751,0.0000\nCC-MAIN-2018-34,UTF-16LE,35484,35162,0.0013\nCC-MAIN-2018-34,UTF-32,2025,2022,0.0001\nCC-MAIN-2018-34,UTF-32LE,3,3,0.0000\nCC-MAIN-2018-34,UTF-8,2245149161,2214841881,83.5770\nCC-MAIN-2018-34,windows-1250,4453222,4423609,0.1658\nCC-MAIN-2018-34,windows-1251,54700823,54499743,2.0363\nCC-MAIN-2018-34,windows-1252,23888187,23694774,0.8893\nCC-MAIN-2018-34,windows-1253,149093,148298,0.0056\nCC-MAIN-2018-34,windows-1254,1012798,1008111,0.0377\nCC-MAIN-2018-34,windows-1255,494373,492428,0.0184\nCC-MAIN-2018-34,windows-1256,4247513,4234585,0.1581\nCC-MAIN-2018-34,windows-1257,274234,273851,0.0102\nCC-MAIN-2018-34,windows-31j,41773,41406,0.0016\nCC-MAIN-2018-34,x-MacCyrillic,179572,179216,0.0067\nCC-MAIN-2018-34,x-iso-8859-11,972,966,0.0000\nCC-MAIN-2018-34,x-windows-874,430806,428450,0.0160\nCC-MAIN-2018-34,x-windows-949,1144,1141,0.0000\nCC-MAIN-2018-39,<other>,4683,4666,0.0002\nCC-MAIN-2018-39,<unknown>,23862059,23862059,0.8399\nCC-MAIN-2018-39,Big5,3451547,3441194,0.1215\nCC-MAIN-2018-39,Big5-HKSCS,6592,6590,0.0002\nCC-MAIN-2018-39,EUC-JP,11497088,11433031,0.4047\nCC-MAIN-2018-39,EUC-KR,4725181,4717238,0.1663\nCC-MAIN-2018-39,GB18030,1141514,1137313,0.0402\nCC-MAIN-2018-39,GB2312,26072133,25990314,0.9176\nCC-MAIN-2018-39,GBK,12556679,12514383,0.4420\nCC-MAIN-2018-39,IBM500,15,15,0.0000\nCC-MAIN-2018-39,IBM855,8617,8560,0.0003\nCC-MAIN-2018-39,IBM866,47335,41032,0.0017\nCC-MAIN-2018-39,ISO-2022-JP,37644,37511,0.0013\nCC-MAIN-2018-39,ISO-8859-1,164053172,162780277,5.7741\nCC-MAIN-2018-39,ISO-8859-13,14805,14798,0.0005\nCC-MAIN-2018-39,ISO-8859-15,10390418,10313410,0.3657\nCC-MAIN-2018-39,ISO-8859-2,9017868,8977554,0.3174\nCC-MAIN-2018-39,ISO-8859-3,13282,13269,0.0005\nCC-MAIN-2018-39,ISO-8859-4,36811,36045,0.0013\nCC-MAIN-2018-39,ISO-8859-5,58407,58310,0.0021\nCC-MAIN-2018-39,ISO-8859-6,9417,9344,0.0003\nCC-MAIN-2018-39,ISO-8859-7,605312,603475,0.0213\nCC-MAIN-2018-39,ISO-8859-8,30856,30670,0.0011\nCC-MAIN-2018-39,ISO-8859-9,1904783,1893599,0.0670\nCC-MAIN-2018-39,KOI8-R,630791,629721,0.0222\nCC-MAIN-2018-39,KOI8-U,10599,10590,0.0004\nCC-MAIN-2018-39,Shift_JIS,17122561,17024399,0.6027\nCC-MAIN-2018-39,TIS-620,524196,522599,0.0184\nCC-MAIN-2018-39,US-ASCII,759595,756252,0.0267\nCC-MAIN-2018-39,UTF-16,84550,84087,0.0030\nCC-MAIN-2018-39,UTF-16BE,1564,1558,0.0001\nCC-MAIN-2018-39,UTF-16LE,37707,37412,0.0013\nCC-MAIN-2018-39,UTF-32,2593,2542,0.0001\nCC-MAIN-2018-39,UTF-32LE,1,1,0.0000\nCC-MAIN-2018-39,UTF-8,2448086775,2418414906,86.1640\nCC-MAIN-2018-39,windows-1250,5128943,5099392,0.1805\nCC-MAIN-2018-39,windows-1251,61579907,61378188,2.1674\nCC-MAIN-2018-39,windows-1252,28990309,28793137,1.0204\nCC-MAIN-2018-39,windows-1253,177019,176329,0.0062\nCC-MAIN-2018-39,windows-1254,1190656,1183178,0.0419\nCC-MAIN-2018-39,windows-1255,611859,609164,0.0215\nCC-MAIN-2018-39,windows-1256,5596430,5564137,0.1970\nCC-MAIN-2018-39,windows-1257,330945,329350,0.0116\nCC-MAIN-2018-39,windows-31j,60073,59683,0.0021\nCC-MAIN-2018-39,x-MacCyrillic,232230,231077,0.0082\nCC-MAIN-2018-39,x-iso-8859-11,1716,1713,0.0001\nCC-MAIN-2018-39,x-windows-874,486694,484494,0.0171\nCC-MAIN-2018-39,x-windows-949,898,895,0.0000\nCC-MAIN-2018-43,<other>,5833,5795,0.0002\nCC-MAIN-2018-43,<unknown>,106829314,106829314,3.5121\nCC-MAIN-2018-43,Big5,3351549,3338282,0.1102\nCC-MAIN-2018-43,Big5-HKSCS,7975,7969,0.0003\nCC-MAIN-2018-43,EUC-JP,12025602,11938754,0.3953\nCC-MAIN-2018-43,EUC-KR,4665198,4649622,0.1534\nCC-MAIN-2018-43,GB18030,1820725,1816034,0.0599\nCC-MAIN-2018-43,GB2312,34044482,33957414,1.1192\nCC-MAIN-2018-43,GBK,16667691,16605605,0.5480\nCC-MAIN-2018-43,IBM500,11,11,0.0000\nCC-MAIN-2018-43,IBM855,5896,5874,0.0002\nCC-MAIN-2018-43,IBM866,14241,14189,0.0005\nCC-MAIN-2018-43,ISO-2022-JP,37525,37350,0.0012\nCC-MAIN-2018-43,ISO-8859-1,155559333,154280588,5.1141\nCC-MAIN-2018-43,ISO-8859-13,14116,14106,0.0005\nCC-MAIN-2018-43,ISO-8859-15,9983041,9885418,0.3282\nCC-MAIN-2018-43,ISO-8859-2,8932817,8880316,0.2937\nCC-MAIN-2018-43,ISO-8859-3,14719,13056,0.0005\nCC-MAIN-2018-43,ISO-8859-4,32996,32626,0.0011\nCC-MAIN-2018-43,ISO-8859-5,66051,65863,0.0022\nCC-MAIN-2018-43,ISO-8859-6,6148,6001,0.0002\nCC-MAIN-2018-43,ISO-8859-7,653768,651391,0.0215\nCC-MAIN-2018-43,ISO-8859-8,33295,33011,0.0011\nCC-MAIN-2018-43,ISO-8859-9,1910576,1891561,0.0628\nCC-MAIN-2018-43,KOI8-R,613107,611294,0.0202\nCC-MAIN-2018-43,KOI8-U,10718,10684,0.0004\nCC-MAIN-2018-43,Shift_JIS,17004646,16867151,0.5590\nCC-MAIN-2018-43,TIS-620,521696,519774,0.0172\nCC-MAIN-2018-43,US-ASCII,908489,903803,0.0299\nCC-MAIN-2018-43,UTF-16,94184,93528,0.0031\nCC-MAIN-2018-43,UTF-16BE,1066,1058,0.0000\nCC-MAIN-2018-43,UTF-16LE,55051,54654,0.0018\nCC-MAIN-2018-43,UTF-32,3065,2857,0.0001\nCC-MAIN-2018-43,UTF-32LE,1,1,0.0000\nCC-MAIN-2018-43,UTF-8,2561682128,2531944964,84.2164\nCC-MAIN-2018-43,windows-1250,5025383,4988293,0.1652\nCC-MAIN-2018-43,windows-1251,63017227,62744099,2.0717\nCC-MAIN-2018-43,windows-1252,27484876,27129540,0.9036\nCC-MAIN-2018-43,windows-1253,157717,155235,0.0052\nCC-MAIN-2018-43,windows-1254,1151708,1143715,0.0379\nCC-MAIN-2018-43,windows-1255,513551,511398,0.0169\nCC-MAIN-2018-43,windows-1256,5778327,5762054,0.1900\nCC-MAIN-2018-43,windows-1257,328551,327105,0.0108\nCC-MAIN-2018-43,windows-31j,124992,124269,0.0041\nCC-MAIN-2018-43,x-MacCyrillic,153785,153249,0.0051\nCC-MAIN-2018-43,x-iso-8859-11,1246,1239,0.0000\nCC-MAIN-2018-43,x-windows-874,467192,465066,0.0154\nCC-MAIN-2018-43,x-windows-949,2915,2903,0.0001\nCC-MAIN-2018-47,<other>,6127,6089,0.0002\nCC-MAIN-2018-47,<unknown>,55767519,55767519,2.1072\nCC-MAIN-2018-47,Big5,2790341,2778870,0.1054\nCC-MAIN-2018-47,Big5-HKSCS,7554,7549,0.0003\nCC-MAIN-2018-47,EUC-JP,9774292,9707913,0.3693\nCC-MAIN-2018-47,EUC-KR,3977836,3966968,0.1503\nCC-MAIN-2018-47,GB18030,1801683,1796763,0.0681\nCC-MAIN-2018-47,GB2312,27965419,27879814,1.0567\nCC-MAIN-2018-47,GBK,12112024,11991049,0.4577\nCC-MAIN-2018-47,IBM500,13,13,0.0000\nCC-MAIN-2018-47,IBM855,7254,7237,0.0003\nCC-MAIN-2018-47,IBM866,39087,39014,0.0015\nCC-MAIN-2018-47,ISO-2022-JP,48184,47996,0.0018\nCC-MAIN-2018-47,ISO-8859-1,142054924,140845987,5.3675\nCC-MAIN-2018-47,ISO-8859-13,8277,8264,0.0003\nCC-MAIN-2018-47,ISO-8859-15,6899189,6835127,0.2607\nCC-MAIN-2018-47,ISO-8859-2,8017077,7978512,0.3029\nCC-MAIN-2018-47,ISO-8859-3,8018,7806,0.0003\nCC-MAIN-2018-47,ISO-8859-4,26626,26357,0.0010\nCC-MAIN-2018-47,ISO-8859-5,48637,48474,0.0018\nCC-MAIN-2018-47,ISO-8859-6,3883,3788,0.0001\nCC-MAIN-2018-47,ISO-8859-7,577015,574581,0.0218\nCC-MAIN-2018-47,ISO-8859-8,37380,37042,0.0014\nCC-MAIN-2018-47,ISO-8859-9,1668202,1654680,0.0630\nCC-MAIN-2018-47,KOI8-R,527750,526308,0.0199\nCC-MAIN-2018-47,KOI8-U,5822,5805,0.0002\nCC-MAIN-2018-47,Shift_JIS,17775853,17651965,0.6717\nCC-MAIN-2018-47,TIS-620,494862,493188,0.0187\nCC-MAIN-2018-47,US-ASCII,976406,972169,0.0369\nCC-MAIN-2018-47,UTF-16,101666,101006,0.0038\nCC-MAIN-2018-47,UTF-16BE,3016,2998,0.0001\nCC-MAIN-2018-47,UTF-16LE,124453,123860,0.0047\nCC-MAIN-2018-47,UTF-32,1659,1655,0.0001\nCC-MAIN-2018-47,UTF-32LE,4,4,0.0000\nCC-MAIN-2018-47,UTF-8,2254096587,2223908358,85.1705\nCC-MAIN-2018-47,windows-1250,4792766,4762591,0.1811\nCC-MAIN-2018-47,windows-1251,56380684,56131078,2.1303\nCC-MAIN-2018-47,windows-1252,30279903,30038880,1.1441\nCC-MAIN-2018-47,windows-1253,185084,184226,0.0070\nCC-MAIN-2018-47,windows-1254,1054047,1044938,0.0398\nCC-MAIN-2018-47,windows-1255,548488,545486,0.0207\nCC-MAIN-2018-47,windows-1256,4592998,4579351,0.1735\nCC-MAIN-2018-47,windows-1257,306603,305627,0.0116\nCC-MAIN-2018-47,windows-31j,40270,39887,0.0015\nCC-MAIN-2018-47,x-MacCyrillic,155965,155501,0.0059\nCC-MAIN-2018-47,x-iso-8859-11,1046,1042,0.0000\nCC-MAIN-2018-47,x-windows-874,474844,472732,0.0179\nCC-MAIN-2018-47,x-windows-949,1207,1204,0.0000\nCC-MAIN-2018-51,<other>,5434,5310,0.0002\nCC-MAIN-2018-51,<unknown>,67918443,67918443,2.1464\nCC-MAIN-2018-51,Big5,3198731,3192058,0.1011\nCC-MAIN-2018-51,Big5-HKSCS,7420,7413,0.0002\nCC-MAIN-2018-51,EUC-JP,11510303,11444574,0.3638\nCC-MAIN-2018-51,EUC-KR,5156694,5145873,0.1630\nCC-MAIN-2018-51,GB18030,2108204,2100620,0.0666\nCC-MAIN-2018-51,GB2312,34060489,33961559,1.0764\nCC-MAIN-2018-51,GBK,14267277,14133734,0.4509\nCC-MAIN-2018-51,IBM500,14,14,0.0000\nCC-MAIN-2018-51,IBM855,8790,8749,0.0003\nCC-MAIN-2018-51,IBM866,21650,21558,0.0007\nCC-MAIN-2018-51,ISO-2022-JP,54514,54198,0.0017\nCC-MAIN-2018-51,ISO-8859-1,165450495,164209215,5.2287\nCC-MAIN-2018-51,ISO-8859-13,11879,11863,0.0004\nCC-MAIN-2018-51,ISO-8859-15,7416805,7356975,0.2344\nCC-MAIN-2018-51,ISO-8859-2,9324792,9288112,0.2947\nCC-MAIN-2018-51,ISO-8859-3,8774,8519,0.0003\nCC-MAIN-2018-51,ISO-8859-4,38938,38465,0.0012\nCC-MAIN-2018-51,ISO-8859-5,70744,70595,0.0022\nCC-MAIN-2018-51,ISO-8859-6,5659,5583,0.0002\nCC-MAIN-2018-51,ISO-8859-7,685186,682886,0.0217\nCC-MAIN-2018-51,ISO-8859-8,38166,37985,0.0012\nCC-MAIN-2018-51,ISO-8859-9,1930121,1919080,0.0610\nCC-MAIN-2018-51,KOI8-R,537503,535927,0.0170\nCC-MAIN-2018-51,KOI8-U,11745,11733,0.0004\nCC-MAIN-2018-51,Shift_JIS,19098046,18951922,0.6036\nCC-MAIN-2018-51,TIS-620,534131,530719,0.0169\nCC-MAIN-2018-51,US-ASCII,1189365,1184488,0.0376\nCC-MAIN-2018-51,UTF-16,104806,103897,0.0033\nCC-MAIN-2018-51,UTF-16BE,2022,2006,0.0001\nCC-MAIN-2018-51,UTF-16LE,89907,89319,0.0028\nCC-MAIN-2018-51,UTF-32,3001,2973,0.0001\nCC-MAIN-2018-51,UTF-32LE,3,3,0.0000\nCC-MAIN-2018-51,UTF-8,2709480994,2675024546,85.6280\nCC-MAIN-2018-51,windows-1250,5520909,5484030,0.1745\nCC-MAIN-2018-51,windows-1251,63095858,62861645,1.9940\nCC-MAIN-2018-51,windows-1252,32645988,32373077,1.0317\nCC-MAIN-2018-51,windows-1253,200227,199112,0.0063\nCC-MAIN-2018-51,windows-1254,1170301,1162882,0.0370\nCC-MAIN-2018-51,windows-1255,571370,568689,0.0181\nCC-MAIN-2018-51,windows-1256,5537481,5526621,0.1750\nCC-MAIN-2018-51,windows-1257,362375,361109,0.0115\nCC-MAIN-2018-51,windows-31j,52007,51652,0.0016\nCC-MAIN-2018-51,x-MacCyrillic,183894,183394,0.0058\nCC-MAIN-2018-51,x-iso-8859-11,1976,1971,0.0001\nCC-MAIN-2018-51,x-windows-874,553449,551004,0.0175\nCC-MAIN-2018-51,x-windows-949,755,752,0.0000\nCC-MAIN-2019-04,<other>,3120,3082,0.0001\nCC-MAIN-2019-04,<unknown>,56503746,56503746,1.9553\nCC-MAIN-2019-04,Big5,2878045,2871541,0.0996\nCC-MAIN-2019-04,Big5-HKSCS,7104,7100,0.0002\nCC-MAIN-2019-04,EUC-JP,10508300,10442940,0.3636\nCC-MAIN-2019-04,EUC-KR,4795172,4786966,0.1659\nCC-MAIN-2019-04,GB18030,1680438,1675010,0.0582\nCC-MAIN-2019-04,GB2312,27128941,27048116,0.9388\nCC-MAIN-2019-04,GBK,13403477,13249104,0.4638\nCC-MAIN-2019-04,IBM500,16,16,0.0000\nCC-MAIN-2019-04,IBM855,6424,6409,0.0002\nCC-MAIN-2019-04,IBM866,28380,28250,0.0010\nCC-MAIN-2019-04,ISO-2022-JP,29239,29129,0.0010\nCC-MAIN-2019-04,ISO-8859-1,136386399,135497182,4.7197\nCC-MAIN-2019-04,ISO-8859-13,10370,10364,0.0004\nCC-MAIN-2019-04,ISO-8859-15,6704567,6663103,0.2320\nCC-MAIN-2019-04,ISO-8859-2,8600526,8572722,0.2976\nCC-MAIN-2019-04,ISO-8859-3,7482,7454,0.0003\nCC-MAIN-2019-04,ISO-8859-4,31424,31155,0.0011\nCC-MAIN-2019-04,ISO-8859-5,52251,52151,0.0018\nCC-MAIN-2019-04,ISO-8859-6,5390,5333,0.0002\nCC-MAIN-2019-04,ISO-8859-7,612931,611640,0.0212\nCC-MAIN-2019-04,ISO-8859-8,33345,33179,0.0012\nCC-MAIN-2019-04,ISO-8859-9,1762983,1750864,0.0610\nCC-MAIN-2019-04,KOI8-R,462591,461567,0.0160\nCC-MAIN-2019-04,KOI8-U,6379,6366,0.0002\nCC-MAIN-2019-04,Shift_JIS,13894174,13782816,0.4808\nCC-MAIN-2019-04,TIS-620,497731,495783,0.0172\nCC-MAIN-2019-04,US-ASCII,911526,908432,0.0315\nCC-MAIN-2019-04,UTF-16,96192,95614,0.0033\nCC-MAIN-2019-04,UTF-16BE,3482,3470,0.0001\nCC-MAIN-2019-04,UTF-16LE,78727,78283,0.0027\nCC-MAIN-2019-04,UTF-32,1752,1747,0.0001\nCC-MAIN-2019-04,UTF-32LE,2,2,0.0000\nCC-MAIN-2019-04,UTF-8,2513543714,2488208780,86.9821\nCC-MAIN-2019-04,windows-1250,4940236,4902965,0.1710\nCC-MAIN-2019-04,windows-1251,52540303,52361966,1.8182\nCC-MAIN-2019-04,windows-1252,23687194,23512000,0.8197\nCC-MAIN-2019-04,windows-1253,160253,159449,0.0055\nCC-MAIN-2019-04,windows-1254,1056744,1048268,0.0366\nCC-MAIN-2019-04,windows-1255,577473,573752,0.0200\nCC-MAIN-2019-04,windows-1256,5091584,5084020,0.1762\nCC-MAIN-2019-04,windows-1257,313376,312112,0.0108\nCC-MAIN-2019-04,windows-31j,34902,34751,0.0012\nCC-MAIN-2019-04,x-MacCyrillic,155159,154951,0.0054\nCC-MAIN-2019-04,x-iso-8859-11,1823,1818,0.0001\nCC-MAIN-2019-04,x-windows-874,489725,488206,0.0169\nCC-MAIN-2019-04,x-windows-949,1530,1527,0.0001\nCC-MAIN-2019-09,<other>,5224,5204,0.0002\nCC-MAIN-2019-09,<unknown>,73070673,73070673,2.5078\nCC-MAIN-2019-09,Big5,2309155,2304493,0.0793\nCC-MAIN-2019-09,Big5-HKSCS,10904,10902,0.0004\nCC-MAIN-2019-09,EUC-JP,10037847,9987065,0.3445\nCC-MAIN-2019-09,EUC-KR,5151976,5144548,0.1768\nCC-MAIN-2019-09,GB18030,2492998,2487624,0.0856\nCC-MAIN-2019-09,GB2312,31674710,31561548,1.0871\nCC-MAIN-2019-09,GBK,14497541,14438247,0.4976\nCC-MAIN-2019-09,IBM500,12,12,0.0000\nCC-MAIN-2019-09,IBM855,8107,8090,0.0003\nCC-MAIN-2019-09,IBM866,38197,38113,0.0013\nCC-MAIN-2019-09,ISO-2022-JP,52718,52570,0.0018\nCC-MAIN-2019-09,ISO-8859-1,138321842,137383366,4.7472\nCC-MAIN-2019-09,ISO-8859-13,12181,12173,0.0004\nCC-MAIN-2019-09,ISO-8859-15,5747873,5699996,0.1973\nCC-MAIN-2019-09,ISO-8859-2,6815550,6787862,0.2339\nCC-MAIN-2019-09,ISO-8859-3,7879,7861,0.0003\nCC-MAIN-2019-09,ISO-8859-4,36292,36120,0.0012\nCC-MAIN-2019-09,ISO-8859-5,39640,39473,0.0014\nCC-MAIN-2019-09,ISO-8859-6,7344,7289,0.0003\nCC-MAIN-2019-09,ISO-8859-7,478358,476736,0.0164\nCC-MAIN-2019-09,ISO-8859-8,40576,40433,0.0014\nCC-MAIN-2019-09,ISO-8859-9,1736351,1728776,0.0596\nCC-MAIN-2019-09,KOI8-R,444018,442834,0.0152\nCC-MAIN-2019-09,KOI8-U,9516,9466,0.0003\nCC-MAIN-2019-09,Shift_JIS,16108058,16021754,0.5528\nCC-MAIN-2019-09,TIS-620,508480,504974,0.0175\nCC-MAIN-2019-09,US-ASCII,1346025,1341118,0.0462\nCC-MAIN-2019-09,UTF-16,88134,87577,0.0030\nCC-MAIN-2019-09,UTF-16BE,1883,1871,0.0001\nCC-MAIN-2019-09,UTF-16LE,72702,71939,0.0025\nCC-MAIN-2019-09,UTF-32,2404,2399,0.0001\nCC-MAIN-2019-09,UTF-32LE,5,5,0.0000\nCC-MAIN-2019-09,UTF-8,2509946310,2483068828,86.1419\nCC-MAIN-2019-09,windows-1250,5160717,5124276,0.1771\nCC-MAIN-2019-09,windows-1251,53727061,53506185,1.8439\nCC-MAIN-2019-09,windows-1252,26780002,26613572,0.9191\nCC-MAIN-2019-09,windows-1253,201865,201148,0.0069\nCC-MAIN-2019-09,windows-1254,1108301,1103985,0.0380\nCC-MAIN-2019-09,windows-1255,589639,587888,0.0202\nCC-MAIN-2019-09,windows-1256,3915782,3904965,0.1344\nCC-MAIN-2019-09,windows-1257,311587,310223,0.0107\nCC-MAIN-2019-09,windows-31j,37304,37078,0.0013\nCC-MAIN-2019-09,x-MacCyrillic,171504,171205,0.0059\nCC-MAIN-2019-09,x-iso-8859-11,1665,1661,0.0001\nCC-MAIN-2019-09,x-windows-874,605446,603414,0.0208\nCC-MAIN-2019-09,x-windows-949,1066,1065,0.0000\nCC-MAIN-2019-13,<other>,4750,4726,0.0002\nCC-MAIN-2019-13,<unknown>,51039369,51039369,1.9862\nCC-MAIN-2019-13,Big5,2275470,2270015,0.0886\nCC-MAIN-2019-13,Big5-HKSCS,9866,9855,0.0004\nCC-MAIN-2019-13,EUC-JP,8374619,8328170,0.3259\nCC-MAIN-2019-13,EUC-KR,4121011,4115401,0.1604\nCC-MAIN-2019-13,GB18030,1690480,1681689,0.0658\nCC-MAIN-2019-13,GB2312,29370741,29115261,1.1430\nCC-MAIN-2019-13,GBK,15298597,15210826,0.5953\nCC-MAIN-2019-13,IBM500,14,14,0.0000\nCC-MAIN-2019-13,IBM855,7419,7402,0.0003\nCC-MAIN-2019-13,IBM866,23682,23623,0.0009\nCC-MAIN-2019-13,ISO-2022-JP,57461,57321,0.0022\nCC-MAIN-2019-13,ISO-8859-1,121960972,121028763,4.7462\nCC-MAIN-2019-13,ISO-8859-13,9299,9285,0.0004\nCC-MAIN-2019-13,ISO-8859-15,4314702,4271842,0.1679\nCC-MAIN-2019-13,ISO-8859-2,5778135,5751412,0.2249\nCC-MAIN-2019-13,ISO-8859-3,7298,7274,0.0003\nCC-MAIN-2019-13,ISO-8859-4,25136,24935,0.0010\nCC-MAIN-2019-13,ISO-8859-5,42243,42083,0.0016\nCC-MAIN-2019-13,ISO-8859-6,6892,6844,0.0003\nCC-MAIN-2019-13,ISO-8859-7,396305,395256,0.0154\nCC-MAIN-2019-13,ISO-8859-8,28807,28593,0.0011\nCC-MAIN-2019-13,ISO-8859-9,1385891,1378977,0.0539\nCC-MAIN-2019-13,KOI8-R,418342,410410,0.0163\nCC-MAIN-2019-13,KOI8-U,6506,6487,0.0003\nCC-MAIN-2019-13,Shift_JIS,14498097,14418204,0.5642\nCC-MAIN-2019-13,TIS-620,403444,400940,0.0157\nCC-MAIN-2019-13,US-ASCII,1353350,1347901,0.0527\nCC-MAIN-2019-13,UTF-16,88761,88351,0.0035\nCC-MAIN-2019-13,UTF-16BE,2728,2638,0.0001\nCC-MAIN-2019-13,UTF-16LE,74555,74146,0.0029\nCC-MAIN-2019-13,UTF-32,1648,1642,0.0001\nCC-MAIN-2019-13,UTF-32LE,7,6,0.0000\nCC-MAIN-2019-13,UTF-8,2229318573,2204827915,86.7547\nCC-MAIN-2019-13,windows-1250,4367320,4342789,0.1700\nCC-MAIN-2019-13,windows-1251,42941566,42731991,1.6711\nCC-MAIN-2019-13,windows-1252,24382413,24184972,0.9488\nCC-MAIN-2019-13,windows-1253,177777,176871,0.0069\nCC-MAIN-2019-13,windows-1254,957525,951762,0.0373\nCC-MAIN-2019-13,windows-1255,537691,535663,0.0209\nCC-MAIN-2019-13,windows-1256,2975271,2965100,0.1158\nCC-MAIN-2019-13,windows-1257,224432,223975,0.0087\nCC-MAIN-2019-13,windows-31j,34861,34462,0.0014\nCC-MAIN-2019-13,x-MacCyrillic,138577,137548,0.0054\nCC-MAIN-2019-13,x-iso-8859-11,2548,2544,0.0001\nCC-MAIN-2019-13,x-windows-874,545751,543828,0.0212\nCC-MAIN-2019-13,x-windows-949,943,940,0.0000\nCC-MAIN-2019-18,<other>,5286,5260,0.0002\nCC-MAIN-2019-18,<unknown>,39545403,39545403,1.5832\nCC-MAIN-2019-18,Big5,1858154,1852213,0.0744\nCC-MAIN-2019-18,Big5-HKSCS,10541,10538,0.0004\nCC-MAIN-2019-18,EUC-JP,7416122,7373920,0.2969\nCC-MAIN-2019-18,EUC-KR,3389591,3384933,0.1357\nCC-MAIN-2019-18,GB18030,1466651,1455015,0.0587\nCC-MAIN-2019-18,GB2312,26847400,26636899,1.0748\nCC-MAIN-2019-18,GBK,13691300,13527396,0.5481\nCC-MAIN-2019-18,IBM500,13,13,0.0000\nCC-MAIN-2019-18,IBM855,9820,9807,0.0004\nCC-MAIN-2019-18,IBM866,26295,26229,0.0011\nCC-MAIN-2019-18,ISO-2022-JP,41715,41640,0.0017\nCC-MAIN-2019-18,ISO-8859-1,108347978,107517682,4.3377\nCC-MAIN-2019-18,ISO-8859-13,5810,5807,0.0002\nCC-MAIN-2019-18,ISO-8859-15,4353462,4311103,0.1743\nCC-MAIN-2019-18,ISO-8859-2,5213051,5182143,0.2087\nCC-MAIN-2019-18,ISO-8859-3,5387,5139,0.0002\nCC-MAIN-2019-18,ISO-8859-4,24641,24395,0.0010\nCC-MAIN-2019-18,ISO-8859-5,48155,48055,0.0019\nCC-MAIN-2019-18,ISO-8859-6,9068,9025,0.0004\nCC-MAIN-2019-18,ISO-8859-7,348268,347295,0.0139\nCC-MAIN-2019-18,ISO-8859-8,26392,26285,0.0011\nCC-MAIN-2019-18,ISO-8859-9,1220179,1212710,0.0488\nCC-MAIN-2019-18,KOI8-R,368388,359362,0.0147\nCC-MAIN-2019-18,KOI8-U,7596,7584,0.0003\nCC-MAIN-2019-18,Shift_JIS,11705143,11638976,0.4686\nCC-MAIN-2019-18,TIS-620,349856,347165,0.0140\nCC-MAIN-2019-18,US-ASCII,1426268,1423382,0.0571\nCC-MAIN-2019-18,UTF-16,76456,76046,0.0031\nCC-MAIN-2019-18,UTF-16BE,1935,1873,0.0001\nCC-MAIN-2019-18,UTF-16LE,53329,53022,0.0021\nCC-MAIN-2019-18,UTF-32,1387,1385,0.0001\nCC-MAIN-2019-18,UTF-32LE,3,3,0.0000\nCC-MAIN-2019-18,UTF-8,2201291410,2177523946,88.1286\nCC-MAIN-2019-18,windows-1250,3779472,3758417,0.1513\nCC-MAIN-2019-18,windows-1251,40381447,40159222,1.6167\nCC-MAIN-2019-18,windows-1252,19497979,19337887,0.7806\nCC-MAIN-2019-18,windows-1253,159211,158538,0.0064\nCC-MAIN-2019-18,windows-1254,810043,805072,0.0324\nCC-MAIN-2019-18,windows-1255,470592,468818,0.0188\nCC-MAIN-2019-18,windows-1256,2682398,2672153,0.1074\nCC-MAIN-2019-18,windows-1257,170918,170245,0.0068\nCC-MAIN-2019-18,windows-31j,32261,32171,0.0013\nCC-MAIN-2019-18,x-MacCyrillic,125089,124466,0.0050\nCC-MAIN-2019-18,x-iso-8859-11,1692,1688,0.0001\nCC-MAIN-2019-18,x-windows-874,514486,511990,0.0206\nCC-MAIN-2019-18,x-windows-949,566,565,0.0000\nCC-MAIN-2019-22,<other>,4968,4943,0.0002\nCC-MAIN-2019-22,<unknown>,46863427,46863427,1.7488\nCC-MAIN-2019-22,Big5,2114327,2107121,0.0789\nCC-MAIN-2019-22,Big5-HKSCS,9414,9412,0.0004\nCC-MAIN-2019-22,EUC-JP,8118566,8075679,0.3030\nCC-MAIN-2019-22,EUC-KR,4245169,4237810,0.1584\nCC-MAIN-2019-22,GB18030,1916563,1904649,0.0715\nCC-MAIN-2019-22,GB2312,37764375,37535054,1.4093\nCC-MAIN-2019-22,GBK,17754834,17582866,0.6626\nCC-MAIN-2019-22,IBM500,12,12,0.0000\nCC-MAIN-2019-22,IBM855,7195,7154,0.0003\nCC-MAIN-2019-22,IBM866,20834,20700,0.0008\nCC-MAIN-2019-22,ISO-2022-JP,34965,34899,0.0013\nCC-MAIN-2019-22,ISO-8859-1,112836792,112004100,4.2107\nCC-MAIN-2019-22,ISO-8859-13,7596,7591,0.0003\nCC-MAIN-2019-22,ISO-8859-15,4166799,4119990,0.1555\nCC-MAIN-2019-22,ISO-8859-2,5730823,5695820,0.2139\nCC-MAIN-2019-22,ISO-8859-3,4648,4637,0.0002\nCC-MAIN-2019-22,ISO-8859-4,26507,26305,0.0010\nCC-MAIN-2019-22,ISO-8859-5,73518,73425,0.0027\nCC-MAIN-2019-22,ISO-8859-6,9518,9422,0.0004\nCC-MAIN-2019-22,ISO-8859-7,389807,387105,0.0145\nCC-MAIN-2019-22,ISO-8859-8,27222,27070,0.0010\nCC-MAIN-2019-22,ISO-8859-9,1402019,1393732,0.0523\nCC-MAIN-2019-22,KOI8-R,347580,344349,0.0130\nCC-MAIN-2019-22,KOI8-U,7848,7833,0.0003\nCC-MAIN-2019-22,Shift_JIS,11346769,11275595,0.4234\nCC-MAIN-2019-22,TIS-620,412412,409685,0.0154\nCC-MAIN-2019-22,US-ASCII,1274724,1272200,0.0476\nCC-MAIN-2019-22,UTF-16,72452,71974,0.0027\nCC-MAIN-2019-22,UTF-16BE,1931,1871,0.0001\nCC-MAIN-2019-22,UTF-16LE,47776,47510,0.0018\nCC-MAIN-2019-22,UTF-32,1710,1654,0.0001\nCC-MAIN-2019-22,UTF-32LE,1,1,0.0000\nCC-MAIN-2019-22,UTF-8,2353847190,2328732692,87.8384\nCC-MAIN-2019-22,windows-1250,4126784,4099125,0.1540\nCC-MAIN-2019-22,windows-1251,39983416,39800506,1.4921\nCC-MAIN-2019-22,windows-1252,19001139,18857340,0.7091\nCC-MAIN-2019-22,windows-1253,165998,163797,0.0062\nCC-MAIN-2019-22,windows-1254,973150,963652,0.0363\nCC-MAIN-2019-22,windows-1255,532456,530369,0.0199\nCC-MAIN-2019-22,windows-1256,3143909,3129264,0.1173\nCC-MAIN-2019-22,windows-1257,221860,220732,0.0083\nCC-MAIN-2019-22,windows-31j,39772,39505,0.0015\nCC-MAIN-2019-22,x-MacCyrillic,126398,125348,0.0047\nCC-MAIN-2019-22,x-iso-8859-11,2023,2022,0.0001\nCC-MAIN-2019-22,x-windows-874,538205,535932,0.0201\nCC-MAIN-2019-22,x-windows-949,849,849,0.0000\nCC-MAIN-2019-26,<other>,2985,2953,0.0001\nCC-MAIN-2019-26,<unknown>,40453891,40453891,1.5594\nCC-MAIN-2019-26,Big5,1907242,1902387,0.0735\nCC-MAIN-2019-26,Big5-HKSCS,8496,8492,0.0003\nCC-MAIN-2019-26,EUC-JP,8057033,8019763,0.3106\nCC-MAIN-2019-26,EUC-KR,4083750,4075810,0.1574\nCC-MAIN-2019-26,GB18030,3065659,3050805,0.1182\nCC-MAIN-2019-26,GB2312,28766705,28485048,1.1089\nCC-MAIN-2019-26,GBK,14792756,14495897,0.5702\nCC-MAIN-2019-26,IBM500,9,9,0.0000\nCC-MAIN-2019-26,IBM855,6719,6622,0.0003\nCC-MAIN-2019-26,IBM866,23393,23041,0.0009\nCC-MAIN-2019-26,ISO-2022-JP,23340,23280,0.0009\nCC-MAIN-2019-26,ISO-8859-1,102272433,101552428,3.9423\nCC-MAIN-2019-26,ISO-8859-13,7510,7507,0.0003\nCC-MAIN-2019-26,ISO-8859-15,4666521,4621017,0.1799\nCC-MAIN-2019-26,ISO-8859-2,5584913,5556819,0.2153\nCC-MAIN-2019-26,ISO-8859-3,3968,3954,0.0002\nCC-MAIN-2019-26,ISO-8859-4,34092,33646,0.0013\nCC-MAIN-2019-26,ISO-8859-5,68089,68011,0.0026\nCC-MAIN-2019-26,ISO-8859-6,7863,7820,0.0003\nCC-MAIN-2019-26,ISO-8859-7,383549,380449,0.0148\nCC-MAIN-2019-26,ISO-8859-8,26514,26416,0.0010\nCC-MAIN-2019-26,ISO-8859-9,1298646,1290845,0.0501\nCC-MAIN-2019-26,KOI8-R,283874,282448,0.0109\nCC-MAIN-2019-26,KOI8-U,6344,6271,0.0002\nCC-MAIN-2019-26,Shift_JIS,9330788,9275830,0.3597\nCC-MAIN-2019-26,TIS-620,426501,424839,0.0164\nCC-MAIN-2019-26,US-ASCII,1110555,1108819,0.0428\nCC-MAIN-2019-26,UTF-16,76735,75942,0.0030\nCC-MAIN-2019-26,UTF-16BE,1477,1444,0.0001\nCC-MAIN-2019-26,UTF-16LE,28998,28827,0.0011\nCC-MAIN-2019-26,UTF-32,1810,1760,0.0001\nCC-MAIN-2019-26,UTF-32LE,1,1,0.0000\nCC-MAIN-2019-26,UTF-8,2306319918,2285269523,88.9008\nCC-MAIN-2019-26,windows-1250,3920225,3897007,0.1511\nCC-MAIN-2019-26,windows-1251,36374114,36209887,1.4021\nCC-MAIN-2019-26,windows-1252,15090729,14990992,0.5817\nCC-MAIN-2019-26,windows-1253,145595,144931,0.0056\nCC-MAIN-2019-26,windows-1254,914768,903513,0.0353\nCC-MAIN-2019-26,windows-1255,628662,625767,0.0242\nCC-MAIN-2019-26,windows-1256,3147674,3135791,0.1213\nCC-MAIN-2019-26,windows-1257,232978,231485,0.0090\nCC-MAIN-2019-26,windows-31j,58970,58111,0.0023\nCC-MAIN-2019-26,x-MacCyrillic,111476,110995,0.0043\nCC-MAIN-2019-26,x-iso-8859-11,1410,1406,0.0001\nCC-MAIN-2019-26,x-windows-874,500850,499566,0.0193\nCC-MAIN-2019-26,x-windows-949,589,585,0.0000\nCC-MAIN-2019-30,<other>,3015,2992,0.0001\nCC-MAIN-2019-30,<unknown>,30026440,30026440,1.1572\nCC-MAIN-2019-30,Big5,1840594,1834540,0.0709\nCC-MAIN-2019-30,Big5-HKSCS,7869,7866,0.0003\nCC-MAIN-2019-30,EUC-JP,7317903,7280775,0.2820\nCC-MAIN-2019-30,EUC-KR,3787271,3778885,0.1460\nCC-MAIN-2019-30,GB18030,2001230,1983853,0.0771\nCC-MAIN-2019-30,GB2312,29216429,28935636,1.1260\nCC-MAIN-2019-30,GBK,16738888,16419697,0.6451\nCC-MAIN-2019-30,IBM500,14,14,0.0000\nCC-MAIN-2019-30,IBM855,7465,7420,0.0003\nCC-MAIN-2019-30,IBM866,26101,26039,0.0010\nCC-MAIN-2019-30,ISO-2022-JP,20167,20137,0.0008\nCC-MAIN-2019-30,ISO-8859-1,98723653,98007577,3.8047\nCC-MAIN-2019-30,ISO-8859-13,7853,7845,0.0003\nCC-MAIN-2019-30,ISO-8859-15,5031316,4980591,0.1939\nCC-MAIN-2019-30,ISO-8859-2,5110326,5083583,0.1969\nCC-MAIN-2019-30,ISO-8859-3,4386,4368,0.0002\nCC-MAIN-2019-30,ISO-8859-4,32048,31718,0.0012\nCC-MAIN-2019-30,ISO-8859-5,58457,58270,0.0023\nCC-MAIN-2019-30,ISO-8859-6,8011,7966,0.0003\nCC-MAIN-2019-30,ISO-8859-7,358069,355628,0.0138\nCC-MAIN-2019-30,ISO-8859-8,22781,22709,0.0009\nCC-MAIN-2019-30,ISO-8859-9,1216842,1209106,0.0469\nCC-MAIN-2019-30,KOI8-R,267930,266646,0.0103\nCC-MAIN-2019-30,KOI8-U,6798,6789,0.0003\nCC-MAIN-2019-30,Shift_JIS,8575703,8514296,0.3305\nCC-MAIN-2019-30,TIS-620,383243,381517,0.0148\nCC-MAIN-2019-30,US-ASCII,1051410,1048736,0.0405\nCC-MAIN-2019-30,UTF-16,87728,87204,0.0034\nCC-MAIN-2019-30,UTF-16BE,2134,2124,0.0001\nCC-MAIN-2019-30,UTF-16LE,18042,17861,0.0007\nCC-MAIN-2019-30,UTF-32,1897,1705,0.0001\nCC-MAIN-2019-30,UTF-8,2326454221,2304488544,89.6584\nCC-MAIN-2019-30,windows-1250,3866661,3842799,0.1490\nCC-MAIN-2019-30,windows-1251,33124425,32973228,1.2766\nCC-MAIN-2019-30,windows-1252,13838772,13737200,0.5333\nCC-MAIN-2019-30,windows-1253,140509,140068,0.0054\nCC-MAIN-2019-30,windows-1254,885756,876081,0.0341\nCC-MAIN-2019-30,windows-1255,641886,638864,0.0247\nCC-MAIN-2019-30,windows-1256,2975692,2965036,0.1147\nCC-MAIN-2019-30,windows-1257,247624,246395,0.0095\nCC-MAIN-2019-30,windows-31j,77300,76864,0.0030\nCC-MAIN-2019-30,x-MacCyrillic,111290,110635,0.0043\nCC-MAIN-2019-30,x-iso-8859-11,1270,1269,0.0000\nCC-MAIN-2019-30,x-windows-874,470056,466601,0.0181\nCC-MAIN-2019-30,x-windows-949,900,898,0.0000\nCC-MAIN-2019-35,<other>,3320,3301,0.0001\nCC-MAIN-2019-35,<unknown>,32202508,32202508,1.0898\nCC-MAIN-2019-35,Big5,1988059,1982152,0.0673\nCC-MAIN-2019-35,Big5-HKSCS,8543,8539,0.0003\nCC-MAIN-2019-35,EUC-JP,7637465,7591120,0.2585\nCC-MAIN-2019-35,EUC-KR,4663964,4650064,0.1578\nCC-MAIN-2019-35,GB18030,2380719,2359272,0.0806\nCC-MAIN-2019-35,GB2312,42877030,42483833,1.4511\nCC-MAIN-2019-35,GBK,36126613,35730816,1.2226\nCC-MAIN-2019-35,IBM500,10,10,0.0000\nCC-MAIN-2019-35,IBM855,7398,7367,0.0003\nCC-MAIN-2019-35,IBM866,27254,27130,0.0009\nCC-MAIN-2019-35,ISO-2022-JP,30744,30590,0.0010\nCC-MAIN-2019-35,ISO-8859-1,106567851,105801841,3.6066\nCC-MAIN-2019-35,ISO-8859-13,16695,16690,0.0006\nCC-MAIN-2019-35,ISO-8859-15,4880299,4825997,0.1652\nCC-MAIN-2019-35,ISO-8859-2,5885857,5854922,0.1992\nCC-MAIN-2019-35,ISO-8859-3,3471,3467,0.0001\nCC-MAIN-2019-35,ISO-8859-4,50112,49735,0.0017\nCC-MAIN-2019-35,ISO-8859-5,65960,65850,0.0022\nCC-MAIN-2019-35,ISO-8859-6,12789,12607,0.0004\nCC-MAIN-2019-35,ISO-8859-7,402205,399630,0.0136\nCC-MAIN-2019-35,ISO-8859-8,30417,30286,0.0010\nCC-MAIN-2019-35,ISO-8859-9,1393901,1385884,0.0472\nCC-MAIN-2019-35,KOI8-R,282815,281820,0.0096\nCC-MAIN-2019-35,KOI8-U,4755,4747,0.0002\nCC-MAIN-2019-35,Shift_JIS,9422487,9354153,0.3189\nCC-MAIN-2019-35,TIS-620,436930,435237,0.0148\nCC-MAIN-2019-35,US-ASCII,1031285,1028965,0.0349\nCC-MAIN-2019-35,UTF-16,99924,98930,0.0034\nCC-MAIN-2019-35,UTF-16BE,2116,2108,0.0001\nCC-MAIN-2019-35,UTF-16LE,27443,27243,0.0009\nCC-MAIN-2019-35,UTF-32,2584,2476,0.0001\nCC-MAIN-2019-35,UTF-32LE,2,2,0.0000\nCC-MAIN-2019-35,UTF-8,2635346008,2610600587,89.1876\nCC-MAIN-2019-35,windows-1250,3951657,3929786,0.1337\nCC-MAIN-2019-35,windows-1251,34846898,34684908,1.1793\nCC-MAIN-2019-35,windows-1252,15593679,15466247,0.5277\nCC-MAIN-2019-35,windows-1253,175283,174762,0.0059\nCC-MAIN-2019-35,windows-1254,985216,974651,0.0333\nCC-MAIN-2019-35,windows-1255,827097,823489,0.0280\nCC-MAIN-2019-35,windows-1256,3432212,3419195,0.1162\nCC-MAIN-2019-35,windows-1257,357600,355393,0.0121\nCC-MAIN-2019-35,windows-31j,69178,68990,0.0023\nCC-MAIN-2019-35,x-MacCyrillic,115937,114997,0.0039\nCC-MAIN-2019-35,x-iso-8859-11,2491,2486,0.0001\nCC-MAIN-2019-35,x-windows-874,558167,554938,0.0189\nCC-MAIN-2019-35,x-windows-949,1117,1114,0.0000\nCC-MAIN-2019-39,<other>,3102,3088,0.0001\nCC-MAIN-2019-39,<unknown>,51214718,51214718,1.9997\nCC-MAIN-2019-39,Big5,1662412,1656484,0.0649\nCC-MAIN-2019-39,Big5-HKSCS,11241,11239,0.0004\nCC-MAIN-2019-39,EUC-JP,6657154,6620897,0.2599\nCC-MAIN-2019-39,EUC-KR,3740983,3733788,0.1461\nCC-MAIN-2019-39,GB18030,1946824,1912166,0.0760\nCC-MAIN-2019-39,GB2312,28523770,28140317,1.1137\nCC-MAIN-2019-39,GBK,21765704,21326745,0.8499\nCC-MAIN-2019-39,IBM500,8,8,0.0000\nCC-MAIN-2019-39,IBM855,5749,5724,0.0002\nCC-MAIN-2019-39,IBM866,18855,18744,0.0007\nCC-MAIN-2019-39,ISO-2022-JP,16892,16867,0.0007\nCC-MAIN-2019-39,ISO-8859-1,92311849,91649146,3.6044\nCC-MAIN-2019-39,ISO-8859-13,13920,13916,0.0005\nCC-MAIN-2019-39,ISO-8859-15,4433324,4388602,0.1731\nCC-MAIN-2019-39,ISO-8859-2,5465900,5436126,0.2134\nCC-MAIN-2019-39,ISO-8859-3,5592,5575,0.0002\nCC-MAIN-2019-39,ISO-8859-4,49925,49678,0.0019\nCC-MAIN-2019-39,ISO-8859-5,60446,60353,0.0024\nCC-MAIN-2019-39,ISO-8859-6,12282,12162,0.0005\nCC-MAIN-2019-39,ISO-8859-7,344776,342931,0.0135\nCC-MAIN-2019-39,ISO-8859-8,28421,28249,0.0011\nCC-MAIN-2019-39,ISO-8859-9,1249981,1242659,0.0488\nCC-MAIN-2019-39,KOI8-R,231624,231007,0.0090\nCC-MAIN-2019-39,KOI8-U,3475,3474,0.0001\nCC-MAIN-2019-39,Shift_JIS,7879945,7837418,0.3077\nCC-MAIN-2019-39,TIS-620,387297,384876,0.0151\nCC-MAIN-2019-39,US-ASCII,1092812,1087857,0.0427\nCC-MAIN-2019-39,UTF-16,88200,87817,0.0034\nCC-MAIN-2019-39,UTF-16BE,1054,1032,0.0000\nCC-MAIN-2019-39,UTF-16LE,17460,17366,0.0007\nCC-MAIN-2019-39,UTF-32,1971,1901,0.0001\nCC-MAIN-2019-39,UTF-32LE,1,1,0.0000\nCC-MAIN-2019-39,UTF-8,2279847342,2259633933,89.0196\nCC-MAIN-2019-39,windows-1250,4195074,4169420,0.1638\nCC-MAIN-2019-39,windows-1251,28402934,28263939,1.1090\nCC-MAIN-2019-39,windows-1252,13338428,13252165,0.5208\nCC-MAIN-2019-39,windows-1253,141359,140738,0.0055\nCC-MAIN-2019-39,windows-1254,903946,892843,0.0353\nCC-MAIN-2019-39,windows-1255,864449,860423,0.0338\nCC-MAIN-2019-39,windows-1256,3109658,3095537,0.1214\nCC-MAIN-2019-39,windows-1257,382749,380612,0.0149\nCC-MAIN-2019-39,windows-31j,63073,62867,0.0025\nCC-MAIN-2019-39,x-MacCyrillic,111324,110828,0.0043\nCC-MAIN-2019-39,x-iso-8859-11,1419,1418,0.0001\nCC-MAIN-2019-39,x-windows-874,452276,451640,0.0177\nCC-MAIN-2019-39,x-windows-949,1214,1211,0.0000\nCC-MAIN-2019-43,<other>,3004,2993,0.0001\nCC-MAIN-2019-43,<unknown>,37914225,37914225,1.2558\nCC-MAIN-2019-43,Big5,2359825,2352480,0.0782\nCC-MAIN-2019-43,Big5-HKSCS,19447,19441,0.0006\nCC-MAIN-2019-43,EUC-JP,7613133,7573651,0.2522\nCC-MAIN-2019-43,EUC-KR,4713043,4703292,0.1561\nCC-MAIN-2019-43,GB18030,2564504,2533654,0.0849\nCC-MAIN-2019-43,GB2312,50371192,49974212,1.6685\nCC-MAIN-2019-43,GBK,33671600,33290777,1.1153\nCC-MAIN-2019-43,IBM500,11,11,0.0000\nCC-MAIN-2019-43,IBM855,10452,10416,0.0003\nCC-MAIN-2019-43,IBM866,17156,17047,0.0006\nCC-MAIN-2019-43,ISO-2022-JP,17239,17120,0.0006\nCC-MAIN-2019-43,ISO-8859-1,110727645,109904997,3.6676\nCC-MAIN-2019-43,ISO-8859-13,11916,11914,0.0004\nCC-MAIN-2019-43,ISO-8859-15,3773306,3723106,0.1250\nCC-MAIN-2019-43,ISO-8859-2,6567560,6532123,0.2175\nCC-MAIN-2019-43,ISO-8859-3,15364,15326,0.0005\nCC-MAIN-2019-43,ISO-8859-4,60112,59807,0.0020\nCC-MAIN-2019-43,ISO-8859-5,86684,86538,0.0029\nCC-MAIN-2019-43,ISO-8859-6,12349,12260,0.0004\nCC-MAIN-2019-43,ISO-8859-7,418379,412741,0.0139\nCC-MAIN-2019-43,ISO-8859-8,23091,23034,0.0008\nCC-MAIN-2019-43,ISO-8859-9,1354451,1346958,0.0449\nCC-MAIN-2019-43,KOI8-R,301949,300458,0.0100\nCC-MAIN-2019-43,KOI8-U,5249,5243,0.0002\nCC-MAIN-2019-43,Shift_JIS,10027447,9958281,0.3321\nCC-MAIN-2019-43,TIS-620,612670,596770,0.0203\nCC-MAIN-2019-43,US-ASCII,1174526,1172617,0.0389\nCC-MAIN-2019-43,UTF-16,114301,113875,0.0038\nCC-MAIN-2019-43,UTF-16BE,1198,1151,0.0000\nCC-MAIN-2019-43,UTF-16LE,19188,19060,0.0006\nCC-MAIN-2019-43,UTF-32,1889,1846,0.0001\nCC-MAIN-2019-43,UTF-32LE,5,5,0.0000\nCC-MAIN-2019-43,UTF-8,2685611162,2662490705,88.9559\nCC-MAIN-2019-43,windows-1250,4387881,4357537,0.1453\nCC-MAIN-2019-43,windows-1251,32271777,32103269,1.0689\nCC-MAIN-2019-43,windows-1252,15661410,15555070,0.5188\nCC-MAIN-2019-43,windows-1253,160598,160267,0.0053\nCC-MAIN-2019-43,windows-1254,896358,888585,0.0297\nCC-MAIN-2019-43,windows-1255,873843,867247,0.0289\nCC-MAIN-2019-43,windows-1256,3348831,3332815,0.1109\nCC-MAIN-2019-43,windows-1257,386227,383426,0.0128\nCC-MAIN-2019-43,windows-31j,93841,93453,0.0031\nCC-MAIN-2019-43,x-MacCyrillic,116017,115088,0.0038\nCC-MAIN-2019-43,x-iso-8859-11,1825,1824,0.0001\nCC-MAIN-2019-43,x-windows-874,641397,640623,0.0212\nCC-MAIN-2019-43,x-windows-949,1252,1249,0.0000\nCC-MAIN-2019-47,<other>,2965,2953,0.0001\nCC-MAIN-2019-47,<unknown>,36236307,36236307,1.3988\nCC-MAIN-2019-47,Big5,1698075,1693658,0.0655\nCC-MAIN-2019-47,Big5-HKSCS,17285,17284,0.0007\nCC-MAIN-2019-47,EUC-JP,6116548,6087748,0.2361\nCC-MAIN-2019-47,EUC-KR,3587831,3578481,0.1385\nCC-MAIN-2019-47,GB18030,2479348,2467026,0.0957\nCC-MAIN-2019-47,GB2312,35257790,35024243,1.3610\nCC-MAIN-2019-47,GBK,16265453,16097461,0.6279\nCC-MAIN-2019-47,IBM500,11,11,0.0000\nCC-MAIN-2019-47,IBM855,6867,6845,0.0003\nCC-MAIN-2019-47,IBM866,13562,13473,0.0005\nCC-MAIN-2019-47,ISO-2022-JP,13354,13330,0.0005\nCC-MAIN-2019-47,ISO-8859-1,89199718,88478327,3.4432\nCC-MAIN-2019-47,ISO-8859-13,7974,7968,0.0003\nCC-MAIN-2019-47,ISO-8859-15,3135090,3090247,0.1210\nCC-MAIN-2019-47,ISO-8859-2,5168253,5140795,0.1995\nCC-MAIN-2019-47,ISO-8859-3,6912,6884,0.0003\nCC-MAIN-2019-47,ISO-8859-4,40539,40221,0.0016\nCC-MAIN-2019-47,ISO-8859-5,55422,55087,0.0021\nCC-MAIN-2019-47,ISO-8859-6,13701,13638,0.0005\nCC-MAIN-2019-47,ISO-8859-7,393536,389182,0.0152\nCC-MAIN-2019-47,ISO-8859-8,22106,21980,0.0009\nCC-MAIN-2019-47,ISO-8859-9,1088631,1080635,0.0420\nCC-MAIN-2019-47,KOI8-R,246032,245265,0.0095\nCC-MAIN-2019-47,KOI8-U,4016,3992,0.0002\nCC-MAIN-2019-47,Shift_JIS,8158759,8118535,0.3149\nCC-MAIN-2019-47,TIS-620,431058,428432,0.0166\nCC-MAIN-2019-47,US-ASCII,774010,772851,0.0299\nCC-MAIN-2019-47,UTF-16,95263,94783,0.0037\nCC-MAIN-2019-47,UTF-16BE,4548,4527,0.0002\nCC-MAIN-2019-47,UTF-16LE,20624,20489,0.0008\nCC-MAIN-2019-47,UTF-32,1474,1450,0.0001\nCC-MAIN-2019-47,UTF-8,2333007909,2311721182,90.0568\nCC-MAIN-2019-47,windows-1250,3652709,3616634,0.1410\nCC-MAIN-2019-47,windows-1251,25629236,25490060,0.9893\nCC-MAIN-2019-47,windows-1252,12419323,12330078,0.4794\nCC-MAIN-2019-47,windows-1253,153378,152982,0.0059\nCC-MAIN-2019-47,windows-1254,774292,763478,0.0299\nCC-MAIN-2019-47,windows-1255,799661,796535,0.0309\nCC-MAIN-2019-47,windows-1256,2622282,2605580,0.1012\nCC-MAIN-2019-47,windows-1257,348839,345315,0.0135\nCC-MAIN-2019-47,windows-31j,59474,59244,0.0023\nCC-MAIN-2019-47,x-MacCyrillic,96028,95642,0.0037\nCC-MAIN-2019-47,x-iso-8859-11,1066,1065,0.0000\nCC-MAIN-2019-47,x-windows-874,466714,466280,0.0180\nCC-MAIN-2019-47,x-windows-949,1200,1197,0.0000\nCC-MAIN-2019-51,<other>,2527,2521,0.0001\nCC-MAIN-2019-51,<unknown>,27153781,27153781,1.0985\nCC-MAIN-2019-51,Big5,1919171,1915182,0.0776\nCC-MAIN-2019-51,Big5-HKSCS,23218,23217,0.0009\nCC-MAIN-2019-51,EUC-JP,6232852,6200973,0.2521\nCC-MAIN-2019-51,EUC-KR,3822915,3812645,0.1547\nCC-MAIN-2019-51,GB18030,2435624,2427734,0.0985\nCC-MAIN-2019-51,GB2312,35439680,35218130,1.4337\nCC-MAIN-2019-51,GBK,15437184,15288384,0.6245\nCC-MAIN-2019-51,IBM500,8,8,0.0000\nCC-MAIN-2019-51,IBM855,9924,9901,0.0004\nCC-MAIN-2019-51,IBM866,15786,15688,0.0006\nCC-MAIN-2019-51,ISO-2022-JP,15540,15499,0.0006\nCC-MAIN-2019-51,ISO-8859-1,87922506,87257787,3.5569\nCC-MAIN-2019-51,ISO-8859-13,7716,7713,0.0003\nCC-MAIN-2019-51,ISO-8859-15,2988745,2946613,0.1209\nCC-MAIN-2019-51,ISO-8859-2,5031907,5009135,0.2036\nCC-MAIN-2019-51,ISO-8859-3,6615,6601,0.0003\nCC-MAIN-2019-51,ISO-8859-4,35356,35182,0.0014\nCC-MAIN-2019-51,ISO-8859-5,54988,54801,0.0022\nCC-MAIN-2019-51,ISO-8859-6,11740,11668,0.0005\nCC-MAIN-2019-51,ISO-8859-7,363660,358421,0.0147\nCC-MAIN-2019-51,ISO-8859-8,17852,17693,0.0007\nCC-MAIN-2019-51,ISO-8859-9,1036658,1030699,0.0419\nCC-MAIN-2019-51,KOI8-R,249920,249055,0.0101\nCC-MAIN-2019-51,KOI8-U,3344,3330,0.0001\nCC-MAIN-2019-51,Shift_JIS,8370222,8321571,0.3386\nCC-MAIN-2019-51,TIS-620,436104,432589,0.0176\nCC-MAIN-2019-51,US-ASCII,726463,725458,0.0294\nCC-MAIN-2019-51,UTF-16,79822,79539,0.0032\nCC-MAIN-2019-51,UTF-16BE,6522,6517,0.0003\nCC-MAIN-2019-51,UTF-16LE,20666,20564,0.0008\nCC-MAIN-2019-51,UTF-32,2023,1985,0.0001\nCC-MAIN-2019-51,UTF-8,2225372765,2206434139,90.0266\nCC-MAIN-2019-51,windows-1250,3454030,3423985,0.1397\nCC-MAIN-2019-51,windows-1251,25692678,25560335,1.0394\nCC-MAIN-2019-51,windows-1252,12352793,12280023,0.4997\nCC-MAIN-2019-51,windows-1253,159263,158874,0.0064\nCC-MAIN-2019-51,windows-1254,741650,730565,0.0300\nCC-MAIN-2019-51,windows-1255,686277,683814,0.0278\nCC-MAIN-2019-51,windows-1256,2697203,2681009,0.1091\nCC-MAIN-2019-51,windows-1257,274912,272690,0.0111\nCC-MAIN-2019-51,windows-31j,59882,59657,0.0024\nCC-MAIN-2019-51,x-MacCyrillic,110798,109656,0.0045\nCC-MAIN-2019-51,x-iso-8859-11,1752,1752,0.0001\nCC-MAIN-2019-51,x-windows-874,418453,418103,0.0169\nCC-MAIN-2019-51,x-windows-949,1470,1465,0.0001\nCC-MAIN-2020-05,<other>,3625,3622,0.0001\nCC-MAIN-2020-05,<unknown>,28931553,28931553,0.9329\nCC-MAIN-2020-05,Big5,1970663,1966464,0.0635\nCC-MAIN-2020-05,Big5-HKSCS,23041,22700,0.0007\nCC-MAIN-2020-05,EUC-JP,7893108,7851476,0.2545\nCC-MAIN-2020-05,EUC-KR,4504500,4490367,0.1453\nCC-MAIN-2020-05,GB18030,3063488,3055018,0.0988\nCC-MAIN-2020-05,GB2312,34551093,34333869,1.1142\nCC-MAIN-2020-05,GBK,15129860,14984358,0.4879\nCC-MAIN-2020-05,IBM500,18,18,0.0000\nCC-MAIN-2020-05,IBM855,8840,8806,0.0003\nCC-MAIN-2020-05,IBM866,15935,15887,0.0005\nCC-MAIN-2020-05,ISO-2022-JP,23204,23158,0.0007\nCC-MAIN-2020-05,ISO-8859-1,103949213,103062291,3.3520\nCC-MAIN-2020-05,ISO-8859-13,8165,8162,0.0003\nCC-MAIN-2020-05,ISO-8859-15,3548052,3499623,0.1144\nCC-MAIN-2020-05,ISO-8859-2,5794535,5765862,0.1869\nCC-MAIN-2020-05,ISO-8859-3,8076,8057,0.0003\nCC-MAIN-2020-05,ISO-8859-4,42836,42614,0.0014\nCC-MAIN-2020-05,ISO-8859-5,58429,58255,0.0019\nCC-MAIN-2020-05,ISO-8859-6,20187,20091,0.0007\nCC-MAIN-2020-05,ISO-8859-7,424289,416474,0.0137\nCC-MAIN-2020-05,ISO-8859-8,23827,23537,0.0008\nCC-MAIN-2020-05,ISO-8859-9,1190057,1183715,0.0384\nCC-MAIN-2020-05,KOI8-R,305377,303643,0.0098\nCC-MAIN-2020-05,KOI8-U,5243,5235,0.0002\nCC-MAIN-2020-05,Shift_JIS,11145787,11094716,0.3594\nCC-MAIN-2020-05,TIS-620,478490,474971,0.0154\nCC-MAIN-2020-05,US-ASCII,917488,915158,0.0296\nCC-MAIN-2020-05,UTF-16,92256,91955,0.0030\nCC-MAIN-2020-05,UTF-16BE,4458,4454,0.0001\nCC-MAIN-2020-05,UTF-16LE,29580,29427,0.0010\nCC-MAIN-2020-05,UTF-32,2668,2614,0.0001\nCC-MAIN-2020-05,UTF-32LE,1,1,0.0000\nCC-MAIN-2020-05,UTF-8,2820276978,2794406933,90.9445\nCC-MAIN-2020-05,windows-1250,4164581,4129447,0.1343\nCC-MAIN-2020-05,windows-1251,31259368,31093576,1.0080\nCC-MAIN-2020-05,windows-1252,15713096,15604299,0.5067\nCC-MAIN-2020-05,windows-1253,193046,191984,0.0062\nCC-MAIN-2020-05,windows-1254,838443,828507,0.0270\nCC-MAIN-2020-05,windows-1255,740287,737239,0.0239\nCC-MAIN-2020-05,windows-1256,2753473,2736835,0.0888\nCC-MAIN-2020-05,windows-1257,291902,289876,0.0094\nCC-MAIN-2020-05,windows-31j,57207,57045,0.0018\nCC-MAIN-2020-05,x-MacCyrillic,117786,117379,0.0038\nCC-MAIN-2020-05,x-iso-8859-11,1609,1608,0.0001\nCC-MAIN-2020-05,x-windows-874,519799,518615,0.0168\nCC-MAIN-2020-05,x-windows-949,1656,1650,0.0001\nCC-MAIN-2020-10,<other>,4291,4274,0.0002\nCC-MAIN-2020-10,<unknown>,32286792,32286792,1.2277\nCC-MAIN-2020-10,Big5,2419707,2413997,0.0920\nCC-MAIN-2020-10,Big5-HKSCS,9541,9456,0.0004\nCC-MAIN-2020-10,EUC-JP,6933734,6904423,0.2636\nCC-MAIN-2020-10,EUC-KR,4454057,4443238,0.1694\nCC-MAIN-2020-10,GB18030,3147669,3142964,0.1197\nCC-MAIN-2020-10,GB2312,41194583,40982657,1.5664\nCC-MAIN-2020-10,GBK,18089994,18037151,0.6878\nCC-MAIN-2020-10,IBM500,9,9,0.0000\nCC-MAIN-2020-10,IBM855,11656,11634,0.0004\nCC-MAIN-2020-10,IBM866,16226,16201,0.0006\nCC-MAIN-2020-10,ISO-2022-JP,33267,33070,0.0013\nCC-MAIN-2020-10,ISO-8859-1,105474985,104735857,4.0105\nCC-MAIN-2020-10,ISO-8859-13,8255,8252,0.0003\nCC-MAIN-2020-10,ISO-8859-15,3273073,3234247,0.1245\nCC-MAIN-2020-10,ISO-8859-2,5836188,5805283,0.2219\nCC-MAIN-2020-10,ISO-8859-3,8713,8699,0.0003\nCC-MAIN-2020-10,ISO-8859-4,40161,39605,0.0015\nCC-MAIN-2020-10,ISO-8859-5,58754,58576,0.0022\nCC-MAIN-2020-10,ISO-8859-6,18937,18866,0.0007\nCC-MAIN-2020-10,ISO-8859-7,367955,364146,0.0140\nCC-MAIN-2020-10,ISO-8859-8,22215,21843,0.0008\nCC-MAIN-2020-10,ISO-8859-9,1254073,1247981,0.0477\nCC-MAIN-2020-10,KOI8-R,298413,296860,0.0113\nCC-MAIN-2020-10,KOI8-U,3643,3637,0.0001\nCC-MAIN-2020-10,Shift_JIS,11266553,11214020,0.4284\nCC-MAIN-2020-10,TIS-620,456575,454082,0.0174\nCC-MAIN-2020-10,US-ASCII,1242784,1241010,0.0473\nCC-MAIN-2020-10,UTF-16,96072,95751,0.0037\nCC-MAIN-2020-10,UTF-16BE,6363,6355,0.0002\nCC-MAIN-2020-10,UTF-16LE,45441,45266,0.0017\nCC-MAIN-2020-10,UTF-32,3136,3055,0.0001\nCC-MAIN-2020-10,UTF-32LE,1,1,0.0000\nCC-MAIN-2020-10,UTF-8,2334619990,2314440913,88.7701\nCC-MAIN-2020-10,windows-1250,3985793,3949020,0.1516\nCC-MAIN-2020-10,windows-1251,30588669,30448539,1.1631\nCC-MAIN-2020-10,windows-1252,16855760,16767735,0.6409\nCC-MAIN-2020-10,windows-1253,175159,174530,0.0067\nCC-MAIN-2020-10,windows-1254,855727,846762,0.0325\nCC-MAIN-2020-10,windows-1255,753360,749881,0.0286\nCC-MAIN-2020-10,windows-1256,2801075,2779176,0.1065\nCC-MAIN-2020-10,windows-1257,287933,286703,0.0109\nCC-MAIN-2020-10,windows-31j,42246,42150,0.0016\nCC-MAIN-2020-10,x-MacCyrillic,124812,124536,0.0047\nCC-MAIN-2020-10,x-iso-8859-11,1016,1015,0.0000\nCC-MAIN-2020-10,x-windows-874,485743,484348,0.0185\nCC-MAIN-2020-10,x-windows-949,2363,2358,0.0001\nCC-MAIN-2020-16,<other>,3292,3275,0.0001\nCC-MAIN-2020-16,<unknown>,45105718,45105718,1.5628\nCC-MAIN-2020-16,Big5,2122512,2116270,0.0735\nCC-MAIN-2020-16,Big5-HKSCS,8755,8686,0.0003\nCC-MAIN-2020-16,EUC-JP,7302850,7268227,0.2530\nCC-MAIN-2020-16,EUC-KR,4042334,4029157,0.1401\nCC-MAIN-2020-16,GB18030,3448391,3440156,0.1195\nCC-MAIN-2020-16,GB2312,36453295,36248063,1.2630\nCC-MAIN-2020-16,GBK,15730109,15682885,0.5450\nCC-MAIN-2020-16,IBM500,8,8,0.0000\nCC-MAIN-2020-16,IBM855,10528,10508,0.0004\nCC-MAIN-2020-16,IBM866,17779,17714,0.0006\nCC-MAIN-2020-16,ISO-2022-JP,20679,20288,0.0007\nCC-MAIN-2020-16,ISO-8859-1,93970128,93283249,3.2558\nCC-MAIN-2020-16,ISO-8859-13,10081,10080,0.0003\nCC-MAIN-2020-16,ISO-8859-15,3406846,3364307,0.1180\nCC-MAIN-2020-16,ISO-8859-2,5596638,5556891,0.1939\nCC-MAIN-2020-16,ISO-8859-3,8146,8130,0.0003\nCC-MAIN-2020-16,ISO-8859-4,53860,53507,0.0019\nCC-MAIN-2020-16,ISO-8859-5,51269,51160,0.0018\nCC-MAIN-2020-16,ISO-8859-6,12806,12760,0.0004\nCC-MAIN-2020-16,ISO-8859-7,328507,325517,0.0114\nCC-MAIN-2020-16,ISO-8859-8,24993,24845,0.0009\nCC-MAIN-2020-16,ISO-8859-9,1228622,1220821,0.0426\nCC-MAIN-2020-16,KOI8-R,274999,274000,0.0095\nCC-MAIN-2020-16,KOI8-U,6264,6232,0.0002\nCC-MAIN-2020-16,Shift_JIS,9504310,9458289,0.3293\nCC-MAIN-2020-16,TIS-620,398750,396607,0.0138\nCC-MAIN-2020-16,US-ASCII,1055179,1053228,0.0366\nCC-MAIN-2020-16,UTF-16,103223,102858,0.0036\nCC-MAIN-2020-16,UTF-16BE,3336,3326,0.0001\nCC-MAIN-2020-16,UTF-16LE,25977,25833,0.0009\nCC-MAIN-2020-16,UTF-32,5500,5315,0.0002\nCC-MAIN-2020-16,UTF-32LE,1,1,0.0000\nCC-MAIN-2020-16,UTF-8,2601391266,2578817812,90.1309\nCC-MAIN-2020-16,windows-1250,3764978,3731356,0.1304\nCC-MAIN-2020-16,windows-1251,31548380,31376748,1.0931\nCC-MAIN-2020-16,windows-1252,14022218,13938692,0.4858\nCC-MAIN-2020-16,windows-1253,160888,160070,0.0056\nCC-MAIN-2020-16,windows-1254,825008,815186,0.0286\nCC-MAIN-2020-16,windows-1255,848938,845613,0.0294\nCC-MAIN-2020-16,windows-1256,2408664,2394725,0.0835\nCC-MAIN-2020-16,windows-1257,333784,332518,0.0116\nCC-MAIN-2020-16,windows-31j,36671,36515,0.0013\nCC-MAIN-2020-16,x-MacCyrillic,103138,102743,0.0036\nCC-MAIN-2020-16,x-iso-8859-11,1170,1169,0.0000\nCC-MAIN-2020-16,x-windows-874,453394,452857,0.0157\nCC-MAIN-2020-16,x-windows-949,2055,2050,0.0001\nCC-MAIN-2020-24,<other>,4454,4430,0.0002\nCC-MAIN-2020-24,<unknown>,31381479,31381479,1.1357\nCC-MAIN-2020-24,Big5,2718136,2711526,0.0984\nCC-MAIN-2020-24,Big5-HKSCS,3751,3749,0.0001\nCC-MAIN-2020-24,EUC-JP,7184618,7154089,0.2600\nCC-MAIN-2020-24,EUC-KR,4850767,4838788,0.1755\nCC-MAIN-2020-24,GB18030,2302572,2296557,0.0833\nCC-MAIN-2020-24,GB2312,34674630,34518554,1.2549\nCC-MAIN-2020-24,GBK,15926785,15861824,0.5764\nCC-MAIN-2020-24,IBM500,11,11,0.0000\nCC-MAIN-2020-24,IBM855,14842,14803,0.0005\nCC-MAIN-2020-24,IBM866,19524,19450,0.0007\nCC-MAIN-2020-24,ISO-2022-JP,15901,15885,0.0006\nCC-MAIN-2020-24,ISO-8859-1,96353602,95646442,3.4870\nCC-MAIN-2020-24,ISO-8859-13,9044,9042,0.0003\nCC-MAIN-2020-24,ISO-8859-15,3315230,3278613,0.1200\nCC-MAIN-2020-24,ISO-8859-2,5899923,5867869,0.2135\nCC-MAIN-2020-24,ISO-8859-3,10732,10709,0.0004\nCC-MAIN-2020-24,ISO-8859-4,57279,56005,0.0021\nCC-MAIN-2020-24,ISO-8859-5,52745,52547,0.0019\nCC-MAIN-2020-24,ISO-8859-6,24029,23871,0.0009\nCC-MAIN-2020-24,ISO-8859-7,390180,386158,0.0141\nCC-MAIN-2020-24,ISO-8859-8,20193,19823,0.0007\nCC-MAIN-2020-24,ISO-8859-9,1390217,1381965,0.0503\nCC-MAIN-2020-24,KOI8-R,295596,294625,0.0107\nCC-MAIN-2020-24,KOI8-U,4967,4963,0.0002\nCC-MAIN-2020-24,Shift_JIS,8782819,8738110,0.3178\nCC-MAIN-2020-24,TIS-620,481502,479760,0.0174\nCC-MAIN-2020-24,US-ASCII,883310,881914,0.0320\nCC-MAIN-2020-24,UTF-16,130716,130338,0.0047\nCC-MAIN-2020-24,UTF-16BE,5870,5866,0.0002\nCC-MAIN-2020-24,UTF-16LE,20333,20223,0.0007\nCC-MAIN-2020-24,UTF-32,3918,3800,0.0001\nCC-MAIN-2020-24,UTF-32LE,2,2,0.0000\nCC-MAIN-2020-24,UTF-8,2490545822,2468096354,90.1324\nCC-MAIN-2020-24,windows-1250,3768055,3742210,0.1364\nCC-MAIN-2020-24,windows-1251,30998405,30831598,1.1218\nCC-MAIN-2020-24,windows-1252,14385182,14272775,0.5206\nCC-MAIN-2020-24,windows-1253,161891,161210,0.0059\nCC-MAIN-2020-24,windows-1254,956528,943847,0.0346\nCC-MAIN-2020-24,windows-1255,904858,900882,0.0327\nCC-MAIN-2020-24,windows-1256,3186385,3172628,0.1153\nCC-MAIN-2020-24,windows-1257,392405,387376,0.0142\nCC-MAIN-2020-24,windows-31j,36703,36566,0.0013\nCC-MAIN-2020-24,x-MacCyrillic,113789,113417,0.0041\nCC-MAIN-2020-24,x-iso-8859-11,975,975,0.0000\nCC-MAIN-2020-24,x-windows-874,524805,523258,0.0190\nCC-MAIN-2020-24,x-windows-949,1282,1277,0.0000\nCC-MAIN-2020-29,<other>,3091,3069,0.0001\nCC-MAIN-2020-29,<unknown>,31549599,31549599,1.0033\nCC-MAIN-2020-29,Big5,2756068,2747602,0.0876\nCC-MAIN-2020-29,Big5-HKSCS,3305,3300,0.0001\nCC-MAIN-2020-29,EUC-JP,7927401,7887190,0.2521\nCC-MAIN-2020-29,EUC-KR,4779609,4768370,0.1520\nCC-MAIN-2020-29,GB18030,2099801,2094980,0.0668\nCC-MAIN-2020-29,GB2312,30988828,30882168,0.9854\nCC-MAIN-2020-29,GBK,14565912,14506836,0.4632\nCC-MAIN-2020-29,IBM500,13,13,0.0000\nCC-MAIN-2020-29,IBM855,13224,13153,0.0004\nCC-MAIN-2020-29,IBM866,22616,22504,0.0007\nCC-MAIN-2020-29,ISO-2022-JP,21958,21926,0.0007\nCC-MAIN-2020-29,ISO-8859-1,102192979,101396689,3.2497\nCC-MAIN-2020-29,ISO-8859-13,7714,7711,0.0002\nCC-MAIN-2020-29,ISO-8859-15,3553302,3515461,0.1130\nCC-MAIN-2020-29,ISO-8859-2,5908380,5874172,0.1879\nCC-MAIN-2020-29,ISO-8859-3,9594,9562,0.0003\nCC-MAIN-2020-29,ISO-8859-4,49865,49649,0.0016\nCC-MAIN-2020-29,ISO-8859-5,63924,63768,0.0020\nCC-MAIN-2020-29,ISO-8859-6,10811,10764,0.0003\nCC-MAIN-2020-29,ISO-8859-7,414126,410271,0.0132\nCC-MAIN-2020-29,ISO-8859-8,24023,23806,0.0008\nCC-MAIN-2020-29,ISO-8859-9,1300992,1292534,0.0414\nCC-MAIN-2020-29,KOI8-R,310410,309351,0.0099\nCC-MAIN-2020-29,KOI8-U,5221,5210,0.0002\nCC-MAIN-2020-29,Shift_JIS,10181692,10136441,0.3238\nCC-MAIN-2020-29,TIS-620,463678,461262,0.0147\nCC-MAIN-2020-29,US-ASCII,769200,767676,0.0245\nCC-MAIN-2020-29,UTF-16,142579,142091,0.0045\nCC-MAIN-2020-29,UTF-16BE,5675,5672,0.0002\nCC-MAIN-2020-29,UTF-16LE,28110,27851,0.0009\nCC-MAIN-2020-29,UTF-32,5542,5468,0.0002\nCC-MAIN-2020-29,UTF-8,2866203511,2838254531,91.1430\nCC-MAIN-2020-29,windows-1250,4004210,3970088,0.1273\nCC-MAIN-2020-29,windows-1251,34388531,34169013,1.0935\nCC-MAIN-2020-29,windows-1252,14174964,14068161,0.4508\nCC-MAIN-2020-29,windows-1253,188040,186763,0.0060\nCC-MAIN-2020-29,windows-1254,862784,855739,0.0274\nCC-MAIN-2020-29,windows-1255,811296,802825,0.0258\nCC-MAIN-2020-29,windows-1256,2859652,2848306,0.0909\nCC-MAIN-2020-29,windows-1257,329040,325908,0.0105\nCC-MAIN-2020-29,windows-31j,59295,59020,0.0019\nCC-MAIN-2020-29,x-MacCyrillic,122517,122194,0.0039\nCC-MAIN-2020-29,x-iso-8859-11,1586,1585,0.0001\nCC-MAIN-2020-29,x-windows-874,547707,545401,0.0174\nCC-MAIN-2020-29,x-windows-949,1045,1040,0.0000\nCC-MAIN-2020-34,<other>,2430,2397,0.0001\nCC-MAIN-2020-34,<unknown>,30202420,30202420,1.2328\nCC-MAIN-2020-34,Big5,2296290,2287976,0.0937\nCC-MAIN-2020-34,Big5-HKSCS,2314,2314,0.0001\nCC-MAIN-2020-34,EUC-JP,6803300,6772022,0.2777\nCC-MAIN-2020-34,EUC-KR,3731692,3721766,0.1523\nCC-MAIN-2020-34,GB18030,1702014,1698623,0.0695\nCC-MAIN-2020-34,GB2312,25212566,25131193,1.0292\nCC-MAIN-2020-34,GBK,11738021,11693746,0.4791\nCC-MAIN-2020-34,IBM500,12,12,0.0000\nCC-MAIN-2020-34,IBM855,8641,8637,0.0004\nCC-MAIN-2020-34,IBM866,19982,19889,0.0008\nCC-MAIN-2020-34,ISO-2022-JP,17893,17844,0.0007\nCC-MAIN-2020-34,ISO-8859-1,85569092,84987641,3.4929\nCC-MAIN-2020-34,ISO-8859-13,7131,7102,0.0003\nCC-MAIN-2020-34,ISO-8859-15,2856821,2832480,0.1166\nCC-MAIN-2020-34,ISO-8859-2,4834520,4800982,0.1973\nCC-MAIN-2020-34,ISO-8859-3,10635,10580,0.0004\nCC-MAIN-2020-34,ISO-8859-4,31297,31093,0.0013\nCC-MAIN-2020-34,ISO-8859-5,71515,71389,0.0029\nCC-MAIN-2020-34,ISO-8859-6,10300,10267,0.0004\nCC-MAIN-2020-34,ISO-8859-7,325182,321611,0.0133\nCC-MAIN-2020-34,ISO-8859-8,17421,17298,0.0007\nCC-MAIN-2020-34,ISO-8859-9,989704,983098,0.0404\nCC-MAIN-2020-34,KOI8-R,248608,247860,0.0101\nCC-MAIN-2020-34,KOI8-U,3252,3249,0.0001\nCC-MAIN-2020-34,Shift_JIS,8587127,8546403,0.3505\nCC-MAIN-2020-34,TIS-620,380007,377607,0.0155\nCC-MAIN-2020-34,US-ASCII,803600,802046,0.0328\nCC-MAIN-2020-34,UTF-16,140207,139867,0.0057\nCC-MAIN-2020-34,UTF-16BE,4219,4217,0.0002\nCC-MAIN-2020-34,UTF-16LE,15713,15599,0.0006\nCC-MAIN-2020-34,UTF-32,2335,2322,0.0001\nCC-MAIN-2020-34,UTF-32LE,2,2,0.0000\nCC-MAIN-2020-34,UTF-8,2218490687,2199279340,90.5568\nCC-MAIN-2020-34,windows-1250,2964278,2945284,0.1210\nCC-MAIN-2020-34,windows-1251,25651480,25497441,1.0471\nCC-MAIN-2020-34,windows-1252,11318952,11242527,0.4620\nCC-MAIN-2020-34,windows-1253,127004,126517,0.0052\nCC-MAIN-2020-34,windows-1254,653428,648196,0.0267\nCC-MAIN-2020-34,windows-1255,641618,638137,0.0262\nCC-MAIN-2020-34,windows-1256,2445592,2436956,0.0998\nCC-MAIN-2020-34,windows-1257,262050,260772,0.0107\nCC-MAIN-2020-34,windows-31j,55313,53974,0.0023\nCC-MAIN-2020-34,x-MacCyrillic,103279,103092,0.0042\nCC-MAIN-2020-34,x-iso-8859-11,585,585,0.0000\nCC-MAIN-2020-34,x-windows-874,472831,472161,0.0193\nCC-MAIN-2020-34,x-windows-949,879,876,0.0000\nCC-MAIN-2020-40,<other>,2853,2835,0.0001\nCC-MAIN-2020-40,<unknown>,66263569,66263569,1.9076\nCC-MAIN-2020-40,Big5,2400643,2392890,0.0691\nCC-MAIN-2020-40,Big5-HKSCS,2975,2883,0.0001\nCC-MAIN-2020-40,EUC-JP,6871809,6836299,0.1978\nCC-MAIN-2020-40,EUC-KR,3820835,3811766,0.1100\nCC-MAIN-2020-40,GB18030,1823621,1818742,0.0525\nCC-MAIN-2020-40,GB2312,31535254,31444302,0.9079\nCC-MAIN-2020-40,GBK,11160914,11126933,0.3213\nCC-MAIN-2020-40,IBM500,11,10,0.0000\nCC-MAIN-2020-40,IBM855,10291,10227,0.0003\nCC-MAIN-2020-40,IBM866,25370,25223,0.0007\nCC-MAIN-2020-40,ISO-2022-JP,17333,17300,0.0005\nCC-MAIN-2020-40,ISO-8859-1,97796569,97131167,2.8154\nCC-MAIN-2020-40,ISO-8859-13,6442,6441,0.0002\nCC-MAIN-2020-40,ISO-8859-15,3576596,3543781,0.1030\nCC-MAIN-2020-40,ISO-8859-2,4870099,4841695,0.1402\nCC-MAIN-2020-40,ISO-8859-3,8944,8923,0.0003\nCC-MAIN-2020-40,ISO-8859-4,35399,35232,0.0010\nCC-MAIN-2020-40,ISO-8859-5,76082,75481,0.0022\nCC-MAIN-2020-40,ISO-8859-6,10326,10038,0.0003\nCC-MAIN-2020-40,ISO-8859-7,341684,338804,0.0098\nCC-MAIN-2020-40,ISO-8859-8,17247,17142,0.0005\nCC-MAIN-2020-40,ISO-8859-9,1182475,1175296,0.0340\nCC-MAIN-2020-40,KOI8-R,301118,300407,0.0087\nCC-MAIN-2020-40,KOI8-U,5187,5061,0.0001\nCC-MAIN-2020-40,Shift_JIS,8803971,8759528,0.2535\nCC-MAIN-2020-40,TIS-620,404607,402676,0.0116\nCC-MAIN-2020-40,US-ASCII,785653,784096,0.0226\nCC-MAIN-2020-40,UTF-16,103996,101442,0.0030\nCC-MAIN-2020-40,UTF-16BE,32108,32107,0.0009\nCC-MAIN-2020-40,UTF-16LE,23270,23104,0.0007\nCC-MAIN-2020-40,UTF-32,2587,2549,0.0001\nCC-MAIN-2020-40,UTF-8,3174210781,3148643781,91.3818\nCC-MAIN-2020-40,windows-1250,3524110,3493824,0.1015\nCC-MAIN-2020-40,windows-1251,36215160,36034094,1.0426\nCC-MAIN-2020-40,windows-1252,12649080,12565017,0.3642\nCC-MAIN-2020-40,windows-1253,129730,129120,0.0037\nCC-MAIN-2020-40,windows-1254,700741,695282,0.0202\nCC-MAIN-2020-40,windows-1255,610445,607272,0.0176\nCC-MAIN-2020-40,windows-1256,2322579,2311483,0.0669\nCC-MAIN-2020-40,windows-1257,236223,234761,0.0068\nCC-MAIN-2020-40,windows-31j,59501,58692,0.0017\nCC-MAIN-2020-40,x-MacCyrillic,113544,113228,0.0033\nCC-MAIN-2020-40,x-iso-8859-11,457,457,0.0000\nCC-MAIN-2020-40,x-windows-874,477353,476734,0.0137\nCC-MAIN-2020-40,x-windows-949,1664,1656,0.0000\nCC-MAIN-2020-45,<other>,2060,2020,0.0001\nCC-MAIN-2020-45,<unknown>,50169903,50169903,1.8370\nCC-MAIN-2020-45,Big5,1901239,1889753,0.0696\nCC-MAIN-2020-45,Big5-HKSCS,3604,3602,0.0001\nCC-MAIN-2020-45,EUC-JP,5434883,5406002,0.1990\nCC-MAIN-2020-45,EUC-KR,3050595,3041546,0.1117\nCC-MAIN-2020-45,GB18030,1591767,1587932,0.0583\nCC-MAIN-2020-45,GB2312,27658775,27577521,1.0127\nCC-MAIN-2020-45,GBK,8820877,8802153,0.3230\nCC-MAIN-2020-45,IBM500,13,11,0.0000\nCC-MAIN-2020-45,IBM855,8027,8015,0.0003\nCC-MAIN-2020-45,IBM866,30284,30103,0.0011\nCC-MAIN-2020-45,ISO-2022-JP,12244,12225,0.0004\nCC-MAIN-2020-45,ISO-8859-1,80822792,80223502,2.9594\nCC-MAIN-2020-45,ISO-8859-13,1804,1804,0.0001\nCC-MAIN-2020-45,ISO-8859-15,2804646,2781225,0.1027\nCC-MAIN-2020-45,ISO-8859-2,4159141,4137911,0.1523\nCC-MAIN-2020-45,ISO-8859-3,5357,5319,0.0002\nCC-MAIN-2020-45,ISO-8859-4,22483,22412,0.0008\nCC-MAIN-2020-45,ISO-8859-5,66648,66457,0.0024\nCC-MAIN-2020-45,ISO-8859-6,9699,9476,0.0004\nCC-MAIN-2020-45,ISO-8859-7,309392,305971,0.0113\nCC-MAIN-2020-45,ISO-8859-8,13276,13223,0.0005\nCC-MAIN-2020-45,ISO-8859-9,1040157,1035075,0.0381\nCC-MAIN-2020-45,KOI8-R,240493,239537,0.0088\nCC-MAIN-2020-45,KOI8-U,3342,3317,0.0001\nCC-MAIN-2020-45,Shift_JIS,7966262,7919592,0.2917\nCC-MAIN-2020-45,TIS-620,355247,353114,0.0130\nCC-MAIN-2020-45,US-ASCII,743305,741667,0.0272\nCC-MAIN-2020-45,UTF-16,66773,66416,0.0024\nCC-MAIN-2020-45,UTF-16BE,10481,10479,0.0004\nCC-MAIN-2020-45,UTF-16LE,20331,20197,0.0007\nCC-MAIN-2020-45,UTF-32,827,820,0.0000\nCC-MAIN-2020-45,UTF-32LE,1,1,0.0000\nCC-MAIN-2020-45,UTF-8,2491526564,2471541264,91.2292\nCC-MAIN-2020-45,windows-1250,2863761,2834650,0.1049\nCC-MAIN-2020-45,windows-1251,25034558,24900774,0.9167\nCC-MAIN-2020-45,windows-1252,10410333,10334898,0.3812\nCC-MAIN-2020-45,windows-1253,95265,94649,0.0035\nCC-MAIN-2020-45,windows-1254,592775,584526,0.0217\nCC-MAIN-2020-45,windows-1255,487122,485103,0.0178\nCC-MAIN-2020-45,windows-1256,1945951,1934930,0.0713\nCC-MAIN-2020-45,windows-1257,215887,214564,0.0079\nCC-MAIN-2020-45,windows-31j,56451,55921,0.0021\nCC-MAIN-2020-45,x-MacCyrillic,90251,90051,0.0033\nCC-MAIN-2020-45,x-iso-8859-11,404,403,0.0000\nCC-MAIN-2020-45,x-windows-874,395723,395147,0.0145\nCC-MAIN-2020-45,x-windows-949,1470,1466,0.0001\nCC-MAIN-2020-50,<other>,2377,2365,0.0001\nCC-MAIN-2020-50,<unknown>,42217071,42217071,1.5976\nCC-MAIN-2020-50,Big5,1799403,1790205,0.0681\nCC-MAIN-2020-50,Big5-HKSCS,393,393,0.0000\nCC-MAIN-2020-50,EUC-JP,4752682,4726084,0.1799\nCC-MAIN-2020-50,EUC-KR,2846259,2835099,0.1077\nCC-MAIN-2020-50,GB18030,1598545,1592614,0.0605\nCC-MAIN-2020-50,GB2312,24203095,24127390,0.9159\nCC-MAIN-2020-50,GBK,7125972,7108290,0.2697\nCC-MAIN-2020-50,IBM500,15,15,0.0000\nCC-MAIN-2020-50,IBM855,6711,6694,0.0003\nCC-MAIN-2020-50,IBM866,38330,37878,0.0015\nCC-MAIN-2020-50,ISO-2022-JP,12341,12322,0.0005\nCC-MAIN-2020-50,ISO-8859-1,75957669,75241920,2.8745\nCC-MAIN-2020-50,ISO-8859-13,2038,2031,0.0001\nCC-MAIN-2020-50,ISO-8859-15,2674673,2653407,0.1012\nCC-MAIN-2020-50,ISO-8859-2,3915707,3883189,0.1482\nCC-MAIN-2020-50,ISO-8859-3,5808,5775,0.0002\nCC-MAIN-2020-50,ISO-8859-4,21487,21303,0.0008\nCC-MAIN-2020-50,ISO-8859-5,64225,62814,0.0024\nCC-MAIN-2020-50,ISO-8859-6,9934,9904,0.0004\nCC-MAIN-2020-50,ISO-8859-7,305720,300771,0.0116\nCC-MAIN-2020-50,ISO-8859-8,9451,9406,0.0004\nCC-MAIN-2020-50,ISO-8859-9,952209,943516,0.0360\nCC-MAIN-2020-50,KOI8-R,238524,237032,0.0090\nCC-MAIN-2020-50,KOI8-U,2312,2307,0.0001\nCC-MAIN-2020-50,Shift_JIS,7110497,7073937,0.2691\nCC-MAIN-2020-50,TIS-620,342774,340380,0.0130\nCC-MAIN-2020-50,US-ASCII,648962,648123,0.0246\nCC-MAIN-2020-50,UTF-16,61540,60826,0.0023\nCC-MAIN-2020-50,UTF-16BE,2856,2855,0.0001\nCC-MAIN-2020-50,UTF-16LE,14782,14698,0.0006\nCC-MAIN-2020-50,UTF-32,998,986,0.0000\nCC-MAIN-2020-50,UTF-8,2426351092,2408242335,91.8213\nCC-MAIN-2020-50,windows-1250,2765560,2738016,0.1047\nCC-MAIN-2020-50,windows-1251,23248535,23135584,0.8798\nCC-MAIN-2020-50,windows-1252,9468095,9405615,0.3583\nCC-MAIN-2020-50,windows-1253,87711,87293,0.0033\nCC-MAIN-2020-50,windows-1254,545074,534788,0.0206\nCC-MAIN-2020-50,windows-1255,418218,415166,0.0158\nCC-MAIN-2020-50,windows-1256,1940040,1909061,0.0734\nCC-MAIN-2020-50,windows-1257,187998,183365,0.0071\nCC-MAIN-2020-50,windows-31j,52576,52340,0.0020\nCC-MAIN-2020-50,x-MacCyrillic,89215,88961,0.0034\nCC-MAIN-2020-50,x-iso-8859-11,182,182,0.0000\nCC-MAIN-2020-50,x-windows-874,370156,368445,0.0140\nCC-MAIN-2020-50,x-windows-949,1689,1683,0.0001\nCC-MAIN-2021-04,<other>,2338,2325,0.0001\nCC-MAIN-2021-04,<unknown>,53845776,53845776,1.5831\nCC-MAIN-2021-04,Big5,1999085,1993183,0.0588\nCC-MAIN-2021-04,Big5-HKSCS,708,708,0.0000\nCC-MAIN-2021-04,EUC-JP,5959968,5917673,0.1752\nCC-MAIN-2021-04,EUC-KR,3564494,3553547,0.1048\nCC-MAIN-2021-04,GB18030,1581479,1575203,0.0465\nCC-MAIN-2021-04,GB2312,23433512,23326518,0.6890\nCC-MAIN-2021-04,GBK,7563646,7540951,0.2224\nCC-MAIN-2021-04,IBM500,12,12,0.0000\nCC-MAIN-2021-04,IBM855,6547,6526,0.0002\nCC-MAIN-2021-04,IBM866,37136,36880,0.0011\nCC-MAIN-2021-04,ISO-2022-JP,16397,15939,0.0005\nCC-MAIN-2021-04,ISO-8859-1,88382156,87694564,2.5985\nCC-MAIN-2021-04,ISO-8859-13,1817,1817,0.0001\nCC-MAIN-2021-04,ISO-8859-15,3255099,3199802,0.0957\nCC-MAIN-2021-04,ISO-8859-2,4657477,4629187,0.1369\nCC-MAIN-2021-04,ISO-8859-3,6849,6812,0.0002\nCC-MAIN-2021-04,ISO-8859-4,31326,31166,0.0009\nCC-MAIN-2021-04,ISO-8859-5,64716,64422,0.0019\nCC-MAIN-2021-04,ISO-8859-6,10283,10242,0.0003\nCC-MAIN-2021-04,ISO-8859-7,338694,335287,0.0100\nCC-MAIN-2021-04,ISO-8859-8,17911,17836,0.0005\nCC-MAIN-2021-04,ISO-8859-9,1155421,1146748,0.0340\nCC-MAIN-2021-04,KOI8-R,253555,252532,0.0075\nCC-MAIN-2021-04,KOI8-U,3711,3704,0.0001\nCC-MAIN-2021-04,Shift_JIS,8654875,8614424,0.2545\nCC-MAIN-2021-04,TIS-620,387926,384133,0.0114\nCC-MAIN-2021-04,US-ASCII,722698,721075,0.0212\nCC-MAIN-2021-04,UTF-16,77295,77129,0.0023\nCC-MAIN-2021-04,UTF-16BE,2437,2433,0.0001\nCC-MAIN-2021-04,UTF-16LE,19107,18799,0.0006\nCC-MAIN-2021-04,UTF-32,3927,3908,0.0001\nCC-MAIN-2021-04,UTF-8,3146509284,3120947864,92.5094\nCC-MAIN-2021-04,windows-1250,3425147,3384176,0.1007\nCC-MAIN-2021-04,windows-1251,29526027,29379875,0.8681\nCC-MAIN-2021-04,windows-1252,11628757,11545709,0.3419\nCC-MAIN-2021-04,windows-1253,127646,126374,0.0038\nCC-MAIN-2021-04,windows-1254,654763,644525,0.0193\nCC-MAIN-2021-04,windows-1255,473295,470660,0.0139\nCC-MAIN-2021-04,windows-1256,2061513,2043364,0.0606\nCC-MAIN-2021-04,windows-1257,210245,208483,0.0062\nCC-MAIN-2021-04,windows-31j,46472,46241,0.0014\nCC-MAIN-2021-04,x-MacCyrillic,95750,95467,0.0028\nCC-MAIN-2021-04,x-iso-8859-11,476,476,0.0000\nCC-MAIN-2021-04,x-windows-874,466404,465457,0.0137\nCC-MAIN-2021-04,x-windows-949,2250,2244,0.0001\nCC-MAIN-2021-10,<other>,1796,1774,0.0001\nCC-MAIN-2021-10,<unknown>,39295634,39295634,1.4359\nCC-MAIN-2021-10,Big5,2166825,2156473,0.0792\nCC-MAIN-2021-10,Big5-HKSCS,374,374,0.0000\nCC-MAIN-2021-10,EUC-JP,4719299,4692921,0.1724\nCC-MAIN-2021-10,EUC-KR,2828980,2821127,0.1034\nCC-MAIN-2021-10,GB18030,1207495,1202562,0.0441\nCC-MAIN-2021-10,GB2312,17788214,17713666,0.6500\nCC-MAIN-2021-10,GBK,5914499,5895270,0.2161\nCC-MAIN-2021-10,IBM500,10,10,0.0000\nCC-MAIN-2021-10,IBM855,5583,5524,0.0002\nCC-MAIN-2021-10,IBM866,28015,27900,0.0010\nCC-MAIN-2021-10,ISO-2022-JP,14778,14746,0.0005\nCC-MAIN-2021-10,ISO-8859-1,72032312,71544886,2.6320\nCC-MAIN-2021-10,ISO-8859-13,2425,2425,0.0001\nCC-MAIN-2021-10,ISO-8859-15,2556345,2527978,0.0934\nCC-MAIN-2021-10,ISO-8859-2,3784146,3765055,0.1383\nCC-MAIN-2021-10,ISO-8859-3,4927,4899,0.0002\nCC-MAIN-2021-10,ISO-8859-4,23736,23622,0.0009\nCC-MAIN-2021-10,ISO-8859-5,70132,69976,0.0026\nCC-MAIN-2021-10,ISO-8859-6,10261,10229,0.0004\nCC-MAIN-2021-10,ISO-8859-7,252347,250253,0.0092\nCC-MAIN-2021-10,ISO-8859-8,10603,10565,0.0004\nCC-MAIN-2021-10,ISO-8859-9,881061,873651,0.0322\nCC-MAIN-2021-10,KOI8-R,237429,236491,0.0087\nCC-MAIN-2021-10,KOI8-U,2972,2970,0.0001\nCC-MAIN-2021-10,Shift_JIS,6764022,6727617,0.2472\nCC-MAIN-2021-10,TIS-620,257983,257607,0.0094\nCC-MAIN-2021-10,US-ASCII,714332,713270,0.0261\nCC-MAIN-2021-10,UTF-16,79426,79140,0.0029\nCC-MAIN-2021-10,UTF-16BE,1279,1277,0.0000\nCC-MAIN-2021-10,UTF-16LE,23271,23038,0.0009\nCC-MAIN-2021-10,UTF-32,803,800,0.0000\nCC-MAIN-2021-10,UTF-32LE,1,1,0.0000\nCC-MAIN-2021-10,UTF-8,2536144829,2517997184,92.6700\nCC-MAIN-2021-10,windows-1250,2678024,2659337,0.0979\nCC-MAIN-2021-10,windows-1251,23658589,23542420,0.8645\nCC-MAIN-2021-10,windows-1252,9300578,9241356,0.3398\nCC-MAIN-2021-10,windows-1253,90849,90446,0.0033\nCC-MAIN-2021-10,windows-1254,440475,435329,0.0161\nCC-MAIN-2021-10,windows-1255,405050,403320,0.0148\nCC-MAIN-2021-10,windows-1256,1687320,1674078,0.0617\nCC-MAIN-2021-10,windows-1257,185239,184323,0.0068\nCC-MAIN-2021-10,windows-31j,41846,41599,0.0015\nCC-MAIN-2021-10,x-MacCyrillic,77349,77070,0.0028\nCC-MAIN-2021-10,x-iso-8859-11,206,206,0.0000\nCC-MAIN-2021-10,x-windows-874,356966,356454,0.0130\nCC-MAIN-2021-10,x-windows-949,1248,1242,0.0000\nCC-MAIN-2021-17,<other>,1865,1846,0.0001\nCC-MAIN-2021-17,<unknown>,42757729,42757729,1.3641\nCC-MAIN-2021-17,Big5,2407559,2400459,0.0768\nCC-MAIN-2021-17,Big5-HKSCS,1302,1302,0.0000\nCC-MAIN-2021-17,EUC-JP,5532339,5506437,0.1765\nCC-MAIN-2021-17,EUC-KR,3108914,3103026,0.0992\nCC-MAIN-2021-17,GB18030,1168864,1165870,0.0373\nCC-MAIN-2021-17,GB2312,16499397,16455383,0.5264\nCC-MAIN-2021-17,GBK,6044823,6029891,0.1929\nCC-MAIN-2021-17,IBM500,34,34,0.0000\nCC-MAIN-2021-17,IBM855,5977,5961,0.0002\nCC-MAIN-2021-17,IBM866,40862,40717,0.0013\nCC-MAIN-2021-17,ISO-2022-JP,19253,19226,0.0006\nCC-MAIN-2021-17,ISO-8859-1,81600463,81146077,2.6034\nCC-MAIN-2021-17,ISO-8859-13,2497,2496,0.0001\nCC-MAIN-2021-17,ISO-8859-15,2866574,2849670,0.0915\nCC-MAIN-2021-17,ISO-8859-2,4254396,4236833,0.1357\nCC-MAIN-2021-17,ISO-8859-3,3399,3376,0.0001\nCC-MAIN-2021-17,ISO-8859-4,27317,27181,0.0009\nCC-MAIN-2021-17,ISO-8859-5,70564,70444,0.0023\nCC-MAIN-2021-17,ISO-8859-6,9219,9124,0.0003\nCC-MAIN-2021-17,ISO-8859-7,303374,301164,0.0097\nCC-MAIN-2021-17,ISO-8859-8,16396,16291,0.0005\nCC-MAIN-2021-17,ISO-8859-9,994568,987480,0.0317\nCC-MAIN-2021-17,KOI8-R,208821,207964,0.0067\nCC-MAIN-2021-17,KOI8-U,3707,3704,0.0001\nCC-MAIN-2021-17,Shift_JIS,7837701,7778061,0.2501\nCC-MAIN-2021-17,TIS-620,279209,278783,0.0089\nCC-MAIN-2021-17,US-ASCII,794564,791837,0.0253\nCC-MAIN-2021-17,UTF-16,98707,98476,0.0031\nCC-MAIN-2021-17,UTF-16BE,1157,1152,0.0000\nCC-MAIN-2021-17,UTF-16LE,21957,21654,0.0007\nCC-MAIN-2021-17,UTF-32,1454,1447,0.0000\nCC-MAIN-2021-17,UTF-32LE,1,1,0.0000\nCC-MAIN-2021-17,UTF-8,2912037572,2894874209,92.9050\nCC-MAIN-2021-17,windows-1250,3170528,3153060,0.1012\nCC-MAIN-2021-17,windows-1251,27705582,27594877,0.8839\nCC-MAIN-2021-17,windows-1252,10988861,10933194,0.3506\nCC-MAIN-2021-17,windows-1253,115973,115512,0.0037\nCC-MAIN-2021-17,windows-1254,499875,495352,0.0159\nCC-MAIN-2021-17,windows-1255,465812,464244,0.0149\nCC-MAIN-2021-17,windows-1256,1710964,1699780,0.0546\nCC-MAIN-2021-17,windows-1257,222205,220573,0.0071\nCC-MAIN-2021-17,windows-31j,40997,40480,0.0013\nCC-MAIN-2021-17,x-MacCyrillic,86078,85912,0.0027\nCC-MAIN-2021-17,x-iso-8859-11,1217,1177,0.0000\nCC-MAIN-2021-17,x-windows-874,392226,391892,0.0125\nCC-MAIN-2021-17,x-windows-949,1953,1948,0.0001\nCC-MAIN-2021-21,<other>,2135,2124,0.0001\nCC-MAIN-2021-21,<unknown>,52756157,52756157,2.0043\nCC-MAIN-2021-21,Big5,1569297,1562021,0.0596\nCC-MAIN-2021-21,Big5-HKSCS,366,365,0.0000\nCC-MAIN-2021-21,EUC-JP,3422627,3404736,0.1300\nCC-MAIN-2021-21,EUC-KR,2266279,2260438,0.0861\nCC-MAIN-2021-21,GB18030,823206,818455,0.0313\nCC-MAIN-2021-21,GB2312,11258201,11227827,0.4277\nCC-MAIN-2021-21,GBK,4388647,4377503,0.1667\nCC-MAIN-2021-21,IBM500,5,5,0.0000\nCC-MAIN-2021-21,IBM855,6204,6190,0.0002\nCC-MAIN-2021-21,IBM866,34318,34191,0.0013\nCC-MAIN-2021-21,ISO-2022-JP,25969,25926,0.0010\nCC-MAIN-2021-21,ISO-8859-1,76698209,76259223,2.9139\nCC-MAIN-2021-21,ISO-8859-13,1183,1183,0.0000\nCC-MAIN-2021-21,ISO-8859-15,2507969,2492262,0.0953\nCC-MAIN-2021-21,ISO-8859-2,3650410,3630124,0.1387\nCC-MAIN-2021-21,ISO-8859-3,2724,2702,0.0001\nCC-MAIN-2021-21,ISO-8859-4,16415,16327,0.0006\nCC-MAIN-2021-21,ISO-8859-5,43368,43245,0.0016\nCC-MAIN-2021-21,ISO-8859-6,8510,8311,0.0003\nCC-MAIN-2021-21,ISO-8859-7,263242,261002,0.0100\nCC-MAIN-2021-21,ISO-8859-8,18914,18866,0.0007\nCC-MAIN-2021-21,ISO-8859-9,846434,841006,0.0322\nCC-MAIN-2021-21,KOI8-R,180043,179236,0.0068\nCC-MAIN-2021-21,KOI8-U,2697,2697,0.0001\nCC-MAIN-2021-21,Shift_JIS,7517656,7479658,0.2856\nCC-MAIN-2021-21,TIS-620,193213,192822,0.0073\nCC-MAIN-2021-21,US-ASCII,971231,968352,0.0369\nCC-MAIN-2021-21,UTF-16,81967,81320,0.0031\nCC-MAIN-2021-21,UTF-16BE,1201,1200,0.0000\nCC-MAIN-2021-21,UTF-16LE,38591,38321,0.0015\nCC-MAIN-2021-21,UTF-32,2162,2160,0.0001\nCC-MAIN-2021-21,UTF-32LE,4,4,0.0000\nCC-MAIN-2021-21,UTF-8,2421689193,2406714651,92.0045\nCC-MAIN-2021-21,windows-1250,2912529,2897836,0.1107\nCC-MAIN-2021-21,windows-1251,22245601,22162163,0.8452\nCC-MAIN-2021-21,windows-1252,12473334,12409602,0.4739\nCC-MAIN-2021-21,windows-1253,103074,102387,0.0039\nCC-MAIN-2021-21,windows-1254,435695,430534,0.0166\nCC-MAIN-2021-21,windows-1255,355264,352657,0.0135\nCC-MAIN-2021-21,windows-1256,1679015,1668614,0.0638\nCC-MAIN-2021-21,windows-1257,209519,208411,0.0080\nCC-MAIN-2021-21,windows-31j,36124,35954,0.0014\nCC-MAIN-2021-21,x-MacCyrillic,88495,88323,0.0034\nCC-MAIN-2021-21,x-iso-8859-11,133,132,0.0000\nCC-MAIN-2021-21,x-windows-874,314100,313897,0.0119\nCC-MAIN-2021-21,x-windows-949,835,826,0.0000\nCC-MAIN-2021-25,<other>,2548,2530,0.0001\nCC-MAIN-2021-25,<unknown>,37897657,37897657,1.5420\nCC-MAIN-2021-25,Big5,1876778,1872546,0.0764\nCC-MAIN-2021-25,Big5-HKSCS,390,390,0.0000\nCC-MAIN-2021-25,EUC-JP,3259616,3242140,0.1326\nCC-MAIN-2021-25,EUC-KR,1988090,1984450,0.0809\nCC-MAIN-2021-25,GB18030,845492,840405,0.0344\nCC-MAIN-2021-25,GB2312,32385844,32349877,1.3178\nCC-MAIN-2021-25,GBK,4784883,4775601,0.1947\nCC-MAIN-2021-25,IBM500,6,6,0.0000\nCC-MAIN-2021-25,IBM855,4578,4549,0.0002\nCC-MAIN-2021-25,IBM866,31399,31277,0.0013\nCC-MAIN-2021-25,ISO-2022-JP,20670,20640,0.0008\nCC-MAIN-2021-25,ISO-8859-1,65509175,65164042,2.6655\nCC-MAIN-2021-25,ISO-8859-13,1147,1145,0.0000\nCC-MAIN-2021-25,ISO-8859-15,2319193,2307114,0.0944\nCC-MAIN-2021-25,ISO-8859-2,2948728,2935867,0.1200\nCC-MAIN-2021-25,ISO-8859-3,2164,2137,0.0001\nCC-MAIN-2021-25,ISO-8859-4,15003,14965,0.0006\nCC-MAIN-2021-25,ISO-8859-5,64860,64757,0.0026\nCC-MAIN-2021-25,ISO-8859-6,6804,6681,0.0003\nCC-MAIN-2021-25,ISO-8859-7,223876,221277,0.0091\nCC-MAIN-2021-25,ISO-8859-8,11855,11832,0.0005\nCC-MAIN-2021-25,ISO-8859-9,696138,691576,0.0283\nCC-MAIN-2021-25,KOI8-R,153243,152786,0.0062\nCC-MAIN-2021-25,KOI8-U,1871,1870,0.0001\nCC-MAIN-2021-25,Shift_JIS,5553639,5533177,0.2260\nCC-MAIN-2021-25,TIS-620,227539,226915,0.0093\nCC-MAIN-2021-25,US-ASCII,1247684,1243268,0.0508\nCC-MAIN-2021-25,UTF-16,87036,86709,0.0035\nCC-MAIN-2021-25,UTF-16BE,1105,1102,0.0000\nCC-MAIN-2021-25,UTF-16LE,800046,799748,0.0326\nCC-MAIN-2021-25,UTF-32,887,883,0.0000\nCC-MAIN-2021-25,UTF-8,2263285212,2249525530,92.0921\nCC-MAIN-2021-25,windows-1250,2342452,2322446,0.0953\nCC-MAIN-2021-25,windows-1251,16721466,16667727,0.6804\nCC-MAIN-2021-25,windows-1252,9647066,9587278,0.3925\nCC-MAIN-2021-25,windows-1253,90123,89720,0.0037\nCC-MAIN-2021-25,windows-1254,394487,390801,0.0161\nCC-MAIN-2021-25,windows-1255,297442,296000,0.0121\nCC-MAIN-2021-25,windows-1256,1283939,1276475,0.0522\nCC-MAIN-2021-25,windows-1257,172058,171816,0.0070\nCC-MAIN-2021-25,windows-31j,43862,43824,0.0018\nCC-MAIN-2021-25,x-MacCyrillic,68857,68747,0.0028\nCC-MAIN-2021-25,x-iso-8859-11,109,109,0.0000\nCC-MAIN-2021-25,x-windows-874,314181,314023,0.0128\nCC-MAIN-2021-25,x-windows-949,558,552,0.0000\nCC-MAIN-2021-31,<other>,941,931,0.0000\nCC-MAIN-2021-31,<unknown>,33101540,33101540,1.0458\nCC-MAIN-2021-31,Big5,1746082,1739249,0.0552\nCC-MAIN-2021-31,Big5-HKSCS,368,368,0.0000\nCC-MAIN-2021-31,EUC-JP,3601242,3586893,0.1138\nCC-MAIN-2021-31,EUC-KR,2061584,2056162,0.0651\nCC-MAIN-2021-31,GB18030,776964,774391,0.0245\nCC-MAIN-2021-31,GB2312,16228604,16204501,0.5127\nCC-MAIN-2021-31,GBK,4770079,4761315,0.1507\nCC-MAIN-2021-31,IBM855,5916,5891,0.0002\nCC-MAIN-2021-31,IBM866,34789,34684,0.0011\nCC-MAIN-2021-31,ISO-2022-JP,16968,16934,0.0005\nCC-MAIN-2021-31,ISO-8859-1,69704534,69314967,2.2023\nCC-MAIN-2021-31,ISO-8859-13,967,967,0.0000\nCC-MAIN-2021-31,ISO-8859-15,2690413,2678357,0.0850\nCC-MAIN-2021-31,ISO-8859-2,3112912,3096704,0.0984\nCC-MAIN-2021-31,ISO-8859-3,1981,1969,0.0001\nCC-MAIN-2021-31,ISO-8859-4,15140,15112,0.0005\nCC-MAIN-2021-31,ISO-8859-5,39741,39486,0.0013\nCC-MAIN-2021-31,ISO-8859-6,8839,8495,0.0003\nCC-MAIN-2021-31,ISO-8859-7,248078,245501,0.0078\nCC-MAIN-2021-31,ISO-8859-8,13862,13839,0.0004\nCC-MAIN-2021-31,ISO-8859-9,812828,807988,0.0257\nCC-MAIN-2021-31,KOI8-R,153962,153571,0.0049\nCC-MAIN-2021-31,KOI8-U,2130,2130,0.0001\nCC-MAIN-2021-31,Shift_JIS,5459517,5439606,0.1725\nCC-MAIN-2021-31,TIS-620,213316,212638,0.0067\nCC-MAIN-2021-31,US-ASCII,969686,966874,0.0306\nCC-MAIN-2021-31,UTF-16,59499,59277,0.0019\nCC-MAIN-2021-31,UTF-16BE,496,495,0.0000\nCC-MAIN-2021-31,UTF-16LE,1009122,1008974,0.0319\nCC-MAIN-2021-31,UTF-32,2173,2169,0.0001\nCC-MAIN-2021-31,UTF-8,2983654138,2967559386,94.2676\nCC-MAIN-2021-31,windows-1250,2642704,2625640,0.0835\nCC-MAIN-2021-31,windows-1251,19819117,19755751,0.6262\nCC-MAIN-2021-31,windows-1252,9331815,9287319,0.2948\nCC-MAIN-2021-31,windows-1253,80898,80393,0.0026\nCC-MAIN-2021-31,windows-1254,433628,431608,0.0137\nCC-MAIN-2021-31,windows-1255,330829,329309,0.0105\nCC-MAIN-2021-31,windows-1256,1340695,1332182,0.0424\nCC-MAIN-2021-31,windows-1257,191335,189990,0.0060\nCC-MAIN-2021-31,windows-31j,36941,36910,0.0012\nCC-MAIN-2021-31,x-MacCyrillic,70916,70740,0.0022\nCC-MAIN-2021-31,x-iso-8859-11,187,187,0.0000\nCC-MAIN-2021-31,x-windows-874,291907,291468,0.0092\nCC-MAIN-2021-31,x-windows-949,472,466,0.0000\nCC-MAIN-2021-39,<other>,2394,2364,0.0001\nCC-MAIN-2021-39,<unknown>,60375930,60375930,2.0398\nCC-MAIN-2021-39,Big5,2540677,2529693,0.0858\nCC-MAIN-2021-39,Big5-HKSCS,330,330,0.0000\nCC-MAIN-2021-39,EUC-JP,4484534,4468010,0.1515\nCC-MAIN-2021-39,EUC-KR,2842226,2835924,0.0960\nCC-MAIN-2021-39,GB18030,883901,881113,0.0299\nCC-MAIN-2021-39,GB2312,18416820,18388759,0.6222\nCC-MAIN-2021-39,GBK,5942448,5933998,0.2008\nCC-MAIN-2021-39,IBM500,3,3,0.0000\nCC-MAIN-2021-39,IBM855,6203,6179,0.0002\nCC-MAIN-2021-39,IBM866,35731,35648,0.0012\nCC-MAIN-2021-39,ISO-2022-JP,24955,24909,0.0008\nCC-MAIN-2021-39,ISO-8859-1,76893067,76519387,2.5978\nCC-MAIN-2021-39,ISO-8859-13,1663,1660,0.0001\nCC-MAIN-2021-39,ISO-8859-15,2905762,2891181,0.0982\nCC-MAIN-2021-39,ISO-8859-16,2097,2092,0.0001\nCC-MAIN-2021-39,ISO-8859-2,3997367,3979679,0.1351\nCC-MAIN-2021-39,ISO-8859-3,2521,2501,0.0001\nCC-MAIN-2021-39,ISO-8859-4,22885,22840,0.0008\nCC-MAIN-2021-39,ISO-8859-5,68229,68099,0.0023\nCC-MAIN-2021-39,ISO-8859-6,10722,10370,0.0004\nCC-MAIN-2021-39,ISO-8859-7,278143,275072,0.0094\nCC-MAIN-2021-39,ISO-8859-8,13860,13688,0.0005\nCC-MAIN-2021-39,ISO-8859-9,791086,788076,0.0267\nCC-MAIN-2021-39,KOI8-R,205060,204605,0.0069\nCC-MAIN-2021-39,KOI8-U,3402,3402,0.0001\nCC-MAIN-2021-39,Shift_JIS,6564609,6535249,0.2218\nCC-MAIN-2021-39,TIS-620,273629,272934,0.0092\nCC-MAIN-2021-39,US-ASCII,1005558,1003021,0.0340\nCC-MAIN-2021-39,UTF-16,90792,90586,0.0031\nCC-MAIN-2021-39,UTF-16BE,1122,1119,0.0000\nCC-MAIN-2021-39,UTF-16LE,1213545,1213386,0.0410\nCC-MAIN-2021-39,UTF-32,3393,3386,0.0001\nCC-MAIN-2021-39,UTF-32LE,1,1,0.0000\nCC-MAIN-2021-39,UTF-8,2731852151,2715118313,92.2953\nCC-MAIN-2021-39,windows-1250,2742707,2728801,0.0927\nCC-MAIN-2021-39,windows-1251,20967421,20900251,0.7084\nCC-MAIN-2021-39,windows-1252,11069833,11010136,0.3740\nCC-MAIN-2021-39,windows-1253,103943,103653,0.0035\nCC-MAIN-2021-39,windows-1254,496627,494709,0.0168\nCC-MAIN-2021-39,windows-1255,426528,422898,0.0144\nCC-MAIN-2021-39,windows-1256,1532448,1523604,0.0518\nCC-MAIN-2021-39,windows-1257,255772,254811,0.0086\nCC-MAIN-2021-39,windows-31j,37837,37733,0.0013\nCC-MAIN-2021-39,x-MacCyrillic,82907,82764,0.0028\nCC-MAIN-2021-39,x-iso-8859-11,394,394,0.0000\nCC-MAIN-2021-39,x-windows-874,430020,429402,0.0145\nCC-MAIN-2021-39,x-windows-949,526,523,0.0000\nCC-MAIN-2021-43,<other>,3039,3002,0.0001\nCC-MAIN-2021-43,<unknown>,67951923,67951923,2.0289\nCC-MAIN-2021-43,Big5,2136494,2128115,0.0638\nCC-MAIN-2021-43,Big5-HKSCS,308,308,0.0000\nCC-MAIN-2021-43,EUC-JP,4558758,4543028,0.1361\nCC-MAIN-2021-43,EUC-KR,2840702,2832140,0.0848\nCC-MAIN-2021-43,GB18030,861998,859150,0.0257\nCC-MAIN-2021-43,GB2312,14354260,14330158,0.4286\nCC-MAIN-2021-43,GBK,6909888,6896660,0.2063\nCC-MAIN-2021-43,IBM500,11,11,0.0000\nCC-MAIN-2021-43,IBM855,6844,6816,0.0002\nCC-MAIN-2021-43,IBM866,35429,35378,0.0011\nCC-MAIN-2021-43,ISO-2022-JP,39608,39570,0.0012\nCC-MAIN-2021-43,ISO-8859-1,83533670,83157057,2.4942\nCC-MAIN-2021-43,ISO-8859-13,1895,1894,0.0001\nCC-MAIN-2021-43,ISO-8859-15,2966167,2946401,0.0886\nCC-MAIN-2021-43,ISO-8859-16,5129,5095,0.0002\nCC-MAIN-2021-43,ISO-8859-2,4211845,4189546,0.1258\nCC-MAIN-2021-43,ISO-8859-3,4831,4803,0.0001\nCC-MAIN-2021-43,ISO-8859-4,28573,28471,0.0009\nCC-MAIN-2021-43,ISO-8859-5,90386,89950,0.0027\nCC-MAIN-2021-43,ISO-8859-6,9357,9167,0.0003\nCC-MAIN-2021-43,ISO-8859-7,321631,318246,0.0096\nCC-MAIN-2021-43,ISO-8859-8,14818,14751,0.0004\nCC-MAIN-2021-43,ISO-8859-9,856416,852004,0.0256\nCC-MAIN-2021-43,KOI8-R,247700,246990,0.0074\nCC-MAIN-2021-43,KOI8-U,2975,2973,0.0001\nCC-MAIN-2021-43,Shift_JIS,6894989,6867435,0.2059\nCC-MAIN-2021-43,TIS-620,282908,281922,0.0084\nCC-MAIN-2021-43,US-ASCII,1326446,1309113,0.0396\nCC-MAIN-2021-43,UTF-16,74587,74391,0.0022\nCC-MAIN-2021-43,UTF-16BE,1254,1252,0.0000\nCC-MAIN-2021-43,UTF-16LE,1283333,1283091,0.0383\nCC-MAIN-2021-43,UTF-32,1499,1494,0.0000\nCC-MAIN-2021-43,UTF-32LE,1,1,0.0000\nCC-MAIN-2021-43,UTF-8,3105556653,3089479136,92.7259\nCC-MAIN-2021-43,windows-1250,2909080,2897780,0.0869\nCC-MAIN-2021-43,windows-1251,22979951,22911361,0.6861\nCC-MAIN-2021-43,windows-1252,12296119,12233230,0.3671\nCC-MAIN-2021-43,windows-1253,99677,99445,0.0030\nCC-MAIN-2021-43,windows-1254,572127,569356,0.0171\nCC-MAIN-2021-43,windows-1255,483166,481249,0.0144\nCC-MAIN-2021-43,windows-1256,1569198,1556843,0.0469\nCC-MAIN-2021-43,windows-1257,254234,251837,0.0076\nCC-MAIN-2021-43,windows-31j,59062,58985,0.0018\nCC-MAIN-2021-43,x-MacCyrillic,96339,96189,0.0029\nCC-MAIN-2021-43,x-iso-8859-11,637,637,0.0000\nCC-MAIN-2021-43,x-windows-874,441543,440830,0.0132\nCC-MAIN-2021-43,x-windows-949,557,544,0.0000\nCC-MAIN-2021-49,<other>,2361,2335,0.0001\nCC-MAIN-2021-49,<unknown>,70534571,70534571,2.7912\nCC-MAIN-2021-49,Big5,2152904,2143292,0.0852\nCC-MAIN-2021-49,Big5-HKSCS,1093,1088,0.0000\nCC-MAIN-2021-49,EUC-JP,4060922,4043119,0.1607\nCC-MAIN-2021-49,EUC-KR,2722855,2715454,0.1077\nCC-MAIN-2021-49,GB18030,784345,781630,0.0310\nCC-MAIN-2021-49,GB2312,12086646,12062146,0.4783\nCC-MAIN-2021-49,GBK,5951196,5941694,0.2355\nCC-MAIN-2021-49,IBM420,227256,226867,0.0090\nCC-MAIN-2021-49,IBM424,64129,63995,0.0025\nCC-MAIN-2021-49,IBM500,22537,22412,0.0009\nCC-MAIN-2021-49,IBM855,55,54,0.0000\nCC-MAIN-2021-49,IBM866,8208,8200,0.0003\nCC-MAIN-2021-49,ISO-2022-JP,38251,38221,0.0015\nCC-MAIN-2021-49,ISO-8859-1,85945252,85418910,3.4010\nCC-MAIN-2021-49,ISO-8859-13,1754,1754,0.0001\nCC-MAIN-2021-49,ISO-8859-15,2305718,2282248,0.0912\nCC-MAIN-2021-49,ISO-8859-16,2189,2161,0.0001\nCC-MAIN-2021-49,ISO-8859-2,4493856,4447362,0.1778\nCC-MAIN-2021-49,ISO-8859-3,7806,7778,0.0003\nCC-MAIN-2021-49,ISO-8859-4,22841,22785,0.0009\nCC-MAIN-2021-49,ISO-8859-5,95938,92908,0.0038\nCC-MAIN-2021-49,ISO-8859-6,8856,8522,0.0004\nCC-MAIN-2021-49,ISO-8859-7,271281,265653,0.0107\nCC-MAIN-2021-49,ISO-8859-8,12665,12593,0.0005\nCC-MAIN-2021-49,ISO-8859-9,993407,987300,0.0393\nCC-MAIN-2021-49,KOI8-R,216880,215702,0.0086\nCC-MAIN-2021-49,KOI8-U,3170,3169,0.0001\nCC-MAIN-2021-49,Shift_JIS,6560521,6530688,0.2596\nCC-MAIN-2021-49,TIS-620,258124,257032,0.0102\nCC-MAIN-2021-49,US-ASCII,1052515,1041593,0.0416\nCC-MAIN-2021-49,UTF-16,62756,62577,0.0025\nCC-MAIN-2021-49,UTF-16BE,2794,2791,0.0001\nCC-MAIN-2021-49,UTF-16LE,1195402,1194998,0.0473\nCC-MAIN-2021-49,UTF-32,1115,1110,0.0000\nCC-MAIN-2021-49,UTF-32LE,4875,4868,0.0002\nCC-MAIN-2021-49,UTF-8,2293597685,2278173858,90.7609\nCC-MAIN-2021-49,windows-1250,2474049,2460919,0.0979\nCC-MAIN-2021-49,windows-1251,18240239,18163881,0.7218\nCC-MAIN-2021-49,windows-1252,7182076,7148646,0.2842\nCC-MAIN-2021-49,windows-1253,93198,92977,0.0037\nCC-MAIN-2021-49,windows-1254,499832,497348,0.0198\nCC-MAIN-2021-49,windows-1255,411765,409482,0.0163\nCC-MAIN-2021-49,windows-1256,1715161,1692693,0.0679\nCC-MAIN-2021-49,windows-1257,227816,223747,0.0090\nCC-MAIN-2021-49,windows-31j,56315,56265,0.0022\nCC-MAIN-2021-49,x-iso-8859-11,520,520,0.0000\nCC-MAIN-2021-49,x-windows-874,399807,399269,0.0158\nCC-MAIN-2021-49,x-windows-949,292,288,0.0000\nCC-MAIN-2022-05,<other>,3070,3043,0.0001\nCC-MAIN-2022-05,<unknown>,58272468,58272468,1.9513\nCC-MAIN-2022-05,Big5,1873930,1868039,0.0627\nCC-MAIN-2022-05,Big5-HKSCS,113,108,0.0000\nCC-MAIN-2022-05,EUC-JP,4398007,4377526,0.1473\nCC-MAIN-2022-05,EUC-KR,2865968,2860221,0.0960\nCC-MAIN-2022-05,GB18030,852411,848946,0.0285\nCC-MAIN-2022-05,GB2312,12358589,12337655,0.4138\nCC-MAIN-2022-05,GBK,6220013,6209247,0.2083\nCC-MAIN-2022-05,IBM420,227480,227074,0.0076\nCC-MAIN-2022-05,IBM424,55769,55653,0.0019\nCC-MAIN-2022-05,IBM500,62491,62358,0.0021\nCC-MAIN-2022-05,IBM855,64,64,0.0000\nCC-MAIN-2022-05,IBM866,8894,8887,0.0003\nCC-MAIN-2022-05,ISO-2022-JP,30364,30335,0.0010\nCC-MAIN-2022-05,ISO-8859-1,86510692,86100816,2.8968\nCC-MAIN-2022-05,ISO-8859-13,1533,1530,0.0001\nCC-MAIN-2022-05,ISO-8859-15,2470741,2425354,0.0827\nCC-MAIN-2022-05,ISO-8859-16,2526,2495,0.0001\nCC-MAIN-2022-05,ISO-8859-2,4261200,4243257,0.1427\nCC-MAIN-2022-05,ISO-8859-3,6633,6601,0.0002\nCC-MAIN-2022-05,ISO-8859-4,28285,28219,0.0009\nCC-MAIN-2022-05,ISO-8859-5,76399,75986,0.0026\nCC-MAIN-2022-05,ISO-8859-6,7819,7702,0.0003\nCC-MAIN-2022-05,ISO-8859-7,255321,252973,0.0085\nCC-MAIN-2022-05,ISO-8859-8,13631,13593,0.0005\nCC-MAIN-2022-05,ISO-8859-9,921323,916895,0.0309\nCC-MAIN-2022-05,KOI8-R,214403,212805,0.0072\nCC-MAIN-2022-05,KOI8-U,2338,2335,0.0001\nCC-MAIN-2022-05,Shift_JIS,6391799,6368519,0.2140\nCC-MAIN-2022-05,TIS-620,267181,266527,0.0089\nCC-MAIN-2022-05,US-ASCII,1231162,1223229,0.0412\nCC-MAIN-2022-05,UTF-16,69580,69372,0.0023\nCC-MAIN-2022-05,UTF-16BE,2296,2293,0.0001\nCC-MAIN-2022-05,UTF-16LE,50067,49840,0.0017\nCC-MAIN-2022-05,UTF-32,1352,1348,0.0000\nCC-MAIN-2022-05,UTF-32LE,8185,8182,0.0003\nCC-MAIN-2022-05,UTF-8,2763729059,2749217235,92.5441\nCC-MAIN-2022-05,windows-1250,2653864,2639730,0.0889\nCC-MAIN-2022-05,windows-1251,19702502,19643385,0.6597\nCC-MAIN-2022-05,windows-1252,7165279,7134530,0.2399\nCC-MAIN-2022-05,windows-1253,103735,103471,0.0035\nCC-MAIN-2022-05,windows-1254,465119,462321,0.0156\nCC-MAIN-2022-05,windows-1255,380462,378929,0.0127\nCC-MAIN-2022-05,windows-1256,1529271,1517419,0.0512\nCC-MAIN-2022-05,windows-1257,181867,180023,0.0061\nCC-MAIN-2022-05,windows-31j,67199,67135,0.0023\nCC-MAIN-2022-05,x-iso-8859-11,333,332,0.0000\nCC-MAIN-2022-05,x-windows-874,388728,388294,0.0130\nCC-MAIN-2022-05,x-windows-949,515,508,0.0000\nCC-MAIN-2022-21,<other>,4459,4383,0.0001\nCC-MAIN-2022-21,<unknown>,62534913,62534913,1.8127\nCC-MAIN-2022-21,Big5,2130286,2122150,0.0618\nCC-MAIN-2022-21,Big5-HKSCS,264,259,0.0000\nCC-MAIN-2022-21,EUC-JP,4391507,4367821,0.1273\nCC-MAIN-2022-21,EUC-KR,2621982,2616295,0.0760\nCC-MAIN-2022-21,GB18030,778934,775683,0.0226\nCC-MAIN-2022-21,GB2312,12490980,12470478,0.3621\nCC-MAIN-2022-21,GBK,5857490,5849073,0.1698\nCC-MAIN-2022-21,IBM420,202995,202557,0.0059\nCC-MAIN-2022-21,IBM424,37597,37478,0.0011\nCC-MAIN-2022-21,IBM500,47536,47448,0.0014\nCC-MAIN-2022-21,IBM855,100,100,0.0000\nCC-MAIN-2022-21,IBM866,10292,10286,0.0003\nCC-MAIN-2022-21,ISO-2022-JP,40207,40164,0.0012\nCC-MAIN-2022-21,ISO-8859-1,85691240,85206626,2.4839\nCC-MAIN-2022-21,ISO-8859-13,1736,1734,0.0001\nCC-MAIN-2022-21,ISO-8859-15,2530790,2511429,0.0734\nCC-MAIN-2022-21,ISO-8859-16,2157,2154,0.0001\nCC-MAIN-2022-21,ISO-8859-2,3918750,3887658,0.1136\nCC-MAIN-2022-21,ISO-8859-3,22733,22654,0.0007\nCC-MAIN-2022-21,ISO-8859-4,30950,30864,0.0009\nCC-MAIN-2022-21,ISO-8859-5,80101,78792,0.0023\nCC-MAIN-2022-21,ISO-8859-6,11501,11311,0.0003\nCC-MAIN-2022-21,ISO-8859-7,294177,291481,0.0085\nCC-MAIN-2022-21,ISO-8859-8,10859,10828,0.0003\nCC-MAIN-2022-21,ISO-8859-9,903881,896769,0.0262\nCC-MAIN-2022-21,KOI8-R,188401,186948,0.0055\nCC-MAIN-2022-21,KOI8-U,4582,4579,0.0001\nCC-MAIN-2022-21,Shift_JIS,6525666,6495930,0.1892\nCC-MAIN-2022-21,TIS-620,254564,253517,0.0074\nCC-MAIN-2022-21,US-ASCII,1072834,1071238,0.0311\nCC-MAIN-2022-21,UTF-16,73723,73370,0.0021\nCC-MAIN-2022-21,UTF-16BE,5207,5193,0.0002\nCC-MAIN-2022-21,UTF-16LE,37050,36805,0.0011\nCC-MAIN-2022-21,UTF-32,2180,2155,0.0001\nCC-MAIN-2022-21,UTF-32LE,3056,3055,0.0001\nCC-MAIN-2022-21,UTF-8,3223670170,3202581798,93.4445\nCC-MAIN-2022-21,windows-1250,2684314,2667317,0.0778\nCC-MAIN-2022-21,windows-1251,20758411,20659810,0.6017\nCC-MAIN-2022-21,windows-1252,6960710,6926645,0.2018\nCC-MAIN-2022-21,windows-1253,99534,99052,0.0029\nCC-MAIN-2022-21,windows-1254,482690,480043,0.0140\nCC-MAIN-2022-21,windows-1255,349916,348570,0.0101\nCC-MAIN-2022-21,windows-1256,1348945,1329862,0.0391\nCC-MAIN-2022-21,windows-1257,219168,214824,0.0064\nCC-MAIN-2022-21,windows-31j,39038,38933,0.0011\nCC-MAIN-2022-21,x-iso-8859-11,474,470,0.0000\nCC-MAIN-2022-21,x-windows-874,394930,393891,0.0114\nCC-MAIN-2022-21,x-windows-949,235,231,0.0000\nCC-MAIN-2022-27,<other>,3131,3104,0.0001\nCC-MAIN-2022-27,<unknown>,65588883,65588883,2.1092\nCC-MAIN-2022-27,Big5,2098710,2093634,0.0675\nCC-MAIN-2022-27,Big5-HKSCS,936,932,0.0000\nCC-MAIN-2022-27,EUC-JP,4327367,4307364,0.1392\nCC-MAIN-2022-27,EUC-KR,2797852,2791842,0.0900\nCC-MAIN-2022-27,GB18030,772832,770608,0.0249\nCC-MAIN-2022-27,GB2312,11921681,11872646,0.3834\nCC-MAIN-2022-27,GBK,5607801,5599121,0.1803\nCC-MAIN-2022-27,IBM420,201882,201538,0.0065\nCC-MAIN-2022-27,IBM424,35765,35667,0.0012\nCC-MAIN-2022-27,IBM500,47212,47144,0.0015\nCC-MAIN-2022-27,IBM855,86,86,0.0000\nCC-MAIN-2022-27,IBM866,8385,8374,0.0003\nCC-MAIN-2022-27,ISO-2022-JP,40607,40555,0.0013\nCC-MAIN-2022-27,ISO-8859-1,80145325,79792550,2.5773\nCC-MAIN-2022-27,ISO-8859-13,1897,1897,0.0001\nCC-MAIN-2022-27,ISO-8859-15,2337951,2321222,0.0752\nCC-MAIN-2022-27,ISO-8859-16,2686,2680,0.0001\nCC-MAIN-2022-27,ISO-8859-2,3936593,3922466,0.1266\nCC-MAIN-2022-27,ISO-8859-3,19388,19299,0.0006\nCC-MAIN-2022-27,ISO-8859-4,34033,33908,0.0011\nCC-MAIN-2022-27,ISO-8859-5,62090,61803,0.0020\nCC-MAIN-2022-27,ISO-8859-6,9789,9745,0.0003\nCC-MAIN-2022-27,ISO-8859-7,270080,268471,0.0087\nCC-MAIN-2022-27,ISO-8859-8,12245,12212,0.0004\nCC-MAIN-2022-27,ISO-8859-9,908910,906441,0.0292\nCC-MAIN-2022-27,KOI8-R,177437,176655,0.0057\nCC-MAIN-2022-27,KOI8-U,1543,1531,0.0000\nCC-MAIN-2022-27,Shift_JIS,6305180,6276730,0.2028\nCC-MAIN-2022-27,TIS-620,266252,264700,0.0086\nCC-MAIN-2022-27,US-ASCII,1020560,1018212,0.0328\nCC-MAIN-2022-27,UTF-16,82083,81789,0.0026\nCC-MAIN-2022-27,UTF-16BE,5774,5768,0.0002\nCC-MAIN-2022-27,UTF-16LE,48010,47704,0.0015\nCC-MAIN-2022-27,UTF-32,1999,1995,0.0001\nCC-MAIN-2022-27,UTF-32LE,3817,3814,0.0001\nCC-MAIN-2022-27,UTF-8,2888546541,2871491753,92.8910\nCC-MAIN-2022-27,windows-1250,2645076,2631695,0.0851\nCC-MAIN-2022-27,windows-1251,19604528,19538685,0.6304\nCC-MAIN-2022-27,windows-1252,6750056,6720927,0.2171\nCC-MAIN-2022-27,windows-1253,106944,106265,0.0034\nCC-MAIN-2022-27,windows-1254,477813,475307,0.0154\nCC-MAIN-2022-27,windows-1255,357812,356860,0.0115\nCC-MAIN-2022-27,windows-1256,1368775,1356327,0.0440\nCC-MAIN-2022-27,windows-1257,203210,202544,0.0065\nCC-MAIN-2022-27,windows-31j,28637,28509,0.0009\nCC-MAIN-2022-27,x-iso-8859-11,2161,1958,0.0001\nCC-MAIN-2022-27,x-windows-874,411102,410637,0.0132\nCC-MAIN-2022-27,x-windows-949,245,242,0.0000\nCC-MAIN-2022-33,<other>,4048,3955,0.0002\nCC-MAIN-2022-33,<unknown>,63474865,63474865,2.4520\nCC-MAIN-2022-33,Big5,2046173,2036954,0.0790\nCC-MAIN-2022-33,Big5-HKSCS,301,290,0.0000\nCC-MAIN-2022-33,EUC-JP,3781250,3760292,0.1461\nCC-MAIN-2022-33,EUC-KR,2797914,2790295,0.1081\nCC-MAIN-2022-33,GB18030,699511,698244,0.0270\nCC-MAIN-2022-33,GB2312,10563345,10547117,0.4081\nCC-MAIN-2022-33,GBK,4837357,4827515,0.1869\nCC-MAIN-2022-33,IBM420,208751,208111,0.0081\nCC-MAIN-2022-33,IBM424,41882,41765,0.0016\nCC-MAIN-2022-33,IBM500,48788,48653,0.0019\nCC-MAIN-2022-33,IBM855,74,74,0.0000\nCC-MAIN-2022-33,IBM866,11425,11412,0.0004\nCC-MAIN-2022-33,ISO-2022-JP,35906,35867,0.0014\nCC-MAIN-2022-33,ISO-8859-1,78089451,77555842,3.0166\nCC-MAIN-2022-33,ISO-8859-13,3228,3226,0.0001\nCC-MAIN-2022-33,ISO-8859-15,2103144,2088779,0.0812\nCC-MAIN-2022-33,ISO-8859-16,2587,2560,0.0001\nCC-MAIN-2022-33,ISO-8859-2,3922148,3884502,0.1515\nCC-MAIN-2022-33,ISO-8859-3,17022,16966,0.0007\nCC-MAIN-2022-33,ISO-8859-4,28474,28343,0.0011\nCC-MAIN-2022-33,ISO-8859-5,68943,67114,0.0027\nCC-MAIN-2022-33,ISO-8859-6,11268,11198,0.0004\nCC-MAIN-2022-33,ISO-8859-7,274412,271033,0.0106\nCC-MAIN-2022-33,ISO-8859-8,9916,9881,0.0004\nCC-MAIN-2022-33,ISO-8859-9,868130,862279,0.0335\nCC-MAIN-2022-33,KOI8-R,187929,186688,0.0073\nCC-MAIN-2022-33,KOI8-U,2421,2420,0.0001\nCC-MAIN-2022-33,Shift_JIS,5822621,5798117,0.2249\nCC-MAIN-2022-33,TIS-620,255991,252946,0.0099\nCC-MAIN-2022-33,US-ASCII,1028880,1026114,0.0397\nCC-MAIN-2022-33,UTF-16,81345,80992,0.0031\nCC-MAIN-2022-33,UTF-16BE,2739,2728,0.0001\nCC-MAIN-2022-33,UTF-16LE,47817,47534,0.0018\nCC-MAIN-2022-33,UTF-32,1053,1048,0.0000\nCC-MAIN-2022-33,UTF-32LE,3193,3186,0.0001\nCC-MAIN-2022-33,UTF-8,2378134910,2360525191,91.8663\nCC-MAIN-2022-33,windows-1250,2398981,2386016,0.0927\nCC-MAIN-2022-33,windows-1251,17367262,17294922,0.6709\nCC-MAIN-2022-33,windows-1252,6346278,6311706,0.2452\nCC-MAIN-2022-33,windows-1253,98373,97990,0.0038\nCC-MAIN-2022-33,windows-1254,441583,438539,0.0171\nCC-MAIN-2022-33,windows-1255,354620,351541,0.0137\nCC-MAIN-2022-33,windows-1256,1534004,1511112,0.0593\nCC-MAIN-2022-33,windows-1257,228480,222615,0.0088\nCC-MAIN-2022-33,windows-31j,36863,36738,0.0014\nCC-MAIN-2022-33,x-iso-8859-11,1457,1290,0.0001\nCC-MAIN-2022-33,x-windows-874,362783,360689,0.0140\nCC-MAIN-2022-33,x-windows-949,354,352,0.0000\nCC-MAIN-2022-40,<other>,3838,3804,0.0001\nCC-MAIN-2022-40,<unknown>,54853944,54853944,1.7267\nCC-MAIN-2022-40,Big5,1990520,1985842,0.0627\nCC-MAIN-2022-40,Big5-HKSCS,395,390,0.0000\nCC-MAIN-2022-40,EUC-JP,3534560,3517634,0.1113\nCC-MAIN-2022-40,EUC-KR,2633133,2627691,0.0829\nCC-MAIN-2022-40,GB18030,712242,711201,0.0224\nCC-MAIN-2022-40,GB2312,11998590,11988411,0.3777\nCC-MAIN-2022-40,GBK,4968851,4960990,0.1564\nCC-MAIN-2022-40,IBM420,192614,192271,0.0061\nCC-MAIN-2022-40,IBM424,54171,54086,0.0017\nCC-MAIN-2022-40,IBM500,50098,49891,0.0016\nCC-MAIN-2022-40,IBM855,86,86,0.0000\nCC-MAIN-2022-40,IBM866,7565,7555,0.0002\nCC-MAIN-2022-40,ISO-2022-JP,28347,28311,0.0009\nCC-MAIN-2022-40,ISO-8859-1,73062040,72676985,2.2999\nCC-MAIN-2022-40,ISO-8859-13,3337,3337,0.0001\nCC-MAIN-2022-40,ISO-8859-15,2214200,2192838,0.0697\nCC-MAIN-2022-40,ISO-8859-16,4067,4057,0.0001\nCC-MAIN-2022-40,ISO-8859-2,3748136,3724055,0.1180\nCC-MAIN-2022-40,ISO-8859-3,11781,11742,0.0004\nCC-MAIN-2022-40,ISO-8859-4,23528,23437,0.0007\nCC-MAIN-2022-40,ISO-8859-5,60789,60179,0.0019\nCC-MAIN-2022-40,ISO-8859-6,16036,15939,0.0005\nCC-MAIN-2022-40,ISO-8859-7,240785,237898,0.0076\nCC-MAIN-2022-40,ISO-8859-8,12537,12513,0.0004\nCC-MAIN-2022-40,ISO-8859-9,631209,628336,0.0199\nCC-MAIN-2022-40,KOI8-R,186416,185379,0.0059\nCC-MAIN-2022-40,KOI8-U,911,909,0.0000\nCC-MAIN-2022-40,Shift_JIS,5003109,4990509,0.1575\nCC-MAIN-2022-40,TIS-620,239820,237555,0.0075\nCC-MAIN-2022-40,US-ASCII,930477,928739,0.0293\nCC-MAIN-2022-40,UTF-16,75083,74864,0.0024\nCC-MAIN-2022-40,UTF-16BE,4094,4091,0.0001\nCC-MAIN-2022-40,UTF-16LE,41253,41018,0.0013\nCC-MAIN-2022-40,UTF-32,1776,1776,0.0001\nCC-MAIN-2022-40,UTF-32LE,6654,6654,0.0002\nCC-MAIN-2022-40,UTF-8,2980330903,2964437256,93.8166\nCC-MAIN-2022-40,windows-1250,2489660,2477890,0.0784\nCC-MAIN-2022-40,windows-1251,17828058,17762216,0.5612\nCC-MAIN-2022-40,windows-1252,5944137,5915876,0.1871\nCC-MAIN-2022-40,windows-1253,78423,78242,0.0025\nCC-MAIN-2022-40,windows-1254,372193,369163,0.0117\nCC-MAIN-2022-40,windows-1255,136627,136222,0.0043\nCC-MAIN-2022-40,windows-1256,1481807,1466796,0.0466\nCC-MAIN-2022-40,windows-1257,211528,208148,0.0067\nCC-MAIN-2022-40,windows-31j,30196,30108,0.0010\nCC-MAIN-2022-40,x-iso-8859-11,634,618,0.0000\nCC-MAIN-2022-40,x-windows-874,311583,311424,0.0098\nCC-MAIN-2022-40,x-windows-949,307,304,0.0000\nCC-MAIN-2022-49,<other>,3783,3756,0.0001\nCC-MAIN-2022-49,<unknown>,60767969,60767969,1.7970\nCC-MAIN-2022-49,Big5,1900927,1899531,0.0562\nCC-MAIN-2022-49,Big5-HKSCS,496,491,0.0000\nCC-MAIN-2022-49,EUC-JP,3990047,3969969,0.1180\nCC-MAIN-2022-49,EUC-KR,2843354,2835955,0.0841\nCC-MAIN-2022-49,GB18030,675698,674292,0.0200\nCC-MAIN-2022-49,GB2312,11153118,11139987,0.3298\nCC-MAIN-2022-49,GBK,4664932,4655033,0.1379\nCC-MAIN-2022-49,IBM420,189924,189434,0.0056\nCC-MAIN-2022-49,IBM424,37172,37076,0.0011\nCC-MAIN-2022-49,IBM500,21192,21083,0.0006\nCC-MAIN-2022-49,IBM855,66,66,0.0000\nCC-MAIN-2022-49,IBM866,5015,5006,0.0001\nCC-MAIN-2022-49,ISO-2022-JP,32421,32059,0.0010\nCC-MAIN-2022-49,ISO-8859-1,79859205,79271758,2.3616\nCC-MAIN-2022-49,ISO-8859-13,1754,1754,0.0001\nCC-MAIN-2022-49,ISO-8859-15,2472403,2454169,0.0731\nCC-MAIN-2022-49,ISO-8859-16,7447,7236,0.0002\nCC-MAIN-2022-49,ISO-8859-2,4386349,4335950,0.1297\nCC-MAIN-2022-49,ISO-8859-3,11400,11363,0.0003\nCC-MAIN-2022-49,ISO-8859-4,30532,30464,0.0009\nCC-MAIN-2022-49,ISO-8859-5,84907,82672,0.0025\nCC-MAIN-2022-49,ISO-8859-6,3322,3314,0.0001\nCC-MAIN-2022-49,ISO-8859-7,294476,286493,0.0087\nCC-MAIN-2022-49,ISO-8859-8,14583,14538,0.0004\nCC-MAIN-2022-49,ISO-8859-9,786517,782149,0.0233\nCC-MAIN-2022-49,KOI8-R,209553,208622,0.0062\nCC-MAIN-2022-49,KOI8-U,393,390,0.0000\nCC-MAIN-2022-49,Shift_JIS,5475663,5458830,0.1619\nCC-MAIN-2022-49,TIS-620,227363,225238,0.0067\nCC-MAIN-2022-49,US-ASCII,909753,907902,0.0269\nCC-MAIN-2022-49,UTF-16,88406,88065,0.0026\nCC-MAIN-2022-49,UTF-16BE,3710,3707,0.0001\nCC-MAIN-2022-49,UTF-16LE,51583,51409,0.0015\nCC-MAIN-2022-49,UTF-32,2101,2096,0.0001\nCC-MAIN-2022-49,UTF-32LE,5158,5157,0.0002\nCC-MAIN-2022-49,UTF-8,3169345819,3149457005,93.7229\nCC-MAIN-2022-49,windows-1250,2670026,2654677,0.0790\nCC-MAIN-2022-49,windows-1251,18903183,18828157,0.5590\nCC-MAIN-2022-49,windows-1252,6303996,6277921,0.1864\nCC-MAIN-2022-49,windows-1253,98073,97845,0.0029\nCC-MAIN-2022-49,windows-1254,407609,403722,0.0121\nCC-MAIN-2022-49,windows-1255,130171,129505,0.0038\nCC-MAIN-2022-49,windows-1256,1850776,1807164,0.0547\nCC-MAIN-2022-49,windows-1257,320523,311722,0.0095\nCC-MAIN-2022-49,windows-31j,38170,38081,0.0011\nCC-MAIN-2022-49,x-iso-8859-11,448,444,0.0000\nCC-MAIN-2022-49,x-windows-874,331305,330582,0.0098\nCC-MAIN-2022-49,x-windows-949,97,93,0.0000\nCC-MAIN-2023-06,<other>,3880,3843,0.0001\nCC-MAIN-2023-06,<unknown>,53428296,53428296,1.6751\nCC-MAIN-2023-06,Big5,1570920,1569402,0.0493\nCC-MAIN-2023-06,Big5-HKSCS,301,295,0.0000\nCC-MAIN-2023-06,EUC-JP,3339173,3324099,0.1047\nCC-MAIN-2023-06,EUC-KR,2669622,2662035,0.0837\nCC-MAIN-2023-06,GB18030,585122,583976,0.0183\nCC-MAIN-2023-06,GB2312,9505113,9496219,0.2980\nCC-MAIN-2023-06,GBK,3711529,3706098,0.1164\nCC-MAIN-2023-06,IBM420,168803,168447,0.0053\nCC-MAIN-2023-06,IBM424,49221,49064,0.0015\nCC-MAIN-2023-06,IBM500,17843,17763,0.0006\nCC-MAIN-2023-06,IBM855,41,41,0.0000\nCC-MAIN-2023-06,IBM866,8946,8934,0.0003\nCC-MAIN-2023-06,ISO-2022-JP,26872,26844,0.0008\nCC-MAIN-2023-06,ISO-8859-1,72180857,71649429,2.2630\nCC-MAIN-2023-06,ISO-8859-13,1607,1606,0.0001\nCC-MAIN-2023-06,ISO-8859-15,2062642,2052508,0.0647\nCC-MAIN-2023-06,ISO-8859-16,5384,5370,0.0002\nCC-MAIN-2023-06,ISO-8859-2,3984824,3933910,0.1249\nCC-MAIN-2023-06,ISO-8859-3,12821,12809,0.0004\nCC-MAIN-2023-06,ISO-8859-4,25396,25102,0.0008\nCC-MAIN-2023-06,ISO-8859-5,76695,73844,0.0024\nCC-MAIN-2023-06,ISO-8859-6,2440,2435,0.0001\nCC-MAIN-2023-06,ISO-8859-7,278963,274064,0.0087\nCC-MAIN-2023-06,ISO-8859-8,11821,11787,0.0004\nCC-MAIN-2023-06,ISO-8859-9,927456,923200,0.0291\nCC-MAIN-2023-06,KOI8-R,219761,219287,0.0069\nCC-MAIN-2023-06,KOI8-U,568,567,0.0000\nCC-MAIN-2023-06,Shift_JIS,5163212,5150045,0.1619\nCC-MAIN-2023-06,TIS-620,217860,217446,0.0068\nCC-MAIN-2023-06,US-ASCII,902631,899855,0.0283\nCC-MAIN-2023-06,UTF-16,91248,90796,0.0029\nCC-MAIN-2023-06,UTF-16BE,3315,3315,0.0001\nCC-MAIN-2023-06,UTF-16LE,39931,39806,0.0013\nCC-MAIN-2023-06,UTF-32,1685,1682,0.0001\nCC-MAIN-2023-06,UTF-32LE,7348,7334,0.0002\nCC-MAIN-2023-06,UTF-8,2999989926,2982783247,94.0560\nCC-MAIN-2023-06,windows-1250,2422373,2410889,0.0759\nCC-MAIN-2023-06,windows-1251,17439310,17375702,0.5468\nCC-MAIN-2023-06,windows-1252,5643941,5621522,0.1769\nCC-MAIN-2023-06,windows-1253,93613,93247,0.0029\nCC-MAIN-2023-06,windows-1254,368597,365235,0.0116\nCC-MAIN-2023-06,windows-1255,116710,116294,0.0037\nCC-MAIN-2023-06,windows-1256,1593051,1567879,0.0499\nCC-MAIN-2023-06,windows-1257,258990,250402,0.0081\nCC-MAIN-2023-06,windows-31j,35098,35012,0.0011\nCC-MAIN-2023-06,x-iso-8859-11,360,356,0.0000\nCC-MAIN-2023-06,x-windows-874,311823,311501,0.0098\nCC-MAIN-2023-06,x-windows-949,268,265,0.0000\nCC-MAIN-2023-14,<other>,4618,4592,0.0001\nCC-MAIN-2023-14,<unknown>,58906019,58906019,1.8888\nCC-MAIN-2023-14,Big5,2150925,2149054,0.0690\nCC-MAIN-2023-14,Big5-HKSCS,341,336,0.0000\nCC-MAIN-2023-14,EUC-JP,3395888,3382463,0.1089\nCC-MAIN-2023-14,EUC-KR,2555606,2549371,0.0819\nCC-MAIN-2023-14,GB18030,593142,591733,0.0190\nCC-MAIN-2023-14,GB2312,12887775,12877560,0.4133\nCC-MAIN-2023-14,GBK,3714792,3707332,0.1191\nCC-MAIN-2023-14,IBM420,187269,187035,0.0060\nCC-MAIN-2023-14,IBM424,59188,59048,0.0019\nCC-MAIN-2023-14,IBM500,25439,25352,0.0008\nCC-MAIN-2023-14,IBM855,58,58,0.0000\nCC-MAIN-2023-14,IBM866,9920,9875,0.0003\nCC-MAIN-2023-14,ISO-2022-JP,26178,26129,0.0008\nCC-MAIN-2023-14,ISO-8859-1,74036527,73536838,2.3740\nCC-MAIN-2023-14,ISO-8859-13,1526,1526,0.0000\nCC-MAIN-2023-14,ISO-8859-15,1940614,1928641,0.0622\nCC-MAIN-2023-14,ISO-8859-16,4985,4977,0.0002\nCC-MAIN-2023-14,ISO-8859-2,4091809,4049180,0.1312\nCC-MAIN-2023-14,ISO-8859-3,10869,10852,0.0003\nCC-MAIN-2023-14,ISO-8859-4,25770,25687,0.0008\nCC-MAIN-2023-14,ISO-8859-5,100026,97848,0.0032\nCC-MAIN-2023-14,ISO-8859-6,1406,1401,0.0000\nCC-MAIN-2023-14,ISO-8859-7,314452,311467,0.0101\nCC-MAIN-2023-14,ISO-8859-8,12221,12175,0.0004\nCC-MAIN-2023-14,ISO-8859-9,691831,686978,0.0222\nCC-MAIN-2023-14,KOI8-R,220806,219853,0.0071\nCC-MAIN-2023-14,KOI8-U,783,662,0.0000\nCC-MAIN-2023-14,Shift_JIS,5642872,5626208,0.1809\nCC-MAIN-2023-14,TIS-620,224666,224206,0.0072\nCC-MAIN-2023-14,US-ASCII,906418,904653,0.0291\nCC-MAIN-2023-14,UTF-16,94648,94194,0.0030\nCC-MAIN-2023-14,UTF-16BE,16776,16775,0.0005\nCC-MAIN-2023-14,UTF-16LE,42411,42022,0.0014\nCC-MAIN-2023-14,UTF-32,1181,1178,0.0000\nCC-MAIN-2023-14,UTF-32LE,16797,16794,0.0005\nCC-MAIN-2023-14,UTF-8,2915713807,2898388221,93.4933\nCC-MAIN-2023-14,windows-1250,2570643,2557733,0.0824\nCC-MAIN-2023-14,windows-1251,18292778,18228550,0.5866\nCC-MAIN-2023-14,windows-1252,6085325,6063386,0.1951\nCC-MAIN-2023-14,windows-1253,101576,101320,0.0033\nCC-MAIN-2023-14,windows-1254,339145,335873,0.0109\nCC-MAIN-2023-14,windows-1255,117077,116200,0.0038\nCC-MAIN-2023-14,windows-1256,1815160,1790190,0.0582\nCC-MAIN-2023-14,windows-1257,324496,316878,0.0104\nCC-MAIN-2023-14,windows-31j,28536,28318,0.0009\nCC-MAIN-2023-14,x-iso-8859-11,116,116,0.0000\nCC-MAIN-2023-14,x-windows-874,326783,326411,0.0105\nCC-MAIN-2023-14,x-windows-949,1419,1417,0.0000\nCC-MAIN-2023-23,<other>,5344,5295,0.0002\nCC-MAIN-2023-23,<unknown>,56906950,56906950,1.8120\nCC-MAIN-2023-23,Big5,2154853,2152531,0.0686\nCC-MAIN-2023-23,Big5-HKSCS,223,218,0.0000\nCC-MAIN-2023-23,EUC-JP,3482633,3465709,0.1109\nCC-MAIN-2023-23,EUC-KR,2696277,2690769,0.0859\nCC-MAIN-2023-23,GB18030,539109,537660,0.0172\nCC-MAIN-2023-23,GB2312,8488485,8477902,0.2703\nCC-MAIN-2023-23,GBK,3473607,3465693,0.1106\nCC-MAIN-2023-23,IBM420,185631,185343,0.0059\nCC-MAIN-2023-23,IBM424,53698,53507,0.0017\nCC-MAIN-2023-23,IBM500,42054,41968,0.0013\nCC-MAIN-2023-23,IBM855,166,166,0.0000\nCC-MAIN-2023-23,IBM866,8632,8624,0.0003\nCC-MAIN-2023-23,ISO-2022-JP,28498,28458,0.0009\nCC-MAIN-2023-23,ISO-8859-1,74871124,74495497,2.3840\nCC-MAIN-2023-23,ISO-8859-13,3656,3656,0.0001\nCC-MAIN-2023-23,ISO-8859-15,1885893,1874477,0.0600\nCC-MAIN-2023-23,ISO-8859-16,4695,4684,0.0001\nCC-MAIN-2023-23,ISO-8859-2,4145594,4114850,0.1320\nCC-MAIN-2023-23,ISO-8859-3,14600,14571,0.0005\nCC-MAIN-2023-23,ISO-8859-4,29561,29516,0.0009\nCC-MAIN-2023-23,ISO-8859-5,99109,98903,0.0032\nCC-MAIN-2023-23,ISO-8859-6,1402,1398,0.0000\nCC-MAIN-2023-23,ISO-8859-7,316559,314996,0.0101\nCC-MAIN-2023-23,ISO-8859-8,10974,10938,0.0003\nCC-MAIN-2023-23,ISO-8859-9,754595,752159,0.0240\nCC-MAIN-2023-23,KOI8-R,198601,198057,0.0063\nCC-MAIN-2023-23,KOI8-U,635,629,0.0000\nCC-MAIN-2023-23,Shift_JIS,5541495,5527965,0.1764\nCC-MAIN-2023-23,TIS-620,226449,225973,0.0072\nCC-MAIN-2023-23,US-ASCII,1046476,1044597,0.0333\nCC-MAIN-2023-23,UTF-16,99457,98953,0.0032\nCC-MAIN-2023-23,UTF-16BE,4172,4169,0.0001\nCC-MAIN-2023-23,UTF-16LE,44526,44350,0.0014\nCC-MAIN-2023-23,UTF-32,1150,1146,0.0000\nCC-MAIN-2023-23,UTF-32LE,24812,24810,0.0008\nCC-MAIN-2023-23,UTF-8,2943485993,2925548997,93.7245\nCC-MAIN-2023-23,windows-1250,2605021,2591390,0.0829\nCC-MAIN-2023-23,windows-1251,17888671,17819618,0.5696\nCC-MAIN-2023-23,windows-1252,6049554,6024689,0.1926\nCC-MAIN-2023-23,windows-1253,99826,99314,0.0032\nCC-MAIN-2023-23,windows-1254,321021,318038,0.0102\nCC-MAIN-2023-23,windows-1255,116547,115121,0.0037\nCC-MAIN-2023-23,windows-1256,1894910,1872893,0.0603\nCC-MAIN-2023-23,windows-1257,356216,355356,0.0113\nCC-MAIN-2023-23,windows-31j,27559,27519,0.0009\nCC-MAIN-2023-23,x-iso-8859-11,155,155,0.0000\nCC-MAIN-2023-23,x-windows-874,335280,334753,0.0107\nCC-MAIN-2023-23,x-windows-949,1520,1517,0.0000\nCC-MAIN-2023-40,<other>,1855,1850,0.0001\nCC-MAIN-2023-40,<unknown>,61153290,61153290,1.7751\nCC-MAIN-2023-40,Big5,2141625,2138751,0.0622\nCC-MAIN-2023-40,Big5-HKSCS,357,353,0.0000\nCC-MAIN-2023-40,EUC-JP,3752516,3733652,0.1089\nCC-MAIN-2023-40,EUC-KR,2867330,2861428,0.0832\nCC-MAIN-2023-40,GB18030,572545,571176,0.0166\nCC-MAIN-2023-40,GB2312,8559894,8548049,0.2485\nCC-MAIN-2023-40,GBK,3360215,3351905,0.0975\nCC-MAIN-2023-40,IBM420,208112,207754,0.0060\nCC-MAIN-2023-40,IBM424,80668,80391,0.0023\nCC-MAIN-2023-40,IBM500,25820,25542,0.0007\nCC-MAIN-2023-40,IBM855,98,98,0.0000\nCC-MAIN-2023-40,IBM866,8161,8157,0.0002\nCC-MAIN-2023-40,ISO-2022-JP,27858,27835,0.0008\nCC-MAIN-2023-40,ISO-8859-1,77355587,76980197,2.2454\nCC-MAIN-2023-40,ISO-8859-13,2939,2939,0.0001\nCC-MAIN-2023-40,ISO-8859-15,2012269,1995088,0.0584\nCC-MAIN-2023-40,ISO-8859-16,5449,5432,0.0002\nCC-MAIN-2023-40,ISO-8859-2,4257742,4229792,0.1236\nCC-MAIN-2023-40,ISO-8859-3,16905,16856,0.0005\nCC-MAIN-2023-40,ISO-8859-4,38934,38786,0.0011\nCC-MAIN-2023-40,ISO-8859-5,97869,97695,0.0028\nCC-MAIN-2023-40,ISO-8859-6,1641,1637,0.0000\nCC-MAIN-2023-40,ISO-8859-7,297351,296316,0.0086\nCC-MAIN-2023-40,ISO-8859-8,15567,15369,0.0005\nCC-MAIN-2023-40,ISO-8859-9,756751,753104,0.0220\nCC-MAIN-2023-40,KOI8-R,207469,206842,0.0060\nCC-MAIN-2023-40,KOI8-U,860,860,0.0000\nCC-MAIN-2023-40,Shift_JIS,5525259,5508618,0.1604\nCC-MAIN-2023-40,TIS-620,255011,254437,0.0074\nCC-MAIN-2023-40,US-ASCII,935658,934166,0.0272\nCC-MAIN-2023-40,UTF-16,115730,115188,0.0034\nCC-MAIN-2023-40,UTF-16BE,26868,26810,0.0008\nCC-MAIN-2023-40,UTF-16LE,47720,47356,0.0014\nCC-MAIN-2023-40,UTF-32,1749,1735,0.0001\nCC-MAIN-2023-40,UTF-32LE,20448,20443,0.0006\nCC-MAIN-2023-40,UTF-8,3239527476,3214272438,94.0352\nCC-MAIN-2023-40,windows-1250,2830948,2807781,0.0822\nCC-MAIN-2023-40,windows-1251,18307827,18235841,0.5314\nCC-MAIN-2023-40,windows-1252,6305859,6273119,0.1830\nCC-MAIN-2023-40,windows-1253,106562,106099,0.0031\nCC-MAIN-2023-40,windows-1254,353062,346894,0.0102\nCC-MAIN-2023-40,windows-1255,139823,138389,0.0041\nCC-MAIN-2023-40,windows-1256,1901824,1892293,0.0552\nCC-MAIN-2023-40,windows-1257,382691,381949,0.0111\nCC-MAIN-2023-40,windows-31j,30180,30137,0.0009\nCC-MAIN-2023-40,x-iso-8859-11,131,131,0.0000\nCC-MAIN-2023-40,x-windows-874,370804,369903,0.0108\nCC-MAIN-2023-40,x-windows-949,1730,1729,0.0001\nCC-MAIN-2023-50,<other>,2448,2441,0.0001\nCC-MAIN-2023-50,<unknown>,67071530,67071530,1.9997\nCC-MAIN-2023-50,Big5,2046752,2043034,0.0610\nCC-MAIN-2023-50,Big5-HKSCS,335,330,0.0000\nCC-MAIN-2023-50,EUC-JP,3723916,3706186,0.1110\nCC-MAIN-2023-50,EUC-KR,3208670,3200738,0.0957\nCC-MAIN-2023-50,GB18030,684571,682974,0.0204\nCC-MAIN-2023-50,GB2312,12228519,12212523,0.3646\nCC-MAIN-2023-50,GBK,4464341,4448812,0.1331\nCC-MAIN-2023-50,IBM420,186075,185676,0.0055\nCC-MAIN-2023-50,IBM424,115361,114858,0.0034\nCC-MAIN-2023-50,IBM500,27745,27652,0.0008\nCC-MAIN-2023-50,IBM855,111,111,0.0000\nCC-MAIN-2023-50,IBM866,6118,6093,0.0002\nCC-MAIN-2023-50,ISO-2022-JP,36404,36325,0.0011\nCC-MAIN-2023-50,ISO-8859-1,76978661,76632626,2.2951\nCC-MAIN-2023-50,ISO-8859-13,1443,1443,0.0000\nCC-MAIN-2023-50,ISO-8859-15,1854467,1837185,0.0553\nCC-MAIN-2023-50,ISO-8859-16,5649,5646,0.0002\nCC-MAIN-2023-50,ISO-8859-2,4146488,4129071,0.1236\nCC-MAIN-2023-50,ISO-8859-3,15829,15802,0.0005\nCC-MAIN-2023-50,ISO-8859-4,27964,27878,0.0008\nCC-MAIN-2023-50,ISO-8859-5,93841,93764,0.0028\nCC-MAIN-2023-50,ISO-8859-6,1584,1579,0.0000\nCC-MAIN-2023-50,ISO-8859-7,283394,282267,0.0084\nCC-MAIN-2023-50,ISO-8859-8,22187,22037,0.0007\nCC-MAIN-2023-50,ISO-8859-9,884541,881970,0.0264\nCC-MAIN-2023-50,KOI8-R,213311,212498,0.0064\nCC-MAIN-2023-50,KOI8-U,1717,1616,0.0001\nCC-MAIN-2023-50,Shift_JIS,6551152,6521040,0.1953\nCC-MAIN-2023-50,TIS-620,207091,206747,0.0062\nCC-MAIN-2023-50,US-ASCII,1084046,1081949,0.0323\nCC-MAIN-2023-50,UTF-16,112859,111831,0.0034\nCC-MAIN-2023-50,UTF-16BE,17020,17010,0.0005\nCC-MAIN-2023-50,UTF-16LE,62286,62032,0.0019\nCC-MAIN-2023-50,UTF-32,1747,1744,0.0001\nCC-MAIN-2023-50,UTF-32LE,18523,18520,0.0006\nCC-MAIN-2023-50,UTF-8,3136416289,3110998963,93.5115\nCC-MAIN-2023-50,windows-1250,2541731,2528588,0.0758\nCC-MAIN-2023-50,windows-1251,18844003,18766834,0.5618\nCC-MAIN-2023-50,windows-1252,6812501,6778504,0.2031\nCC-MAIN-2023-50,windows-1253,96776,96564,0.0029\nCC-MAIN-2023-50,windows-1254,412693,405520,0.0123\nCC-MAIN-2023-50,windows-1255,229807,228382,0.0069\nCC-MAIN-2023-50,windows-1256,1603266,1599761,0.0478\nCC-MAIN-2023-50,windows-1257,320486,320177,0.0096\nCC-MAIN-2023-50,windows-31j,31643,31577,0.0009\nCC-MAIN-2023-50,x-iso-8859-11,74,74,0.0000\nCC-MAIN-2023-50,x-windows-874,341034,340240,0.0102\nCC-MAIN-2023-50,x-windows-949,3125,3124,0.0001\nCC-MAIN-2024-10,<other>,1872,1866,0.0001\nCC-MAIN-2024-10,<unknown>,52474379,52474379,1.6892\nCC-MAIN-2024-10,Big5,1720776,1712010,0.0554\nCC-MAIN-2024-10,Big5-HKSCS,210,204,0.0000\nCC-MAIN-2024-10,EUC-JP,3291910,3276143,0.1060\nCC-MAIN-2024-10,EUC-KR,2502899,2492750,0.0806\nCC-MAIN-2024-10,GB18030,487187,485961,0.0157\nCC-MAIN-2024-10,GB2312,7563597,7553585,0.2435\nCC-MAIN-2024-10,GBK,3269448,3258878,0.1052\nCC-MAIN-2024-10,IBM420,173328,172952,0.0056\nCC-MAIN-2024-10,IBM424,69118,68817,0.0022\nCC-MAIN-2024-10,IBM500,21223,21107,0.0007\nCC-MAIN-2024-10,IBM855,92,92,0.0000\nCC-MAIN-2024-10,IBM866,4631,4624,0.0001\nCC-MAIN-2024-10,ISO-2022-JP,35887,35865,0.0012\nCC-MAIN-2024-10,ISO-8859-1,72252693,71438420,2.3258\nCC-MAIN-2024-10,ISO-8859-13,1086,1086,0.0000\nCC-MAIN-2024-10,ISO-8859-15,1552323,1541696,0.0500\nCC-MAIN-2024-10,ISO-8859-16,4004,4002,0.0001\nCC-MAIN-2024-10,ISO-8859-2,3917540,3842360,0.1261\nCC-MAIN-2024-10,ISO-8859-3,15595,15552,0.0005\nCC-MAIN-2024-10,ISO-8859-4,20994,20899,0.0007\nCC-MAIN-2024-10,ISO-8859-5,79595,75310,0.0026\nCC-MAIN-2024-10,ISO-8859-6,1619,1616,0.0001\nCC-MAIN-2024-10,ISO-8859-7,295016,289382,0.0095\nCC-MAIN-2024-10,ISO-8859-8,27932,27817,0.0009\nCC-MAIN-2024-10,ISO-8859-9,811766,802940,0.0261\nCC-MAIN-2024-10,KOI8-R,239687,239164,0.0077\nCC-MAIN-2024-10,KOI8-U,1379,1371,0.0000\nCC-MAIN-2024-10,Shift_JIS,5793378,5767740,0.1865\nCC-MAIN-2024-10,TIS-620,157823,157481,0.0051\nCC-MAIN-2024-10,US-ASCII,1083391,1081894,0.0349\nCC-MAIN-2024-10,UTF-16,104664,104156,0.0034\nCC-MAIN-2024-10,UTF-16BE,8451,8447,0.0003\nCC-MAIN-2024-10,UTF-16LE,46440,46193,0.0015\nCC-MAIN-2024-10,UTF-32,780,778,0.0000\nCC-MAIN-2024-10,UTF-32LE,10093,10067,0.0003\nCC-MAIN-2024-10,UTF-8,2921155030,2897183678,94.0329\nCC-MAIN-2024-10,windows-1250,2323148,2305341,0.0748\nCC-MAIN-2024-10,windows-1251,16307933,16211375,0.5250\nCC-MAIN-2024-10,windows-1252,5703381,5672108,0.1836\nCC-MAIN-2024-10,windows-1253,81058,80831,0.0026\nCC-MAIN-2024-10,windows-1254,296493,295225,0.0095\nCC-MAIN-2024-10,windows-1255,236524,231027,0.0076\nCC-MAIN-2024-10,windows-1256,1669815,1609433,0.0538\nCC-MAIN-2024-10,windows-1257,388184,375050,0.0125\nCC-MAIN-2024-10,windows-31j,15814,15773,0.0005\nCC-MAIN-2024-10,x-iso-8859-11,100,99,0.0000\nCC-MAIN-2024-10,x-windows-874,302032,298336,0.0097\nCC-MAIN-2024-10,x-windows-949,3248,3248,0.0001\nCC-MAIN-2024-18,<other>,1977,1972,0.0001\nCC-MAIN-2024-18,<unknown>,47829408,47829408,1.7163\nCC-MAIN-2024-18,Big5,1013867,1012270,0.0364\nCC-MAIN-2024-18,Big5-HKSCS,336,330,0.0000\nCC-MAIN-2024-18,EUC-JP,3041374,3027518,0.1091\nCC-MAIN-2024-18,EUC-KR,2311955,2306712,0.0830\nCC-MAIN-2024-18,GB18030,464198,463159,0.0167\nCC-MAIN-2024-18,GB2312,7558004,7549228,0.2712\nCC-MAIN-2024-18,GBK,3017324,3006532,0.1083\nCC-MAIN-2024-18,IBM420,153722,153312,0.0055\nCC-MAIN-2024-18,IBM424,64375,64141,0.0023\nCC-MAIN-2024-18,IBM500,20314,20258,0.0007\nCC-MAIN-2024-18,IBM855,74,74,0.0000\nCC-MAIN-2024-18,IBM866,3789,3781,0.0001\nCC-MAIN-2024-18,ISO-2022-JP,38128,38105,0.0014\nCC-MAIN-2024-18,ISO-8859-1,63383714,63116762,2.2744\nCC-MAIN-2024-18,ISO-8859-13,1029,1029,0.0000\nCC-MAIN-2024-18,ISO-8859-15,1348064,1338622,0.0484\nCC-MAIN-2024-18,ISO-8859-16,2775,2771,0.0001\nCC-MAIN-2024-18,ISO-8859-2,3177508,3165093,0.1140\nCC-MAIN-2024-18,ISO-8859-3,12816,12788,0.0005\nCC-MAIN-2024-18,ISO-8859-4,19217,19132,0.0007\nCC-MAIN-2024-18,ISO-8859-5,77348,77228,0.0028\nCC-MAIN-2024-18,ISO-8859-6,872,870,0.0000\nCC-MAIN-2024-18,ISO-8859-7,192635,191616,0.0069\nCC-MAIN-2024-18,ISO-8859-8,20632,20583,0.0007\nCC-MAIN-2024-18,ISO-8859-9,718711,715844,0.0258\nCC-MAIN-2024-18,KOI8-R,201004,200343,0.0072\nCC-MAIN-2024-18,KOI8-U,1932,1908,0.0001\nCC-MAIN-2024-18,Shift_JIS,5308720,5283622,0.1905\nCC-MAIN-2024-18,TIS-620,146415,146054,0.0053\nCC-MAIN-2024-18,US-ASCII,979685,978637,0.0352\nCC-MAIN-2024-18,UTF-16,102796,102360,0.0037\nCC-MAIN-2024-18,UTF-16BE,7087,7084,0.0003\nCC-MAIN-2024-18,UTF-16LE,43924,43719,0.0016\nCC-MAIN-2024-18,UTF-32,1045,1043,0.0000\nCC-MAIN-2024-18,UTF-32LE,9074,9041,0.0003\nCC-MAIN-2024-18,UTF-8,2622020716,2604378021,94.0871\nCC-MAIN-2024-18,windows-1250,2030728,2017148,0.0729\nCC-MAIN-2024-18,windows-1251,14188544,14139245,0.5091\nCC-MAIN-2024-18,windows-1252,5028420,5004230,0.1804\nCC-MAIN-2024-18,windows-1253,74539,74363,0.0027\nCC-MAIN-2024-18,windows-1254,318890,317465,0.0114\nCC-MAIN-2024-18,windows-1255,197246,196493,0.0071\nCC-MAIN-2024-18,windows-1256,1148870,1146118,0.0412\nCC-MAIN-2024-18,windows-1257,220736,220302,0.0079\nCC-MAIN-2024-18,windows-31j,13686,13646,0.0005\nCC-MAIN-2024-18,x-iso-8859-11,181,181,0.0000\nCC-MAIN-2024-18,x-windows-874,280475,279911,0.0101\nCC-MAIN-2024-18,x-windows-949,1178,1178,0.0000\nCC-MAIN-2024-22,<other>,1404,1398,0.0001\nCC-MAIN-2024-22,<unknown>,43411591,43411591,1.6020\nCC-MAIN-2024-22,Big5,1171026,1169365,0.0432\nCC-MAIN-2024-22,Big5-HKSCS,226,221,0.0000\nCC-MAIN-2024-22,EUC-JP,2744040,2732615,0.1013\nCC-MAIN-2024-22,EUC-KR,2105723,2101325,0.0777\nCC-MAIN-2024-22,GB18030,395136,392990,0.0146\nCC-MAIN-2024-22,GB2312,6953620,6944295,0.2566\nCC-MAIN-2024-22,GBK,2598924,2586090,0.0959\nCC-MAIN-2024-22,IBM420,141275,140831,0.0052\nCC-MAIN-2024-22,IBM424,56473,56054,0.0021\nCC-MAIN-2024-22,IBM500,22874,22772,0.0008\nCC-MAIN-2024-22,IBM855,125,125,0.0000\nCC-MAIN-2024-22,IBM866,7584,7581,0.0003\nCC-MAIN-2024-22,ISO-2022-JP,30515,30433,0.0011\nCC-MAIN-2024-22,ISO-8859-1,61223679,60966692,2.2593\nCC-MAIN-2024-22,ISO-8859-13,1367,1367,0.0001\nCC-MAIN-2024-22,ISO-8859-15,1311792,1302334,0.0484\nCC-MAIN-2024-22,ISO-8859-16,3821,3820,0.0001\nCC-MAIN-2024-22,ISO-8859-2,3066427,3055840,0.1132\nCC-MAIN-2024-22,ISO-8859-3,13496,13457,0.0005\nCC-MAIN-2024-22,ISO-8859-4,20222,19889,0.0007\nCC-MAIN-2024-22,ISO-8859-5,78337,78233,0.0029\nCC-MAIN-2024-22,ISO-8859-6,843,841,0.0000\nCC-MAIN-2024-22,ISO-8859-7,174024,173207,0.0064\nCC-MAIN-2024-22,ISO-8859-8,21912,21828,0.0008\nCC-MAIN-2024-22,ISO-8859-9,647082,644602,0.0239\nCC-MAIN-2024-22,KOI8-R,204198,203799,0.0075\nCC-MAIN-2024-22,KOI8-U,1910,1905,0.0001\nCC-MAIN-2024-22,Shift_JIS,4804651,4781236,0.1773\nCC-MAIN-2024-22,TIS-620,142571,142118,0.0053\nCC-MAIN-2024-22,US-ASCII,916151,915327,0.0338\nCC-MAIN-2024-22,UTF-16,112990,112525,0.0042\nCC-MAIN-2024-22,UTF-16BE,6301,6282,0.0002\nCC-MAIN-2024-22,UTF-16LE,38257,37981,0.0014\nCC-MAIN-2024-22,UTF-32,780,776,0.0000\nCC-MAIN-2024-22,UTF-32LE,6651,6646,0.0002\nCC-MAIN-2024-22,UTF-8,2555015059,2538661023,94.2852\nCC-MAIN-2024-22,windows-1250,2072892,2060577,0.0765\nCC-MAIN-2024-22,windows-1251,13581833,13522159,0.5012\nCC-MAIN-2024-22,windows-1252,4589483,4564922,0.1694\nCC-MAIN-2024-22,windows-1253,69755,69440,0.0026\nCC-MAIN-2024-22,windows-1254,288709,287525,0.0107\nCC-MAIN-2024-22,windows-1255,178911,178268,0.0066\nCC-MAIN-2024-22,windows-1256,1168831,1165469,0.0431\nCC-MAIN-2024-22,windows-1257,229334,228674,0.0085\nCC-MAIN-2024-22,windows-31j,13866,13837,0.0005\nCC-MAIN-2024-22,x-iso-8859-11,162,162,0.0000\nCC-MAIN-2024-22,x-windows-874,230630,230127,0.0085\nCC-MAIN-2024-22,x-windows-949,512,512,0.0000\nCC-MAIN-2024-26,<other>,1224,1222,0.0000\nCC-MAIN-2024-26,<unknown>,45669572,45669572,1.6322\nCC-MAIN-2024-26,Big5,2070303,2068739,0.0740\nCC-MAIN-2024-26,Big5-HKSCS,195,191,0.0000\nCC-MAIN-2024-26,EUC-JP,3009909,2996499,0.1076\nCC-MAIN-2024-26,EUC-KR,2894265,2888299,0.1034\nCC-MAIN-2024-26,GB18030,497841,496779,0.0178\nCC-MAIN-2024-26,GB2312,13205028,13194697,0.4719\nCC-MAIN-2024-26,GBK,3753402,3740946,0.1341\nCC-MAIN-2024-26,IBM420,144802,144507,0.0052\nCC-MAIN-2024-26,IBM424,54945,54668,0.0020\nCC-MAIN-2024-26,IBM500,20338,20230,0.0007\nCC-MAIN-2024-26,IBM855,101,101,0.0000\nCC-MAIN-2024-26,IBM866,6808,6802,0.0002\nCC-MAIN-2024-26,ISO-2022-JP,31692,31665,0.0011\nCC-MAIN-2024-26,ISO-8859-1,65073220,64823485,2.3257\nCC-MAIN-2024-26,ISO-8859-13,2365,2365,0.0001\nCC-MAIN-2024-26,ISO-8859-15,1363702,1351379,0.0487\nCC-MAIN-2024-26,ISO-8859-16,3951,3949,0.0001\nCC-MAIN-2024-26,ISO-8859-2,3256427,3246283,0.1164\nCC-MAIN-2024-26,ISO-8859-3,12579,12516,0.0004\nCC-MAIN-2024-26,ISO-8859-4,20744,20601,0.0007\nCC-MAIN-2024-26,ISO-8859-5,85523,85435,0.0031\nCC-MAIN-2024-26,ISO-8859-6,1239,1235,0.0000\nCC-MAIN-2024-26,ISO-8859-7,199401,198552,0.0071\nCC-MAIN-2024-26,ISO-8859-8,17022,16973,0.0006\nCC-MAIN-2024-26,ISO-8859-9,690987,688933,0.0247\nCC-MAIN-2024-26,KOI8-R,200409,199968,0.0072\nCC-MAIN-2024-26,KOI8-U,1604,1599,0.0001\nCC-MAIN-2024-26,Shift_JIS,4980877,4961431,0.1780\nCC-MAIN-2024-26,TIS-620,168974,168236,0.0060\nCC-MAIN-2024-26,US-ASCII,915318,914665,0.0327\nCC-MAIN-2024-26,UTF-16,136799,136280,0.0049\nCC-MAIN-2024-26,UTF-16BE,12031,12025,0.0004\nCC-MAIN-2024-26,UTF-16LE,41367,41171,0.0015\nCC-MAIN-2024-26,UTF-32,1170,1170,0.0000\nCC-MAIN-2024-26,UTF-32LE,4528,4522,0.0002\nCC-MAIN-2024-26,UTF-8,2625577704,2608644334,93.8361\nCC-MAIN-2024-26,windows-1250,2186998,2175826,0.0782\nCC-MAIN-2024-26,windows-1251,14460243,14411845,0.5168\nCC-MAIN-2024-26,windows-1252,4814212,4790777,0.1721\nCC-MAIN-2024-26,windows-1253,73051,72707,0.0026\nCC-MAIN-2024-26,windows-1254,318057,317036,0.0114\nCC-MAIN-2024-26,windows-1255,174759,173691,0.0062\nCC-MAIN-2024-26,windows-1256,1362844,1357494,0.0487\nCC-MAIN-2024-26,windows-1257,269857,269252,0.0096\nCC-MAIN-2024-26,windows-31j,14142,14059,0.0005\nCC-MAIN-2024-26,x-iso-8859-11,988,988,0.0000\nCC-MAIN-2024-26,x-windows-874,243248,242683,0.0087\nCC-MAIN-2024-26,x-windows-949,261,260,0.0000\nCC-MAIN-2024-30,<other>,1462,1455,0.0001\nCC-MAIN-2024-30,<unknown>,50126888,50126888,1.9684\nCC-MAIN-2024-30,Big5,1983809,1981792,0.0779\nCC-MAIN-2024-30,Big5-HKSCS,231,226,0.0000\nCC-MAIN-2024-30,EUC-JP,2706192,2697078,0.1063\nCC-MAIN-2024-30,EUC-KR,2574833,2570811,0.1011\nCC-MAIN-2024-30,GB18030,436148,435449,0.0171\nCC-MAIN-2024-30,GB2312,7335104,7325195,0.2880\nCC-MAIN-2024-30,GBK,3521610,3514329,0.1383\nCC-MAIN-2024-30,IBM420,132789,132013,0.0052\nCC-MAIN-2024-30,IBM424,52232,51932,0.0021\nCC-MAIN-2024-30,IBM500,16727,16655,0.0007\nCC-MAIN-2024-30,IBM855,106,106,0.0000\nCC-MAIN-2024-30,IBM866,4112,4109,0.0002\nCC-MAIN-2024-30,ISO-2022-JP,24855,24827,0.0010\nCC-MAIN-2024-30,ISO-8859-1,57830372,57587150,2.2709\nCC-MAIN-2024-30,ISO-8859-13,2688,2687,0.0001\nCC-MAIN-2024-30,ISO-8859-15,1289068,1278851,0.0506\nCC-MAIN-2024-30,ISO-8859-16,4163,4162,0.0002\nCC-MAIN-2024-30,ISO-8859-2,2998441,2987812,0.1177\nCC-MAIN-2024-30,ISO-8859-3,13502,13443,0.0005\nCC-MAIN-2024-30,ISO-8859-4,16309,16202,0.0006\nCC-MAIN-2024-30,ISO-8859-5,53388,53178,0.0021\nCC-MAIN-2024-30,ISO-8859-6,1052,1048,0.0000\nCC-MAIN-2024-30,ISO-8859-7,158814,157328,0.0062\nCC-MAIN-2024-30,ISO-8859-8,22046,21982,0.0009\nCC-MAIN-2024-30,ISO-8859-9,646590,645128,0.0254\nCC-MAIN-2024-30,KOI8-R,179104,178263,0.0070\nCC-MAIN-2024-30,KOI8-U,1558,1553,0.0001\nCC-MAIN-2024-30,Shift_JIS,4448392,4432725,0.1747\nCC-MAIN-2024-30,TIS-620,150531,150128,0.0059\nCC-MAIN-2024-30,US-ASCII,876495,875511,0.0344\nCC-MAIN-2024-30,UTF-16,138002,137517,0.0054\nCC-MAIN-2024-30,UTF-16BE,7176,7169,0.0003\nCC-MAIN-2024-30,UTF-16LE,40475,40232,0.0016\nCC-MAIN-2024-30,UTF-32,1277,1277,0.0001\nCC-MAIN-2024-30,UTF-32LE,6170,6161,0.0002\nCC-MAIN-2024-30,UTF-8,2386051828,2372309651,93.6945\nCC-MAIN-2024-30,windows-1250,2009646,2001529,0.0789\nCC-MAIN-2024-30,windows-1251,14134764,14089437,0.5550\nCC-MAIN-2024-30,windows-1252,4500454,4482070,0.1767\nCC-MAIN-2024-30,windows-1253,73363,73011,0.0029\nCC-MAIN-2024-30,windows-1254,297702,296787,0.0117\nCC-MAIN-2024-30,windows-1255,185901,183393,0.0073\nCC-MAIN-2024-30,windows-1256,1141482,1133636,0.0448\nCC-MAIN-2024-30,windows-1257,207680,206480,0.0082\nCC-MAIN-2024-30,windows-31j,17310,17282,0.0007\nCC-MAIN-2024-30,x-iso-8859-11,602,602,0.0000\nCC-MAIN-2024-30,x-windows-874,205196,204392,0.0081\nCC-MAIN-2024-30,x-windows-949,1756,1755,0.0001\nCC-MAIN-2024-33,<other>,1799,1797,0.0001\nCC-MAIN-2024-33,<unknown>,47230244,47230244,2.0394\nCC-MAIN-2024-33,Big5,1981425,1979391,0.0856\nCC-MAIN-2024-33,Big5-HKSCS,685,675,0.0000\nCC-MAIN-2024-33,EUC-JP,2454822,2447140,0.1060\nCC-MAIN-2024-33,EUC-KR,2278454,2274789,0.0984\nCC-MAIN-2024-33,GB18030,394725,393766,0.0170\nCC-MAIN-2024-33,GB2312,6363081,6352087,0.2748\nCC-MAIN-2024-33,GBK,3199389,3193455,0.1381\nCC-MAIN-2024-33,IBM420,129803,129474,0.0056\nCC-MAIN-2024-33,IBM424,50202,49914,0.0022\nCC-MAIN-2024-33,IBM500,15465,15390,0.0007\nCC-MAIN-2024-33,IBM855,121,121,0.0000\nCC-MAIN-2024-33,IBM866,4204,4203,0.0002\nCC-MAIN-2024-33,ISO-2022-JP,28186,28107,0.0012\nCC-MAIN-2024-33,ISO-8859-1,55520249,55303534,2.3973\nCC-MAIN-2024-33,ISO-8859-13,1957,1957,0.0001\nCC-MAIN-2024-33,ISO-8859-15,1223091,1214884,0.0528\nCC-MAIN-2024-33,ISO-8859-16,4248,4242,0.0002\nCC-MAIN-2024-33,ISO-8859-2,2960746,2949818,0.1278\nCC-MAIN-2024-33,ISO-8859-3,12767,12725,0.0006\nCC-MAIN-2024-33,ISO-8859-4,15900,15839,0.0007\nCC-MAIN-2024-33,ISO-8859-5,50598,50472,0.0022\nCC-MAIN-2024-33,ISO-8859-6,904,900,0.0000\nCC-MAIN-2024-33,ISO-8859-7,155270,153670,0.0067\nCC-MAIN-2024-33,ISO-8859-8,22574,22462,0.0010\nCC-MAIN-2024-33,ISO-8859-9,637203,635716,0.0275\nCC-MAIN-2024-33,KOI8-R,163293,162666,0.0071\nCC-MAIN-2024-33,KOI8-U,1927,1925,0.0001\nCC-MAIN-2024-33,Shift_JIS,4321118,4308424,0.1866\nCC-MAIN-2024-33,TIS-620,138754,138437,0.0060\nCC-MAIN-2024-33,US-ASCII,874394,871060,0.0378\nCC-MAIN-2024-33,UTF-16,133514,133065,0.0058\nCC-MAIN-2024-33,UTF-16BE,7316,7315,0.0003\nCC-MAIN-2024-33,UTF-16LE,29908,29747,0.0013\nCC-MAIN-2024-33,UTF-32,687,684,0.0000\nCC-MAIN-2024-33,UTF-32LE,8378,8368,0.0004\nCC-MAIN-2024-33,UTF-8,2163972033,2151951380,93.4387\nCC-MAIN-2024-33,windows-1250,1815055,1807303,0.0784\nCC-MAIN-2024-33,windows-1251,13224476,13180855,0.5710\nCC-MAIN-2024-33,windows-1252,4416268,4399407,0.1907\nCC-MAIN-2024-33,windows-1253,63926,63651,0.0028\nCC-MAIN-2024-33,windows-1254,301188,299934,0.0130\nCC-MAIN-2024-33,windows-1255,181403,180574,0.0078\nCC-MAIN-2024-33,windows-1256,1121736,1115630,0.0484\nCC-MAIN-2024-33,windows-1257,182849,181806,0.0079\nCC-MAIN-2024-33,windows-31j,14770,14737,0.0006\nCC-MAIN-2024-33,x-iso-8859-11,688,688,0.0000\nCC-MAIN-2024-33,x-windows-874,211973,211239,0.0092\nCC-MAIN-2024-33,x-windows-949,2650,2649,0.0001\nCC-MAIN-2024-38,<other>,1534,1534,0.0001\nCC-MAIN-2024-38,<unknown>,42174210,42174210,1.5057\nCC-MAIN-2024-38,Big5,2305326,2302485,0.0823\nCC-MAIN-2024-38,Big5-HKSCS,1469,1465,0.0001\nCC-MAIN-2024-38,EUC-JP,2818314,2809972,0.1006\nCC-MAIN-2024-38,EUC-KR,2343421,2340027,0.0837\nCC-MAIN-2024-38,GB18030,421529,420581,0.0150\nCC-MAIN-2024-38,GB2312,6246047,6236387,0.2230\nCC-MAIN-2024-38,GBK,3109518,3102607,0.1110\nCC-MAIN-2024-38,IBM420,111118,110892,0.0040\nCC-MAIN-2024-38,IBM424,39882,39627,0.0014\nCC-MAIN-2024-38,IBM500,18866,18787,0.0007\nCC-MAIN-2024-38,IBM855,138,138,0.0000\nCC-MAIN-2024-38,IBM866,7080,7075,0.0003\nCC-MAIN-2024-38,ISO-2022-JP,25527,25484,0.0009\nCC-MAIN-2024-38,ISO-8859-1,77270242,77025981,2.7588\nCC-MAIN-2024-38,ISO-8859-13,2329,2329,0.0001\nCC-MAIN-2024-38,ISO-8859-15,1305574,1297947,0.0466\nCC-MAIN-2024-38,ISO-8859-16,3544,3541,0.0001\nCC-MAIN-2024-38,ISO-8859-2,3003130,2992305,0.1072\nCC-MAIN-2024-38,ISO-8859-3,15048,15022,0.0005\nCC-MAIN-2024-38,ISO-8859-4,21291,21144,0.0008\nCC-MAIN-2024-38,ISO-8859-5,53106,53030,0.0019\nCC-MAIN-2024-38,ISO-8859-6,1969,1966,0.0001\nCC-MAIN-2024-38,ISO-8859-7,152033,150404,0.0054\nCC-MAIN-2024-38,ISO-8859-8,22194,22081,0.0008\nCC-MAIN-2024-38,ISO-8859-9,658011,656370,0.0235\nCC-MAIN-2024-38,KOI8-R,182698,182240,0.0065\nCC-MAIN-2024-38,KOI8-U,2929,2856,0.0001\nCC-MAIN-2024-38,Shift_JIS,4488122,4475576,0.1602\nCC-MAIN-2024-38,TIS-620,149980,149660,0.0054\nCC-MAIN-2024-38,US-ASCII,947773,944998,0.0338\nCC-MAIN-2024-38,UTF-16,132622,132044,0.0047\nCC-MAIN-2024-38,UTF-16BE,8416,8413,0.0003\nCC-MAIN-2024-38,UTF-16LE,30065,29861,0.0011\nCC-MAIN-2024-38,UTF-32,701,701,0.0000\nCC-MAIN-2024-38,UTF-32LE,6253,6241,0.0002\nCC-MAIN-2024-38,UTF-8,2630507208,2616852308,93.9167\nCC-MAIN-2024-38,windows-1250,1948323,1939033,0.0696\nCC-MAIN-2024-38,windows-1251,13958747,13905586,0.4984\nCC-MAIN-2024-38,windows-1252,4348066,4329347,0.1552\nCC-MAIN-2024-38,windows-1253,62765,62531,0.0022\nCC-MAIN-2024-38,windows-1254,310754,309924,0.0111\nCC-MAIN-2024-38,windows-1255,188439,187370,0.0067\nCC-MAIN-2024-38,windows-1256,1063331,1055496,0.0380\nCC-MAIN-2024-38,windows-1257,208968,207319,0.0075\nCC-MAIN-2024-38,windows-31j,16172,16151,0.0006\nCC-MAIN-2024-38,x-iso-8859-11,351,351,0.0000\nCC-MAIN-2024-38,x-windows-874,197143,196283,0.0070\nCC-MAIN-2024-38,x-windows-949,1187,1187,0.0000\nCC-MAIN-2024-42,<other>,1278,1273,0.0001\nCC-MAIN-2024-42,<unknown>,50760125,50760125,2.0343\nCC-MAIN-2024-42,Big5,2148950,2147175,0.0861\nCC-MAIN-2024-42,Big5-HKSCS,2958,2956,0.0001\nCC-MAIN-2024-42,EUC-JP,3003270,2993481,0.1204\nCC-MAIN-2024-42,EUC-KR,2260919,2257110,0.0906\nCC-MAIN-2024-42,GB18030,353123,351972,0.0142\nCC-MAIN-2024-42,GB2312,5906657,5897799,0.2367\nCC-MAIN-2024-42,GBK,2729294,2724012,0.1094\nCC-MAIN-2024-42,IBM420,116974,116656,0.0047\nCC-MAIN-2024-42,IBM424,47783,47619,0.0019\nCC-MAIN-2024-42,IBM500,15757,15705,0.0006\nCC-MAIN-2024-42,IBM855,83,83,0.0000\nCC-MAIN-2024-42,IBM866,8646,8644,0.0003\nCC-MAIN-2024-42,ISO-2022-JP,25691,25670,0.0010\nCC-MAIN-2024-42,ISO-8859-1,66389299,66165111,2.6607\nCC-MAIN-2024-42,ISO-8859-13,4098,4098,0.0002\nCC-MAIN-2024-42,ISO-8859-15,1287423,1277622,0.0516\nCC-MAIN-2024-42,ISO-8859-16,3742,3739,0.0001\nCC-MAIN-2024-42,ISO-8859-2,2863698,2852504,0.1148\nCC-MAIN-2024-42,ISO-8859-3,32267,32147,0.0013\nCC-MAIN-2024-42,ISO-8859-4,18232,18137,0.0007\nCC-MAIN-2024-42,ISO-8859-5,43586,43402,0.0017\nCC-MAIN-2024-42,ISO-8859-6,911,907,0.0000\nCC-MAIN-2024-42,ISO-8859-7,160860,159144,0.0064\nCC-MAIN-2024-42,ISO-8859-8,20493,20454,0.0008\nCC-MAIN-2024-42,ISO-8859-9,607698,606018,0.0244\nCC-MAIN-2024-42,KOI8-R,198139,197653,0.0079\nCC-MAIN-2024-42,KOI8-U,2560,2541,0.0001\nCC-MAIN-2024-42,Shift_JIS,4710780,4696626,0.1888\nCC-MAIN-2024-42,TIS-620,154819,154495,0.0062\nCC-MAIN-2024-42,US-ASCII,884607,883352,0.0355\nCC-MAIN-2024-42,UTF-16,143609,143244,0.0058\nCC-MAIN-2024-42,UTF-16BE,9466,9464,0.0004\nCC-MAIN-2024-42,UTF-16LE,33765,33576,0.0014\nCC-MAIN-2024-42,UTF-32,1365,1364,0.0001\nCC-MAIN-2024-42,UTF-32LE,4962,4957,0.0002\nCC-MAIN-2024-42,UTF-8,2328881681,2316239943,93.3348\nCC-MAIN-2024-42,windows-1250,1957705,1949412,0.0785\nCC-MAIN-2024-42,windows-1251,12955688,12896259,0.5192\nCC-MAIN-2024-42,windows-1252,4485885,4468593,0.1798\nCC-MAIN-2024-42,windows-1253,73342,73121,0.0029\nCC-MAIN-2024-42,windows-1254,302085,300964,0.0121\nCC-MAIN-2024-42,windows-1255,181480,180422,0.0073\nCC-MAIN-2024-42,windows-1256,1004430,997006,0.0403\nCC-MAIN-2024-42,windows-1257,187704,186054,0.0075\nCC-MAIN-2024-42,windows-31j,15661,15628,0.0006\nCC-MAIN-2024-42,x-iso-8859-11,770,736,0.0000\nCC-MAIN-2024-42,x-windows-874,186168,185823,0.0075\nCC-MAIN-2024-42,x-windows-949,268,267,0.0000\nCC-MAIN-2024-46,<other>,1187,1186,0.0000\nCC-MAIN-2024-46,<unknown>,47315879,47315879,1.7604\nCC-MAIN-2024-46,Big5,2302003,2300553,0.0856\nCC-MAIN-2024-46,Big5-HKSCS,4435,4427,0.0002\nCC-MAIN-2024-46,EUC-JP,3224004,3212952,0.1199\nCC-MAIN-2024-46,EUC-KR,2358863,2354719,0.0878\nCC-MAIN-2024-46,GB18030,402188,401457,0.0150\nCC-MAIN-2024-46,GB2312,6348147,6340428,0.2362\nCC-MAIN-2024-46,GBK,2994470,2987455,0.1114\nCC-MAIN-2024-46,IBM420,120050,119864,0.0045\nCC-MAIN-2024-46,IBM424,44160,43815,0.0016\nCC-MAIN-2024-46,IBM500,21785,21683,0.0008\nCC-MAIN-2024-46,IBM855,122,122,0.0000\nCC-MAIN-2024-46,IBM866,7766,7761,0.0003\nCC-MAIN-2024-46,ISO-2022-JP,30550,30512,0.0011\nCC-MAIN-2024-46,ISO-8859-1,60469167,60249738,2.2498\nCC-MAIN-2024-46,ISO-8859-13,1875,1875,0.0001\nCC-MAIN-2024-46,ISO-8859-15,1265691,1256256,0.0471\nCC-MAIN-2024-46,ISO-8859-16,4169,4166,0.0002\nCC-MAIN-2024-46,ISO-8859-2,2783810,2773513,0.1036\nCC-MAIN-2024-46,ISO-8859-3,24928,24709,0.0009\nCC-MAIN-2024-46,ISO-8859-4,19516,19423,0.0007\nCC-MAIN-2024-46,ISO-8859-5,27581,27484,0.0010\nCC-MAIN-2024-46,ISO-8859-6,933,932,0.0000\nCC-MAIN-2024-46,ISO-8859-7,155153,153858,0.0058\nCC-MAIN-2024-46,ISO-8859-8,20925,20884,0.0008\nCC-MAIN-2024-46,ISO-8859-9,609322,607664,0.0227\nCC-MAIN-2024-46,KOI8-R,201563,201122,0.0075\nCC-MAIN-2024-46,KOI8-U,2132,2131,0.0001\nCC-MAIN-2024-46,Shift_JIS,4801682,4790675,0.1786\nCC-MAIN-2024-46,TIS-620,170665,170391,0.0063\nCC-MAIN-2024-46,US-ASCII,950829,949547,0.0354\nCC-MAIN-2024-46,UTF-16,144774,144375,0.0054\nCC-MAIN-2024-46,UTF-16BE,5091,5091,0.0002\nCC-MAIN-2024-46,UTF-16LE,32535,32364,0.0012\nCC-MAIN-2024-46,UTF-32,957,955,0.0000\nCC-MAIN-2024-46,UTF-32LE,4517,4513,0.0002\nCC-MAIN-2024-46,UTF-8,2529301253,2516709153,94.1026\nCC-MAIN-2024-46,windows-1250,1967219,1959508,0.0732\nCC-MAIN-2024-46,windows-1251,13468081,13413916,0.5011\nCC-MAIN-2024-46,windows-1252,4273838,4255362,0.1590\nCC-MAIN-2024-46,windows-1253,69137,68952,0.0026\nCC-MAIN-2024-46,windows-1254,306779,305695,0.0114\nCC-MAIN-2024-46,windows-1255,193848,193256,0.0072\nCC-MAIN-2024-46,windows-1256,994337,987884,0.0370\nCC-MAIN-2024-46,windows-1257,158826,158492,0.0059\nCC-MAIN-2024-46,windows-31j,13706,13683,0.0005\nCC-MAIN-2024-46,x-iso-8859-11,981,978,0.0000\nCC-MAIN-2024-46,x-windows-874,190124,189806,0.0071\nCC-MAIN-2024-46,x-windows-949,194,194,0.0000\nCC-MAIN-2024-51,<other>,1274,1272,0.0000\nCC-MAIN-2024-51,<unknown>,47187575,47187575,1.7906\nCC-MAIN-2024-51,Big5,1206353,1204605,0.0458\nCC-MAIN-2024-51,Big5-HKSCS,400,394,0.0000\nCC-MAIN-2024-51,EUC-JP,3371585,3362924,0.1279\nCC-MAIN-2024-51,EUC-KR,2416116,2411786,0.0917\nCC-MAIN-2024-51,GB18030,401866,401082,0.0152\nCC-MAIN-2024-51,GB2312,6526881,6517321,0.2477\nCC-MAIN-2024-51,GBK,3146965,3141884,0.1194\nCC-MAIN-2024-51,IBM420,166002,165760,0.0063\nCC-MAIN-2024-51,IBM424,45711,45603,0.0017\nCC-MAIN-2024-51,IBM500,31025,30886,0.0012\nCC-MAIN-2024-51,IBM855,151,151,0.0000\nCC-MAIN-2024-51,IBM866,8448,8445,0.0003\nCC-MAIN-2024-51,ISO-2022-JP,30505,30476,0.0012\nCC-MAIN-2024-51,ISO-8859-1,63504298,63258927,2.4097\nCC-MAIN-2024-51,ISO-8859-13,2479,2479,0.0001\nCC-MAIN-2024-51,ISO-8859-15,1306796,1296807,0.0496\nCC-MAIN-2024-51,ISO-8859-16,4234,4227,0.0002\nCC-MAIN-2024-51,ISO-8859-2,3070449,3060006,0.1165\nCC-MAIN-2024-51,ISO-8859-3,14388,14245,0.0005\nCC-MAIN-2024-51,ISO-8859-4,20839,20761,0.0008\nCC-MAIN-2024-51,ISO-8859-5,30483,30362,0.0012\nCC-MAIN-2024-51,ISO-8859-6,1000,998,0.0000\nCC-MAIN-2024-51,ISO-8859-7,171196,170071,0.0065\nCC-MAIN-2024-51,ISO-8859-8,21399,21371,0.0008\nCC-MAIN-2024-51,ISO-8859-9,582115,580544,0.0221\nCC-MAIN-2024-51,KOI8-R,160430,160144,0.0061\nCC-MAIN-2024-51,KOI8-U,2598,2588,0.0001\nCC-MAIN-2024-51,Shift_JIS,4799756,4785359,0.1821\nCC-MAIN-2024-51,TIS-620,148139,147731,0.0056\nCC-MAIN-2024-51,US-ASCII,1072204,1070607,0.0407\nCC-MAIN-2024-51,UTF-16,144490,144157,0.0055\nCC-MAIN-2024-51,UTF-16BE,5194,5189,0.0002\nCC-MAIN-2024-51,UTF-16LE,28887,28633,0.0011\nCC-MAIN-2024-51,UTF-32,668,666,0.0000\nCC-MAIN-2024-51,UTF-32LE,3667,3661,0.0001\nCC-MAIN-2024-51,UTF-8,2473135386,2460159208,93.8442\nCC-MAIN-2024-51,windows-1250,1933166,1925202,0.0734\nCC-MAIN-2024-51,windows-1251,14328868,14240942,0.5437\nCC-MAIN-2024-51,windows-1252,4291453,4271564,0.1628\nCC-MAIN-2024-51,windows-1253,71306,71147,0.0027\nCC-MAIN-2024-51,windows-1254,335539,334409,0.0127\nCC-MAIN-2024-51,windows-1255,199088,198244,0.0076\nCC-MAIN-2024-51,windows-1256,1032673,1029340,0.0392\nCC-MAIN-2024-51,windows-1257,167720,167297,0.0064\nCC-MAIN-2024-51,windows-31j,13824,13796,0.0005\nCC-MAIN-2024-51,x-iso-8859-11,1277,1233,0.0000\nCC-MAIN-2024-51,x-windows-874,215305,214845,0.0082\nCC-MAIN-2024-51,x-windows-949,185,184,0.0000\nCC-MAIN-2025-05,<other>,1080,1077,0.0000\nCC-MAIN-2025-05,<unknown>,44450246,44450246,1.4664\nCC-MAIN-2025-05,Big5,1402185,1400787,0.0463\nCC-MAIN-2025-05,Big5-HKSCS,691,691,0.0000\nCC-MAIN-2025-05,EUC-JP,3578703,3568794,0.1181\nCC-MAIN-2025-05,EUC-KR,2542723,2538696,0.0839\nCC-MAIN-2025-05,GB18030,390125,389065,0.0129\nCC-MAIN-2025-05,GB2312,6558289,6546033,0.2164\nCC-MAIN-2025-05,GBK,3075795,3067449,0.1015\nCC-MAIN-2025-05,IBM420,123308,123070,0.0041\nCC-MAIN-2025-05,IBM424,43160,43057,0.0014\nCC-MAIN-2025-05,IBM500,38549,38434,0.0013\nCC-MAIN-2025-05,IBM855,141,141,0.0000\nCC-MAIN-2025-05,IBM866,7660,7656,0.0003\nCC-MAIN-2025-05,ISO-2022-JP,26906,26865,0.0009\nCC-MAIN-2025-05,ISO-8859-1,69572300,69321393,2.2951\nCC-MAIN-2025-05,ISO-8859-13,2384,2384,0.0001\nCC-MAIN-2025-05,ISO-8859-15,1311374,1303348,0.0433\nCC-MAIN-2025-05,ISO-8859-16,4681,4675,0.0002\nCC-MAIN-2025-05,ISO-8859-2,3211126,3199696,0.1059\nCC-MAIN-2025-05,ISO-8859-3,1627,1611,0.0001\nCC-MAIN-2025-05,ISO-8859-4,24112,23998,0.0008\nCC-MAIN-2025-05,ISO-8859-5,37712,37599,0.0012\nCC-MAIN-2025-05,ISO-8859-6,1142,1140,0.0000\nCC-MAIN-2025-05,ISO-8859-7,181891,180956,0.0060\nCC-MAIN-2025-05,ISO-8859-8,24536,24487,0.0008\nCC-MAIN-2025-05,ISO-8859-9,692056,689926,0.0228\nCC-MAIN-2025-05,KOI8-R,173002,172508,0.0057\nCC-MAIN-2025-05,KOI8-U,1480,1480,0.0000\nCC-MAIN-2025-05,Shift_JIS,4816608,4802127,0.1589\nCC-MAIN-2025-05,TIS-620,141902,141516,0.0047\nCC-MAIN-2025-05,US-ASCII,950801,949750,0.0314\nCC-MAIN-2025-05,UTF-16,153763,153388,0.0051\nCC-MAIN-2025-05,UTF-16BE,6889,6885,0.0002\nCC-MAIN-2025-05,UTF-16LE,29619,29418,0.0010\nCC-MAIN-2025-05,UTF-32,1393,1391,0.0000\nCC-MAIN-2025-05,UTF-32LE,9939,9936,0.0003\nCC-MAIN-2025-05,UTF-8,2864099311,2848376924,94.4849\nCC-MAIN-2025-05,windows-1250,2053330,2044147,0.0677\nCC-MAIN-2025-05,windows-1251,14932215,14846516,0.4926\nCC-MAIN-2025-05,windows-1252,4227941,4209471,0.1395\nCC-MAIN-2025-05,windows-1253,76474,76254,0.0025\nCC-MAIN-2025-05,windows-1254,371714,369625,0.0123\nCC-MAIN-2025-05,windows-1255,225199,224486,0.0074\nCC-MAIN-2025-05,windows-1256,1223891,1218817,0.0404\nCC-MAIN-2025-05,windows-1257,214733,214160,0.0071\nCC-MAIN-2025-05,windows-31j,14743,14708,0.0005\nCC-MAIN-2025-05,x-iso-8859-11,1490,1444,0.0000\nCC-MAIN-2025-05,x-windows-874,247285,246880,0.0082\nCC-MAIN-2025-05,x-windows-949,113,112,0.0000\nCC-MAIN-2025-08,<other>,1174,1172,0.0000\nCC-MAIN-2025-08,<unknown>,45158818,45158818,1.6852\nCC-MAIN-2025-08,Big5,1334506,1333488,0.0498\nCC-MAIN-2025-08,Big5-HKSCS,780,780,0.0000\nCC-MAIN-2025-08,EUC-JP,3391910,3381727,0.1266\nCC-MAIN-2025-08,EUC-KR,2579057,2575750,0.0962\nCC-MAIN-2025-08,GB18030,404996,404419,0.0151\nCC-MAIN-2025-08,GB2312,6302774,6294060,0.2352\nCC-MAIN-2025-08,GBK,3122826,3117988,0.1165\nCC-MAIN-2025-08,IBM420,126916,126706,0.0047\nCC-MAIN-2025-08,IBM424,43153,43060,0.0016\nCC-MAIN-2025-08,IBM500,40340,40216,0.0015\nCC-MAIN-2025-08,IBM855,140,140,0.0000\nCC-MAIN-2025-08,IBM866,7820,7817,0.0003\nCC-MAIN-2025-08,ISO-2022-JP,29183,29161,0.0011\nCC-MAIN-2025-08,ISO-8859-1,68874319,68633172,2.5702\nCC-MAIN-2025-08,ISO-8859-13,2565,2565,0.0001\nCC-MAIN-2025-08,ISO-8859-15,1253979,1246484,0.0468\nCC-MAIN-2025-08,ISO-8859-16,7401,7395,0.0003\nCC-MAIN-2025-08,ISO-8859-2,3362145,3348430,0.1255\nCC-MAIN-2025-08,ISO-8859-3,1221,1213,0.0000\nCC-MAIN-2025-08,ISO-8859-4,20068,19984,0.0007\nCC-MAIN-2025-08,ISO-8859-5,28924,28804,0.0011\nCC-MAIN-2025-08,ISO-8859-6,935,933,0.0000\nCC-MAIN-2025-08,ISO-8859-7,231284,230500,0.0086\nCC-MAIN-2025-08,ISO-8859-8,19743,19690,0.0007\nCC-MAIN-2025-08,ISO-8859-9,708719,707080,0.0264\nCC-MAIN-2025-08,KOI8-R,211061,209994,0.0079\nCC-MAIN-2025-08,KOI8-U,875,875,0.0000\nCC-MAIN-2025-08,Shift_JIS,4689378,4677080,0.1750\nCC-MAIN-2025-08,TIS-620,133625,133157,0.0050\nCC-MAIN-2025-08,US-ASCII,754956,754301,0.0282\nCC-MAIN-2025-08,UTF-16,158668,158362,0.0059\nCC-MAIN-2025-08,UTF-16BE,8422,8417,0.0003\nCC-MAIN-2025-08,UTF-16LE,30106,29985,0.0011\nCC-MAIN-2025-08,UTF-32,1438,1435,0.0001\nCC-MAIN-2025-08,UTF-32LE,7131,7129,0.0003\nCC-MAIN-2025-08,UTF-8,2513990443,2500127577,93.8159\nCC-MAIN-2025-08,windows-1250,1952802,1944380,0.0729\nCC-MAIN-2025-08,windows-1251,13992815,13920117,0.5222\nCC-MAIN-2025-08,windows-1252,4000199,3982937,0.1493\nCC-MAIN-2025-08,windows-1253,82159,81907,0.0031\nCC-MAIN-2025-08,windows-1254,379348,377724,0.0142\nCC-MAIN-2025-08,windows-1255,246396,245635,0.0092\nCC-MAIN-2025-08,windows-1256,1395826,1390331,0.0521\nCC-MAIN-2025-08,windows-1257,314968,314720,0.0118\nCC-MAIN-2025-08,windows-31j,14755,14691,0.0006\nCC-MAIN-2025-08,x-iso-8859-11,1869,1852,0.0001\nCC-MAIN-2025-08,x-windows-874,283027,282710,0.0106\nCC-MAIN-2025-08,x-windows-949,93,92,0.0000\nCC-MAIN-2025-13,<other>,992,988,0.0000\nCC-MAIN-2025-13,<unknown>,44296617,44296617,1.6162\nCC-MAIN-2025-13,Big5,1262970,1261385,0.0461\nCC-MAIN-2025-13,Big5-HKSCS,688,683,0.0000\nCC-MAIN-2025-13,EUC-JP,3305316,3290963,0.1206\nCC-MAIN-2025-13,EUC-KR,2505472,2502019,0.0914\nCC-MAIN-2025-13,GB18030,406263,405642,0.0148\nCC-MAIN-2025-13,GB2312,5873359,5865192,0.2143\nCC-MAIN-2025-13,GBK,2980349,2976282,0.1087\nCC-MAIN-2025-13,IBM420,114378,114187,0.0042\nCC-MAIN-2025-13,IBM424,38536,38461,0.0014\nCC-MAIN-2025-13,IBM500,24315,24256,0.0009\nCC-MAIN-2025-13,IBM855,409,409,0.0000\nCC-MAIN-2025-13,IBM866,6271,6266,0.0002\nCC-MAIN-2025-13,ISO-2022-JP,28946,28933,0.0011\nCC-MAIN-2025-13,ISO-8859-1,77356120,77072471,2.8223\nCC-MAIN-2025-13,ISO-8859-13,3611,3611,0.0001\nCC-MAIN-2025-13,ISO-8859-15,1243277,1235240,0.0454\nCC-MAIN-2025-13,ISO-8859-16,10604,10566,0.0004\nCC-MAIN-2025-13,ISO-8859-2,2807747,2795379,0.1024\nCC-MAIN-2025-13,ISO-8859-3,539,517,0.0000\nCC-MAIN-2025-13,ISO-8859-4,16622,16575,0.0006\nCC-MAIN-2025-13,ISO-8859-5,56649,56492,0.0021\nCC-MAIN-2025-13,ISO-8859-6,808,807,0.0000\nCC-MAIN-2025-13,ISO-8859-7,192354,190924,0.0070\nCC-MAIN-2025-13,ISO-8859-8,19994,19953,0.0007\nCC-MAIN-2025-13,ISO-8859-9,629898,627978,0.0230\nCC-MAIN-2025-13,KOI8-R,168651,168427,0.0062\nCC-MAIN-2025-13,KOI8-U,835,832,0.0000\nCC-MAIN-2025-13,Shift_JIS,4796194,4785050,0.1750\nCC-MAIN-2025-13,TIS-620,134764,134211,0.0049\nCC-MAIN-2025-13,US-ASCII,635472,634859,0.0232\nCC-MAIN-2025-13,UTF-16,153804,153365,0.0056\nCC-MAIN-2025-13,UTF-16BE,7164,7162,0.0003\nCC-MAIN-2025-13,UTF-16LE,29764,29704,0.0011\nCC-MAIN-2025-13,UTF-32,1303,1301,0.0000\nCC-MAIN-2025-13,UTF-32LE,3493,3491,0.0001\nCC-MAIN-2025-13,UTF-8,2569938370,2555558838,93.7645\nCC-MAIN-2025-13,windows-1250,1993370,1979952,0.0727\nCC-MAIN-2025-13,windows-1251,13827787,13770937,0.5045\nCC-MAIN-2025-13,windows-1252,3831129,3815546,0.1398\nCC-MAIN-2025-13,windows-1253,68529,68293,0.0025\nCC-MAIN-2025-13,windows-1254,347411,345541,0.0127\nCC-MAIN-2025-13,windows-1255,190707,190160,0.0070\nCC-MAIN-2025-13,windows-1256,1083883,1077212,0.0395\nCC-MAIN-2025-13,windows-1257,210284,209888,0.0077\nCC-MAIN-2025-13,windows-31j,14154,14123,0.0005\nCC-MAIN-2025-13,x-iso-8859-11,2442,2442,0.0001\nCC-MAIN-2025-13,x-windows-874,221338,220938,0.0081\nCC-MAIN-2025-13,x-windows-949,235,234,0.0000\nCC-MAIN-2025-18,<other>,1071,1066,0.0000\nCC-MAIN-2025-18,<unknown>,43903696,43903696,1.5980\nCC-MAIN-2025-18,Big5,1232310,1231135,0.0449\nCC-MAIN-2025-18,Big5-HKSCS,809,802,0.0000\nCC-MAIN-2025-18,EUC-JP,3403002,3393427,0.1239\nCC-MAIN-2025-18,EUC-KR,2498785,2495457,0.0910\nCC-MAIN-2025-18,GB18030,363490,362814,0.0132\nCC-MAIN-2025-18,GB2312,5593701,5585528,0.2036\nCC-MAIN-2025-18,GBK,2695316,2691078,0.0981\nCC-MAIN-2025-18,IBM420,119566,119384,0.0044\nCC-MAIN-2025-18,IBM424,39826,39745,0.0014\nCC-MAIN-2025-18,IBM500,23469,23414,0.0009\nCC-MAIN-2025-18,IBM855,113,113,0.0000\nCC-MAIN-2025-18,IBM866,6172,6168,0.0002\nCC-MAIN-2025-18,ISO-2022-JP,29336,29224,0.0011\nCC-MAIN-2025-18,ISO-8859-1,72698018,72400765,2.6461\nCC-MAIN-2025-18,ISO-8859-13,2401,2401,0.0001\nCC-MAIN-2025-18,ISO-8859-15,1291687,1283631,0.0470\nCC-MAIN-2025-18,ISO-8859-16,10412,10380,0.0004\nCC-MAIN-2025-18,ISO-8859-2,2921597,2907679,0.1063\nCC-MAIN-2025-18,ISO-8859-3,531,515,0.0000\nCC-MAIN-2025-18,ISO-8859-4,20662,20578,0.0008\nCC-MAIN-2025-18,ISO-8859-5,61894,61722,0.0023\nCC-MAIN-2025-18,ISO-8859-6,780,776,0.0000\nCC-MAIN-2025-18,ISO-8859-7,180387,179162,0.0066\nCC-MAIN-2025-18,ISO-8859-8,22485,22455,0.0008\nCC-MAIN-2025-18,ISO-8859-9,709847,707290,0.0258\nCC-MAIN-2025-18,KOI8-R,175901,174672,0.0064\nCC-MAIN-2025-18,KOI8-U,1449,1446,0.0001\nCC-MAIN-2025-18,Shift_JIS,5039728,5028599,0.1834\nCC-MAIN-2025-18,TIS-620,130116,129749,0.0047\nCC-MAIN-2025-18,US-ASCII,649677,648684,0.0236\nCC-MAIN-2025-18,UTF-16,160808,160396,0.0059\nCC-MAIN-2025-18,UTF-16BE,3765,3763,0.0001\nCC-MAIN-2025-18,UTF-16LE,26057,25964,0.0009\nCC-MAIN-2025-18,UTF-32,1005,1005,0.0000\nCC-MAIN-2025-18,UTF-32LE,7380,7373,0.0003\nCC-MAIN-2025-18,UTF-8,2581926189,2566911455,93.9793\nCC-MAIN-2025-18,windows-1250,2047571,2030509,0.0745\nCC-MAIN-2025-18,windows-1251,13283557,13237287,0.4835\nCC-MAIN-2025-18,windows-1252,3899964,3882498,0.1420\nCC-MAIN-2025-18,windows-1253,65864,65678,0.0024\nCC-MAIN-2025-18,windows-1254,332145,330604,0.0121\nCC-MAIN-2025-18,windows-1255,212419,207822,0.0077\nCC-MAIN-2025-18,windows-1256,1071482,1065812,0.0390\nCC-MAIN-2025-18,windows-1257,212042,211580,0.0077\nCC-MAIN-2025-18,windows-31j,13553,13514,0.0005\nCC-MAIN-2025-18,x-iso-8859-11,2076,2061,0.0001\nCC-MAIN-2025-18,x-windows-874,241621,241258,0.0088\nCC-MAIN-2025-18,x-windows-949,378,377,0.0000\nCC-MAIN-2025-21,<other>,1367,1366,0.0001\nCC-MAIN-2025-21,<unknown>,37149924,37149924,1.4997\nCC-MAIN-2025-21,Big5,1074429,1073389,0.0434\nCC-MAIN-2025-21,Big5-HKSCS,1674,1669,0.0001\nCC-MAIN-2025-21,EUC-JP,2774205,2764740,0.1120\nCC-MAIN-2025-21,EUC-KR,1882063,1879486,0.0760\nCC-MAIN-2025-21,GB18030,303471,302538,0.0123\nCC-MAIN-2025-21,GB2312,4753996,4747155,0.1919\nCC-MAIN-2025-21,GBK,2453235,2449450,0.0990\nCC-MAIN-2025-21,IBM420,88647,88495,0.0036\nCC-MAIN-2025-21,IBM424,29330,29255,0.0012\nCC-MAIN-2025-21,IBM500,21768,21714,0.0009\nCC-MAIN-2025-21,IBM855,98,98,0.0000\nCC-MAIN-2025-21,IBM866,4081,4078,0.0002\nCC-MAIN-2025-21,ISO-2022-JP,23532,23512,0.0009\nCC-MAIN-2025-21,ISO-8859-1,62642882,62416804,2.5288\nCC-MAIN-2025-21,ISO-8859-13,2174,2173,0.0001\nCC-MAIN-2025-21,ISO-8859-15,1176126,1170344,0.0475\nCC-MAIN-2025-21,ISO-8859-16,4433,4420,0.0002\nCC-MAIN-2025-21,ISO-8859-2,2433369,2423614,0.0982\nCC-MAIN-2025-21,ISO-8859-3,6417,6399,0.0003\nCC-MAIN-2025-21,ISO-8859-4,14018,13970,0.0006\nCC-MAIN-2025-21,ISO-8859-5,54291,54168,0.0022\nCC-MAIN-2025-21,ISO-8859-6,416,414,0.0000\nCC-MAIN-2025-21,ISO-8859-7,126228,125841,0.0051\nCC-MAIN-2025-21,ISO-8859-8,18088,18072,0.0007\nCC-MAIN-2025-21,ISO-8859-9,598713,597204,0.0242\nCC-MAIN-2025-21,KOI8-R,182298,178258,0.0074\nCC-MAIN-2025-21,KOI8-U,1052,1052,0.0000\nCC-MAIN-2025-21,Shift_JIS,3854741,3840138,0.1556\nCC-MAIN-2025-21,TIS-620,114355,114121,0.0046\nCC-MAIN-2025-21,US-ASCII,547751,547292,0.0221\nCC-MAIN-2025-21,UTF-16,123216,122723,0.0050\nCC-MAIN-2025-21,UTF-16BE,5002,5001,0.0002\nCC-MAIN-2025-21,UTF-16LE,25194,25079,0.0010\nCC-MAIN-2025-21,UTF-32,2245,2241,0.0001\nCC-MAIN-2025-21,UTF-32LE,4430,4429,0.0002\nCC-MAIN-2025-21,UTF-8,2336377362,2323905197,94.3166\nCC-MAIN-2025-21,windows-1250,1642324,1634166,0.0663\nCC-MAIN-2025-21,windows-1251,11512357,11473429,0.4647\nCC-MAIN-2025-21,windows-1252,3393991,3380091,0.1370\nCC-MAIN-2025-21,windows-1253,55317,55154,0.0022\nCC-MAIN-2025-21,windows-1254,261876,260615,0.0106\nCC-MAIN-2025-21,windows-1255,178444,177826,0.0072\nCC-MAIN-2025-21,windows-1256,866716,863673,0.0350\nCC-MAIN-2025-21,windows-1257,166216,165891,0.0067\nCC-MAIN-2025-21,windows-31j,13547,13492,0.0005\nCC-MAIN-2025-21,x-iso-8859-11,2224,2213,0.0001\nCC-MAIN-2025-21,x-windows-874,195561,195200,0.0079\nCC-MAIN-2025-21,x-windows-949,408,407,0.0000\nCC-MAIN-2025-26,<other>,828,827,0.0000\nCC-MAIN-2025-26,<unknown>,37191934,37191934,1.5590\nCC-MAIN-2025-26,Big5,1033295,1032581,0.0433\nCC-MAIN-2025-26,Big5-HKSCS,1619,1617,0.0001\nCC-MAIN-2025-26,EUC-JP,2908511,2897504,0.1219\nCC-MAIN-2025-26,EUC-KR,1947703,1944881,0.0816\nCC-MAIN-2025-26,GB18030,309758,309481,0.0130\nCC-MAIN-2025-26,GB2312,5071945,5064945,0.2126\nCC-MAIN-2025-26,GBK,2596719,2592422,0.1088\nCC-MAIN-2025-26,IBM420,83804,83648,0.0035\nCC-MAIN-2025-26,IBM424,27706,27631,0.0012\nCC-MAIN-2025-26,IBM500,30926,30732,0.0013\nCC-MAIN-2025-26,IBM855,107,107,0.0000\nCC-MAIN-2025-26,IBM866,3997,3994,0.0002\nCC-MAIN-2025-26,ISO-2022-JP,22854,22838,0.0010\nCC-MAIN-2025-26,ISO-8859-1,168284041,167949327,7.0541\nCC-MAIN-2025-26,ISO-8859-13,2822,2822,0.0001\nCC-MAIN-2025-26,ISO-8859-15,1163891,1158196,0.0488\nCC-MAIN-2025-26,ISO-8859-16,4712,4706,0.0002\nCC-MAIN-2025-26,ISO-8859-2,2296796,2286454,0.0963\nCC-MAIN-2025-26,ISO-8859-3,7429,7402,0.0003\nCC-MAIN-2025-26,ISO-8859-4,15373,15316,0.0006\nCC-MAIN-2025-26,ISO-8859-5,40946,40844,0.0017\nCC-MAIN-2025-26,ISO-8859-6,462,460,0.0000\nCC-MAIN-2025-26,ISO-8859-7,117275,117004,0.0049\nCC-MAIN-2025-26,ISO-8859-8,17017,17005,0.0007\nCC-MAIN-2025-26,ISO-8859-9,526916,523646,0.0221\nCC-MAIN-2025-26,KOI8-R,173353,171474,0.0073\nCC-MAIN-2025-26,KOI8-U,1454,1454,0.0001\nCC-MAIN-2025-26,Shift_JIS,3692081,3683643,0.1548\nCC-MAIN-2025-26,TIS-620,85040,84707,0.0036\nCC-MAIN-2025-26,US-ASCII,492939,492450,0.0207\nCC-MAIN-2025-26,UTF-16,110746,110495,0.0046\nCC-MAIN-2025-26,UTF-16BE,3692,3687,0.0002\nCC-MAIN-2025-26,UTF-16LE,24840,24756,0.0010\nCC-MAIN-2025-26,UTF-32,1362,1361,0.0001\nCC-MAIN-2025-26,UTF-32LE,7482,7402,0.0003\nCC-MAIN-2025-26,UTF-8,2139113219,2127172772,89.6676\nCC-MAIN-2025-26,windows-1250,1639878,1632729,0.0687\nCC-MAIN-2025-26,windows-1251,11528263,11484003,0.4832\nCC-MAIN-2025-26,windows-1252,3382750,3368261,0.1418\nCC-MAIN-2025-26,windows-1253,55128,54967,0.0023\nCC-MAIN-2025-26,windows-1254,228908,228151,0.0096\nCC-MAIN-2025-26,windows-1255,168184,167466,0.0070\nCC-MAIN-2025-26,windows-1256,833176,828918,0.0349\nCC-MAIN-2025-26,windows-1257,156068,155814,0.0065\nCC-MAIN-2025-26,windows-31j,15222,15177,0.0006\nCC-MAIN-2025-26,x-iso-8859-11,1896,1861,0.0001\nCC-MAIN-2025-26,x-windows-874,178787,178407,0.0075\nCC-MAIN-2025-26,x-windows-949,95,94,0.0000\nCC-MAIN-2025-30,<other>,872,868,0.0000\nCC-MAIN-2025-30,<unknown>,38564663,38564663,1.5919\nCC-MAIN-2025-30,Big5,1012969,1012074,0.0418\nCC-MAIN-2025-30,Big5-HKSCS,1940,1935,0.0001\nCC-MAIN-2025-30,EUC-JP,3105789,3095480,0.1282\nCC-MAIN-2025-30,EUC-KR,1969995,1967357,0.0813\nCC-MAIN-2025-30,GB18030,388313,387109,0.0160\nCC-MAIN-2025-30,GB2312,5166377,5159977,0.2133\nCC-MAIN-2025-30,GBK,2642594,2636926,0.1091\nCC-MAIN-2025-30,IBM420,88160,87997,0.0036\nCC-MAIN-2025-30,IBM424,27071,26991,0.0011\nCC-MAIN-2025-30,IBM500,15420,15375,0.0006\nCC-MAIN-2025-30,IBM855,49,49,0.0000\nCC-MAIN-2025-30,IBM866,3439,3437,0.0001\nCC-MAIN-2025-30,ISO-2022-JP,22663,22641,0.0009\nCC-MAIN-2025-30,ISO-8859-1,131474166,131173098,5.4270\nCC-MAIN-2025-30,ISO-8859-13,2599,2599,0.0001\nCC-MAIN-2025-30,ISO-8859-15,1188872,1181513,0.0491\nCC-MAIN-2025-30,ISO-8859-16,3406,3401,0.0001\nCC-MAIN-2025-30,ISO-8859-2,2265941,2257446,0.0935\nCC-MAIN-2025-30,ISO-8859-3,5839,5819,0.0002\nCC-MAIN-2025-30,ISO-8859-4,13232,13178,0.0005\nCC-MAIN-2025-30,ISO-8859-5,34924,34809,0.0014\nCC-MAIN-2025-30,ISO-8859-6,615,613,0.0000\nCC-MAIN-2025-30,ISO-8859-7,121249,120946,0.0050\nCC-MAIN-2025-30,ISO-8859-8,16136,16124,0.0007\nCC-MAIN-2025-30,ISO-8859-9,556602,555055,0.0230\nCC-MAIN-2025-30,KOI8-R,173852,173202,0.0072\nCC-MAIN-2025-30,KOI8-U,915,915,0.0000\nCC-MAIN-2025-30,Shift_JIS,3790761,3781458,0.1565\nCC-MAIN-2025-30,TIS-620,109059,108772,0.0045\nCC-MAIN-2025-30,US-ASCII,492050,491608,0.0203\nCC-MAIN-2025-30,UTF-16,107744,107499,0.0044\nCC-MAIN-2025-30,UTF-16BE,3007,3001,0.0001\nCC-MAIN-2025-30,UTF-16LE,26963,26870,0.0011\nCC-MAIN-2025-30,UTF-32,1162,1160,0.0000\nCC-MAIN-2025-30,UTF-32LE,6068,6057,0.0003\nCC-MAIN-2025-30,UTF-8,2210783390,2198589842,91.2574\nCC-MAIN-2025-30,windows-1250,1681942,1675224,0.0694\nCC-MAIN-2025-30,windows-1251,11830821,11749310,0.4884\nCC-MAIN-2025-30,windows-1252,3236647,3223751,0.1336\nCC-MAIN-2025-30,windows-1253,60396,60119,0.0025\nCC-MAIN-2025-30,windows-1254,222987,222398,0.0092\nCC-MAIN-2025-30,windows-1255,142031,141616,0.0059\nCC-MAIN-2025-30,windows-1256,864986,861517,0.0357\nCC-MAIN-2025-30,windows-1257,150655,150341,0.0062\nCC-MAIN-2025-30,windows-31j,8890,8868,0.0004\nCC-MAIN-2025-30,x-MacCyrillic,1,1,0.0000\nCC-MAIN-2025-30,x-iso-8859-11,986,975,0.0000\nCC-MAIN-2025-30,x-windows-874,191183,190750,0.0079\nCC-MAIN-2025-30,x-windows-949,116,115,0.0000\nCC-MAIN-2025-33,<other>,848,844,0.0000\nCC-MAIN-2025-33,<unknown>,36807594,36807594,1.5070\nCC-MAIN-2025-33,Big5,1087240,1086215,0.0445\nCC-MAIN-2025-33,Big5-HKSCS,1838,1838,0.0001\nCC-MAIN-2025-33,EUC-JP,2993213,2982017,0.1225\nCC-MAIN-2025-33,EUC-KR,1921943,1919315,0.0787\nCC-MAIN-2025-33,GB18030,330486,329575,0.0135\nCC-MAIN-2025-33,GB2312,4673540,4666581,0.1913\nCC-MAIN-2025-33,GBK,2351339,2346979,0.0963\nCC-MAIN-2025-33,IBM420,87009,86872,0.0036\nCC-MAIN-2025-33,IBM424,25245,25177,0.0010\nCC-MAIN-2025-33,IBM500,18429,18376,0.0008\nCC-MAIN-2025-33,IBM855,88,88,0.0000\nCC-MAIN-2025-33,IBM866,5907,5900,0.0002\nCC-MAIN-2025-33,ISO-2022-JP,23367,23302,0.0010\nCC-MAIN-2025-33,ISO-8859-1,127289796,126995095,5.2115\nCC-MAIN-2025-33,ISO-8859-13,3067,3067,0.0001\nCC-MAIN-2025-33,ISO-8859-15,1154742,1147302,0.0473\nCC-MAIN-2025-33,ISO-8859-16,3489,3482,0.0001\nCC-MAIN-2025-33,ISO-8859-2,2106941,2099184,0.0863\nCC-MAIN-2025-33,ISO-8859-3,5861,5841,0.0002\nCC-MAIN-2025-33,ISO-8859-4,11963,11894,0.0005\nCC-MAIN-2025-33,ISO-8859-5,37781,37693,0.0015\nCC-MAIN-2025-33,ISO-8859-6,578,575,0.0000\nCC-MAIN-2025-33,ISO-8859-7,119068,118803,0.0049\nCC-MAIN-2025-33,ISO-8859-8,16358,16338,0.0007\nCC-MAIN-2025-33,ISO-8859-9,488383,486758,0.0200\nCC-MAIN-2025-33,KOI8-R,167180,166712,0.0068\nCC-MAIN-2025-33,KOI8-U,1016,1016,0.0000\nCC-MAIN-2025-33,Shift_JIS,3842639,3832127,0.1573\nCC-MAIN-2025-33,TIS-620,116829,115796,0.0048\nCC-MAIN-2025-33,US-ASCII,489906,489481,0.0201\nCC-MAIN-2025-33,UTF-16,115296,115108,0.0047\nCC-MAIN-2025-33,UTF-16BE,4307,4303,0.0002\nCC-MAIN-2025-33,UTF-16LE,23629,23544,0.0010\nCC-MAIN-2025-33,UTF-32,1218,1214,0.0000\nCC-MAIN-2025-33,UTF-32LE,8121,8106,0.0003\nCC-MAIN-2025-33,UTF-8,2238370031,2226276990,91.6428\nCC-MAIN-2025-33,windows-1250,1630940,1624343,0.0668\nCC-MAIN-2025-33,windows-1251,11542574,11486834,0.4726\nCC-MAIN-2025-33,windows-1252,3031887,3019919,0.1241\nCC-MAIN-2025-33,windows-1253,55916,55675,0.0023\nCC-MAIN-2025-33,windows-1254,236877,235763,0.0097\nCC-MAIN-2025-33,windows-1255,151612,151100,0.0062\nCC-MAIN-2025-33,windows-1256,805554,802103,0.0330\nCC-MAIN-2025-33,windows-1257,154964,154708,0.0063\nCC-MAIN-2025-33,windows-31j,9270,9242,0.0004\nCC-MAIN-2025-33,x-iso-8859-11,1202,1187,0.0000\nCC-MAIN-2025-33,x-windows-874,166090,165796,0.0068\nCC-MAIN-2025-33,x-windows-949,307,306,0.0000\nCC-MAIN-2025-38,<other>,951,950,0.0000\nCC-MAIN-2025-38,<unknown>,35532031,35532031,1.4892\nCC-MAIN-2025-38,Big5,1114232,1113528,0.0467\nCC-MAIN-2025-38,Big5-HKSCS,1390,1383,0.0001\nCC-MAIN-2025-38,EUC-JP,2992921,2986314,0.1254\nCC-MAIN-2025-38,EUC-KR,1853771,1851104,0.0777\nCC-MAIN-2025-38,GB18030,348181,346974,0.0146\nCC-MAIN-2025-38,GB2312,4704297,4696996,0.1972\nCC-MAIN-2025-38,GBK,2387939,2383793,0.1001\nCC-MAIN-2025-38,IBM420,82263,82152,0.0034\nCC-MAIN-2025-38,IBM424,24217,24125,0.0010\nCC-MAIN-2025-38,IBM500,18645,18602,0.0008\nCC-MAIN-2025-38,IBM855,3,3,0.0000\nCC-MAIN-2025-38,IBM866,6067,6062,0.0003\nCC-MAIN-2025-38,ISO-2022-JP,19244,19203,0.0008\nCC-MAIN-2025-38,ISO-8859-1,133825145,133526028,5.6088\nCC-MAIN-2025-38,ISO-8859-13,2819,2819,0.0001\nCC-MAIN-2025-38,ISO-8859-15,1058288,1051621,0.0444\nCC-MAIN-2025-38,ISO-8859-16,4330,4317,0.0002\nCC-MAIN-2025-38,ISO-8859-2,1880185,1871949,0.0788\nCC-MAIN-2025-38,ISO-8859-3,7792,7743,0.0003\nCC-MAIN-2025-38,ISO-8859-4,9594,9531,0.0004\nCC-MAIN-2025-38,ISO-8859-5,36749,36653,0.0015\nCC-MAIN-2025-38,ISO-8859-6,467,465,0.0000\nCC-MAIN-2025-38,ISO-8859-7,105092,104878,0.0044\nCC-MAIN-2025-38,ISO-8859-8,15234,15223,0.0006\nCC-MAIN-2025-38,ISO-8859-9,550453,548582,0.0231\nCC-MAIN-2025-38,KOI8-R,145472,145258,0.0061\nCC-MAIN-2025-38,KOI8-U,671,671,0.0000\nCC-MAIN-2025-38,Shift_JIS,3740013,3728069,0.1568\nCC-MAIN-2025-38,TIS-620,126507,125899,0.0053\nCC-MAIN-2025-38,US-ASCII,457708,457252,0.0192\nCC-MAIN-2025-38,UTF-16,104524,104395,0.0044\nCC-MAIN-2025-38,UTF-16BE,5769,5766,0.0002\nCC-MAIN-2025-38,UTF-16LE,22858,22792,0.0010\nCC-MAIN-2025-38,UTF-32,897,896,0.0000\nCC-MAIN-2025-38,UTF-32LE,7223,7210,0.0003\nCC-MAIN-2025-38,UTF-8,2177507389,2165401450,91.2632\nCC-MAIN-2025-38,windows-1250,1479383,1473300,0.0620\nCC-MAIN-2025-38,windows-1251,11152909,11095127,0.4674\nCC-MAIN-2025-38,windows-1252,3080462,3049521,0.1291\nCC-MAIN-2025-38,windows-1253,41734,41473,0.0017\nCC-MAIN-2025-38,windows-1254,258677,257043,0.0108\nCC-MAIN-2025-38,windows-1255,109504,109207,0.0046\nCC-MAIN-2025-38,windows-1256,804761,801565,0.0337\nCC-MAIN-2025-38,windows-1257,149372,149161,0.0063\nCC-MAIN-2025-38,windows-31j,10137,10104,0.0004\nCC-MAIN-2025-38,x-iso-8859-11,1275,1267,0.0001\nCC-MAIN-2025-38,x-windows-874,174619,174338,0.0073\nCC-MAIN-2025-38,x-windows-949,45,45,0.0000\nCC-MAIN-2025-43,<other>,1153,1148,0.0000\nCC-MAIN-2025-43,<unknown>,37453021,37453021,1.4313\nCC-MAIN-2025-43,Big5,1124779,1123864,0.0430\nCC-MAIN-2025-43,Big5-HKSCS,1398,1398,0.0001\nCC-MAIN-2025-43,EUC-JP,3146123,3139443,0.1202\nCC-MAIN-2025-43,EUC-KR,1836383,1833588,0.0702\nCC-MAIN-2025-43,GB18030,338949,336860,0.0130\nCC-MAIN-2025-43,GB2312,5494610,5486693,0.2100\nCC-MAIN-2025-43,GBK,2533095,2529358,0.0968\nCC-MAIN-2025-43,IBM420,86563,86423,0.0033\nCC-MAIN-2025-43,IBM424,38599,38522,0.0015\nCC-MAIN-2025-43,IBM500,25613,25493,0.0010\nCC-MAIN-2025-43,IBM855,2,2,0.0000\nCC-MAIN-2025-43,IBM866,6247,6242,0.0002\nCC-MAIN-2025-43,ISO-2022-JP,24358,24299,0.0009\nCC-MAIN-2025-43,ISO-8859-1,143034496,142716588,5.4660\nCC-MAIN-2025-43,ISO-8859-13,2013,2012,0.0001\nCC-MAIN-2025-43,ISO-8859-15,1053262,1047401,0.0403\nCC-MAIN-2025-43,ISO-8859-16,4471,4456,0.0002\nCC-MAIN-2025-43,ISO-8859-2,2120995,2113723,0.0811\nCC-MAIN-2025-43,ISO-8859-3,7211,7166,0.0003\nCC-MAIN-2025-43,ISO-8859-4,14735,14681,0.0006\nCC-MAIN-2025-43,ISO-8859-5,25536,25437,0.0010\nCC-MAIN-2025-43,ISO-8859-6,508,504,0.0000\nCC-MAIN-2025-43,ISO-8859-7,115117,114769,0.0044\nCC-MAIN-2025-43,ISO-8859-8,16579,16559,0.0006\nCC-MAIN-2025-43,ISO-8859-9,554398,552990,0.0212\nCC-MAIN-2025-43,KOI8-R,170087,169344,0.0065\nCC-MAIN-2025-43,KOI8-U,853,853,0.0000\nCC-MAIN-2025-43,Shift_JIS,3819837,3808500,0.1460\nCC-MAIN-2025-43,TIS-620,123733,123075,0.0047\nCC-MAIN-2025-43,US-ASCII,400399,400050,0.0153\nCC-MAIN-2025-43,UTF-16,112747,112457,0.0043\nCC-MAIN-2025-43,UTF-16BE,4434,4431,0.0002\nCC-MAIN-2025-43,UTF-16LE,22656,22550,0.0009\nCC-MAIN-2025-43,UTF-32,1000,998,0.0000\nCC-MAIN-2025-43,UTF-32LE,6361,6343,0.0002\nCC-MAIN-2025-43,UTF-8,2395035360,2382270083,91.5255\nCC-MAIN-2025-43,windows-1250,1715297,1708444,0.0655\nCC-MAIN-2025-43,windows-1251,11375260,11320356,0.4347\nCC-MAIN-2025-43,windows-1252,3351883,3338358,0.1281\nCC-MAIN-2025-43,windows-1253,50858,50755,0.0019\nCC-MAIN-2025-43,windows-1254,265939,263968,0.0102\nCC-MAIN-2025-43,windows-1255,157376,155638,0.0060\nCC-MAIN-2025-43,windows-1256,776448,773805,0.0297\nCC-MAIN-2025-43,windows-1257,154565,154173,0.0059\nCC-MAIN-2025-43,windows-31j,10524,10494,0.0004\nCC-MAIN-2025-43,x-iso-8859-11,1763,1751,0.0001\nCC-MAIN-2025-43,x-windows-874,179141,178748,0.0068\nCC-MAIN-2025-43,x-windows-949,122,121,0.0000\nCC-MAIN-2025-47,<other>,1317,1315,0.0001\nCC-MAIN-2025-47,<unknown>,39443469,39443469,1.7191\nCC-MAIN-2025-47,Big5,1063523,1062806,0.0464\nCC-MAIN-2025-47,Big5-HKSCS,859,856,0.0000\nCC-MAIN-2025-47,EUC-JP,3086185,3079651,0.1345\nCC-MAIN-2025-47,EUC-KR,1795791,1793520,0.0783\nCC-MAIN-2025-47,GB18030,367754,365496,0.0160\nCC-MAIN-2025-47,GB2312,5715599,5679107,0.2491\nCC-MAIN-2025-47,GBK,2391833,2383579,0.1042\nCC-MAIN-2025-47,IBM420,86580,86451,0.0038\nCC-MAIN-2025-47,IBM424,32971,32565,0.0014\nCC-MAIN-2025-47,IBM500,27152,27098,0.0012\nCC-MAIN-2025-47,IBM866,5042,5031,0.0002\nCC-MAIN-2025-47,ISO-2022-JP,24412,24340,0.0011\nCC-MAIN-2025-47,ISO-8859-1,131865822,131568817,5.7471\nCC-MAIN-2025-47,ISO-8859-13,2591,2591,0.0001\nCC-MAIN-2025-47,ISO-8859-15,1031064,1025229,0.0449\nCC-MAIN-2025-47,ISO-8859-16,4748,4730,0.0002\nCC-MAIN-2025-47,ISO-8859-2,2037113,2031794,0.0888\nCC-MAIN-2025-47,ISO-8859-3,10162,10086,0.0004\nCC-MAIN-2025-47,ISO-8859-4,15507,15444,0.0007\nCC-MAIN-2025-47,ISO-8859-5,26512,26415,0.0012\nCC-MAIN-2025-47,ISO-8859-6,438,437,0.0000\nCC-MAIN-2025-47,ISO-8859-7,102631,102290,0.0045\nCC-MAIN-2025-47,ISO-8859-8,16610,16594,0.0007\nCC-MAIN-2025-47,ISO-8859-9,502346,501160,0.0219\nCC-MAIN-2025-47,KOI8-R,160423,160036,0.0070\nCC-MAIN-2025-47,KOI8-U,1146,1047,0.0000\nCC-MAIN-2025-47,Shift_JIS,3557286,3549729,0.1550\nCC-MAIN-2025-47,TIS-620,94238,93994,0.0041\nCC-MAIN-2025-47,US-ASCII,423256,422779,0.0184\nCC-MAIN-2025-47,UTF-16,110179,109844,0.0048\nCC-MAIN-2025-47,UTF-16BE,8083,8080,0.0004\nCC-MAIN-2025-47,UTF-16LE,25975,25887,0.0011\nCC-MAIN-2025-47,UTF-32,2003,1995,0.0001\nCC-MAIN-2025-47,UTF-32LE,5377,5362,0.0002\nCC-MAIN-2025-47,UTF-8,2083125185,2071782858,90.7888\nCC-MAIN-2025-47,windows-1250,1618940,1612817,0.0706\nCC-MAIN-2025-47,windows-1251,10937095,10880107,0.4767\nCC-MAIN-2025-47,windows-1252,3223407,3210025,0.1405\nCC-MAIN-2025-47,windows-1253,48328,48190,0.0021\nCC-MAIN-2025-47,windows-1254,248498,247261,0.0108\nCC-MAIN-2025-47,windows-1255,148494,148058,0.0065\nCC-MAIN-2025-47,windows-1256,739186,736908,0.0322\nCC-MAIN-2025-47,windows-1257,154463,154125,0.0067\nCC-MAIN-2025-47,windows-31j,9500,9464,0.0004\nCC-MAIN-2025-47,x-iso-8859-11,1334,1329,0.0001\nCC-MAIN-2025-47,x-windows-874,172331,172137,0.0075\nCC-MAIN-2025-47,x-windows-949,154,153,0.0000\nCC-MAIN-2025-51,<other>,1188,1187,0.0001\nCC-MAIN-2025-51,<unknown>,38863941,38863941,1.7917\nCC-MAIN-2025-51,Big5,1241259,1240349,0.0572\nCC-MAIN-2025-51,Big5-HKSCS,529,529,0.0000\nCC-MAIN-2025-51,EUC-JP,2960023,2951962,0.1365\nCC-MAIN-2025-51,EUC-KR,1744249,1742092,0.0804\nCC-MAIN-2025-51,GB18030,454626,452920,0.0210\nCC-MAIN-2025-51,GB2312,6501585,6488201,0.2997\nCC-MAIN-2025-51,GBK,2555350,2551418,0.1178\nCC-MAIN-2025-51,IBM420,114468,114295,0.0053\nCC-MAIN-2025-51,IBM424,32270,32203,0.0015\nCC-MAIN-2025-51,IBM500,23153,23096,0.0011\nCC-MAIN-2025-51,IBM855,1,1,0.0000\nCC-MAIN-2025-51,IBM866,5307,5300,0.0002\nCC-MAIN-2025-51,ISO-2022-JP,23068,23020,0.0011\nCC-MAIN-2025-51,ISO-8859-1,120412093,120124319,5.5513\nCC-MAIN-2025-51,ISO-8859-13,3175,3174,0.0001\nCC-MAIN-2025-51,ISO-8859-15,997847,991538,0.0460\nCC-MAIN-2025-51,ISO-8859-16,4622,4613,0.0002\nCC-MAIN-2025-51,ISO-8859-2,1846923,1841685,0.0851\nCC-MAIN-2025-51,ISO-8859-3,908,904,0.0000\nCC-MAIN-2025-51,ISO-8859-4,15157,15099,0.0007\nCC-MAIN-2025-51,ISO-8859-5,24200,24106,0.0011\nCC-MAIN-2025-51,ISO-8859-6,565,564,0.0000\nCC-MAIN-2025-51,ISO-8859-7,98902,98617,0.0046\nCC-MAIN-2025-51,ISO-8859-8,17503,17486,0.0008\nCC-MAIN-2025-51,ISO-8859-9,483913,482829,0.0223\nCC-MAIN-2025-51,KOI8-R,135451,135201,0.0062\nCC-MAIN-2025-51,KOI8-U,1079,1079,0.0000\nCC-MAIN-2025-51,Shift_JIS,3541809,3533191,0.1633\nCC-MAIN-2025-51,TIS-620,92549,92264,0.0043\nCC-MAIN-2025-51,US-ASCII,448995,448647,0.0207\nCC-MAIN-2025-51,UTF-16,78492,78280,0.0036\nCC-MAIN-2025-51,UTF-16BE,4193,4190,0.0002\nCC-MAIN-2025-51,UTF-16LE,24320,24245,0.0011\nCC-MAIN-2025-51,UTF-32,921,918,0.0000\nCC-MAIN-2025-51,UTF-32LE,5334,5325,0.0002\nCC-MAIN-2025-51,UTF-8,1969723245,1959074053,90.8089\nCC-MAIN-2025-51,windows-1250,1542348,1536348,0.0711\nCC-MAIN-2025-51,windows-1251,10746918,10686998,0.4955\nCC-MAIN-2025-51,windows-1252,2886755,2873286,0.1331\nCC-MAIN-2025-51,windows-1253,47285,47144,0.0022\nCC-MAIN-2025-51,windows-1254,214500,213371,0.0099\nCC-MAIN-2025-51,windows-1255,139587,139240,0.0064\nCC-MAIN-2025-51,windows-1256,714645,712244,0.0329\nCC-MAIN-2025-51,windows-1257,138423,138186,0.0064\nCC-MAIN-2025-51,windows-31j,8737,8699,0.0004\nCC-MAIN-2025-51,x-iso-8859-11,1475,1468,0.0001\nCC-MAIN-2025-51,x-windows-874,163280,163073,0.0075\nCC-MAIN-2025-51,x-windows-949,113,112,0.0000\nCC-MAIN-2026-04,<other>,1400,1396,0.0001\nCC-MAIN-2026-04,<unknown>,37907015,37907015,1.6272\nCC-MAIN-2026-04,Big5,588266,587325,0.0253\nCC-MAIN-2026-04,Big5-HKSCS,477,477,0.0000\nCC-MAIN-2026-04,EUC-JP,2993867,2986734,0.1285\nCC-MAIN-2026-04,EUC-KR,1794412,1792192,0.0770\nCC-MAIN-2026-04,GB18030,384621,382169,0.0165\nCC-MAIN-2026-04,GB2312,5112611,5104768,0.2195\nCC-MAIN-2026-04,GBK,2309171,2304002,0.0991\nCC-MAIN-2026-04,IBM420,93194,93016,0.0040\nCC-MAIN-2026-04,IBM424,41331,40895,0.0018\nCC-MAIN-2026-04,IBM500,23922,23855,0.0010\nCC-MAIN-2026-04,IBM855,3,3,0.0000\nCC-MAIN-2026-04,IBM866,5088,5084,0.0002\nCC-MAIN-2026-04,ISO-2022-JP,20237,20196,0.0009\nCC-MAIN-2026-04,ISO-8859-1,102486936,102206718,4.3993\nCC-MAIN-2026-04,ISO-8859-13,1716,1716,0.0001\nCC-MAIN-2026-04,ISO-8859-15,1062047,1056392,0.0456\nCC-MAIN-2026-04,ISO-8859-16,6228,6197,0.0003\nCC-MAIN-2026-04,ISO-8859-2,1918889,1912884,0.0824\nCC-MAIN-2026-04,ISO-8859-3,871,869,0.0000\nCC-MAIN-2026-04,ISO-8859-4,14261,14186,0.0006\nCC-MAIN-2026-04,ISO-8859-5,35470,35348,0.0015\nCC-MAIN-2026-04,ISO-8859-6,433,431,0.0000\nCC-MAIN-2026-04,ISO-8859-7,106736,106442,0.0046\nCC-MAIN-2026-04,ISO-8859-8,14485,14468,0.0006\nCC-MAIN-2026-04,ISO-8859-9,461234,460059,0.0198\nCC-MAIN-2026-04,KOI8-R,132262,132087,0.0057\nCC-MAIN-2026-04,KOI8-U,1445,1445,0.0001\nCC-MAIN-2026-04,Shift_JIS,3741883,3731593,0.1606\nCC-MAIN-2026-04,TIS-620,86399,86022,0.0037\nCC-MAIN-2026-04,US-ASCII,452975,452564,0.0194\nCC-MAIN-2026-04,UTF-16,58474,58258,0.0025\nCC-MAIN-2026-04,UTF-16BE,4048,4043,0.0002\nCC-MAIN-2026-04,UTF-16LE,28665,28565,0.0012\nCC-MAIN-2026-04,UTF-32,1286,1282,0.0001\nCC-MAIN-2026-04,UTF-32LE,4183,4164,0.0002\nCC-MAIN-2026-04,UTF-8,2150861477,2139789123,92.3263\nCC-MAIN-2026-04,windows-1250,1556707,1550366,0.0668\nCC-MAIN-2026-04,windows-1251,10903988,10852460,0.4681\nCC-MAIN-2026-04,windows-1252,2960777,2948671,0.1271\nCC-MAIN-2026-04,windows-1253,47352,47208,0.0020\nCC-MAIN-2026-04,windows-1254,233063,232035,0.0100\nCC-MAIN-2026-04,windows-1255,137339,136816,0.0059\nCC-MAIN-2026-04,windows-1256,721134,719124,0.0310\nCC-MAIN-2026-04,windows-1257,138057,137791,0.0059\nCC-MAIN-2026-04,windows-31j,8699,8637,0.0004\nCC-MAIN-2026-04,x-iso-8859-11,1303,1294,0.0001\nCC-MAIN-2026-04,x-windows-874,164215,163950,0.0070\nCC-MAIN-2026-04,x-windows-949,103,102,0.0000\nCC-MAIN-2026-08,<other>,1107,1102,0.0001\nCC-MAIN-2026-08,<unknown>,39361187,39361187,1.8164\nCC-MAIN-2026-08,Big5,475412,474249,0.0219\nCC-MAIN-2026-08,Big5-HKSCS,354,354,0.0000\nCC-MAIN-2026-08,EUC-JP,2841869,2834745,0.1311\nCC-MAIN-2026-08,EUC-KR,1700919,1698442,0.0785\nCC-MAIN-2026-08,GB18030,322227,320876,0.0149\nCC-MAIN-2026-08,GB2312,4998687,4986918,0.2307\nCC-MAIN-2026-08,GBK,2196094,2189822,0.1013\nCC-MAIN-2026-08,IBM420,111253,111107,0.0051\nCC-MAIN-2026-08,IBM424,50533,48749,0.0023\nCC-MAIN-2026-08,IBM500,22862,22795,0.0011\nCC-MAIN-2026-08,IBM866,5491,5468,0.0003\nCC-MAIN-2026-08,ISO-2022-JP,21464,21441,0.0010\nCC-MAIN-2026-08,ISO-8859-1,144044345,143728455,6.6472\nCC-MAIN-2026-08,ISO-8859-13,909,909,0.0000\nCC-MAIN-2026-08,ISO-8859-15,1009980,1004835,0.0466\nCC-MAIN-2026-08,ISO-8859-16,3992,3982,0.0002\nCC-MAIN-2026-08,ISO-8859-2,1964087,1958260,0.0906\nCC-MAIN-2026-08,ISO-8859-3,4088,4081,0.0002\nCC-MAIN-2026-08,ISO-8859-4,12139,12065,0.0006\nCC-MAIN-2026-08,ISO-8859-5,34324,34208,0.0016\nCC-MAIN-2026-08,ISO-8859-6,369,366,0.0000\nCC-MAIN-2026-08,ISO-8859-7,93850,93579,0.0043\nCC-MAIN-2026-08,ISO-8859-8,15080,15069,0.0007\nCC-MAIN-2026-08,ISO-8859-9,423726,422618,0.0196\nCC-MAIN-2026-08,KOI8-R,144967,144761,0.0067\nCC-MAIN-2026-08,KOI8-U,1187,1187,0.0001\nCC-MAIN-2026-08,Shift_JIS,3789895,3779981,0.1749\nCC-MAIN-2026-08,TIS-620,82849,82650,0.0038\nCC-MAIN-2026-08,US-ASCII,410131,409733,0.0189\nCC-MAIN-2026-08,UTF-16,58772,58452,0.0027\nCC-MAIN-2026-08,UTF-16BE,4114,4110,0.0002\nCC-MAIN-2026-08,UTF-16LE,32287,32162,0.0015\nCC-MAIN-2026-08,UTF-32,1301,1297,0.0001\nCC-MAIN-2026-08,UTF-32LE,3846,3813,0.0002\nCC-MAIN-2026-08,UTF-8,1946369417,1935479110,89.8190\nCC-MAIN-2026-08,windows-1250,1474703,1468675,0.0681\nCC-MAIN-2026-08,windows-1251,10445933,10390217,0.4820\nCC-MAIN-2026-08,windows-1252,3104479,3091168,0.1433\nCC-MAIN-2026-08,windows-1253,41837,41721,0.0019\nCC-MAIN-2026-08,windows-1254,224389,223535,0.0104\nCC-MAIN-2026-08,windows-1255,128927,128435,0.0059\nCC-MAIN-2026-08,windows-1256,655622,653668,0.0303\nCC-MAIN-2026-08,windows-1257,134133,133863,0.0062\nCC-MAIN-2026-08,windows-31j,8160,8131,0.0004\nCC-MAIN-2026-08,x-iso-8859-11,2443,2407,0.0001\nCC-MAIN-2026-08,x-windows-874,155917,155638,0.0072\nCC-MAIN-2026-08,x-windows-949,65,64,0.0000\nCC-MAIN-2026-12,<other>,1361,1356,0.0001\nCC-MAIN-2026-12,<unknown>,36005030,36005030,1.8232\nCC-MAIN-2026-12,Big5,391629,390834,0.0198\nCC-MAIN-2026-12,Big5-HKSCS,353,353,0.0000\nCC-MAIN-2026-12,EUC-JP,2647198,2639972,0.1340\nCC-MAIN-2026-12,EUC-KR,1617501,1615292,0.0819\nCC-MAIN-2026-12,GB18030,325641,324955,0.0165\nCC-MAIN-2026-12,GB2312,4715643,4708447,0.2388\nCC-MAIN-2026-12,GBK,1975372,1972356,0.1000\nCC-MAIN-2026-12,IBM420,96205,96013,0.0049\nCC-MAIN-2026-12,IBM424,40627,40428,0.0021\nCC-MAIN-2026-12,IBM500,20849,20773,0.0011\nCC-MAIN-2026-12,IBM855,2,2,0.0000\nCC-MAIN-2026-12,IBM866,3139,3139,0.0002\nCC-MAIN-2026-12,ISO-2022-JP,23099,23078,0.0012\nCC-MAIN-2026-12,ISO-8859-1,65925622,65713352,3.3383\nCC-MAIN-2026-12,ISO-8859-13,616,616,0.0000\nCC-MAIN-2026-12,ISO-8859-15,944960,940381,0.0478\nCC-MAIN-2026-12,ISO-8859-16,6257,6235,0.0003\nCC-MAIN-2026-12,ISO-8859-2,1742113,1736983,0.0882\nCC-MAIN-2026-12,ISO-8859-3,6679,6673,0.0003\nCC-MAIN-2026-12,ISO-8859-4,12876,12816,0.0007\nCC-MAIN-2026-12,ISO-8859-5,28746,28653,0.0015\nCC-MAIN-2026-12,ISO-8859-6,366,363,0.0000\nCC-MAIN-2026-12,ISO-8859-7,85880,85660,0.0043\nCC-MAIN-2026-12,ISO-8859-8,16121,16106,0.0008\nCC-MAIN-2026-12,ISO-8859-9,396267,395249,0.0201\nCC-MAIN-2026-12,KOI8-R,129674,129487,0.0066\nCC-MAIN-2026-12,KOI8-U,1227,1226,0.0001\nCC-MAIN-2026-12,Shift_JIS,3579430,3569741,0.1813\nCC-MAIN-2026-12,TIS-620,74370,74216,0.0038\nCC-MAIN-2026-12,US-ASCII,395393,394971,0.0200\nCC-MAIN-2026-12,UTF-16,44781,44548,0.0023\nCC-MAIN-2026-12,UTF-16BE,3684,3674,0.0002\nCC-MAIN-2026-12,UTF-16LE,29448,29123,0.0015\nCC-MAIN-2026-12,UTF-32,992,988,0.0001\nCC-MAIN-2026-12,UTF-32LE,4546,4516,0.0002\nCC-MAIN-2026-12,UTF-8,1837974229,1827614246,93.0693\nCC-MAIN-2026-12,windows-1250,1359762,1354264,0.0689\nCC-MAIN-2026-12,windows-1251,9919771,9867155,0.5023\nCC-MAIN-2026-12,windows-1252,3075119,3060164,0.1557\nCC-MAIN-2026-12,windows-1253,46720,46373,0.0024\nCC-MAIN-2026-12,windows-1254,255609,253011,0.0129\nCC-MAIN-2026-12,windows-1255,115854,115475,0.0059\nCC-MAIN-2026-12,windows-1256,545093,543005,0.0276\nCC-MAIN-2026-12,windows-1257,116683,116435,0.0059\nCC-MAIN-2026-12,windows-31j,7656,7636,0.0004\nCC-MAIN-2026-12,x-iso-8859-11,2578,2562,0.0001\nCC-MAIN-2026-12,x-windows-874,132392,132120,0.0067\nCC-MAIN-2026-12,x-windows-949,71,70,0.0000\nCC-MAIN-2026-17,<other>,2318,2314,0.0001\nCC-MAIN-2026-17,<unknown>,41467368,41467368,1.8918\nCC-MAIN-2026-17,Big5,652206,651651,0.0298\nCC-MAIN-2026-17,Big5-HKSCS,772,772,0.0000\nCC-MAIN-2026-17,EUC-JP,2774903,2767865,0.1266\nCC-MAIN-2026-17,EUC-KR,1691059,1688850,0.0771\nCC-MAIN-2026-17,GB18030,328133,327466,0.0150\nCC-MAIN-2026-17,GB2312,4407671,4401246,0.2011\nCC-MAIN-2026-17,GBK,2047427,2043670,0.0934\nCC-MAIN-2026-17,IBM420,110960,110719,0.0051\nCC-MAIN-2026-17,IBM424,25193,25072,0.0011\nCC-MAIN-2026-17,IBM500,17952,17908,0.0008\nCC-MAIN-2026-17,IBM866,2526,2523,0.0001\nCC-MAIN-2026-17,ISO-2022-JP,22833,22808,0.0010\nCC-MAIN-2026-17,ISO-8859-1,59456401,59246052,2.7125\nCC-MAIN-2026-17,ISO-8859-13,620,620,0.0000\nCC-MAIN-2026-17,ISO-8859-15,973840,967873,0.0444\nCC-MAIN-2026-17,ISO-8859-16,6935,6917,0.0003\nCC-MAIN-2026-17,ISO-8859-2,1791551,1785905,0.0817\nCC-MAIN-2026-17,ISO-8859-3,7325,7305,0.0003\nCC-MAIN-2026-17,ISO-8859-4,14715,14662,0.0007\nCC-MAIN-2026-17,ISO-8859-5,16730,16638,0.0008\nCC-MAIN-2026-17,ISO-8859-6,449,447,0.0000\nCC-MAIN-2026-17,ISO-8859-7,88024,87744,0.0040\nCC-MAIN-2026-17,ISO-8859-8,14271,14251,0.0007\nCC-MAIN-2026-17,ISO-8859-9,516036,514479,0.0235\nCC-MAIN-2026-17,KOI8-R,167093,166532,0.0076\nCC-MAIN-2026-17,KOI8-U,1905,1905,0.0001\nCC-MAIN-2026-17,Shift_JIS,3241088,3230774,0.1479\nCC-MAIN-2026-17,TIS-620,79240,79071,0.0036\nCC-MAIN-2026-17,US-ASCII,445179,444631,0.0203\nCC-MAIN-2026-17,UTF-16,47193,47017,0.0022\nCC-MAIN-2026-17,UTF-16BE,6708,6706,0.0003\nCC-MAIN-2026-17,UTF-16LE,84922,84770,0.0039\nCC-MAIN-2026-17,UTF-32,1021,1017,0.0000\nCC-MAIN-2026-17,UTF-32LE,3372,3352,0.0002\nCC-MAIN-2026-17,UTF-8,2054795645,2042701966,93.7434\nCC-MAIN-2026-17,windows-1250,1459400,1453648,0.0666\nCC-MAIN-2026-17,windows-1251,10605458,10541589,0.4838\nCC-MAIN-2026-17,windows-1252,3344637,3329213,0.1526\nCC-MAIN-2026-17,windows-1253,52150,51994,0.0024\nCC-MAIN-2026-17,windows-1254,270316,267976,0.0123\nCC-MAIN-2026-17,windows-1255,116790,116111,0.0053\nCC-MAIN-2026-17,windows-1256,526124,524625,0.0240\nCC-MAIN-2026-17,windows-1257,115165,114923,0.0053\nCC-MAIN-2026-17,windows-31j,7881,7830,0.0004\nCC-MAIN-2026-17,x-iso-8859-11,855,852,0.0000\nCC-MAIN-2026-17,x-windows-874,125810,125471,0.0057\nCC-MAIN-2026-17,x-windows-949,130,129,0.0000\n"
  },
  {
    "path": "plots/charsets.md",
    "content": "---\nlayout: table\ntable_include: charsets-top-100.html\ntable_sortlist: \"{sortList: [[1,1]]}\"\n---\n\nCharacter Encoding of HTML Pages\n================================\n\nThe [character set or encoding](https://en.wikipedia.org/wiki/Character_encoding) of HTML pages only is identified by [Tika](https://tika.apache.org/)'s [AutoDetectReader](https://tika.apache.org/1.25/api/org/apache/tika/detect/AutoDetectReader.html). The table shows the percentage how character sets have been used to encode HTML pages crawled by the latest monthly crawls. The underlying data including page counts is provided in [charsets.csv](./charsets.csv).\n"
  },
  {
    "path": "plots/crawlermetrics.md",
    "content": "Crawler-Related Metrics\n=======================\n\nCrawler-related metrics are extracted from the crawler log files, cf. [../stats/crawler/](https://github.com/commoncrawl/cc-crawl-statistics/blob/master/stats/crawler/) and include\n- the size of the URL database (CrawlDb)\n- the fetch list size (number of URLs scheduled for fetching)\n- the response status of the fetch:\n  - success\n  - redirect\n  - denied (forbidden by HTTP 403 or robots.txt)\n  - failed (404, host not found, etc.)\n- usage of http/https URL protocols (schemes)\n\nThe first plot shows absolute number for the metrics.\n\n![Crawler metrics](./crawler/metrics.png)\n\nThe relative portion of the fetch status is shown in the second graphics.\n\n![Percentage of fetch status](./crawler/fetch_status_percentage.png)\n\nThe next figure shows the relative usage of http and https URL protocols (schemes). The increasing usage HTTPS on the web is reflected. But also crawler properties such as sampling, deduplication and URL canonicalization) may influence the actual amount of HTTPS URLs in a single monthly crawl.\n\n![Percentage of HTTP vs. HTTPS URLs](./crawler/url_protocols_percentage.png)\n\nThe crawls are backed by a CrawlDb which stores URLs, fetch time, status information, content checksum and various other metadata. HTTP response codes are mapped to coarse [CrawlDatum states](https://cwiki.apache.org/confluence/display/NUTCH/CrawlDatumStates) and so are other status signals, such as disallowed by robots.txt or the result of a deduplication job. By adding permanently new URLs, the CrawlDb is growing and requires a permanent cleanup which removes stale URLs. The figure below shows the development of the CrawlDb over time, including the amount of CrawlDatum states. Size and counts are recorded before the fetching of a monthly crawl.\n\n![CrawlDb size and status counts](./crawler/crawldb_status.png)\n\n"
  },
  {
    "path": "plots/crawloverlap.md",
    "content": "Overlaps between Common Crawl Monthly Archives\n==============================================\n\nOverlaps between monthly crawl archives are calculated and plotted as [Jaccard similarity](https://en.wikipedia.org/wiki/Jaccard_index) of unique URLs or content digests. The cardinality of the monthly crawls and the union of two crawls are [Hyperloglog](https://en.wikipedia.org/wiki/HyperLogLog) estimates, cf. [plot/overlap.py](https://github.com/commoncrawl/cc-crawl-statistics/blob/master/plot/overlap.py) for details.\n\n![URL overlap (Jaccard similarity) between Common Crawl monthly crawls](./crawloverlap/crawlsimilarity_matrix_url.png)\n\n![Content overlap between Common Crawl monthly crawls (Jaccard similarity on unique content digests)](./crawloverlap/crawlsimilarity_matrix_digest.png)\n\nNote, that the content overlaps are small and in the same order of magnitude as the 1% error rate of the Hyperloglog cardinality estimates.\n"
  },
  {
    "path": "plots/crawlsize/cumulative.csv",
    "content": "crawl,digest estim.,page,url estim.\nCC-MAIN-2008-2009,1804803498,1798158091,1799114116\nCC-MAIN-2009-2010,4339999986,4661653302,3824634756\nCC-MAIN-2012,7847769263,8490193179,6700436803\nCC-MAIN-2013-20,9490547971,10286291822,8195754186\nCC-MAIN-2013-48,11503581137,12532065489,9346464155\nCC-MAIN-2014-10,13572625500,14833288963,9832774963\nCC-MAIN-2014-15,15602447332,17474660279,9950397001\nCC-MAIN-2014-23,18641073418,21083381155,10354691655\nCC-MAIN-2014-35,20956079021,23954073578,10458526844\nCC-MAIN-2014-41,23507937056,26933817121,10595820253\nCC-MAIN-2014-42,26228211380,30655948799,10668931260\nCC-MAIN-2014-49,27770806276,32604459232,10722997344\nCC-MAIN-2014-52,29465863477,34690436439,10815040325\nCC-MAIN-2015-06,30940526320,36516460542,10880192370\nCC-MAIN-2015-11,32463979449,38353656631,11021004856\nCC-MAIN-2015-14,33766065049,40000354165,11087874963\nCC-MAIN-2015-18,35326761691,42116172224,11179957192\nCC-MAIN-2015-22,36837279660,44131633672,11276662468\nCC-MAIN-2015-27,38376895047,45807252770,11338154181\nCC-MAIN-2015-32,39907079198,47622745179,11405145059\nCC-MAIN-2015-35,41467358985,49470767654,11453781702\nCC-MAIN-2015-40,42565334478,50792755033,11497150192\nCC-MAIN-2015-48,44230018316,52616925560,11605145185\nCC-MAIN-2016-07,45520871944,54350210682,11686758494\nCC-MAIN-2016-18,46751042145,55685257605,11708221081\nCC-MAIN-2016-22,47857808281,57151478403,11859582835\nCC-MAIN-2016-26,48868077184,58388294063,11902605722\nCC-MAIN-2016-30,50237632397,60125616367,12075123774\nCC-MAIN-2016-36,51295633217,61737229457,12189524326\nCC-MAIN-2016-40,52743152144,63459885850,12331627743\nCC-MAIN-2016-44,55627173775,66714862581,14005397439\nCC-MAIN-2016-50,57996438129,69581144971,14490820500\nCC-MAIN-2017-04,60876695619,72727642997,14906550735\nCC-MAIN-2017-09,63865800399,75812009659,15323698796\nCC-MAIN-2017-13,67119410032,78882730235,16014267196\nCC-MAIN-2017-17,69744509254,81825660717,16583912416\nCC-MAIN-2017-22,72316052190,84792954416,17055886868\nCC-MAIN-2017-26,75085000318,87958168502,17825096347\nCC-MAIN-2017-30,77552853745,90850382154,18351199107\nCC-MAIN-2017-34,81109194156,94130463064,19177390204\nCC-MAIN-2017-39,83965683990,97147643627,20016213244\nCC-MAIN-2017-43,87295397289,100798073845,20918444015\nCC-MAIN-2017-47,90375199278,104003017418,21711675713\nCC-MAIN-2017-51,93221122901,106917021841,22349157985\nCC-MAIN-2018-05,96431621375,110381559046,23511097105\nCC-MAIN-2018-09,99564273220,113870022365,24583073520\nCC-MAIN-2018-13,102885914035,117102760383,25385911908\nCC-MAIN-2018-17,105613732494,120204114372,25968567715\nCC-MAIN-2018-22,108421602628,122992502379,26505324121\nCC-MAIN-2018-26,111159265312,126061916626,27237490288\nCC-MAIN-2018-30,114425901875,129325874826,27870676728\nCC-MAIN-2018-34,116854075023,132012198184,28504107420\nCC-MAIN-2018-39,119462460866,134853393013,28993693320\nCC-MAIN-2018-43,122415800423,137895177536,29566931364\nCC-MAIN-2018-47,124525048786,140541746080,30203725220\nCC-MAIN-2018-51,127384661711,143705993715,30922118054\nCC-MAIN-2019-04,130280036558,146595720357,31789761988\nCC-MAIN-2019-09,133310062247,149509453779,32532956245\nCC-MAIN-2019-13,135678206416,152079135624,33219709036\nCC-MAIN-2019-18,137745300121,154576954231,33985148178\nCC-MAIN-2019-22,140219941044,157256700481,34776143018\nCC-MAIN-2019-26,142888639070,159850961598,35657441452\nCC-MAIN-2019-30,145327203530,162445759973,36488951083\nCC-MAIN-2019-35,147887838188,165400596038,37629104062\nCC-MAIN-2019-39,150653922510,167961658950,38621609347\nCC-MAIN-2019-43,153231541805,170980695479,39774629837\nCC-MAIN-2019-47,155332742333,173571290652,40909225217\nCC-MAIN-2019-51,157413646943,176043195617,41825244065\nCC-MAIN-2020-05,160461668413,179144292790,42724695533\nCC-MAIN-2020-10,162830752567,181774256252,43809199716\nCC-MAIN-2020-16,165689194086,184660492489,44789599932\nCC-MAIN-2020-24,168064599874,187423699251,46040917543\nCC-MAIN-2020-29,171062084908,190568432671,47154203497\nCC-MAIN-2020-34,173509592974,193018266910,48095676013\nCC-MAIN-2020-40,176656257005,196491838116,49670234250\nCC-MAIN-2020-45,179298763005,199222901359,51240666293\nCC-MAIN-2020-50,182035630890,201865372860,52618423533\nCC-MAIN-2021-04,184853874152,205266659267,53781737753\nCC-MAIN-2021-10,187408406769,208003409150,55021667409\nCC-MAIN-2021-17,190496420723,211137833956,56407546066\nCC-MAIN-2021-21,192909177042,213769976421,57687854581\nCC-MAIN-2021-25,195201841501,216227608177,59031676141\nCC-MAIN-2021-31,198169308063,219392698032,60025581192\nCC-MAIN-2021-39,201225712241,222352601811,61352022578\nCC-MAIN-2021-43,204833406728,225701779826,62715848469\nCC-MAIN-2021-49,207179211585,228228855625,63924776338\nCC-MAIN-2022-05,210188022512,231215247655,65293210195\nCC-MAIN-2022-21,213617877949,234665071870,66696778543\nCC-MAIN-2022-27,216701932808,237774681542,68119489942\nCC-MAIN-2022-33,219573338989,240363371792,69439230091\nCC-MAIN-2022-40,223169646311,243540134840,70741828607\nCC-MAIN-2022-49,227141025821,246921747728,72000883063\nCC-MAIN-2023-06,229964599953,250111325935,73327803656\nCC-MAIN-2023-14,233370072352,253229959348,74604374730\nCC-MAIN-2023-23,235805412777,256370533316,75614359781\nCC-MAIN-2023-40,239485697308,259815548353,76838156387\nCC-MAIN-2023-50,243498181317,263169590477,78252035354\nCC-MAIN-2024-10,246441310436,266276116043,79643622874\nCC-MAIN-2024-18,249355638842,269062916100,80624442373\nCC-MAIN-2024-22,251639784779,271772794075,81543301245\nCC-MAIN-2024-26,253997038560,274570841101,82488799113\nCC-MAIN-2024-30,256394048536,277117471496,83437816689\nCC-MAIN-2024-33,259118617115,279433397912,84287023650\nCC-MAIN-2024-38,261724865107,282234291375,85282072602\nCC-MAIN-2024-42,263714594810,284729482129,86315032134\nCC-MAIN-2024-46,266385356719,287417293876,87294467131\nCC-MAIN-2024-51,269430609904,290052656232,88348928908\nCC-MAIN-2025-05,272915812712,293083934569,89334444115\nCC-MAIN-2025-08,276246105116,295763640625,90367464910\nCC-MAIN-2025-13,278777325777,298504484812,91270344253\nCC-MAIN-2025-18,280809279268,301251820922,92108476329\nCC-MAIN-2025-21,282504734859,303728986524,92762606290\nCC-MAIN-2025-26,284791401008,306114590473,93475687576\nCC-MAIN-2025-30,287064143452,308537170980,94238953789\nCC-MAIN-2025-33,289427337023,310979664458,94914252824\nCC-MAIN-2025-38,291730810048,313365628667,95715270548\nCC-MAIN-2025-43,293577931360,315982425524,96462869345\nCC-MAIN-2025-47,296088842711,318276898436,97099631663\nCC-MAIN-2025-51,298445856189,320445985715,97883155597\nCC-MAIN-2026-04,301026872854,322775616470,98499220111\nCC-MAIN-2026-08,302693544790,324942608192,99125333660\nCC-MAIN-2026-12,304458347420,326917453426,99725480448\nCC-MAIN-2026-17,306800659832,329109389726,100385941968\n"
  },
  {
    "path": "plots/crawlsize/domain.csv",
    "content": "crawl,domain,host,tld,url\nCC-MAIN-2008-2009,15045431,32086112,1496,1790932667\nCC-MAIN-2009-2010,30794437,68991076,4711,2301135881\nCC-MAIN-2012,41205862,108312113,4533,3597338329\nCC-MAIN-2013-20,13146177,24715985,3557,1666857706\nCC-MAIN-2013-48,13811062,26865697,3587,2085501361\nCC-MAIN-2014-10,15573396,30260036,3805,2032050611\nCC-MAIN-2014-15,15617272,30432463,3844,1718646762\nCC-MAIN-2014-23,16427529,32047686,3997,2116640253\nCC-MAIN-2014-35,16035620,31236378,3986,1877746879\nCC-MAIN-2014-41,16193652,31899800,4043,1980620845\nCC-MAIN-2014-42,16130921,30903420,4038,1602175249\nCC-MAIN-2014-49,14841151,25341644,3961,1321875973\nCC-MAIN-2014-52,15659214,26944971,4053,1905493151\nCC-MAIN-2015-06,15069183,25388182,4028,1679287071\nCC-MAIN-2015-11,14894291,26083379,4042,1685659195\nCC-MAIN-2015-14,14489203,25268429,4018,1514869973\nCC-MAIN-2015-18,15205382,26713877,4071,1934559347\nCC-MAIN-2015-22,15152686,26650871,4084,1836492906\nCC-MAIN-2015-27,14020009,24412992,4009,1531042999\nCC-MAIN-2015-32,14309119,25082257,4049,1649248826\nCC-MAIN-2015-35,14538242,25493476,4086,1673197542\nCC-MAIN-2015-40,12405056,21201836,3927,1215112821\nCC-MAIN-2015-48,14336765,25267526,4083,1644173738\nCC-MAIN-2016-07,14015346,24559106,4092,1560185771\nCC-MAIN-2016-18,13267938,23006430,4049,1335046923\nCC-MAIN-2016-22,20350958,32432769,4505,1466220798\nCC-MAIN-2016-26,18960939,29359449,4266,1236815660\nCC-MAIN-2016-30,20846085,33908950,4566,1632457174\nCC-MAIN-2016-36,28693907,52508908,4944,1558553055\nCC-MAIN-2016-40,28180171,51543077,4774,1690810255\nCC-MAIN-2016-44,34243794,60710319,4772,3200654906\nCC-MAIN-2016-50,30479701,49920842,4701,2822871128\nCC-MAIN-2017-04,29850051,49381625,4597,3116143133\nCC-MAIN-2017-09,27330988,49058582,4465,2927969262\nCC-MAIN-2017-13,20191742,41050117,4421,3036216177\nCC-MAIN-2017-17,24910163,46613678,4551,2907715349\nCC-MAIN-2017-22,23868267,45591275,5013,2918934207\nCC-MAIN-2017-26,23350329,49246271,4847,3134206224\nCC-MAIN-2017-30,28203688,56656354,4961,2845357895\nCC-MAIN-2017-34,21860809,50282581,4834,3256820690\nCC-MAIN-2017-39,25543915,68834916,4990,2981741134\nCC-MAIN-2017-43,26443475,64582863,4990,3612710595\nCC-MAIN-2017-47,25418336,59250305,4913,3176376980\nCC-MAIN-2017-51,23514587,50537187,4992,2894523756\nCC-MAIN-2018-05,29769642,60598789,5045,3433021579\nCC-MAIN-2018-09,31215472,71316578,5147,3457773652\nCC-MAIN-2018-13,31051894,64663019,5180,3198644180\nCC-MAIN-2018-17,31132878,66341003,5158,3075796938\nCC-MAIN-2018-22,30953922,61359667,5184,2760510003\nCC-MAIN-2018-26,31959458,62303176,5138,3035256963\nCC-MAIN-2018-30,30534423,62451023,5150,3216428094\nCC-MAIN-2018-34,30085546,54331757,5115,2651873292\nCC-MAIN-2018-39,29832599,56474429,5122,2809230609\nCC-MAIN-2018-43,31963859,62069483,5180,3009250058\nCC-MAIN-2018-47,33389605,57213346,5204,2613775730\nCC-MAIN-2018-51,35271439,63270632,5257,3126936231\nCC-MAIN-2019-04,33634695,60242330,5198,2862395712\nCC-MAIN-2019-09,35484698,49287179,5250,2884823295\nCC-MAIN-2019-13,34974874,48929500,5201,2543088606\nCC-MAIN-2019-18,33191518,45686480,5146,2472089618\nCC-MAIN-2019-22,35605554,49283908,5180,2652632174\nCC-MAIN-2019-26,31556662,43324846,4982,2571282259\nCC-MAIN-2019-30,31115231,42885276,4986,2570908353\nCC-MAIN-2019-35,36290400,49943451,4985,2927837229\nCC-MAIN-2019-39,31452367,43145761,4912,2538726203\nCC-MAIN-2019-43,35197133,47657983,4955,2993600398\nCC-MAIN-2019-47,33253379,44286957,4884,2567604470\nCC-MAIN-2019-51,32939357,44413500,4879,2451407069\nCC-MAIN-2020-05,34258638,46981558,4880,3073345461\nCC-MAIN-2020-10,36078526,50557611,5031,2608200380\nCC-MAIN-2020-16,34740004,48417633,4995,2862109363\nCC-MAIN-2020-24,35144434,48003638,4980,2739217355\nCC-MAIN-2020-29,35992413,49631406,4973,3115135038\nCC-MAIN-2020-34,35784429,48620941,4992,2429402562\nCC-MAIN-2020-40,35651678,52327922,4997,3446549212\nCC-MAIN-2020-45,35366328,52252895,4974,2709830599\nCC-MAIN-2020-50,34705193,50489412,4967,2623030081\nCC-MAIN-2021-04,35260454,49115244,4987,3374268802\nCC-MAIN-2021-10,34030905,45169589,4965,2717572573\nCC-MAIN-2021-17,34010292,44536533,4962,3116314669\nCC-MAIN-2021-21,36693656,47079406,5018,2616289925\nCC-MAIN-2021-25,35932515,47815503,4953,2443174594\nCC-MAIN-2021-31,36229096,46990262,4901,3148285250\nCC-MAIN-2021-39,35400842,46419761,4941,2942372881\nCC-MAIN-2021-43,36268319,46356937,4950,3332276463\nCC-MAIN-2021-49,35886138,45134961,4906,2510642167\nCC-MAIN-2022-05,35485371,44368670,4908,2971085259\nCC-MAIN-2022-21,36239867,45672763,4903,3427800099\nCC-MAIN-2022-27,35465507,44649210,4877,3091798575\nCC-MAIN-2022-33,36634288,46272964,4908,2570114162\nCC-MAIN-2022-40,34439244,43813671,4889,3160148440\nCC-MAIN-2022-49,34827992,44158815,4901,3360693494\nCC-MAIN-2023-06,33172138,41677455,4853,3171463873\nCC-MAIN-2023-14,34430126,43564649,4889,3100440521\nCC-MAIN-2023-23,35465162,44538755,4920,3121917891\nCC-MAIN-2023-40,34751623,43774397,4922,3419001876\nCC-MAIN-2023-50,37753297,47588945,4944,3327873282\nCC-MAIN-2024-10,37076380,46400316,4909,3081216032\nCC-MAIN-2024-18,37650533,47249591,4895,2768587136\nCC-MAIN-2024-22,39672464,50329468,4908,2692942753\nCC-MAIN-2024-26,41422679,52714606,4903,2780577813\nCC-MAIN-2024-30,40022641,49631224,4891,2532418706\nCC-MAIN-2024-33,38314355,47646699,4876,2303470630\nCC-MAIN-2024-38,38600392,47667694,4910,2786769935\nCC-MAIN-2024-42,38304026,47552457,4886,2482057519\nCC-MAIN-2024-46,38369536,47545592,4897,2674779340\nCC-MAIN-2024-51,38347759,47522314,4883,2621880944\nCC-MAIN-2025-05,39321583,48854520,4863,3015035656\nCC-MAIN-2025-08,38551855,47641976,4833,2665362477\nCC-MAIN-2025-13,38048218,46701762,4816,2725953839\nCC-MAIN-2025-18,38885373,47557674,4794,2731781792\nCC-MAIN-2025-21,38251838,46976773,4784,2464239933\nCC-MAIN-2025-26,38512437,47435427,4806,2373133460\nCC-MAIN-2025-30,39091572,47641753,4771,2409871272\nCC-MAIN-2025-33,38893957,47529915,4748,2429917832\nCC-MAIN-2025-38,38618249,47001434,4760,2373363904\nCC-MAIN-2025-43,38536490,47028412,4759,2603532961\nCC-MAIN-2025-47,36858566,45278203,4743,2282620113\nCC-MAIN-2025-51,36971985,46060332,4794,2157963360\nCC-MAIN-2026-04,36977003,44962815,4789,2318103719\nCC-MAIN-2026-08,37153380,45570756,4808,2155602565\nCC-MAIN-2026-12,36172833,44065210,4777,1964104377\nCC-MAIN-2026-17,35359712,43212465,4753,2179433788\n"
  },
  {
    "path": "plots/crawlsize/monthly.csv",
    "content": "crawl,digest estim.,page,url\nCC-MAIN-2008-2009,1804803498,1798158091,1790932667\nCC-MAIN-2009-2010,2631454016,2863495211,2301135881\nCC-MAIN-2012,3472132880,3828539877,3597338329\nCC-MAIN-2013-20,1675186145,1796098643,1666857706\nCC-MAIN-2013-48,2123908635,2245773667,2085501361\nCC-MAIN-2014-10,2115654671,2301223474,2032050611\nCC-MAIN-2014-15,2250363653,2641371316,1718646762\nCC-MAIN-2014-23,3127260498,3608720876,2116640253\nCC-MAIN-2014-35,2513136600,2870692423,1877746879\nCC-MAIN-2014-41,2643268717,2979743543,1980620845\nCC-MAIN-2014-42,3004865099,3722131678,1602175249\nCC-MAIN-2014-49,1675826663,1948510433,1321875973\nCC-MAIN-2014-52,1917739931,2085977207,1905493151\nCC-MAIN-2015-06,1663353964,1826024103,1679287071\nCC-MAIN-2015-11,1660875177,1837196089,1685659195\nCC-MAIN-2015-14,1497626091,1646697534,1514869973\nCC-MAIN-2015-18,1910978257,2115818059,1934559347\nCC-MAIN-2015-22,1821352251,2015461448,1836492906\nCC-MAIN-2015-27,1525928862,1675619098,1531042999\nCC-MAIN-2015-32,1613612273,1815492409,1649248826\nCC-MAIN-2015-35,1677929649,1848022475,1673197542\nCC-MAIN-2015-40,1188702135,1321987379,1215112821\nCC-MAIN-2015-48,1643268398,1824170527,1644173738\nCC-MAIN-2016-07,1546567872,1733285122,1560185771\nCC-MAIN-2016-18,1211048216,1335046923,1335046923\nCC-MAIN-2016-22,1308787436,1466220798,1466220798\nCC-MAIN-2016-26,1080537066,1236815660,1236815660\nCC-MAIN-2016-30,1537831071,1737322304,1632457174\nCC-MAIN-2016-36,1435966389,1611613090,1558553055\nCC-MAIN-2016-40,1538695808,1722656393,1690810255\nCC-MAIN-2016-44,3040453061,3254976731,3200654906\nCC-MAIN-2016-50,2835369567,2866282390,2822871128\nCC-MAIN-2017-04,3124474229,3146498026,3116143133\nCC-MAIN-2017-09,3075159558,3084366662,2927969262\nCC-MAIN-2017-13,3076918527,3070720576,3036216177\nCC-MAIN-2017-17,2915114582,2942930482,2907715349\nCC-MAIN-2017-22,2913487045,2967293699,2918934207\nCC-MAIN-2017-26,3090678021,3165214086,3134206224\nCC-MAIN-2017-30,2731370763,2892213652,2845357895\nCC-MAIN-2017-34,3321321532,3280080910,3256820690\nCC-MAIN-2017-39,2954936664,3017180563,2981741134\nCC-MAIN-2017-43,3568900959,3650430218,3612710595\nCC-MAIN-2017-47,3147013327,3204943573,3176376980\nCC-MAIN-2017-51,2838391323,2914004423,2894523756\nCC-MAIN-2018-05,3405797273,3464537205,3433021579\nCC-MAIN-2018-09,3473010805,3488463319,3457773652\nCC-MAIN-2018-13,3159524180,3232738018,3198644180\nCC-MAIN-2018-17,3012333785,3101353989,3075796938\nCC-MAIN-2018-22,2744992004,2788388007,2760510003\nCC-MAIN-2018-26,2987363973,3069414247,3035256963\nCC-MAIN-2018-30,3179521724,3263958200,3216428094\nCC-MAIN-2018-34,2622248769,2686323358,2651873292\nCC-MAIN-2018-39,2779896284,2841194829,2809230609\nCC-MAIN-2018-43,3015132452,3041784523,3009250058\nCC-MAIN-2018-47,2561180363,2646568544,2613775730\nCC-MAIN-2018-51,3119954567,3164247635,3126936231\nCC-MAIN-2019-04,2783709611,2889726642,2862395712\nCC-MAIN-2019-09,2803066951,2913733422,2884823295\nCC-MAIN-2019-13,2497065618,2569681845,2543088606\nCC-MAIN-2019-18,2438027577,2497818607,2472089618\nCC-MAIN-2019-22,2630765347,2679746250,2652632174\nCC-MAIN-2019-26,2554582339,2594261117,2571282259\nCC-MAIN-2019-30,2531580647,2594798375,2570908353\nCC-MAIN-2019-35,2833688958,2954836065,2927837229\nCC-MAIN-2019-39,2492717822,2561062912,2538726203\nCC-MAIN-2019-43,2924967393,3019036529,2993600398\nCC-MAIN-2019-47,2514913197,2590595173,2567604470\nCC-MAIN-2019-51,2406286576,2471904965,2451407069\nCC-MAIN-2020-05,3028524398,3101097173,3073345461\nCC-MAIN-2020-10,2598864641,2629963462,2608200380\nCC-MAIN-2020-16,2865127577,2886236237,2862109363\nCC-MAIN-2020-24,2685892317,2763206762,2739217355\nCC-MAIN-2020-29,3040070894,3144733420,3115135038\nCC-MAIN-2020-34,2354875952,2449834239,2429402562\nCC-MAIN-2020-40,3407171814,3473571206,3446549212\nCC-MAIN-2020-45,2627114869,2731063243,2709830599\nCC-MAIN-2020-50,2556108707,2642471501,2623030081\nCC-MAIN-2021-04,3317353644,3401286407,3374268802\nCC-MAIN-2021-10,2698208760,2736749883,2717572573\nCC-MAIN-2021-17,3057706409,3134424806,3116314669\nCC-MAIN-2021-21,2590708976,2632142465,2616289925\nCC-MAIN-2021-25,2404813154,2457631756,2443174594\nCC-MAIN-2021-31,3060540112,3165089855,3148285250\nCC-MAIN-2021-39,2880390023,2959903779,2942372881\nCC-MAIN-2021-43,3304468971,3349178015,3332276463\nCC-MAIN-2021-49,2445330855,2527075799,2510642167\nCC-MAIN-2022-05,2923130207,2986392030,2971085259\nCC-MAIN-2022-21,3397499191,3449824215,3427800099\nCC-MAIN-2022-27,3065329274,3109609672,3091798575\nCC-MAIN-2022-33,2506544286,2588690250,2570114162\nCC-MAIN-2022-40,3100384124,3176763048,3160148440\nCC-MAIN-2022-49,3327669734,3381612888,3360693494\nCC-MAIN-2023-06,3129891467,3189578207,3171463873\nCC-MAIN-2023-14,3061148112,3118633413,3100440521\nCC-MAIN-2023-23,3063301913,3140573968,3121917891\nCC-MAIN-2023-40,3398196830,3445015037,3419001876\nCC-MAIN-2023-50,3296666094,3354042124,3327873282\nCC-MAIN-2024-10,3005351878,3106525566,3081216032\nCC-MAIN-2024-18,2736902585,2786800057,2768587136\nCC-MAIN-2024-22,2639673318,2709877975,2692942753\nCC-MAIN-2024-26,2751769686,2798047026,2780577813\nCC-MAIN-2024-30,2456863301,2546630395,2532418706\nCC-MAIN-2024-33,2261433594,2315926416,2303470630\nCC-MAIN-2024-38,2721268713,2800893463,2786769935\nCC-MAIN-2024-42,2425001789,2495190754,2482057519\nCC-MAIN-2024-46,2626639405,2687811747,2674779340\nCC-MAIN-2024-51,2574983678,2635362356,2621880944\nCC-MAIN-2025-05,2970641172,3031278337,3015035656\nCC-MAIN-2025-08,2609966983,2679706056,2665362477\nCC-MAIN-2025-13,2674329452,2740844187,2725953839\nCC-MAIN-2025-18,2671584365,2747336110,2731781792\nCC-MAIN-2025-21,2399538709,2477165602,2464239933\nCC-MAIN-2025-26,2314401772,2385603949,2373133460\nCC-MAIN-2025-30,2353198706,2422580507,2409871272\nCC-MAIN-2025-33,2368713079,2442493478,2429917832\nCC-MAIN-2025-38,2322577046,2385964209,2373363904\nCC-MAIN-2025-43,2585129731,2616796857,2603532961\nCC-MAIN-2025-47,2243496646,2294472912,2282620113\nCC-MAIN-2025-51,2089652489,2169087279,2157963360\nCC-MAIN-2026-04,2306342206,2329630755,2318103719\nCC-MAIN-2026-08,2092658715,2166991722,2155602565\nCC-MAIN-2026-12,1919920870,1974845234,1964104377\nCC-MAIN-2026-17,2137917323,2191936300,2179433788\n"
  },
  {
    "path": "plots/crawlsize/monthly_new.csv",
    "content": "crawl,url estim. new\nCC-MAIN-2008-2009,1799114116\nCC-MAIN-2009-2010,2025520640\nCC-MAIN-2012,2875802047\nCC-MAIN-2013-20,1495317383\nCC-MAIN-2013-48,1150709969\nCC-MAIN-2014-10,486310808\nCC-MAIN-2014-15,117622038\nCC-MAIN-2014-23,404294654\nCC-MAIN-2014-35,103835189\nCC-MAIN-2014-41,137293409\nCC-MAIN-2014-42,73111007\nCC-MAIN-2014-49,54066084\nCC-MAIN-2014-52,92042981\nCC-MAIN-2015-06,65152045\nCC-MAIN-2015-11,140812486\nCC-MAIN-2015-14,66870107\nCC-MAIN-2015-18,92082229\nCC-MAIN-2015-22,96705276\nCC-MAIN-2015-27,61491713\nCC-MAIN-2015-32,66990878\nCC-MAIN-2015-35,48636643\nCC-MAIN-2015-40,43368490\nCC-MAIN-2015-48,107994993\nCC-MAIN-2016-07,81613309\nCC-MAIN-2016-18,21462587\nCC-MAIN-2016-22,151361754\nCC-MAIN-2016-26,43022887\nCC-MAIN-2016-30,172518052\nCC-MAIN-2016-36,114400552\nCC-MAIN-2016-40,142103417\nCC-MAIN-2016-44,1673769696\nCC-MAIN-2016-50,485423061\nCC-MAIN-2017-04,415730235\nCC-MAIN-2017-09,417148061\nCC-MAIN-2017-13,690568400\nCC-MAIN-2017-17,569645220\nCC-MAIN-2017-22,471974452\nCC-MAIN-2017-26,769209479\nCC-MAIN-2017-30,526102760\nCC-MAIN-2017-34,826191097\nCC-MAIN-2017-39,838823040\nCC-MAIN-2017-43,902230771\nCC-MAIN-2017-47,793231698\nCC-MAIN-2017-51,637482272\nCC-MAIN-2018-05,1161939120\nCC-MAIN-2018-09,1071976415\nCC-MAIN-2018-13,802838388\nCC-MAIN-2018-17,582655807\nCC-MAIN-2018-22,536756406\nCC-MAIN-2018-26,732166167\nCC-MAIN-2018-30,633186440\nCC-MAIN-2018-34,633430692\nCC-MAIN-2018-39,489585900\nCC-MAIN-2018-43,573238044\nCC-MAIN-2018-47,636793856\nCC-MAIN-2018-51,718392834\nCC-MAIN-2019-04,867643934\nCC-MAIN-2019-09,743194257\nCC-MAIN-2019-13,686752791\nCC-MAIN-2019-18,765439142\nCC-MAIN-2019-22,790994840\nCC-MAIN-2019-26,881298434\nCC-MAIN-2019-30,831509631\nCC-MAIN-2019-35,1140152979\nCC-MAIN-2019-39,992505285\nCC-MAIN-2019-43,1153020490\nCC-MAIN-2019-47,1134595380\nCC-MAIN-2019-51,916018848\nCC-MAIN-2020-05,899451468\nCC-MAIN-2020-10,1084504183\nCC-MAIN-2020-16,980400216\nCC-MAIN-2020-24,1251317611\nCC-MAIN-2020-29,1113285954\nCC-MAIN-2020-34,941472516\nCC-MAIN-2020-40,1574558237\nCC-MAIN-2020-45,1570432043\nCC-MAIN-2020-50,1377757240\nCC-MAIN-2021-04,1163314220\nCC-MAIN-2021-10,1239929656\nCC-MAIN-2021-17,1385878657\nCC-MAIN-2021-21,1280308515\nCC-MAIN-2021-25,1343821560\nCC-MAIN-2021-31,993905051\nCC-MAIN-2021-39,1326441386\nCC-MAIN-2021-43,1363825891\nCC-MAIN-2021-49,1208927869\nCC-MAIN-2022-05,1368433857\nCC-MAIN-2022-21,1403568348\nCC-MAIN-2022-27,1422711399\nCC-MAIN-2022-33,1319740149\nCC-MAIN-2022-40,1302598516\nCC-MAIN-2022-49,1259054456\nCC-MAIN-2023-06,1326920593\nCC-MAIN-2023-14,1276571074\nCC-MAIN-2023-23,1009985051\nCC-MAIN-2023-40,1223796606\nCC-MAIN-2023-50,1413878967\nCC-MAIN-2024-10,1391587520\nCC-MAIN-2024-18,980819499\nCC-MAIN-2024-22,918858872\nCC-MAIN-2024-26,945497868\nCC-MAIN-2024-30,949017576\nCC-MAIN-2024-33,849206961\nCC-MAIN-2024-38,995048952\nCC-MAIN-2024-42,1032959532\nCC-MAIN-2024-46,979434997\nCC-MAIN-2024-51,1054461777\nCC-MAIN-2025-05,985515207\nCC-MAIN-2025-08,1033020795\nCC-MAIN-2025-13,902879343\nCC-MAIN-2025-18,838132076\nCC-MAIN-2025-21,654129961\nCC-MAIN-2025-26,713081286\nCC-MAIN-2025-30,763266213\nCC-MAIN-2025-33,675299035\nCC-MAIN-2025-38,801017724\nCC-MAIN-2025-43,747598797\nCC-MAIN-2025-47,636762318\nCC-MAIN-2025-51,783523934\nCC-MAIN-2026-04,616064514\nCC-MAIN-2026-08,626113549\nCC-MAIN-2026-12,600146788\nCC-MAIN-2026-17,660461520\n"
  },
  {
    "path": "plots/crawlsize/url_last_n_crawls.csv",
    "content": "crawl,1,12,2,3,4,6,9\nCC-MAIN-2008-2009,1790932667,nan,nan,nan,nan,nan,nan\nCC-MAIN-2009-2010,2301135881,nan,3824634756,nan,nan,nan,nan\nCC-MAIN-2012,3597338329,nan,5338230492,6700436803,nan,nan,nan\nCC-MAIN-2013-20,1666857706,nan,5102564526,6794857295,8195754186,nan,nan\nCC-MAIN-2013-48,2085501361,nan,2814463798,6240947269,7934679100,nan,nan\nCC-MAIN-2014-10,2032050611,nan,2670134814,3337225376,6725333686,9832774963,nan\nCC-MAIN-2014-15,1718646762,nan,2269648596,2804213185,3467517290,8545885193,nan\nCC-MAIN-2014-23,2116640253,nan,2508686420,2814919207,3225671322,7252594573,nan\nCC-MAIN-2014-35,1877746879,nan,2378823435,2688988045,2947488273,3964962965,10458526844\nCC-MAIN-2014-41,1980620845,nan,2272644005,2601497773,2889897351,3501256106,9209551673\nCC-MAIN-2014-42,1602175249,nan,2167042315,2415496146,2698811403,3205015840,7590387789\nCC-MAIN-2014-49,1321875973,10722997344,1856602934,2272718194,2498752932,3039372985,4245175437\nCC-MAIN-2014-52,1905493151,9419407885,2048360670,2239881411,2492504015,2892401473,3725944955\nCC-MAIN-2015-06,1679287071,7775153522,2100950452,2208216202,2375016211,2753064126,3428622028\nCC-MAIN-2015-11,1685659195,4547219851,2070364891,2361569754,2452617129,2807861364,3381927848\nCC-MAIN-2015-14,1514869973,3978557342,1995315397,2247254101,2490479859,2707608520,3233872061\nCC-MAIN-2015-18,1934559347,3733516984,2129341154,2313250930,2479757369,2738619103,3171193476\nCC-MAIN-2015-22,1836492906,3637184874,2210849367,2336416081,2474778730,2773418454,3124299031\nCC-MAIN-2015-27,1531042999,3504376280,2074983989,2354812587,2466265633,2713029125,3047351063\nCC-MAIN-2015-32,1649248826,3411454100,1957222773,2252288208,2480722496,2691372578,3013328428\nCC-MAIN-2015-35,1673197542,3356264728,1960637890,2150631881,2385683293,2680198957,3036367263\nCC-MAIN-2015-40,1215112821,3272730053,1880574946,2102012064,2265845388,2671200407,2969836620\nCC-MAIN-2015-48,1644173738,3269369708,1874444927,2124422294,2291480136,2627452451,2973683472\nCC-MAIN-2016-07,1560185771,3302286301,1938230429,2095920811,2294445055,2569770285,2982529495\nCC-MAIN-2016-18,1335046923,3221940976,1762852237,2056977558,2195060854,2502413881,2944935037\nCC-MAIN-2016-22,1466220798,3318087171,1720103378,2023116266,2298830078,2591699621,3006564226\nCC-MAIN-2016-26,1236815660,3277132629,1687590694,1874360729,2145998219,2519975153,2904804076\nCC-MAIN-2016-30,1632457174,3395341138,1821143340,2033027096,2170980278,2625071858,2993482544\nCC-MAIN-2016-36,1558553055,3383126164,1943622715,2066276054,2220373904,2558454276,3014372483\nCC-MAIN-2016-40,1690810255,3421186613,1924600759,2194852775,2297154694,2558817748,3072547225\nCC-MAIN-2016-44,3200654906,4989344103,3521602715,3685227823,3924042245,4156389144,4660920304\nCC-MAIN-2016-50,2822871128,5358777996,3865932493,4081634184,4222536091,4507176714,4960693985\nCC-MAIN-2017-04,3116143133,5714674302,3733768705,4455059090,4634572990,4950240900,5262628013\nCC-MAIN-2017-09,2927969262,6079377490,3935057069,4354453546,4965823742,5263421140,5614505233\nCC-MAIN-2017-13,3036216177,6653640531,4058774798,4781357539,5149796452,5894926449,6236818461\nCC-MAIN-2017-17,2907715349,7021341798,4335119428,5003153239,5411920389,6335193937,6727708548\nCC-MAIN-2017-22,2918934207,7407877742,4722225671,5247275367,5584480004,6263883681,7067706901\nCC-MAIN-2017-26,3134206224,8072789255,5025036839,5779803610,6112818705,6759925393,7761965864\nCC-MAIN-2017-30,2845357895,8561307519,5458538980,6208963954,6536861924,7114582528,8190227801\nCC-MAIN-2017-34,3256820690,9260741526,5756777618,6430357494,7112877630,7686106569,8594561433\nCC-MAIN-2017-39,2981741134,10045005372,5940034058,6989390788,7555704239,8321913096,9204158854\nCC-MAIN-2017-43,3612710595,10821737191,6510094580,7319682064,8174062430,9014909756,9835397477\nCC-MAIN-2017-47,3176376980,11217349783,6710795851,7722206045,8375247142,9532840451,10349835157\nCC-MAIN-2017-51,2894523756,11642030295,6045013407,7681214257,8484310391,9952200757,10827795343\nCC-MAIN-2018-05,3433021579,12470563915,6245202192,8281354819,9244957448,10611300741,11716360337\nCC-MAIN-2018-09,3457773652,13322412540,6879055877,8753463733,9684354163,11295089182,12548963665\nCC-MAIN-2018-13,3198644180,13885356708,6620223851,9092911747,9845201117,11460743447,13045614992\nCC-MAIN-2018-17,3075796938,14276375332,6173779601,8595591919,9982712294,11393256342,13234300556\nCC-MAIN-2018-22,2760510003,14593795578,5730210533,7981653671,9630374744,11367149069,13388852674\nCC-MAIN-2018-26,3035256963,15000574113,5765513719,7818358756,9314231857,11539161457,13417447203\nCC-MAIN-2018-30,3216428094,15159747362,6224839843,8300831228,9527768209,11291063248,13386164986\nCC-MAIN-2018-34,2651873292,15349186887,5860690482,7916325236,9244077886,11120699520,13437470142\nCC-MAIN-2018-39,2809230609,15244154700,5444842794,7408970490,8739344993,10973721782,13453198523\nCC-MAIN-2018-43,3009250058,15204706752,5809500310,6903649830,8247279458,10664093214,13134798674\nCC-MAIN-2018-47,2613775730,15285198672,5604096569,7124978165,7908935774,10303607798,13034660078\nCC-MAIN-2018-51,3126936231,15537877536,5638710615,7365584034,8200552050,10003441223,13143506966\nCC-MAIN-2019-04,2862395712,15465738071,6027205484,7329545621,8380441558,9768293009,13078783242\nCC-MAIN-2019-09,2884823295,15424307911,5651701997,7426849816,8312709397,10000849820,12782712914\nCC-MAIN-2019-13,2543088606,15368676187,5330417167,6909270598,8329726406,10045283284,12375359274\nCC-MAIN-2019-18,2472089618,15176654917,4988463746,6595046308,7912728102,9984314003,12020808632\nCC-MAIN-2019-22,2652632174,15079501231,5085892921,6575963620,7810471953,10225944748,12353912414\nCC-MAIN-2019-26,2571282259,14972269495,5188411493,6634008519,7762961532,10004482307,12689935261\nCC-MAIN-2019-30,2570908353,14663012628,5012203245,6607458427,7780181445,9819185899,12750013623\nCC-MAIN-2019-35,2927837229,15360386075,5405804678,6902465484,8175093156,10122619342,13310865078\nCC-MAIN-2019-39,2538726203,15852601084,5422687509,7062830456,8243843855,10349355860,13347001708\nCC-MAIN-2019-43,2993600398,16194261848,5420555922,7318981335,8539983786,10735558696,13469604952\nCC-MAIN-2019-47,2567604470,16689389386,5406243082,7056681768,8686549176,10841741253,13697889358\nCC-MAIN-2019-51,2451407069,16651071975,4897364558,7010240087,8523324012,10887406425,13748244251\nCC-MAIN-2020-05,3073345461,16612681521,4866838888,6579469907,8450624455,10924768940,13924676092\nCC-MAIN-2020-10,2608200380,16846620247,5374716471,6922864426,8413345899,11119748687,14114627495\nCC-MAIN-2020-16,2862109363,17072531233,4884563161,6814012518,8280608793,11263044403,14322438231\nCC-MAIN-2020-24,2739217355,17385530205,5295535145,7086553027,8796836054,11276575427,14608017700\nCC-MAIN-2020-29,3115135038,17575587786,5761148134,7314502707,8970998929,11648711820,14861414998\nCC-MAIN-2020-34,2429402562,17740048551,5506384671,7579860899,8986058099,11851444284,15056541648\nCC-MAIN-2020-40,3446549212,18472665636,5770323568,7891993007,9773754487,12427161838,15469338063\nCC-MAIN-2020-45,2709830599,19066253268,6070506795,7827673474,9787709971,12726651229,16144851741\nCC-MAIN-2020-50,2623030081,19568235827,5300297356,7799175349,9467573340,12981490742,16576920480\nCC-MAIN-2021-04,3374268802,19786340303,5889311083,7720391747,9574225899,12903059456,16953858229\nCC-MAIN-2021-10,2717572573,20297261720,5990832044,7676032540,9295491663,12575242600,17160672855\nCC-MAIN-2021-17,3116314669,20872200529,5802784011,7893431719,9432293889,12683145383,17508283534\nCC-MAIN-2021-21,2616289925,21190983173,5718251449,7656768040,9572349264,12457802579,17211843630\nCC-MAIN-2021-25,2443174594,21247885942,5008082717,7882003922,9442957535,12557820570,16962863821\nCC-MAIN-2021-31,3148285250,21236090301,5479050129,7308069398,9307036599,12524665742,16796276362\nCC-MAIN-2021-39,2942372881,21205644873,6022435140,7672066493,9289153628,12452033994,16754719401\nCC-MAIN-2021-43,3332276463,21205538070,6262527417,8126259455,9629124215,12791724784,17011781635\nCC-MAIN-2021-49,2510642167,21498748761,5739798414,8547339940,10108588582,13018149788,17387061597\nCC-MAIN-2022-05,2971085259,21439066834,5407415444,8210859755,10320657898,13200772000,17474990755\nCC-MAIN-2022-21,3427800099,21776694542,6229843408,8144898287,10172428320,13488816376,17764575900\nCC-MAIN-2022-27,3091798575,22289192042,6439594860,8420653437,10232704215,13963486656,17978912106\nCC-MAIN-2022-33,2570114162,22249936543,5662213396,8862564477,10444459889,13831769405,18134805197\nCC-MAIN-2022-40,3160148440,22418263241,5658203891,8501893826,10699660390,13863384133,18388522390\nCC-MAIN-2022-49,3360693494,22370950615,6484203306,8486922386,10513615955,13931460230,18677976033\nCC-MAIN-2023-06,3171463873,22519495870,6506734493,8407253553,10221653234,13947797962,18501742387\nCC-MAIN-2023-14,3100440521,22538145885,6216918640,8463876604,10179447007,13686732579,18320001561\nCC-MAIN-2023-23,3121917891,22602803052,6150896632,8265712739,10180474290,13378355910,17958568615\nCC-MAIN-2023-40,3419001876,22469965483,6228906585,8401830837,10203917135,13425574456,18231303879\nCC-MAIN-2023-50,3327873282,22521123399,6706221284,8691583101,10475591287,13692382999,18213156599\nCC-MAIN-2024-10,3081216032,22317048979,6263566448,8936952554,10581417342,13593463584,18068153613\nCC-MAIN-2024-18,2768587136,22190181208,5832675481,8524203336,10676017752,13624395460,17820810768\nCC-MAIN-2024-22,2692942753,21905836569,5390835671,8301503828,10189852106,13441143799,17656169037\nCC-MAIN-2024-26,2780577813,21596557359,5409455504,8107769333,10114514729,13406407335,17400651453\nCC-MAIN-2024-30,2532418706,21237485769,5290227057,7873980261,10039848139,13091771451,17290503423\nCC-MAIN-2024-33,2303470630,21001059427,4751305847,7435937093,9840290625,13061891489,17006403865\nCC-MAIN-2024-38,2786769935,20684915191,5066981627,7507006248,9679315995,13025708402,16923493316\nCC-MAIN-2024-42,2482057519,20528572812,5200858747,7392984819,9499694430,12908023463,16771800001\nCC-MAIN-2024-46,2674779340,20344721467,5132015471,7844620801,9692411198,12925722525,16791557983\nCC-MAIN-2024-51,2621880944,20456250957,5290877126,7688554165,10007488015,12982902859,17030167896\nCC-MAIN-2025-05,3015035656,20338241132,5618696000,8139967689,10074727253,13052703347,17011102575\nCC-MAIN-2025-08,2665362477,20353835726,5663457487,8140995932,10240046634,13274553247,17081560125\nCC-MAIN-2025-13,2725953839,20505037034,5348413205,8271240792,10317939697,13391610670,17093218772\nCC-MAIN-2025-18,2731781792,20504705850,5467358518,7958409633,10292525107,13535389576,17199819070\nCC-MAIN-2025-21,2464239933,20307381436,5188671695,7940153305,10023619078,13408521057,17172775559\nCC-MAIN-2025-26,2373133460,20204598763,4817550388,7601979898,10010192726,13331057454,17110644544\nCC-MAIN-2025-30,2409871272,20113218203,4763393384,7156349483,9687833895,13128018719,17115824556\nCC-MAIN-2025-33,2429917832,20093604947,4833380611,7159008177,9289000131,12948189373,16942737047\nCC-MAIN-2025-38,2373363904,19892564238,4747712181,7098425422,9205559994,12623234533,16683672770\nCC-MAIN-2025-43,2603532961,19844686095,4894153297,7262710418,9218032019,12290784914,16494270875\nCC-MAIN-2025-47,2282620113,19716225295,4853160261,7097396721,9135371922,12234766779,16382766239\nCC-MAIN-2025-51,2157963360,19475195731,4404296244,6986097888,8981797278,12127695964,16112247373\nCC-MAIN-2026-04,2318103719,19218203008,4483573493,6680398525,8737502321,11908164793,15686863059\nCC-MAIN-2026-08,2155602565,19042411083,4433808464,6484334872,8374645042,11635353490,15511978549\nCC-MAIN-2026-12,1964104377,18535612694,4068889092,6328116802,8109670903,11227186513,15157870015\nCC-MAIN-2026-17,2179433788,18249591530,4099292003,6115052549,8061035202,10884500104,14961464255\n"
  },
  {
    "path": "plots/crawlsize/url_page_ratio_last_n_crawls.csv",
    "content": "crawl,12,2,3,4,6,9\nCC-MAIN-2009-2010,,0.8204459894859851,,,,\nCC-MAIN-2012,,0.7976991186989425,0.7891972139777857,,,\nCC-MAIN-2013-20,,0.9071808806657321,0.8005125166895182,0.796764696921312,,\nCC-MAIN-2013-48,,0.6963267471455574,0.7929632045585264,0.7392162803154453,,\nCC-MAIN-2014-10,,0.5872303701103206,0.5261193413503087,0.6611850748632512,0.6628856882331876,\nCC-MAIN-2014-15,,0.45920183475125625,0.3901042638221014,0.38594579415845376,0.5451397952498407,\nCC-MAIN-2014-23,,0.40138390649838274,0.3291796627496876,0.2987537865544119,0.44164625293525744,\nCC-MAIN-2014-35,,0.3671356225056882,0.2948198163322158,0.2580534219581395,0.2564015539887648,0.4366074442388523\nCC-MAIN-2014-41,,0.38845720527624694,0.27502427715850747,0.2388240672858075,0.21031691155984109,0.3663938813781721\nCC-MAIN-2014-42,,0.32334865146544034,0.252335239178384,0.20474564371344176,0.17683935529598155,0.29200205829298226\nCC-MAIN-2014-49,0.32888131245175806,0.3274061204459602,0.26273027410622773,0.2168853396617772,0.17102829689848154,0.17604414862428988\nCC-MAIN-2014-52,0.28637140259311783,0.5077127141725486,0.28877031592902,0.23215534415794184,0.1680087755625187,0.1526767282146204\nCC-MAIN-2015-06,0.24408100992169118,0.5370525941873981,0.3767957985303196,0.24784562115660508,0.1783872198777798,0.14295219956240438\nCC-MAIN-2015-11,0.15226699536404462,0.5651762063119792,0.4107651190426624,0.31861655216430407,0.19499601854200993,0.14378720161765118\nCC-MAIN-2015-14,0.13389476322941293,0.572725695132397,0.4232182525157265,0.3367381340002062,0.20721699336882085,0.14356370451300024\nCC-MAIN-2015-18,0.1262000917399002,0.5659355028219812,0.41310179190757845,0.3339409643431045,0.2389673395918108,0.15077378297519378\nCC-MAIN-2015-22,0.12414301593232033,0.535148823325548,0.40436576061500484,0.3249799692997919,0.24059828958396504,0.15484027882682613\nCC-MAIN-2015-27,0.1236871027991238,0.5621616659784482,0.4055198389330237,0.33088264872516726,0.2440473103288154,0.16146244487083952\nCC-MAIN-2015-32,0.128543174467744,0.5606302660558359,0.40901813639913903,0.32545201255664685,0.2423287954491851,0.1776014965059656\nCC-MAIN-2015-35,0.13153211454444527,0.5351794525423853,0.40280537784788634,0.324379949340055,0.24108772067266238,0.18002559819429348\nCC-MAIN-2015-40,0.1371699807037077,0.5932394637912694,0.42162493428197245,0.34015975166977597,0.24750752308693802,0.1844353409518684\nCC-MAIN-2015-48,0.14887178032108295,0.595788572285348,0.42537956820346573,0.3365037068102651,0.2502156147209208,0.18469550219049455\nCC-MAIN-2016-07,0.15185891867627319,0.5448361470212105,0.4295409945300831,0.3410563835632945,0.25148024842257366,0.18644824913485364\nCC-MAIN-2016-18,0.1534636065973147,0.5745311169541301,0.42043464009036396,0.35321657470003365,0.2533319149767353,0.18775601955506843\nCC-MAIN-2016-22,0.16079885141612382,0.6140446216921942,0.4461556268162338,0.3615238380782085,0.27198784561123945,0.19996694381916252\nCC-MAIN-2016-26,0.16357334342201038,0.624331458425338,0.46417088310242594,0.3718352446017776,0.28258678891679184,0.20375066785162085\nCC-MAIN-2016-30,0.1687104050581055,0.6123264495607642,0.45785199011358624,0.3759009143961114,0.2812719233743198,0.20906596788945894\nCC-MAIN-2016-36,0.1724232350900049,0.5803703226052739,0.4505861809043592,0.3668843739361133,0.280522919509466,0.21356589611272228\nCC-MAIN-2016-40,0.17700444828084858,0.5772181189351094,0.4327739430105675,0.3641417763991172,0.28089011965964317,0.2196383776268724\nCC-MAIN-2016-44,0.23863770885828303,0.7074853906006754,0.5592791198437983,0.4712676340220083,0.3768393476506316,0.2927326228609394\nCC-MAIN-2016-50,0.24404228207705456,0.6315583798335336,0.5203567244847304,0.44656795699541624,0.3626144506244168,0.2924209988573579\nCC-MAIN-2017-04,0.24571978039689835,0.6209720706022204,0.4807052040031191,0.4216923205967007,0.3452207574266147,0.2863636183116042\nCC-MAIN-2017-09,0.242987953912996,0.6315426936775745,0.4786614428308576,0.4020218562237697,0.3355405568394313,0.27895734085342255\nCC-MAIN-2017-13,0.25331950089969973,0.6594179157920166,0.514036844612426,0.42322916376453873,0.34381768869440016,0.28699766167248936\nCC-MAIN-2017-17,0.25554965574925115,0.7208797760609941,0.5499168492496627,0.44198729466030123,0.3449456384431242,0.28705053120171237\nCC-MAIN-2017-22,0.2544989316777723,0.7989926483974771,0.584267636532351,0.4628541949779904,0.34649031204017006,0.2865208595658144\nCC-MAIN-2017-26,0.26204662782848087,0.8194097773982687,0.636862203230058,0.5032717572702338,0.3678465874300458,0.29602165851798923\nCC-MAIN-2017-30,0.263732496042779,0.9011315059950287,0.6879950807727075,0.546210899869338,0.3925776598319552,0.29901713755379933\nCC-MAIN-2017-34,0.2723359293020135,0.932680312025588,0.6886587993016015,0.5780570406101786,0.41958272344662495,0.3134916354770109\nCC-MAIN-2017-39,0.2836737611645958,0.9432725770508911,0.7605865071646298,0.6115657067498531,0.45562291577276154,0.33388929689105307\nCC-MAIN-2017-43,0.28983027222556035,0.9763759154255288,0.735817141440195,0.6366139166638247,0.4751588369481346,0.3503828469986155\nCC-MAIN-2017-47,0.3008287707459672,0.9789102761705266,0.7821892661316413,0.6367733137802307,0.4962420190921558,0.3671325000325967\nCC-MAIN-2017-51,0.31181885282985183,0.9879171078021366,0.7862541595525948,0.6635335228944688,0.5249368502960811,0.38623395572737057\nCC-MAIN-2018-05,0.3311890295493233,0.9790956234549482,0.8641276785334705,0.6985806660610032,0.5433006315838758,0.4102956314668422\nCC-MAIN-2018-09,0.35005539156540527,0.9893650738634692,0.8871449624297021,0.7408500842994445,0.5722057422744891,0.4315759651905197\nCC-MAIN-2018-13,0.3633005168816331,0.9849762741901329,0.8927101073237032,0.7515568162905554,0.5743260531689971,0.4476170071369132\nCC-MAIN-2018-17,0.3719893318354178,0.9746905466761717,0.8750871472566547,0.7513090068959346,0.587098451440846,0.4508558045605048\nCC-MAIN-2018-22,0.3820410543113107,0.9729136754872547,0.8749433990264481,0.7636522098072931,0.5986022839663893,0.46389142942652806\nCC-MAIN-2018-26,0.3936771276196776,0.9842451945288899,0.872666861023734,0.763969212462316,0.6027278596506531,0.46404235041510616\nCC-MAIN-2018-30,0.3940104806775429,0.9828633788856977,0.9100032027655349,0.7794877691304293,0.5960132516329919,0.4692322760844908\nCC-MAIN-2018-34,0.40518700736324664,0.9849433887914855,0.8776709777298304,0.7828601179647521,0.6129749612697213,0.47975234457094795\nCC-MAIN-2018-39,0.40429257999736495,0.9850429450970525,0.842744740912423,0.7368202998135831,0.6182158129650842,0.4815657137489582\nCC-MAIN-2018-43,0.40986236765671713,0.9875098929295035,0.8056256224842826,0.6969574592097793,0.602795497090341,0.47739262935458404\nCC-MAIN-2018-47,0.4183286948321355,0.9851878923464158,0.8353289355865292,0.7051557203975016,0.5871254609913973,0.4887070748513113\nCC-MAIN-2018-51,0.4223515022169222,0.9703818605341568,0.832024879687158,0.7012737676369074,0.5669574652468806,0.49405674874076994\nCC-MAIN-2019-04,0.42706326782452103,0.9955783107467604,0.8424239466196405,0.7136951059605888,0.5656271210686603,0.4955660238878032\nCC-MAIN-2019-09,0.43278771010193423,0.9738504159025088,0.8281770621078759,0.7157320200654022,0.5715667674682556,0.48205816427298653\nCC-MAIN-2019-13,0.4394016269869078,0.9720980278621674,0.825170607770718,0.7219766979552026,0.5831553106793371,0.4756603415204108\nCC-MAIN-2019-18,0.4415304344725601,0.9844032167833736,0.8263191396363284,0.7278775495830345,0.5985162243535235,0.47605127841068623\nCC-MAIN-2019-22,0.4400949698606783,0.9822943915659385,0.84881298775504,0.7326223163494193,0.6117841845496279,0.4893704089966595\nCC-MAIN-2019-26,0.4431101709861017,0.9837702399629583,0.8535971522256837,0.7506605098472633,0.6196656679344847,0.507646782440061\nCC-MAIN-2019-30,0.4427253465076758,0.9659174755516563,0.8397028270417811,0.7505028814659906,0.6195054483704832,0.519336502737489\nCC-MAIN-2019-35,0.46005160661399613,0.974083020502518,0.8475631146898805,0.7552996765573766,0.6369975913007149,0.535457798751319\nCC-MAIN-2019-39,0.4788109747023626,0.9831013097976106,0.8708043401790095,0.7700958279168453,0.6516191191772345,0.5502632716393523\nCC-MAIN-2019-43,0.4894667774553086,0.9714084810339135,0.8575321195871729,0.767312487190636,0.6544579394233566,0.5523731266737193\nCC-MAIN-2019-47,0.5052866941480031,0.9637429637443959,0.8636575103307368,0.780776164897581,0.6645426663718306,0.5692786228374161\nCC-MAIN-2019-51,0.5149199991224398,0.9673806270620194,0.867439000261607,0.8008686175526364,0.6723844536970436,0.5737026303145594\nCC-MAIN-2020-05,0.5103966250807642,0.8732885377550882,0.8059522850465106,0.7556917785121721,0.6542352588532808,0.5667962794813537\nCC-MAIN-2020-10,0.5221361655970984,0.9378223008453652,0.8439465387981147,0.7794782533717615,0.6791241873635719,0.5756947236842894\nCC-MAIN-2020-16,0.523996937995541,0.8854942582817468,0.7907366566586126,0.7467272139795574,0.6744809077050349,0.5772958099822703\nCC-MAIN-2020-24,0.5292923300136483,0.9373552659859309,0.8559252478279795,0.7729742318010318,0.6857977765718413,0.5848367848690548\nCC-MAIN-2020-29,0.5276095426606514,0.9751534302179906,0.8317439130737547,0.7852669017052278,0.685333558252244,0.590492350006506\nCC-MAIN-2020-34,0.5348655365312904,0.9842377475124213,0.9069233646644744,0.7991861954174252,0.6981675705177847,0.6009010346506615\nCC-MAIN-2020-40,0.54257837153552,0.9741564411854978,0.8702990905289804,0.8260898460015887,0.71636428119744,0.6063757426750497\nCC-MAIN-2020-45,0.5637183239594823,0.9783826661985514,0.9044660921650329,0.8295230373555358,0.7293776193484706,0.6293893948965269\nCC-MAIN-2020-50,0.5771708633144256,0.9863707240226229,0.8815510284467657,0.8380652797665263,0.7545237433839522,0.6419644758845326\nCC-MAIN-2021-04,0.5770973925465431,0.9744452330237182,0.8798346557889861,0.7816720447829462,0.7231456801130345,0.6490169351206135\nCC-MAIN-2021-10,0.5894862879604394,0.9760176970214688,0.8742128271747467,0.8074911439581358,0.7212652460498912,0.654259515041697\nCC-MAIN-2021-17,0.5947404366268999,0.9883514489650369,0.8512768764708117,0.7916363615329984,0.6999695605751175,0.6612553437746546\nCC-MAIN-2021-21,0.6120018711783048,0.991621389341458,0.9004448383297359,0.8040880332512234,0.7210153292611926,0.6532931965658813\nCC-MAIN-2021-25,0.6167146229560942,0.9839498766638907,0.9583916799828682,0.8615091277713108,0.7384908604661836,0.6610837443718134\nCC-MAIN-2021-31,0.6114236043751609,0.9744480534624143,0.8853046313926974,0.8171745133016286,0.7145794135210216,0.6368393799398211\nCC-MAIN-2021-39,0.6071088216004917,0.9832557386785359,0.8939067178603726,0.8282965593316778,0.7287882399190632,0.647881849066948\nCC-MAIN-2021-43,0.6035729523989329,0.9926210535034949,0.8577276996936959,0.8070133145979369,0.7227628473928568,0.6424660944836232\nCC-MAIN-2021-49,0.6105762370238745,0.9767785047550365,0.9673141125019317,0.8422948219174158,0.7616952362545155,0.6595130754151708\nCC-MAIN-2022-05,0.6174240121760066,0.9807648492220847,0.9264569406842249,0.87296380451826,0.7566962888070393,0.6734466820970254\nCC-MAIN-2022-21,0.6144289197875531,0.9679356893640232,0.9086949579481982,0.8261890807656663,0.731598261051556,0.6662966254791779\nCC-MAIN-2022-27,0.6207079127973506,0.9817302790050974,0.8821293736358423,0.8475762046036357,0.7596289403917543,0.6749639591529403\nCC-MAIN-2022-33,0.6339607029333868,0.9936671416924411,0.9687848945069469,0.8607232249938293,0.7679721310966422,0.6819289129501658\nCC-MAIN-2022-40,0.6308477442903098,0.9813979228593865,0.9579530708388878,0.8681345499877693,0.7771671839763061,0.673263320413001\nCC-MAIN-2022-49,0.6251677990713441,0.988690396719582,0.9278299963533247,0.8577868972636414,0.7452811557053901,0.6784824118252775\nCC-MAIN-2023-06,0.6196659224590622,0.9901910321784668,0.8624633876675798,0.8285602558018064,0.738131889343549,0.6665199129596711\nCC-MAIN-2023-14,0.6091003725910237,0.9855279141697533,0.8734808971010933,0.7911535955198221,0.7372375725529835,0.6654999305841857\nCC-MAIN-2023-23,0.6112527377117731,0.9826957724186004,0.8747910154186896,0.7934651686027651,0.7194268954490753,0.6381484718923967\nCC-MAIN-2023-40,0.5997917290837961,0.9458389492983551,0.8657912478815157,0.7913816439208358,0.690183662167511,0.6374514754760918\nCC-MAIN-2023-50,0.601079246630572,0.9863457719501882,0.8744371886841275,0.802219257643831,0.6975426752635423,0.6389568212012289\nCC-MAIN-2024-10,0.586561259176545,0.9695071313462238,0.9022137112277332,0.8110754446215855,0.7023460214645605,0.6339383939557871\nCC-MAIN-2024-18,0.5863024624686363,0.9897086728479249,0.9217978098432814,0.8411358161572445,0.7189051336262896,0.6209440323075948\nCC-MAIN-2024-22,0.5903309410365356,0.9807443040353069,0.9649316947386742,0.8521905748956724,0.724869956341061,0.6253810131746875\nCC-MAIN-2024-26,0.5869242230122269,0.9821222153565776,0.9774608894577299,0.8871408113517495,0.7366033307441674,0.6293389522128835\nCC-MAIN-2024-30,0.5778263089025873,0.9898122263120958,0.9775809928516134,0.9260694552932301,0.7566656806180913,0.6402432877340885\nCC-MAIN-2024-33,0.5850975260976685,0.9771208916781539,0.9706724497467314,0.9488749706511708,0.803126299988684,0.6490142056533188\nCC-MAIN-2024-38,0.58576678581344,0.9902599166711844,0.9795856930747274,0.9252323751973821,0.8162404617701063,0.6543323393837196\nCC-MAIN-2024-42,0.5930001787778056,0.9820196458178791,0.9712262863834599,0.9351343751409502,0.8239216838652625,0.6731895553626521\nCC-MAIN-2024-46,0.5950952815680126,0.9901626460743241,0.982555488745344,0.9410270236135858,0.8262151356334054,0.6925009641817254\nCC-MAIN-2024-51,0.6073325902887992,0.9939327595951073,0.9833966955528077,0.9423904865514185,0.8385904849750915,0.7162592942718744\nCC-MAIN-2025-05,0.6113383739130269,0.9915391330423992,0.9743268930500968,0.9285768271689765,0.8175075022766127,0.7081757418801142\nCC-MAIN-2025-08,0.6244647607026195,0.9916779835612484,0.9753963233046118,0.9280314976182484,0.8128815646097249,0.7120032254551685\nCC-MAIN-2025-13,0.636241852045689,0.9866919344409442,0.9786332878985106,0.9306180218740304,0.8230763034166623,0.7141920795012039\nCC-MAIN-2025-18,0.6370116027055926,0.9962060687016092,0.9743536196579106,0.9190439994324255,0.8192175300106135,0.7126696794847343\nCC-MAIN-2025-21,0.6354756270919715,0.9931419264505736,0.9968372253610276,0.9416223725701863,0.8220189864013921,0.7068268990411731\nCC-MAIN-2025-26,0.640526226756504,0.9907009446929886,0.9989322404494799,0.9670796277632587,0.8299783359821564,0.7165171790261636\nCC-MAIN-2025-30,0.640146740208077,0.9906844106315209,0.9822931535241268,0.9656271244584594,0.8495319925122706,0.7189200372669134\nCC-MAIN-2025-33,0.6369566718045697,0.9934855309297007,0.9873570778023196,0.9548879046649995,0.8509574850243335,0.7190591026500136\nCC-MAIN-2025-38,0.6389884267230598,0.98327716400676,0.97895297639912,0.9552663528848443,0.8494120409683633,0.7156390210007126\nCC-MAIN-2025-43,0.6349701480653132,0.9782904345086306,0.9754818153064881,0.934149382448975,0.8343707027701537,0.7203213044656287\nCC-MAIN-2025-47,0.6389007758238104,0.9881681294791037,0.9726146567860537,0.9379494409129799,0.8409981345094634,0.7276941603269592\nCC-MAIN-2025-51,0.6407720398613493,0.9867227180851071,0.9866872306917593,0.9488160219956921,0.8462327470013683,0.7343274940137308\nCC-MAIN-2026-04,0.6472588205706441,0.996633587416339,0.9833962534107163,0.9285349252221554,0.8363388265498076,0.7288149073901433\nCC-MAIN-2026-08,0.6526074316808949,0.9860308457467153,0.97278986174927,0.9346511507972752,0.8333023259033638,0.7312272648097271\nCC-MAIN-2026-12,0.6523645221945199,0.9823875577974345,0.9778487793802422,0.9385590291810643,0.8284630824748404,0.7286434587992163\nCC-MAIN-2026-17,0.6551035253076207,0.9838029590826155,0.9654675502011687,0.9304697312701604,0.8291711576650493,0.7272654660989866\n"
  },
  {
    "path": "plots/crawlsize.md",
    "content": "Size of Common Crawl Monthly Archives\n=====================================\n\nThe number of released pages per month fluctuates varies over time due to changes to the number of available seeds, scheduling policy for page revists and crawler operating issues. Because of duplicates the numbers of unique URLs or unique content digests (here Hyperloglog estimates) are lower than the number of page captures.\n\n![Size of crawl archives (pages, URLs, unique content digest)](./crawlsize/monthly.png)\n\n([Number of page captures, unique URLs and content digests as CSV](./crawlsize/monthly.csv))\n\nThe size on various aggregation levels (host, domain, top-level domain / public suffix) is shown in the next plot. Note that the scale differs per level of aggregation, see the exponential notation behind the labels.\n\n![Coverage of unique URLs, host and domain names, top-level domains (public suffixes)](./crawlsize/domain.png)\n\n([Unique URLs, host and domain names, top-level domains (public suffixes) as CSV](./crawlsize/domain.csv))\n\n\n## Size and URL Status Per Year\n\n![Captures per year and URL status (new/unknown URL, revisit, duplicate)](./crawlsize/url_status_by_year.png)\n\nThe plot above shows the amount of page captures accumulated per year and its distribution by URL status – \"new\" URLs were visited the first time, \"revisits\" have been already archived a previous crawl, and \"duplicates\" designate captures of the same URL within a single, \"monthly\" crawl.\n\n\n## Cumulative Size\n\nEvery monthly crawl is a sample of the web and we try to make every monthly snapshot a representative and diverse sample by its own. We also try to make the sample diverse in time to cover more content over time while still providing fresh and frequent snapshots of popular pages. This and the following plots are based on Hyperloglog cardinality estimates with 1% error rate.\n\n![Cumulative size of monthly crawl archives since 2013](./crawlsize/cumulative.png)\n\nThe next plot shows the difference in the cumulative size of URLs to the preceding crawl. In other words, the amount of new URLs, not observed in any of the preceding crawls.\n\n![New URLs per Crawl, not observed in prior crawls](./crawlsize/monthly_new.png)\n\n([New URLs per crawl as CSV](./crawlsize/monthly_new.csv))\n\nHow many unique items (in terms of URLs or unique content by digest) are covered by the last n crawls? The coverage over certain time intervals went down early 2015 when continuous donations of verified seeds stopped. Since autumn 2016 we are able to extend the crawl by our own, and we try to increase the coverage for the last n crawls.\n\n![Number of unique URLs if the last n crawls are combined](./crawlsize/url_last_n_crawls.png)\n\n([Combined number of unique URLs over n last crawls as CSV](./crawlsize/url_last_n_crawls.csv))\n\n![Ratio of unique URLs by total pages captured over n last crawls](./crawlsize/url_page_ratio_last_n_crawls.png)\n\n![Number of unique content if the last n crawls are combined](./crawlsize/digest_last_n_crawls.png)\n"
  },
  {
    "path": "plots/domains-top-500.csv",
    "content": "domain,pages,urls,hosts,%pages,%urls\nblogspot.com,19780455,19755134,246742,0.902419,0.906434\nwikipedia.org,3899574,3856416,372,0.177905,0.176946\nwordpress.org,3330102,3329363,218,0.151925,0.152763\ngoogle.com,1839088,1803072,1809,0.083902,0.082731\nwiktionary.org,1607921,1596057,195,0.073356,0.073233\neuropa.eu,1556837,1551415,731,0.071026,0.071184\noclc.org,1495406,1488924,635,0.068223,0.068317\nmade-in-china.com,1306394,1300407,14971,0.059600,0.059667\naif.ru,1091748,1091655,114,0.049807,0.050089\napple.com,978593,970153,102,0.044645,0.044514\nhh.ru,960920,958755,3569,0.043839,0.043991\nqq.com,815785,814765,1006,0.037218,0.037384\nrakuten.co.jp,808679,804683,240,0.036893,0.036922\nnih.gov,796095,791971,291,0.036319,0.036338\nexblog.jp,734058,734032,10574,0.033489,0.033680\npixnet.net,726735,724013,10966,0.033155,0.033220\nwikimedia.org,708476,694668,134,0.032322,0.031874\nwikisource.org,686244,674136,85,0.031308,0.030932\nmicrosoft.com,639205,624974,176,0.029162,0.028676\nox.ac.uk,634415,614570,1236,0.028943,0.028199\nspydus.co.uk,620375,620374,54,0.028303,0.028465\napp.link,597697,597654,4048,0.027268,0.027422\nnoblenet.org,592844,592843,26,0.027047,0.027202\nindiatimes.com,589071,586931,87,0.026874,0.026930\namazonaws.com,588879,588388,4560,0.026866,0.026997\nspb.ru,585915,583123,3149,0.026730,0.026756\nairbnb.com,541856,541557,18,0.024720,0.024849\nnii.ac.jp,527465,527273,683,0.024064,0.024193\nalibaba.com,504793,504545,28961,0.023030,0.023150\nberkeley.edu,502282,501739,1408,0.022915,0.023022\nnasa.gov,494274,491674,401,0.022550,0.022560\ngooglesource.com,480793,480618,56,0.021935,0.022052\nnetlify.app,478768,478496,17666,0.021842,0.021955\nwisc.edu,463649,462946,2115,0.021152,0.021242\nweb.app,449481,449430,10752,0.020506,0.020621\nlibsyn.com,444502,444302,3990,0.020279,0.020386\nmail.ru,434680,432572,72,0.019831,0.019848\nmit.edu,412283,410143,1241,0.018809,0.018819\ndebian.org,411258,409970,89,0.018762,0.018811\nlinternaute.com,405535,395168,14,0.018501,0.018132\nunam.mx,384003,382990,1346,0.017519,0.017573\nyandex.ru,382268,381870,129,0.017440,0.017522\n24tv.ua,381418,380815,45,0.017401,0.017473\nmozilla.org,373851,372514,57,0.017056,0.017092\noracle.com,370664,361221,58,0.016910,0.016574\nnsw.gov.au,368321,367498,2482,0.016803,0.016862\nsina.com.cn,364690,363771,349,0.016638,0.016691\nnoaa.gov,360939,360725,287,0.016467,0.016551\nadobe.com,360877,352743,110,0.016464,0.016185\ngodaddy.com,358683,343405,431,0.016364,0.015757\nuol.com.br,357558,356224,493,0.016312,0.016345\nyoutube.com,346960,344346,11,0.015829,0.015800\nvoanews.com,341842,340267,13,0.015595,0.015613\nworldbank.org,340176,339529,89,0.015519,0.015579\nhatenablog.com,338057,337969,3200,0.015423,0.015507\nyahoo.co.jp,337128,334645,132,0.015380,0.015355\nline.me,329069,324146,76,0.015013,0.014873\ngithub.io,327863,326380,33911,0.014958,0.014975\nyale.edu,326214,325419,858,0.014882,0.014931\nfree.fr,322481,322134,4231,0.014712,0.014781\nshein.com,322203,321997,45,0.014699,0.014774\nudn.com,320357,319932,59,0.014615,0.014680\nning.com,313598,313032,623,0.014307,0.014363\ngithub.com,301968,297839,41,0.013776,0.013666\nwixsite.com,296575,290601,88429,0.013530,0.013334\nsubstack.com,292141,287493,48941,0.013328,0.013191\nbing.com,290203,289883,26,0.013240,0.013301\ncornell.edu,289009,287737,796,0.013185,0.013202\nwikidot.com,287476,287014,14203,0.013115,0.013169\nstanford.edu,284007,283405,1627,0.012957,0.013004\nusda.gov,281485,278602,147,0.012842,0.012783\nduke.edu,278884,278290,713,0.012723,0.012769\nweebly.com,271097,266932,77340,0.012368,0.012248\nusp.br,270931,269153,1149,0.012360,0.012350\nimpress.co.jp,269711,268720,42,0.012305,0.012330\nsalesforce.com,269408,268497,55,0.012291,0.012320\nca.gov,268009,266253,1132,0.012227,0.012217\nubc.ca,267395,266896,1574,0.012199,0.012246\nrambler.ru,266885,266183,38,0.012176,0.012213\natlassian.net,265955,265004,5761,0.012133,0.012159\nbanggood.com,265607,265440,54,0.012117,0.012179\namazon.com,262154,254349,97,0.011960,0.011670\nrbc.ru,261968,261621,102,0.011951,0.012004\nsohu.com,255494,255007,183,0.011656,0.011701\nmathworks.com,255103,254225,29,0.011638,0.011665\n163.com,250397,250030,535,0.011424,0.011472\ntistory.com,249860,249825,2548,0.011399,0.011463\nblog.jp,246779,246663,1932,0.011258,0.011318\nmuni.cz,241737,241405,562,0.011028,0.011077\ncraigslist.org,240073,239862,665,0.010953,0.011006\nutoronto.ca,239646,239166,974,0.010933,0.010974\nsamsung.com,235545,233412,61,0.010746,0.010710\nillinois.edu,234987,234471,1694,0.010721,0.010758\nndl.go.jp,233653,233325,20,0.010660,0.010706\ncocolog-nifty.com,226030,225755,1703,0.010312,0.010358\niheart.com,225832,225418,964,0.010303,0.010343\nmpg.de,224016,223428,530,0.010220,0.010252\nopera.com,223863,222098,28,0.010213,0.010191\nadmin.ch,223528,208997,327,0.010198,0.009590\nappspot.com,222624,221182,1157,0.010156,0.010149\nubuntu.com,222331,221559,142,0.010143,0.010166\nharvard.edu,222222,221063,754,0.010138,0.010143\nupenn.edu,220443,219800,677,0.010057,0.010085\nfreelancer.com,220217,220088,9,0.010047,0.010098\nshopify.com,218276,215408,20,0.009958,0.009884\narchive.org,215667,192970,796,0.009839,0.008854\nibm.com,215131,213151,104,0.009815,0.009780\nover-blog.com,214758,214277,1719,0.009798,0.009832\naf.mil,212886,212703,335,0.009712,0.009760\nporsche.com,212521,211280,161,0.009696,0.009694\ncanalblog.com,210869,210328,1559,0.009620,0.009651\nafternic.com,208966,199302,5,0.009533,0.009145\nhotels.com,208779,208407,35,0.009525,0.009562\nsap.com,208262,194884,48,0.009501,0.008942\nkrakow.pl,207082,206315,1214,0.009447,0.009466\nhatenablog.jp,204606,204559,2555,0.009334,0.009386\nusu.edu,201493,199714,84,0.009192,0.009164\ncuni.cz,200724,199935,754,0.009157,0.009174\nuk.com,200178,192398,5221,0.009132,0.008828\ncloudfront.net,199005,198042,1858,0.009079,0.009087\ngov.ru,198296,197315,470,0.009047,0.009053\nredhat.com,197152,195886,46,0.008994,0.008988\nandroid.com,195412,189952,11,0.008915,0.008716\ncam.ac.uk,194780,193856,846,0.008886,0.008895\nusgs.gov,189866,189464,101,0.008662,0.008693\nworkplace.com,188902,188760,291,0.008618,0.008661\npsu.edu,186946,183515,575,0.008529,0.008420\nbibliocommons.com,186576,186181,335,0.008512,0.008543\nbnf.fr,177176,177018,50,0.008083,0.008122\nonet.pl,176630,175822,47,0.008058,0.008067\nfedoraproject.org,176020,175738,73,0.008030,0.008063\nnist.gov,175987,175364,88,0.008029,0.008046\nun.org,175817,175067,242,0.008021,0.008033\nhindustantimes.com,175558,174920,14,0.008009,0.008026\nwashington.edu,174322,173261,378,0.007953,0.007950\nitmedia.co.jp,171201,170201,39,0.007810,0.007809\norg.ru,169636,164916,466,0.007739,0.007567\nprinceton.edu,169054,167003,520,0.007713,0.007663\nub.edu,168922,164590,110,0.007707,0.007552\nkayak.com,168854,168793,17,0.007703,0.007745\nnarod.ru,168468,168414,10483,0.007686,0.007727\nkremlin.ru,166712,165787,24,0.007606,0.007607\nntu.edu.tw,164907,164569,519,0.007523,0.007551\nseesaa.net,161429,160284,1984,0.007365,0.007354\nfoursquare.com,161125,160997,21,0.007351,0.007387\ndocomo.ne.jp,156735,156026,88,0.007151,0.007159\narchlinux.org,156131,155779,22,0.007123,0.007148\nuefa.com,153249,152266,25,0.006991,0.006986\nhatena.ne.jp,152722,148800,27,0.006967,0.006827\nhypotheses.org,152269,152147,1666,0.006947,0.006981\nyorku.ca,149121,148429,479,0.006803,0.006810\npchome.com.tw,148643,148497,18,0.006781,0.006814\narmy.mil,148389,147521,280,0.006770,0.006769\nuni-heidelberg.de,147395,144396,302,0.006724,0.006625\nwikiquote.org,146925,143298,100,0.006703,0.006575\numn.edu,146463,145864,1124,0.006682,0.006693\nintuit.com,145094,144701,85,0.006619,0.006639\narizona.edu,145014,142369,1228,0.006616,0.006532\njd.com,145013,144488,2329,0.006616,0.006630\nru-land.com,142630,142396,12,0.006507,0.006534\nelpais.com,142370,140938,29,0.006495,0.006467\nwikibooks.org,142004,139294,122,0.006478,0.006391\nsapo.pt,141847,140980,93,0.006471,0.006469\nchinadaily.com.cn,141828,141637,109,0.006470,0.006499\nlivejournal.com,141161,141156,1953,0.006440,0.006477\nobozrevatel.com,141062,140643,28,0.006435,0.006453\nhse.ru,139830,137442,479,0.006379,0.006306\nnicovideo.jp,139786,139610,35,0.006377,0.006406\nunibo.it,139536,138716,315,0.006366,0.006365\nhateblo.jp,139234,139210,1647,0.006352,0.006387\nglobalvoices.org,138602,137090,71,0.006323,0.006290\nutexas.edu,138577,138172,648,0.006322,0.006340\nceskatelevize.cz,138431,137890,17,0.006315,0.006327\nwikinews.org,137732,135089,36,0.006284,0.006198\ncern.ch,137615,137484,405,0.006278,0.006308\nerr.ee,137407,136960,27,0.006269,0.006284\ngoogle.cn,136705,133699,27,0.006237,0.006135\nfreebsd.org,136369,136163,90,0.006221,0.006248\nelespanol.com,135672,135266,13,0.006190,0.006206\ntexas.gov,135595,134955,268,0.006186,0.006192\nufsc.br,134827,132890,1690,0.006151,0.006097\naliyun.com,134706,132697,118,0.006146,0.006089\nlivedoor.biz,134433,134377,650,0.006133,0.006166\nhawaii.edu,133777,133466,309,0.006103,0.006124\nwix.com,133645,131864,40,0.006097,0.006050\npodbean.com,132784,132449,18246,0.006058,0.006077\napache.org,132197,131781,359,0.006031,0.006047\nacademic.ru,132021,131925,1051,0.006023,0.006053\nshop-pro.jp,131396,131069,3498,0.005995,0.006014\nhugedomains.com,129845,113843,1,0.005924,0.005224\npurdue.edu,129663,129124,232,0.005915,0.005925\nteachable.com,129623,129400,4337,0.005914,0.005937\nfrontiersin.org,129433,129202,13,0.005905,0.005928\nwalla.co.il,129330,129190,156,0.005900,0.005928\nunivie.ac.at,129252,128921,1235,0.005897,0.005915\nlibretexts.org,129195,127985,35,0.005894,0.005872\nkb.se,129119,126491,42,0.005891,0.005804\niu.edu,128288,127998,595,0.005853,0.005873\nsiemens.com,127994,125548,82,0.005839,0.005761\nwa.gov,127816,126643,286,0.005831,0.005811\ndict.cc,127624,127531,202,0.005822,0.005852\nspotify.com,127561,127167,29,0.005820,0.005835\nazurewebsites.net,126146,125642,4420,0.005755,0.005765\nt.me,125871,124106,2,0.005742,0.005694\nchinaz.com,125759,124914,61,0.005737,0.005731\nmsu.edu,125347,124969,744,0.005719,0.005734\niastate.edu,125018,124833,582,0.005704,0.005728\ninterfax.com.ua,124866,115330,4,0.005697,0.005292\nria.ru,124501,123247,28,0.005680,0.005655\nethz.ch,124381,123738,632,0.005674,0.005678\ncanada.ca,124356,122994,162,0.005673,0.005643\ntradingview.com,124105,124045,21,0.005662,0.005692\npeople.com.cn,123758,123725,144,0.005646,0.005677\ntelegram.org,123527,121721,19,0.005636,0.005585\nuscourts.gov,123424,123310,570,0.005631,0.005658\nhu-berlin.de,122930,122309,235,0.005608,0.005612\nsch.gr,121349,121157,937,0.005536,0.005559\nufl.edu,120992,120127,1019,0.005520,0.005512\nkit.edu,120801,120495,653,0.005511,0.005529\niol.pt,120231,119962,17,0.005485,0.005504\ncolumbia.edu,120174,119803,478,0.005483,0.005497\nvictoriassecret.com,120050,100454,17,0.005477,0.004609\nstatcounter.com,119793,110030,73,0.005465,0.005049\nweblio.jp,119737,119689,26,0.005463,0.005492\nmsu.ru,119653,119386,508,0.005459,0.005478\npoznan.pl,119436,119157,711,0.005449,0.005467\nnt.gov.au,118748,118444,55,0.005417,0.005435\nrutgers.edu,118701,118341,1005,0.005415,0.005430\ngouv.qc.ca,117229,116932,976,0.005348,0.005365\nvk.com,117035,116270,33,0.005339,0.005335\nuab.cat,116909,116417,121,0.005334,0.005342\nblog.hu,116747,116747,956,0.005326,0.005357\nunlp.edu.ar,116443,116319,382,0.005312,0.005337\nucsb.edu,115924,115821,800,0.005289,0.005314\ngva.es,114833,110420,218,0.005239,0.005066\nucla.edu,114537,114302,1042,0.005225,0.005245\nbuzzsprout.com,114484,114206,7247,0.005223,0.005240\ntrip.com,114407,114222,47,0.005219,0.005241\nhp.com,114200,111980,74,0.005210,0.005138\nst-andrews.ac.uk,114184,113488,400,0.005209,0.005207\numd.edu,113950,113627,735,0.005199,0.005214\nanu.edu.au,113510,112459,201,0.005179,0.005160\nugr.es,113389,112617,520,0.005173,0.005167\ncom.ru,113388,113118,1253,0.005173,0.005190\ngo.com,112631,112135,27,0.005138,0.005145\nservice.gov.uk,112505,112048,157,0.005133,0.005141\ncuny.edu,112467,111833,372,0.005131,0.005131\nvecteezy.com,111934,111508,10,0.005107,0.005116\ncolorado.edu,111630,111443,145,0.005093,0.005113\nmsk.ru,111016,110904,852,0.005065,0.005089\nfinalsite.net,110857,106064,1,0.005057,0.004867\ngarmin.com,110855,108967,37,0.005057,0.005000\nncsu.edu,110326,110126,480,0.005033,0.005053\ncnr.it,110300,110180,679,0.005032,0.005055\nantaranews.com,109552,109354,53,0.004998,0.005018\nsi.edu,109493,109368,92,0.004995,0.005018\ntwitch.tv,109346,109081,29,0.004989,0.005005\nstripe.com,109324,104349,14,0.004988,0.004788\nin.gov,109169,108470,227,0.004980,0.004977\natlassian.com,108972,107892,62,0.004971,0.004950\ntelegra.ph,108906,88750,1,0.004968,0.004072\nindiana.edu,108667,108627,516,0.004958,0.004984\nmynavi.jp,108355,104469,101,0.004943,0.004793\nsnu.ac.kr,108131,107998,641,0.004933,0.004955\nsenate.gov,108026,107174,143,0.004928,0.004918\nuwaterloo.ca,107902,107330,179,0.004923,0.004925\nuni-tuebingen.de,107322,107073,158,0.004896,0.004913\nwustl.edu,107214,106898,329,0.004891,0.004905\nyoutube-nocookie.com,107099,107097,2,0.004886,0.004914\ndiva-portal.org,107055,106975,59,0.004884,0.004908\ntemple.edu,106812,106619,142,0.004873,0.004892\nfu-berlin.de,106807,106130,159,0.004873,0.004870\ntfrrs.org,106528,106426,15,0.004860,0.004883\nchina.com,106380,106368,88,0.004853,0.004881\nnrw.de,105906,105651,497,0.004832,0.004848\ngta5-mods.com,105667,105666,29,0.004821,0.004848\nicm.edu.pl,105520,105455,60,0.004814,0.004839\nunsplash.com,105481,105329,5,0.004812,0.004833\nmn.gov,105422,103707,99,0.004810,0.004758\nuc.pt,105280,105161,217,0.004803,0.004825\nas.com,105211,104799,16,0.004800,0.004809\nsemrush.com,104758,104554,27,0.004779,0.004797\nucm.es,104610,104499,129,0.004772,0.004795\nuni-bonn.de,103889,103325,330,0.004740,0.004741\nkhanacademy.org,102880,102824,72,0.004694,0.004718\nuchile.cl,102048,101328,439,0.004656,0.004649\nuni-lj.si,101688,101468,295,0.004639,0.004656\nplaystation.com,100986,100545,27,0.004607,0.004613\nwww.gov.uk,100841,86913,1,0.004601,0.003988\ntufts.edu,100834,100733,181,0.004600,0.004622\nvt.edu,100787,100512,724,0.004598,0.004612\nespn.com,100310,100261,14,0.004576,0.004600\nunb.br,99998,98047,518,0.004562,0.004499\nlegistar.com,99369,99178,301,0.004533,0.004551\ntableau.com,99086,98757,25,0.004520,0.004531\nunc.edu,98952,98190,890,0.004514,0.004505\nugent.be,98657,98449,428,0.004501,0.004517\nbme.hu,98566,98374,433,0.004497,0.004514\nvirginia.gov,98549,98099,255,0.004496,0.004501\nherokuapp.com,98514,98382,952,0.004494,0.004514\nmhlw.go.jp,98477,98306,113,0.004493,0.004511\nhouse.gov,97918,97761,556,0.004467,0.004486\nsld.cu,97726,97147,374,0.004458,0.004457\ner.ru,97698,97662,108,0.004457,0.004481\nyandex.com,97588,97572,50,0.004452,0.004477\nhubspot.com,96608,95539,48,0.004407,0.004384\nmediaset.it,96126,95897,20,0.004385,0.004400\ngamer.com.tw,95688,94963,15,0.004365,0.004357\nlodz.pl,95520,94803,542,0.004358,0.004350\nidnes.cz,95322,94714,254,0.004349,0.004346\nperfil.com,95285,95218,19,0.004347,0.004369\nsteampowered.com,95192,94231,6,0.004343,0.004324\nbyu.edu,95053,94826,598,0.004336,0.004351\ntrend.az,94932,94290,8,0.004331,0.004326\nnews12.com,94828,94716,10,0.004326,0.004346\nnyu.edu,94586,94087,217,0.004315,0.004317\nufrj.br,94573,94166,460,0.004315,0.004321\nhessen.de,93833,93660,462,0.004281,0.004297\nrozhlas.cz,93814,91265,59,0.004280,0.004188\nmarketscreener.com,93667,93460,16,0.004273,0.004288\npanasonic.com,93506,91828,126,0.004266,0.004213\neclipse.org,93444,93094,28,0.004263,0.004271\nhabr.com,93308,92803,17,0.004257,0.004258\nsky.it,92865,92393,24,0.004237,0.004239\nyahoo.com,92858,92806,31,0.004236,0.004258\nccm.net,92836,92822,12,0.004235,0.004259\ninteria.pl,92398,91704,30,0.004215,0.004208\ndonga.com,92349,91715,30,0.004213,0.004208\nomeka.net,92144,92135,588,0.004204,0.004227\ntum.de,91848,91303,405,0.004190,0.004189\ndartmouth.edu,91743,91555,204,0.004185,0.004201\nunicamp.br,91535,89742,424,0.004176,0.004118\nndtv.com,91292,90452,17,0.004165,0.004150\nexlibrisgroup.com,91113,91065,594,0.004157,0.004178\ncnrs.fr,90737,90519,636,0.004140,0.004153\ntalent.com,90686,90661,79,0.004137,0.004160\nusc.edu,90661,89752,424,0.004136,0.004118\nwolfram.com,90448,90131,26,0.004126,0.004136\nvietnamplus.vn,90343,90339,22,0.004122,0.004145\nosu.edu,90339,89923,666,0.004121,0.004126\ntvbs.com.tw,89948,87014,23,0.004104,0.003993\nulisboa.pt,89861,89579,461,0.004100,0.004110\ncbsnews.com,89782,88627,5,0.004096,0.004067\nhpe.com,89568,88860,66,0.004086,0.004077\nuni-hamburg.de,89347,89114,378,0.004076,0.004089\nbaidu.com,89198,88939,227,0.004069,0.004081\nblic.rs,88958,88458,11,0.004058,0.004059\ncnet.com,88922,87014,7,0.004057,0.003993\nbsky.app,88672,88198,12,0.004045,0.004047\narcgis.com,88660,87772,4837,0.004045,0.004027\nfau.de,88500,88032,611,0.004038,0.004039\nbayern.de,88332,87681,531,0.004030,0.004023\noffice.com,88093,87989,16,0.004019,0.004037\nvirginia.edu,87929,87533,407,0.004011,0.004016\nodoo.com,87662,87247,3812,0.003999,0.004003\nnet.ru,87030,86554,357,0.003970,0.003971\nburberry.com,86877,84116,50,0.003963,0.003860\nvirgilio.it,86506,86275,15,0.003947,0.003959\njustice.gc.ca,86354,86287,12,0.003940,0.003959\ntoyota.com,86236,86120,22,0.003934,0.003951\nmain.jp,86187,86150,1311,0.003932,0.003953\nunistra.fr,85898,85665,564,0.003919,0.003931\nucsd.edu,85896,85466,1258,0.003919,0.003921\nrezdy.com,85840,85801,712,0.003916,0.003937\nvercel.app,85412,85029,8191,0.003897,0.003901\nuba.ar,85351,85130,447,0.003894,0.003906\nfao.org,85271,84854,63,0.003890,0.003893\nuv.es,84994,84825,359,0.003878,0.003892\ndeveloppement-durable.gouv.fr,84745,84579,174,0.003866,0.003881\nimgur.com,84684,84604,12,0.003863,0.003882\nmaryland.gov,84194,83739,198,0.003841,0.003842\nrs-online.com,84124,82058,34,0.003838,0.003765\nrediff.com,84034,83746,45,0.003834,0.003843\nus.es,83814,83745,179,0.003824,0.003843\nkeizai.biz,83773,83173,162,0.003822,0.003816\noverdrive.com,83740,83642,1100,0.003820,0.003838\nunesp.br,83690,83411,153,0.003818,0.003827\nwikileaks.org,83572,83221,17,0.003813,0.003818\nprnewswire.com,83352,83167,13,0.003803,0.003816\nupc.edu,83141,82510,527,0.003793,0.003786\n17173.com,83054,82565,259,0.003789,0.003788\narchives.gov,82767,82576,49,0.003776,0.003789\ndmm.com,82693,82537,77,0.003773,0.003787\naps.org,82561,81104,17,0.003767,0.003721\nculture.gouv.fr,82529,81646,51,0.003765,0.003746\ncopernicus.org,82287,82099,66,0.003754,0.003767\nilsole24ore.com,82263,82138,181,0.003753,0.003769\nutah.edu,82262,81571,737,0.003753,0.003743\nhelsinki.fi,82168,82016,75,0.003749,0.003763\nissuu.com,81791,81601,2,0.003731,0.003744\nu-tokyo.ac.jp,81733,81674,448,0.003729,0.003747\nunt.edu,81704,72232,193,0.003727,0.003314\nvice.com,81700,81134,10,0.003727,0.003723\nuni-stuttgart.de,81570,81290,320,0.003721,0.003730\ndnevnik.hr,81382,80739,20,0.003713,0.003705\nibiblio.org,81361,81352,9,0.003712,0.003733\nlenovo.com,80932,80274,60,0.003692,0.003683\ngov.sk,80624,80342,147,0.003678,0.003686\nucf.edu,80453,80191,296,0.003670,0.003679\nexcite.co.jp,80390,78966,20,0.003668,0.003623\nuq.edu.au,80350,80146,218,0.003666,0.003677\nniedersachsen.de,80186,79702,309,0.003658,0.003657\nbiglobe.ne.jp,80083,79885,101,0.003654,0.003665\nuniroma1.it,79767,78666,391,0.003639,0.003609\nfacebook.com,79393,79073,10,0.003622,0.003628\noverheid.nl,79325,76302,47,0.003619,0.003501\nuiowa.edu,79278,78991,783,0.003617,0.003624\nuber.com,79259,78016,20,0.003616,0.003580\nunl.pt,79069,78927,299,0.003607,0.003621\nuni-goettingen.de,78863,78512,239,0.003598,0.003602\nuni-muenchen.de,78782,78726,519,0.003594,0.003612\nrtp.pt,78512,76754,20,0.003582,0.003522\nakipress.org,78423,78399,29,0.003578,0.003597\nunimelb.edu.au,78419,78407,114,0.003578,0.003598\nkrymr.com,78276,78122,3,0.003571,0.003585\nbg.ac.rs,78252,78007,523,0.003570,0.003579\nrbc.ua,78249,78210,16,0.003570,0.003589\nicrt.cu,78194,78182,58,0.003567,0.003587\nunifr.ch,78091,77679,38,0.003563,0.003564\nsputniknews.ru,77854,77590,9,0.003552,0.003560\nmiami.edu,77729,77401,497,0.003546,0.003551\nbncollege.com,77409,77328,458,0.003532,0.003548\nsinica.edu.tw,77283,77189,266,0.003526,0.003542\njotform.com,77248,77045,1041,0.003524,0.003535\nmetu.edu.tr,77021,76986,427,0.003514,0.003532\nuw.edu.pl,76960,76519,648,0.003511,0.003511\nneocities.org,76874,76667,11076,0.003507,0.003518\nhatenadiary.jp,76628,76616,692,0.003496,0.003515\nrp.pl,76273,75855,40,0.003480,0.003480\ngov.bc.ca,76125,75975,143,0.003473,0.003486\nstatcan.gc.ca,75890,75577,18,0.003462,0.003468\npp.ua,75844,75736,613,0.003460,0.003475\nlibreoffice.org,75742,75678,68,0.003455,0.003472\nuni-bremen.de,75569,75134,199,0.003448,0.003447\nbirdeye.com,75497,74654,6,0.003444,0.003425\nifeng.com,75485,75359,383,0.003444,0.003458\ngov.si,75406,75239,70,0.003440,0.003452\nunl.edu,75403,75214,580,0.003440,0.003451\ncheck24.de,75355,74878,49,0.003438,0.003436\nw3.org,75325,74994,14,0.003436,0.003441\npitt.edu,75288,74730,920,0.003435,0.003429\ncbssports.com,75278,74175,31,0.003434,0.003403\naljazeera.com,75185,73504,8,0.003430,0.003373\ndetik.com,75140,75020,28,0.003428,0.003442\naladin.co.kr,75123,74931,14,0.003427,0.003438\nbundestag.de,74854,74581,13,0.003415,0.003422\nucr.ac.cr,74786,74713,389,0.003412,0.003428\nutah.gov,74737,74535,376,0.003410,0.003420\nuzh.ch,74643,74365,746,0.003405,0.003412\nanswers.com,74640,74629,8,0.003405,0.003424\nkommersant.ru,74549,74500,18,0.003401,0.003418\ncancer.gov,74495,74235,89,0.003399,0.003406\nettoday.net,74306,74207,31,0.003390,0.003405\nhuaweicloud.com,74287,74267,51,0.003389,0.003408\nrug.nl,74179,73665,95,0.003384,0.003380\ncisco.com,74100,71722,103,0.003381,0.003291\nfreshdesk.com,73672,73272,2846,0.003361,0.003362\nnewsru.com,73106,73019,6,0.003335,0.003350\nuct.ac.za,73056,72591,141,0.003333,0.003331\ncorreiobraziliense.com.br,73027,72934,13,0.003332,0.003346\njst.go.jp,72982,72752,33,0.003330,0.003338\nut.ac.ir,72668,72516,299,0.003315,0.003327\ngatech.edu,72204,72071,736,0.003294,0.003307\nvlex.com,72158,72070,78,0.003292,0.003307\nchess-results.com,72013,71993,5,0.003285,0.003303\niprima.cz,71968,71915,12,0.003283,0.003300\nwroc.pl,71833,71619,548,0.003277,0.003286\nglobo.com,71818,71578,47,0.003276,0.003284\nunipd.it,71800,71563,408,0.003276,0.003284\ntyc.edu.tw,71731,71475,331,0.003272,0.003280\nacer.com,71666,71327,22,0.003270,0.003273\ntimesnownews.com,71304,71223,11,0.003253,0.003268\nchurchofjesuschrist.org,71219,70737,94,0.003249,0.003246\nwalmart.com,71135,70609,38,0.003245,0.003240\nstlouisfed.org,71127,71079,17,0.003245,0.003261\ntwitcasting.tv,70963,70681,38,0.003237,0.003243\nku.edu,70829,70683,608,0.003231,0.003243\nchinanews.com.cn,70809,70462,39,0.003230,0.003233\nlublin.pl,70809,70721,585,0.003230,0.003245\npraca.gov.pl,70655,70598,378,0.003223,0.003239\nindiamart.com,70203,70148,14,0.003203,0.003219\nfifa.com,70062,69257,32,0.003196,0.003178\nadelaide.edu.au,69949,66322,47,0.003191,0.003043\nbusiness-gazeta.ru,69908,69715,14,0.003189,0.003199\nnvidia.com,69859,68334,53,0.003187,0.003135\nshueisha.co.jp,69850,68877,53,0.003187,0.003160\nmoe.edu.tw,69805,69763,40,0.003185,0.003201\nfinalfantasyxiv.com,69804,69783,16,0.003185,0.003202\nepfl.ch,69568,68638,213,0.003174,0.003149\nnd.edu,69561,68584,123,0.003173,0.003147\nifixit.com,69486,69383,18,0.003170,0.003184\ndiscord.com,69437,67340,5,0.003168,0.003090\nkde.org,69415,69246,73,0.003167,0.003177\ncaixin.com,69160,68865,332,0.003155,0.003160\nfoxnews.com,69150,68965,14,0.003155,0.003164\nr-project.org,69077,68861,113,0.003151,0.003160\nhudl.com,69017,68782,61,0.003149,0.003156\nucdavis.edu,69002,68828,581,0.003148,0.003158\nuservoice.com,68975,68808,230,0.003147,0.003157\ninformator.ua,68851,68794,16,0.003141,0.003157\n"
  },
  {
    "path": "plots/domains-top-500.html",
    "content": "<table border=\"1\" class=\"dataframe tablesorter tablesearcher\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th>domain</th>\n      <th>pages</th>\n      <th>urls</th>\n      <th>hosts</th>\n      <th>%pages</th>\n      <th>%urls</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>blogspot.com</th>\n      <td>19780455</td>\n      <td>19755134</td>\n      <td>246742</td>\n      <td>0.902419</td>\n      <td>0.906434</td>\n    </tr>\n    <tr>\n      <th>wikipedia.org</th>\n      <td>3899574</td>\n      <td>3856416</td>\n      <td>372</td>\n      <td>0.177905</td>\n      <td>0.176946</td>\n    </tr>\n    <tr>\n      <th>wordpress.org</th>\n      <td>3330102</td>\n      <td>3329363</td>\n      <td>218</td>\n      <td>0.151925</td>\n      <td>0.152763</td>\n    </tr>\n    <tr>\n      <th>google.com</th>\n      <td>1839088</td>\n      <td>1803072</td>\n      <td>1809</td>\n      <td>0.083902</td>\n      <td>0.082731</td>\n    </tr>\n    <tr>\n      <th>wiktionary.org</th>\n      <td>1607921</td>\n      <td>1596057</td>\n      <td>195</td>\n      <td>0.073356</td>\n      <td>0.073233</td>\n    </tr>\n    <tr>\n      <th>europa.eu</th>\n      <td>1556837</td>\n      <td>1551415</td>\n      <td>731</td>\n      <td>0.071026</td>\n      <td>0.071184</td>\n    </tr>\n    <tr>\n      <th>oclc.org</th>\n      <td>1495406</td>\n      <td>1488924</td>\n      <td>635</td>\n      <td>0.068223</td>\n      <td>0.068317</td>\n    </tr>\n    <tr>\n      <th>made-in-china.com</th>\n      <td>1306394</td>\n      <td>1300407</td>\n      <td>14971</td>\n      <td>0.059600</td>\n      <td>0.059667</td>\n    </tr>\n    <tr>\n      <th>aif.ru</th>\n      <td>1091748</td>\n      <td>1091655</td>\n      <td>114</td>\n      <td>0.049807</td>\n      <td>0.050089</td>\n    </tr>\n    <tr>\n      <th>apple.com</th>\n      <td>978593</td>\n      <td>970153</td>\n      <td>102</td>\n      <td>0.044645</td>\n      <td>0.044514</td>\n    </tr>\n    <tr>\n      <th>hh.ru</th>\n      <td>960920</td>\n      <td>958755</td>\n      <td>3569</td>\n      <td>0.043839</td>\n      <td>0.043991</td>\n    </tr>\n    <tr>\n      <th>qq.com</th>\n      <td>815785</td>\n      <td>814765</td>\n      <td>1006</td>\n      <td>0.037218</td>\n      <td>0.037384</td>\n    </tr>\n    <tr>\n      <th>rakuten.co.jp</th>\n      <td>808679</td>\n      <td>804683</td>\n      <td>240</td>\n      <td>0.036893</td>\n      <td>0.036922</td>\n    </tr>\n    <tr>\n      <th>nih.gov</th>\n      <td>796095</td>\n      <td>791971</td>\n      <td>291</td>\n      <td>0.036319</td>\n      <td>0.036338</td>\n    </tr>\n    <tr>\n      <th>exblog.jp</th>\n      <td>734058</td>\n      <td>734032</td>\n      <td>10574</td>\n      <td>0.033489</td>\n      <td>0.033680</td>\n    </tr>\n    <tr>\n      <th>pixnet.net</th>\n      <td>726735</td>\n      <td>724013</td>\n      <td>10966</td>\n      <td>0.033155</td>\n      <td>0.033220</td>\n    </tr>\n    <tr>\n      <th>wikimedia.org</th>\n      <td>708476</td>\n      <td>694668</td>\n      <td>134</td>\n      <td>0.032322</td>\n      <td>0.031874</td>\n    </tr>\n    <tr>\n      <th>wikisource.org</th>\n      <td>686244</td>\n      <td>674136</td>\n      <td>85</td>\n      <td>0.031308</td>\n      <td>0.030932</td>\n    </tr>\n    <tr>\n      <th>microsoft.com</th>\n      <td>639205</td>\n      <td>624974</td>\n      <td>176</td>\n      <td>0.029162</td>\n      <td>0.028676</td>\n    </tr>\n    <tr>\n      <th>ox.ac.uk</th>\n      <td>634415</td>\n      <td>614570</td>\n      <td>1236</td>\n      <td>0.028943</td>\n      <td>0.028199</td>\n    </tr>\n    <tr>\n      <th>spydus.co.uk</th>\n      <td>620375</td>\n      <td>620374</td>\n      <td>54</td>\n      <td>0.028303</td>\n      <td>0.028465</td>\n    </tr>\n    <tr>\n      <th>app.link</th>\n      <td>597697</td>\n      <td>597654</td>\n      <td>4048</td>\n      <td>0.027268</td>\n      <td>0.027422</td>\n    </tr>\n    <tr>\n      <th>noblenet.org</th>\n      <td>592844</td>\n      <td>592843</td>\n      <td>26</td>\n      <td>0.027047</td>\n      <td>0.027202</td>\n    </tr>\n    <tr>\n      <th>indiatimes.com</th>\n      <td>589071</td>\n      <td>586931</td>\n      <td>87</td>\n      <td>0.026874</td>\n      <td>0.026930</td>\n    </tr>\n    <tr>\n      <th>amazonaws.com</th>\n      <td>588879</td>\n      <td>588388</td>\n      <td>4560</td>\n      <td>0.026866</td>\n      <td>0.026997</td>\n    </tr>\n    <tr>\n      <th>spb.ru</th>\n      <td>585915</td>\n      <td>583123</td>\n      <td>3149</td>\n      <td>0.026730</td>\n      <td>0.026756</td>\n    </tr>\n    <tr>\n      <th>airbnb.com</th>\n      <td>541856</td>\n      <td>541557</td>\n      <td>18</td>\n      <td>0.024720</td>\n      <td>0.024849</td>\n    </tr>\n    <tr>\n      <th>nii.ac.jp</th>\n      <td>527465</td>\n      <td>527273</td>\n      <td>683</td>\n      <td>0.024064</td>\n      <td>0.024193</td>\n    </tr>\n    <tr>\n      <th>alibaba.com</th>\n      <td>504793</td>\n      <td>504545</td>\n      <td>28961</td>\n      <td>0.023030</td>\n      <td>0.023150</td>\n    </tr>\n    <tr>\n      <th>berkeley.edu</th>\n      <td>502282</td>\n      <td>501739</td>\n      <td>1408</td>\n      <td>0.022915</td>\n      <td>0.023022</td>\n    </tr>\n    <tr>\n      <th>nasa.gov</th>\n      <td>494274</td>\n      <td>491674</td>\n      <td>401</td>\n      <td>0.022550</td>\n      <td>0.022560</td>\n    </tr>\n    <tr>\n      <th>googlesource.com</th>\n      <td>480793</td>\n      <td>480618</td>\n      <td>56</td>\n      <td>0.021935</td>\n      <td>0.022052</td>\n    </tr>\n    <tr>\n      <th>netlify.app</th>\n      <td>478768</td>\n      <td>478496</td>\n      <td>17666</td>\n      <td>0.021842</td>\n      <td>0.021955</td>\n    </tr>\n    <tr>\n      <th>wisc.edu</th>\n      <td>463649</td>\n      <td>462946</td>\n      <td>2115</td>\n      <td>0.021152</td>\n      <td>0.021242</td>\n    </tr>\n    <tr>\n      <th>web.app</th>\n      <td>449481</td>\n      <td>449430</td>\n      <td>10752</td>\n      <td>0.020506</td>\n      <td>0.020621</td>\n    </tr>\n    <tr>\n      <th>libsyn.com</th>\n      <td>444502</td>\n      <td>444302</td>\n      <td>3990</td>\n      <td>0.020279</td>\n      <td>0.020386</td>\n    </tr>\n    <tr>\n      <th>mail.ru</th>\n      <td>434680</td>\n      <td>432572</td>\n      <td>72</td>\n      <td>0.019831</td>\n      <td>0.019848</td>\n    </tr>\n    <tr>\n      <th>mit.edu</th>\n      <td>412283</td>\n      <td>410143</td>\n      <td>1241</td>\n      <td>0.018809</td>\n      <td>0.018819</td>\n    </tr>\n    <tr>\n      <th>debian.org</th>\n      <td>411258</td>\n      <td>409970</td>\n      <td>89</td>\n      <td>0.018762</td>\n      <td>0.018811</td>\n    </tr>\n    <tr>\n      <th>linternaute.com</th>\n      <td>405535</td>\n      <td>395168</td>\n      <td>14</td>\n      <td>0.018501</td>\n      <td>0.018132</td>\n    </tr>\n    <tr>\n      <th>unam.mx</th>\n      <td>384003</td>\n      <td>382990</td>\n      <td>1346</td>\n      <td>0.017519</td>\n      <td>0.017573</td>\n    </tr>\n    <tr>\n      <th>yandex.ru</th>\n      <td>382268</td>\n      <td>381870</td>\n      <td>129</td>\n      <td>0.017440</td>\n      <td>0.017522</td>\n    </tr>\n    <tr>\n      <th>24tv.ua</th>\n      <td>381418</td>\n      <td>380815</td>\n      <td>45</td>\n      <td>0.017401</td>\n      <td>0.017473</td>\n    </tr>\n    <tr>\n      <th>mozilla.org</th>\n      <td>373851</td>\n      <td>372514</td>\n      <td>57</td>\n      <td>0.017056</td>\n      <td>0.017092</td>\n    </tr>\n    <tr>\n      <th>oracle.com</th>\n      <td>370664</td>\n      <td>361221</td>\n      <td>58</td>\n      <td>0.016910</td>\n      <td>0.016574</td>\n    </tr>\n    <tr>\n      <th>nsw.gov.au</th>\n      <td>368321</td>\n      <td>367498</td>\n      <td>2482</td>\n      <td>0.016803</td>\n      <td>0.016862</td>\n    </tr>\n    <tr>\n      <th>sina.com.cn</th>\n      <td>364690</td>\n      <td>363771</td>\n      <td>349</td>\n      <td>0.016638</td>\n      <td>0.016691</td>\n    </tr>\n    <tr>\n      <th>noaa.gov</th>\n      <td>360939</td>\n      <td>360725</td>\n      <td>287</td>\n      <td>0.016467</td>\n      <td>0.016551</td>\n    </tr>\n    <tr>\n      <th>adobe.com</th>\n      <td>360877</td>\n      <td>352743</td>\n      <td>110</td>\n      <td>0.016464</td>\n      <td>0.016185</td>\n    </tr>\n    <tr>\n      <th>godaddy.com</th>\n      <td>358683</td>\n      <td>343405</td>\n      <td>431</td>\n      <td>0.016364</td>\n      <td>0.015757</td>\n    </tr>\n    <tr>\n      <th>uol.com.br</th>\n      <td>357558</td>\n      <td>356224</td>\n      <td>493</td>\n      <td>0.016312</td>\n      <td>0.016345</td>\n    </tr>\n    <tr>\n      <th>youtube.com</th>\n      <td>346960</td>\n      <td>344346</td>\n      <td>11</td>\n      <td>0.015829</td>\n      <td>0.015800</td>\n    </tr>\n    <tr>\n      <th>voanews.com</th>\n      <td>341842</td>\n      <td>340267</td>\n      <td>13</td>\n      <td>0.015595</td>\n      <td>0.015613</td>\n    </tr>\n    <tr>\n      <th>worldbank.org</th>\n      <td>340176</td>\n      <td>339529</td>\n      <td>89</td>\n      <td>0.015519</td>\n      <td>0.015579</td>\n    </tr>\n    <tr>\n      <th>hatenablog.com</th>\n      <td>338057</td>\n      <td>337969</td>\n      <td>3200</td>\n      <td>0.015423</td>\n      <td>0.015507</td>\n    </tr>\n    <tr>\n      <th>yahoo.co.jp</th>\n      <td>337128</td>\n      <td>334645</td>\n      <td>132</td>\n      <td>0.015380</td>\n      <td>0.015355</td>\n    </tr>\n    <tr>\n      <th>line.me</th>\n      <td>329069</td>\n      <td>324146</td>\n      <td>76</td>\n      <td>0.015013</td>\n      <td>0.014873</td>\n    </tr>\n    <tr>\n      <th>github.io</th>\n      <td>327863</td>\n      <td>326380</td>\n      <td>33911</td>\n      <td>0.014958</td>\n      <td>0.014975</td>\n    </tr>\n    <tr>\n      <th>yale.edu</th>\n      <td>326214</td>\n      <td>325419</td>\n      <td>858</td>\n      <td>0.014882</td>\n      <td>0.014931</td>\n    </tr>\n    <tr>\n      <th>free.fr</th>\n      <td>322481</td>\n      <td>322134</td>\n      <td>4231</td>\n      <td>0.014712</td>\n      <td>0.014781</td>\n    </tr>\n    <tr>\n      <th>shein.com</th>\n      <td>322203</td>\n      <td>321997</td>\n      <td>45</td>\n      <td>0.014699</td>\n      <td>0.014774</td>\n    </tr>\n    <tr>\n      <th>udn.com</th>\n      <td>320357</td>\n      <td>319932</td>\n      <td>59</td>\n      <td>0.014615</td>\n      <td>0.014680</td>\n    </tr>\n    <tr>\n      <th>ning.com</th>\n      <td>313598</td>\n      <td>313032</td>\n      <td>623</td>\n      <td>0.014307</td>\n      <td>0.014363</td>\n    </tr>\n    <tr>\n      <th>github.com</th>\n      <td>301968</td>\n      <td>297839</td>\n      <td>41</td>\n      <td>0.013776</td>\n      <td>0.013666</td>\n    </tr>\n    <tr>\n      <th>wixsite.com</th>\n      <td>296575</td>\n      <td>290601</td>\n      <td>88429</td>\n      <td>0.013530</td>\n      <td>0.013334</td>\n    </tr>\n    <tr>\n      <th>substack.com</th>\n      <td>292141</td>\n      <td>287493</td>\n      <td>48941</td>\n      <td>0.013328</td>\n      <td>0.013191</td>\n    </tr>\n    <tr>\n      <th>bing.com</th>\n      <td>290203</td>\n      <td>289883</td>\n      <td>26</td>\n      <td>0.013240</td>\n      <td>0.013301</td>\n    </tr>\n    <tr>\n      <th>cornell.edu</th>\n      <td>289009</td>\n      <td>287737</td>\n      <td>796</td>\n      <td>0.013185</td>\n      <td>0.013202</td>\n    </tr>\n    <tr>\n      <th>wikidot.com</th>\n      <td>287476</td>\n      <td>287014</td>\n      <td>14203</td>\n      <td>0.013115</td>\n      <td>0.013169</td>\n    </tr>\n    <tr>\n      <th>stanford.edu</th>\n      <td>284007</td>\n      <td>283405</td>\n      <td>1627</td>\n      <td>0.012957</td>\n      <td>0.013004</td>\n    </tr>\n    <tr>\n      <th>usda.gov</th>\n      <td>281485</td>\n      <td>278602</td>\n      <td>147</td>\n      <td>0.012842</td>\n      <td>0.012783</td>\n    </tr>\n    <tr>\n      <th>duke.edu</th>\n      <td>278884</td>\n      <td>278290</td>\n      <td>713</td>\n      <td>0.012723</td>\n      <td>0.012769</td>\n    </tr>\n    <tr>\n      <th>weebly.com</th>\n      <td>271097</td>\n      <td>266932</td>\n      <td>77340</td>\n      <td>0.012368</td>\n      <td>0.012248</td>\n    </tr>\n    <tr>\n      <th>usp.br</th>\n      <td>270931</td>\n      <td>269153</td>\n      <td>1149</td>\n      <td>0.012360</td>\n      <td>0.012350</td>\n    </tr>\n    <tr>\n      <th>impress.co.jp</th>\n      <td>269711</td>\n      <td>268720</td>\n      <td>42</td>\n      <td>0.012305</td>\n      <td>0.012330</td>\n    </tr>\n    <tr>\n      <th>salesforce.com</th>\n      <td>269408</td>\n      <td>268497</td>\n      <td>55</td>\n      <td>0.012291</td>\n      <td>0.012320</td>\n    </tr>\n    <tr>\n      <th>ca.gov</th>\n      <td>268009</td>\n      <td>266253</td>\n      <td>1132</td>\n      <td>0.012227</td>\n      <td>0.012217</td>\n    </tr>\n    <tr>\n      <th>ubc.ca</th>\n      <td>267395</td>\n      <td>266896</td>\n      <td>1574</td>\n      <td>0.012199</td>\n      <td>0.012246</td>\n    </tr>\n    <tr>\n      <th>rambler.ru</th>\n      <td>266885</td>\n      <td>266183</td>\n      <td>38</td>\n      <td>0.012176</td>\n      <td>0.012213</td>\n    </tr>\n    <tr>\n      <th>atlassian.net</th>\n      <td>265955</td>\n      <td>265004</td>\n      <td>5761</td>\n      <td>0.012133</td>\n      <td>0.012159</td>\n    </tr>\n    <tr>\n      <th>banggood.com</th>\n      <td>265607</td>\n      <td>265440</td>\n      <td>54</td>\n      <td>0.012117</td>\n      <td>0.012179</td>\n    </tr>\n    <tr>\n      <th>amazon.com</th>\n      <td>262154</td>\n      <td>254349</td>\n      <td>97</td>\n      <td>0.011960</td>\n      <td>0.011670</td>\n    </tr>\n    <tr>\n      <th>rbc.ru</th>\n      <td>261968</td>\n      <td>261621</td>\n      <td>102</td>\n      <td>0.011951</td>\n      <td>0.012004</td>\n    </tr>\n    <tr>\n      <th>sohu.com</th>\n      <td>255494</td>\n      <td>255007</td>\n      <td>183</td>\n      <td>0.011656</td>\n      <td>0.011701</td>\n    </tr>\n    <tr>\n      <th>mathworks.com</th>\n      <td>255103</td>\n      <td>254225</td>\n      <td>29</td>\n      <td>0.011638</td>\n      <td>0.011665</td>\n    </tr>\n    <tr>\n      <th>163.com</th>\n      <td>250397</td>\n      <td>250030</td>\n      <td>535</td>\n      <td>0.011424</td>\n      <td>0.011472</td>\n    </tr>\n    <tr>\n      <th>tistory.com</th>\n      <td>249860</td>\n      <td>249825</td>\n      <td>2548</td>\n      <td>0.011399</td>\n      <td>0.011463</td>\n    </tr>\n    <tr>\n      <th>blog.jp</th>\n      <td>246779</td>\n      <td>246663</td>\n      <td>1932</td>\n      <td>0.011258</td>\n      <td>0.011318</td>\n    </tr>\n    <tr>\n      <th>muni.cz</th>\n      <td>241737</td>\n      <td>241405</td>\n      <td>562</td>\n      <td>0.011028</td>\n      <td>0.011077</td>\n    </tr>\n    <tr>\n      <th>craigslist.org</th>\n      <td>240073</td>\n      <td>239862</td>\n      <td>665</td>\n      <td>0.010953</td>\n      <td>0.011006</td>\n    </tr>\n    <tr>\n      <th>utoronto.ca</th>\n      <td>239646</td>\n      <td>239166</td>\n      <td>974</td>\n      <td>0.010933</td>\n      <td>0.010974</td>\n    </tr>\n    <tr>\n      <th>samsung.com</th>\n      <td>235545</td>\n      <td>233412</td>\n      <td>61</td>\n      <td>0.010746</td>\n      <td>0.010710</td>\n    </tr>\n    <tr>\n      <th>illinois.edu</th>\n      <td>234987</td>\n      <td>234471</td>\n      <td>1694</td>\n      <td>0.010721</td>\n      <td>0.010758</td>\n    </tr>\n    <tr>\n      <th>ndl.go.jp</th>\n      <td>233653</td>\n      <td>233325</td>\n      <td>20</td>\n      <td>0.010660</td>\n      <td>0.010706</td>\n    </tr>\n    <tr>\n      <th>cocolog-nifty.com</th>\n      <td>226030</td>\n      <td>225755</td>\n      <td>1703</td>\n      <td>0.010312</td>\n      <td>0.010358</td>\n    </tr>\n    <tr>\n      <th>iheart.com</th>\n      <td>225832</td>\n      <td>225418</td>\n      <td>964</td>\n      <td>0.010303</td>\n      <td>0.010343</td>\n    </tr>\n    <tr>\n      <th>mpg.de</th>\n      <td>224016</td>\n      <td>223428</td>\n      <td>530</td>\n      <td>0.010220</td>\n      <td>0.010252</td>\n    </tr>\n    <tr>\n      <th>opera.com</th>\n      <td>223863</td>\n      <td>222098</td>\n      <td>28</td>\n      <td>0.010213</td>\n      <td>0.010191</td>\n    </tr>\n    <tr>\n      <th>admin.ch</th>\n      <td>223528</td>\n      <td>208997</td>\n      <td>327</td>\n      <td>0.010198</td>\n      <td>0.009590</td>\n    </tr>\n    <tr>\n      <th>appspot.com</th>\n      <td>222624</td>\n      <td>221182</td>\n      <td>1157</td>\n      <td>0.010156</td>\n      <td>0.010149</td>\n    </tr>\n    <tr>\n      <th>ubuntu.com</th>\n      <td>222331</td>\n      <td>221559</td>\n      <td>142</td>\n      <td>0.010143</td>\n      <td>0.010166</td>\n    </tr>\n    <tr>\n      <th>harvard.edu</th>\n      <td>222222</td>\n      <td>221063</td>\n      <td>754</td>\n      <td>0.010138</td>\n      <td>0.010143</td>\n    </tr>\n    <tr>\n      <th>upenn.edu</th>\n      <td>220443</td>\n      <td>219800</td>\n      <td>677</td>\n      <td>0.010057</td>\n      <td>0.010085</td>\n    </tr>\n    <tr>\n      <th>freelancer.com</th>\n      <td>220217</td>\n      <td>220088</td>\n      <td>9</td>\n      <td>0.010047</td>\n      <td>0.010098</td>\n    </tr>\n    <tr>\n      <th>shopify.com</th>\n      <td>218276</td>\n      <td>215408</td>\n      <td>20</td>\n      <td>0.009958</td>\n      <td>0.009884</td>\n    </tr>\n    <tr>\n      <th>archive.org</th>\n      <td>215667</td>\n      <td>192970</td>\n      <td>796</td>\n      <td>0.009839</td>\n      <td>0.008854</td>\n    </tr>\n    <tr>\n      <th>ibm.com</th>\n      <td>215131</td>\n      <td>213151</td>\n      <td>104</td>\n      <td>0.009815</td>\n      <td>0.009780</td>\n    </tr>\n    <tr>\n      <th>over-blog.com</th>\n      <td>214758</td>\n      <td>214277</td>\n      <td>1719</td>\n      <td>0.009798</td>\n      <td>0.009832</td>\n    </tr>\n    <tr>\n      <th>af.mil</th>\n      <td>212886</td>\n      <td>212703</td>\n      <td>335</td>\n      <td>0.009712</td>\n      <td>0.009760</td>\n    </tr>\n    <tr>\n      <th>porsche.com</th>\n      <td>212521</td>\n      <td>211280</td>\n      <td>161</td>\n      <td>0.009696</td>\n      <td>0.009694</td>\n    </tr>\n    <tr>\n      <th>canalblog.com</th>\n      <td>210869</td>\n      <td>210328</td>\n      <td>1559</td>\n      <td>0.009620</td>\n      <td>0.009651</td>\n    </tr>\n    <tr>\n      <th>afternic.com</th>\n      <td>208966</td>\n      <td>199302</td>\n      <td>5</td>\n      <td>0.009533</td>\n      <td>0.009145</td>\n    </tr>\n    <tr>\n      <th>hotels.com</th>\n      <td>208779</td>\n      <td>208407</td>\n      <td>35</td>\n      <td>0.009525</td>\n      <td>0.009562</td>\n    </tr>\n    <tr>\n      <th>sap.com</th>\n      <td>208262</td>\n      <td>194884</td>\n      <td>48</td>\n      <td>0.009501</td>\n      <td>0.008942</td>\n    </tr>\n    <tr>\n      <th>krakow.pl</th>\n      <td>207082</td>\n      <td>206315</td>\n      <td>1214</td>\n      <td>0.009447</td>\n      <td>0.009466</td>\n    </tr>\n    <tr>\n      <th>hatenablog.jp</th>\n      <td>204606</td>\n      <td>204559</td>\n      <td>2555</td>\n      <td>0.009334</td>\n      <td>0.009386</td>\n    </tr>\n    <tr>\n      <th>usu.edu</th>\n      <td>201493</td>\n      <td>199714</td>\n      <td>84</td>\n      <td>0.009192</td>\n      <td>0.009164</td>\n    </tr>\n    <tr>\n      <th>cuni.cz</th>\n      <td>200724</td>\n      <td>199935</td>\n      <td>754</td>\n      <td>0.009157</td>\n      <td>0.009174</td>\n    </tr>\n    <tr>\n      <th>uk.com</th>\n      <td>200178</td>\n      <td>192398</td>\n      <td>5221</td>\n      <td>0.009132</td>\n      <td>0.008828</td>\n    </tr>\n    <tr>\n      <th>cloudfront.net</th>\n      <td>199005</td>\n      <td>198042</td>\n      <td>1858</td>\n      <td>0.009079</td>\n      <td>0.009087</td>\n    </tr>\n    <tr>\n      <th>gov.ru</th>\n      <td>198296</td>\n      <td>197315</td>\n      <td>470</td>\n      <td>0.009047</td>\n      <td>0.009053</td>\n    </tr>\n    <tr>\n      <th>redhat.com</th>\n      <td>197152</td>\n      <td>195886</td>\n      <td>46</td>\n      <td>0.008994</td>\n      <td>0.008988</td>\n    </tr>\n    <tr>\n      <th>android.com</th>\n      <td>195412</td>\n      <td>189952</td>\n      <td>11</td>\n      <td>0.008915</td>\n      <td>0.008716</td>\n    </tr>\n    <tr>\n      <th>cam.ac.uk</th>\n      <td>194780</td>\n      <td>193856</td>\n      <td>846</td>\n      <td>0.008886</td>\n      <td>0.008895</td>\n    </tr>\n    <tr>\n      <th>usgs.gov</th>\n      <td>189866</td>\n      <td>189464</td>\n      <td>101</td>\n      <td>0.008662</td>\n      <td>0.008693</td>\n    </tr>\n    <tr>\n      <th>workplace.com</th>\n      <td>188902</td>\n      <td>188760</td>\n      <td>291</td>\n      <td>0.008618</td>\n      <td>0.008661</td>\n    </tr>\n    <tr>\n      <th>psu.edu</th>\n      <td>186946</td>\n      <td>183515</td>\n      <td>575</td>\n      <td>0.008529</td>\n      <td>0.008420</td>\n    </tr>\n    <tr>\n      <th>bibliocommons.com</th>\n      <td>186576</td>\n      <td>186181</td>\n      <td>335</td>\n      <td>0.008512</td>\n      <td>0.008543</td>\n    </tr>\n    <tr>\n      <th>bnf.fr</th>\n      <td>177176</td>\n      <td>177018</td>\n      <td>50</td>\n      <td>0.008083</td>\n      <td>0.008122</td>\n    </tr>\n    <tr>\n      <th>onet.pl</th>\n      <td>176630</td>\n      <td>175822</td>\n      <td>47</td>\n      <td>0.008058</td>\n      <td>0.008067</td>\n    </tr>\n    <tr>\n      <th>fedoraproject.org</th>\n      <td>176020</td>\n      <td>175738</td>\n      <td>73</td>\n      <td>0.008030</td>\n      <td>0.008063</td>\n    </tr>\n    <tr>\n      <th>nist.gov</th>\n      <td>175987</td>\n      <td>175364</td>\n      <td>88</td>\n      <td>0.008029</td>\n      <td>0.008046</td>\n    </tr>\n    <tr>\n      <th>un.org</th>\n      <td>175817</td>\n      <td>175067</td>\n      <td>242</td>\n      <td>0.008021</td>\n      <td>0.008033</td>\n    </tr>\n    <tr>\n      <th>hindustantimes.com</th>\n      <td>175558</td>\n      <td>174920</td>\n      <td>14</td>\n      <td>0.008009</td>\n      <td>0.008026</td>\n    </tr>\n    <tr>\n      <th>washington.edu</th>\n      <td>174322</td>\n      <td>173261</td>\n      <td>378</td>\n      <td>0.007953</td>\n      <td>0.007950</td>\n    </tr>\n    <tr>\n      <th>itmedia.co.jp</th>\n      <td>171201</td>\n      <td>170201</td>\n      <td>39</td>\n      <td>0.007810</td>\n      <td>0.007809</td>\n    </tr>\n    <tr>\n      <th>org.ru</th>\n      <td>169636</td>\n      <td>164916</td>\n      <td>466</td>\n      <td>0.007739</td>\n      <td>0.007567</td>\n    </tr>\n    <tr>\n      <th>princeton.edu</th>\n      <td>169054</td>\n      <td>167003</td>\n      <td>520</td>\n      <td>0.007713</td>\n      <td>0.007663</td>\n    </tr>\n    <tr>\n      <th>ub.edu</th>\n      <td>168922</td>\n      <td>164590</td>\n      <td>110</td>\n      <td>0.007707</td>\n      <td>0.007552</td>\n    </tr>\n    <tr>\n      <th>kayak.com</th>\n      <td>168854</td>\n      <td>168793</td>\n      <td>17</td>\n      <td>0.007703</td>\n      <td>0.007745</td>\n    </tr>\n    <tr>\n      <th>narod.ru</th>\n      <td>168468</td>\n      <td>168414</td>\n      <td>10483</td>\n      <td>0.007686</td>\n      <td>0.007727</td>\n    </tr>\n    <tr>\n      <th>kremlin.ru</th>\n      <td>166712</td>\n      <td>165787</td>\n      <td>24</td>\n      <td>0.007606</td>\n      <td>0.007607</td>\n    </tr>\n    <tr>\n      <th>ntu.edu.tw</th>\n      <td>164907</td>\n      <td>164569</td>\n      <td>519</td>\n      <td>0.007523</td>\n      <td>0.007551</td>\n    </tr>\n    <tr>\n      <th>seesaa.net</th>\n      <td>161429</td>\n      <td>160284</td>\n      <td>1984</td>\n      <td>0.007365</td>\n      <td>0.007354</td>\n    </tr>\n    <tr>\n      <th>foursquare.com</th>\n      <td>161125</td>\n      <td>160997</td>\n      <td>21</td>\n      <td>0.007351</td>\n      <td>0.007387</td>\n    </tr>\n    <tr>\n      <th>docomo.ne.jp</th>\n      <td>156735</td>\n      <td>156026</td>\n      <td>88</td>\n      <td>0.007151</td>\n      <td>0.007159</td>\n    </tr>\n    <tr>\n      <th>archlinux.org</th>\n      <td>156131</td>\n      <td>155779</td>\n      <td>22</td>\n      <td>0.007123</td>\n      <td>0.007148</td>\n    </tr>\n    <tr>\n      <th>uefa.com</th>\n      <td>153249</td>\n      <td>152266</td>\n      <td>25</td>\n      <td>0.006991</td>\n      <td>0.006986</td>\n    </tr>\n    <tr>\n      <th>hatena.ne.jp</th>\n      <td>152722</td>\n      <td>148800</td>\n      <td>27</td>\n      <td>0.006967</td>\n      <td>0.006827</td>\n    </tr>\n    <tr>\n      <th>hypotheses.org</th>\n      <td>152269</td>\n      <td>152147</td>\n      <td>1666</td>\n      <td>0.006947</td>\n      <td>0.006981</td>\n    </tr>\n    <tr>\n      <th>yorku.ca</th>\n      <td>149121</td>\n      <td>148429</td>\n      <td>479</td>\n      <td>0.006803</td>\n      <td>0.006810</td>\n    </tr>\n    <tr>\n      <th>pchome.com.tw</th>\n      <td>148643</td>\n      <td>148497</td>\n      <td>18</td>\n      <td>0.006781</td>\n      <td>0.006814</td>\n    </tr>\n    <tr>\n      <th>army.mil</th>\n      <td>148389</td>\n      <td>147521</td>\n      <td>280</td>\n      <td>0.006770</td>\n      <td>0.006769</td>\n    </tr>\n    <tr>\n      <th>uni-heidelberg.de</th>\n      <td>147395</td>\n      <td>144396</td>\n      <td>302</td>\n      <td>0.006724</td>\n      <td>0.006625</td>\n    </tr>\n    <tr>\n      <th>wikiquote.org</th>\n      <td>146925</td>\n      <td>143298</td>\n      <td>100</td>\n      <td>0.006703</td>\n      <td>0.006575</td>\n    </tr>\n    <tr>\n      <th>umn.edu</th>\n      <td>146463</td>\n      <td>145864</td>\n      <td>1124</td>\n      <td>0.006682</td>\n      <td>0.006693</td>\n    </tr>\n    <tr>\n      <th>intuit.com</th>\n      <td>145094</td>\n      <td>144701</td>\n      <td>85</td>\n      <td>0.006619</td>\n      <td>0.006639</td>\n    </tr>\n    <tr>\n      <th>arizona.edu</th>\n      <td>145014</td>\n      <td>142369</td>\n      <td>1228</td>\n      <td>0.006616</td>\n      <td>0.006532</td>\n    </tr>\n    <tr>\n      <th>jd.com</th>\n      <td>145013</td>\n      <td>144488</td>\n      <td>2329</td>\n      <td>0.006616</td>\n      <td>0.006630</td>\n    </tr>\n    <tr>\n      <th>ru-land.com</th>\n      <td>142630</td>\n      <td>142396</td>\n      <td>12</td>\n      <td>0.006507</td>\n      <td>0.006534</td>\n    </tr>\n    <tr>\n      <th>elpais.com</th>\n      <td>142370</td>\n      <td>140938</td>\n      <td>29</td>\n      <td>0.006495</td>\n      <td>0.006467</td>\n    </tr>\n    <tr>\n      <th>wikibooks.org</th>\n      <td>142004</td>\n      <td>139294</td>\n      <td>122</td>\n      <td>0.006478</td>\n      <td>0.006391</td>\n    </tr>\n    <tr>\n      <th>sapo.pt</th>\n      <td>141847</td>\n      <td>140980</td>\n      <td>93</td>\n      <td>0.006471</td>\n      <td>0.006469</td>\n    </tr>\n    <tr>\n      <th>chinadaily.com.cn</th>\n      <td>141828</td>\n      <td>141637</td>\n      <td>109</td>\n      <td>0.006470</td>\n      <td>0.006499</td>\n    </tr>\n    <tr>\n      <th>livejournal.com</th>\n      <td>141161</td>\n      <td>141156</td>\n      <td>1953</td>\n      <td>0.006440</td>\n      <td>0.006477</td>\n    </tr>\n    <tr>\n      <th>obozrevatel.com</th>\n      <td>141062</td>\n      <td>140643</td>\n      <td>28</td>\n      <td>0.006435</td>\n      <td>0.006453</td>\n    </tr>\n    <tr>\n      <th>hse.ru</th>\n      <td>139830</td>\n      <td>137442</td>\n      <td>479</td>\n      <td>0.006379</td>\n      <td>0.006306</td>\n    </tr>\n    <tr>\n      <th>nicovideo.jp</th>\n      <td>139786</td>\n      <td>139610</td>\n      <td>35</td>\n      <td>0.006377</td>\n      <td>0.006406</td>\n    </tr>\n    <tr>\n      <th>unibo.it</th>\n      <td>139536</td>\n      <td>138716</td>\n      <td>315</td>\n      <td>0.006366</td>\n      <td>0.006365</td>\n    </tr>\n    <tr>\n      <th>hateblo.jp</th>\n      <td>139234</td>\n      <td>139210</td>\n      <td>1647</td>\n      <td>0.006352</td>\n      <td>0.006387</td>\n    </tr>\n    <tr>\n      <th>globalvoices.org</th>\n      <td>138602</td>\n      <td>137090</td>\n      <td>71</td>\n      <td>0.006323</td>\n      <td>0.006290</td>\n    </tr>\n    <tr>\n      <th>utexas.edu</th>\n      <td>138577</td>\n      <td>138172</td>\n      <td>648</td>\n      <td>0.006322</td>\n      <td>0.006340</td>\n    </tr>\n    <tr>\n      <th>ceskatelevize.cz</th>\n      <td>138431</td>\n      <td>137890</td>\n      <td>17</td>\n      <td>0.006315</td>\n      <td>0.006327</td>\n    </tr>\n    <tr>\n      <th>wikinews.org</th>\n      <td>137732</td>\n      <td>135089</td>\n      <td>36</td>\n      <td>0.006284</td>\n      <td>0.006198</td>\n    </tr>\n    <tr>\n      <th>cern.ch</th>\n      <td>137615</td>\n      <td>137484</td>\n      <td>405</td>\n      <td>0.006278</td>\n      <td>0.006308</td>\n    </tr>\n    <tr>\n      <th>err.ee</th>\n      <td>137407</td>\n      <td>136960</td>\n      <td>27</td>\n      <td>0.006269</td>\n      <td>0.006284</td>\n    </tr>\n    <tr>\n      <th>google.cn</th>\n      <td>136705</td>\n      <td>133699</td>\n      <td>27</td>\n      <td>0.006237</td>\n      <td>0.006135</td>\n    </tr>\n    <tr>\n      <th>freebsd.org</th>\n      <td>136369</td>\n      <td>136163</td>\n      <td>90</td>\n      <td>0.006221</td>\n      <td>0.006248</td>\n    </tr>\n    <tr>\n      <th>elespanol.com</th>\n      <td>135672</td>\n      <td>135266</td>\n      <td>13</td>\n      <td>0.006190</td>\n      <td>0.006206</td>\n    </tr>\n    <tr>\n      <th>texas.gov</th>\n      <td>135595</td>\n      <td>134955</td>\n      <td>268</td>\n      <td>0.006186</td>\n      <td>0.006192</td>\n    </tr>\n    <tr>\n      <th>ufsc.br</th>\n      <td>134827</td>\n      <td>132890</td>\n      <td>1690</td>\n      <td>0.006151</td>\n      <td>0.006097</td>\n    </tr>\n    <tr>\n      <th>aliyun.com</th>\n      <td>134706</td>\n      <td>132697</td>\n      <td>118</td>\n      <td>0.006146</td>\n      <td>0.006089</td>\n    </tr>\n    <tr>\n      <th>livedoor.biz</th>\n      <td>134433</td>\n      <td>134377</td>\n      <td>650</td>\n      <td>0.006133</td>\n      <td>0.006166</td>\n    </tr>\n    <tr>\n      <th>hawaii.edu</th>\n      <td>133777</td>\n      <td>133466</td>\n      <td>309</td>\n      <td>0.006103</td>\n      <td>0.006124</td>\n    </tr>\n    <tr>\n      <th>wix.com</th>\n      <td>133645</td>\n      <td>131864</td>\n      <td>40</td>\n      <td>0.006097</td>\n      <td>0.006050</td>\n    </tr>\n    <tr>\n      <th>podbean.com</th>\n      <td>132784</td>\n      <td>132449</td>\n      <td>18246</td>\n      <td>0.006058</td>\n      <td>0.006077</td>\n    </tr>\n    <tr>\n      <th>apache.org</th>\n      <td>132197</td>\n      <td>131781</td>\n      <td>359</td>\n      <td>0.006031</td>\n      <td>0.006047</td>\n    </tr>\n    <tr>\n      <th>academic.ru</th>\n      <td>132021</td>\n      <td>131925</td>\n      <td>1051</td>\n      <td>0.006023</td>\n      <td>0.006053</td>\n    </tr>\n    <tr>\n      <th>shop-pro.jp</th>\n      <td>131396</td>\n      <td>131069</td>\n      <td>3498</td>\n      <td>0.005995</td>\n      <td>0.006014</td>\n    </tr>\n    <tr>\n      <th>hugedomains.com</th>\n      <td>129845</td>\n      <td>113843</td>\n      <td>1</td>\n      <td>0.005924</td>\n      <td>0.005224</td>\n    </tr>\n    <tr>\n      <th>purdue.edu</th>\n      <td>129663</td>\n      <td>129124</td>\n      <td>232</td>\n      <td>0.005915</td>\n      <td>0.005925</td>\n    </tr>\n    <tr>\n      <th>teachable.com</th>\n      <td>129623</td>\n      <td>129400</td>\n      <td>4337</td>\n      <td>0.005914</td>\n      <td>0.005937</td>\n    </tr>\n    <tr>\n      <th>frontiersin.org</th>\n      <td>129433</td>\n      <td>129202</td>\n      <td>13</td>\n      <td>0.005905</td>\n      <td>0.005928</td>\n    </tr>\n    <tr>\n      <th>walla.co.il</th>\n      <td>129330</td>\n      <td>129190</td>\n      <td>156</td>\n      <td>0.005900</td>\n      <td>0.005928</td>\n    </tr>\n    <tr>\n      <th>univie.ac.at</th>\n      <td>129252</td>\n      <td>128921</td>\n      <td>1235</td>\n      <td>0.005897</td>\n      <td>0.005915</td>\n    </tr>\n    <tr>\n      <th>libretexts.org</th>\n      <td>129195</td>\n      <td>127985</td>\n      <td>35</td>\n      <td>0.005894</td>\n      <td>0.005872</td>\n    </tr>\n    <tr>\n      <th>kb.se</th>\n      <td>129119</td>\n      <td>126491</td>\n      <td>42</td>\n      <td>0.005891</td>\n      <td>0.005804</td>\n    </tr>\n    <tr>\n      <th>iu.edu</th>\n      <td>128288</td>\n      <td>127998</td>\n      <td>595</td>\n      <td>0.005853</td>\n      <td>0.005873</td>\n    </tr>\n    <tr>\n      <th>siemens.com</th>\n      <td>127994</td>\n      <td>125548</td>\n      <td>82</td>\n      <td>0.005839</td>\n      <td>0.005761</td>\n    </tr>\n    <tr>\n      <th>wa.gov</th>\n      <td>127816</td>\n      <td>126643</td>\n      <td>286</td>\n      <td>0.005831</td>\n      <td>0.005811</td>\n    </tr>\n    <tr>\n      <th>dict.cc</th>\n      <td>127624</td>\n      <td>127531</td>\n      <td>202</td>\n      <td>0.005822</td>\n      <td>0.005852</td>\n    </tr>\n    <tr>\n      <th>spotify.com</th>\n      <td>127561</td>\n      <td>127167</td>\n      <td>29</td>\n      <td>0.005820</td>\n      <td>0.005835</td>\n    </tr>\n    <tr>\n      <th>azurewebsites.net</th>\n      <td>126146</td>\n      <td>125642</td>\n      <td>4420</td>\n      <td>0.005755</td>\n      <td>0.005765</td>\n    </tr>\n    <tr>\n      <th>t.me</th>\n      <td>125871</td>\n      <td>124106</td>\n      <td>2</td>\n      <td>0.005742</td>\n      <td>0.005694</td>\n    </tr>\n    <tr>\n      <th>chinaz.com</th>\n      <td>125759</td>\n      <td>124914</td>\n      <td>61</td>\n      <td>0.005737</td>\n      <td>0.005731</td>\n    </tr>\n    <tr>\n      <th>msu.edu</th>\n      <td>125347</td>\n      <td>124969</td>\n      <td>744</td>\n      <td>0.005719</td>\n      <td>0.005734</td>\n    </tr>\n    <tr>\n      <th>iastate.edu</th>\n      <td>125018</td>\n      <td>124833</td>\n      <td>582</td>\n      <td>0.005704</td>\n      <td>0.005728</td>\n    </tr>\n    <tr>\n      <th>interfax.com.ua</th>\n      <td>124866</td>\n      <td>115330</td>\n      <td>4</td>\n      <td>0.005697</td>\n      <td>0.005292</td>\n    </tr>\n    <tr>\n      <th>ria.ru</th>\n      <td>124501</td>\n      <td>123247</td>\n      <td>28</td>\n      <td>0.005680</td>\n      <td>0.005655</td>\n    </tr>\n    <tr>\n      <th>ethz.ch</th>\n      <td>124381</td>\n      <td>123738</td>\n      <td>632</td>\n      <td>0.005674</td>\n      <td>0.005678</td>\n    </tr>\n    <tr>\n      <th>canada.ca</th>\n      <td>124356</td>\n      <td>122994</td>\n      <td>162</td>\n      <td>0.005673</td>\n      <td>0.005643</td>\n    </tr>\n    <tr>\n      <th>tradingview.com</th>\n      <td>124105</td>\n      <td>124045</td>\n      <td>21</td>\n      <td>0.005662</td>\n      <td>0.005692</td>\n    </tr>\n    <tr>\n      <th>people.com.cn</th>\n      <td>123758</td>\n      <td>123725</td>\n      <td>144</td>\n      <td>0.005646</td>\n      <td>0.005677</td>\n    </tr>\n    <tr>\n      <th>telegram.org</th>\n      <td>123527</td>\n      <td>121721</td>\n      <td>19</td>\n      <td>0.005636</td>\n      <td>0.005585</td>\n    </tr>\n    <tr>\n      <th>uscourts.gov</th>\n      <td>123424</td>\n      <td>123310</td>\n      <td>570</td>\n      <td>0.005631</td>\n      <td>0.005658</td>\n    </tr>\n    <tr>\n      <th>hu-berlin.de</th>\n      <td>122930</td>\n      <td>122309</td>\n      <td>235</td>\n      <td>0.005608</td>\n      <td>0.005612</td>\n    </tr>\n    <tr>\n      <th>sch.gr</th>\n      <td>121349</td>\n      <td>121157</td>\n      <td>937</td>\n      <td>0.005536</td>\n      <td>0.005559</td>\n    </tr>\n    <tr>\n      <th>ufl.edu</th>\n      <td>120992</td>\n      <td>120127</td>\n      <td>1019</td>\n      <td>0.005520</td>\n      <td>0.005512</td>\n    </tr>\n    <tr>\n      <th>kit.edu</th>\n      <td>120801</td>\n      <td>120495</td>\n      <td>653</td>\n      <td>0.005511</td>\n      <td>0.005529</td>\n    </tr>\n    <tr>\n      <th>iol.pt</th>\n      <td>120231</td>\n      <td>119962</td>\n      <td>17</td>\n      <td>0.005485</td>\n      <td>0.005504</td>\n    </tr>\n    <tr>\n      <th>columbia.edu</th>\n      <td>120174</td>\n      <td>119803</td>\n      <td>478</td>\n      <td>0.005483</td>\n      <td>0.005497</td>\n    </tr>\n    <tr>\n      <th>victoriassecret.com</th>\n      <td>120050</td>\n      <td>100454</td>\n      <td>17</td>\n      <td>0.005477</td>\n      <td>0.004609</td>\n    </tr>\n    <tr>\n      <th>statcounter.com</th>\n      <td>119793</td>\n      <td>110030</td>\n      <td>73</td>\n      <td>0.005465</td>\n      <td>0.005049</td>\n    </tr>\n    <tr>\n      <th>weblio.jp</th>\n      <td>119737</td>\n      <td>119689</td>\n      <td>26</td>\n      <td>0.005463</td>\n      <td>0.005492</td>\n    </tr>\n    <tr>\n      <th>msu.ru</th>\n      <td>119653</td>\n      <td>119386</td>\n      <td>508</td>\n      <td>0.005459</td>\n      <td>0.005478</td>\n    </tr>\n    <tr>\n      <th>poznan.pl</th>\n      <td>119436</td>\n      <td>119157</td>\n      <td>711</td>\n      <td>0.005449</td>\n      <td>0.005467</td>\n    </tr>\n    <tr>\n      <th>nt.gov.au</th>\n      <td>118748</td>\n      <td>118444</td>\n      <td>55</td>\n      <td>0.005417</td>\n      <td>0.005435</td>\n    </tr>\n    <tr>\n      <th>rutgers.edu</th>\n      <td>118701</td>\n      <td>118341</td>\n      <td>1005</td>\n      <td>0.005415</td>\n      <td>0.005430</td>\n    </tr>\n    <tr>\n      <th>gouv.qc.ca</th>\n      <td>117229</td>\n      <td>116932</td>\n      <td>976</td>\n      <td>0.005348</td>\n      <td>0.005365</td>\n    </tr>\n    <tr>\n      <th>vk.com</th>\n      <td>117035</td>\n      <td>116270</td>\n      <td>33</td>\n      <td>0.005339</td>\n      <td>0.005335</td>\n    </tr>\n    <tr>\n      <th>uab.cat</th>\n      <td>116909</td>\n      <td>116417</td>\n      <td>121</td>\n      <td>0.005334</td>\n      <td>0.005342</td>\n    </tr>\n    <tr>\n      <th>blog.hu</th>\n      <td>116747</td>\n      <td>116747</td>\n      <td>956</td>\n      <td>0.005326</td>\n      <td>0.005357</td>\n    </tr>\n    <tr>\n      <th>unlp.edu.ar</th>\n      <td>116443</td>\n      <td>116319</td>\n      <td>382</td>\n      <td>0.005312</td>\n      <td>0.005337</td>\n    </tr>\n    <tr>\n      <th>ucsb.edu</th>\n      <td>115924</td>\n      <td>115821</td>\n      <td>800</td>\n      <td>0.005289</td>\n      <td>0.005314</td>\n    </tr>\n    <tr>\n      <th>gva.es</th>\n      <td>114833</td>\n      <td>110420</td>\n      <td>218</td>\n      <td>0.005239</td>\n      <td>0.005066</td>\n    </tr>\n    <tr>\n      <th>ucla.edu</th>\n      <td>114537</td>\n      <td>114302</td>\n      <td>1042</td>\n      <td>0.005225</td>\n      <td>0.005245</td>\n    </tr>\n    <tr>\n      <th>buzzsprout.com</th>\n      <td>114484</td>\n      <td>114206</td>\n      <td>7247</td>\n      <td>0.005223</td>\n      <td>0.005240</td>\n    </tr>\n    <tr>\n      <th>trip.com</th>\n      <td>114407</td>\n      <td>114222</td>\n      <td>47</td>\n      <td>0.005219</td>\n      <td>0.005241</td>\n    </tr>\n    <tr>\n      <th>hp.com</th>\n      <td>114200</td>\n      <td>111980</td>\n      <td>74</td>\n      <td>0.005210</td>\n      <td>0.005138</td>\n    </tr>\n    <tr>\n      <th>st-andrews.ac.uk</th>\n      <td>114184</td>\n      <td>113488</td>\n      <td>400</td>\n      <td>0.005209</td>\n      <td>0.005207</td>\n    </tr>\n    <tr>\n      <th>umd.edu</th>\n      <td>113950</td>\n      <td>113627</td>\n      <td>735</td>\n      <td>0.005199</td>\n      <td>0.005214</td>\n    </tr>\n    <tr>\n      <th>anu.edu.au</th>\n      <td>113510</td>\n      <td>112459</td>\n      <td>201</td>\n      <td>0.005179</td>\n      <td>0.005160</td>\n    </tr>\n    <tr>\n      <th>ugr.es</th>\n      <td>113389</td>\n      <td>112617</td>\n      <td>520</td>\n      <td>0.005173</td>\n      <td>0.005167</td>\n    </tr>\n    <tr>\n      <th>com.ru</th>\n      <td>113388</td>\n      <td>113118</td>\n      <td>1253</td>\n      <td>0.005173</td>\n      <td>0.005190</td>\n    </tr>\n    <tr>\n      <th>go.com</th>\n      <td>112631</td>\n      <td>112135</td>\n      <td>27</td>\n      <td>0.005138</td>\n      <td>0.005145</td>\n    </tr>\n    <tr>\n      <th>service.gov.uk</th>\n      <td>112505</td>\n      <td>112048</td>\n      <td>157</td>\n      <td>0.005133</td>\n      <td>0.005141</td>\n    </tr>\n    <tr>\n      <th>cuny.edu</th>\n      <td>112467</td>\n      <td>111833</td>\n      <td>372</td>\n      <td>0.005131</td>\n      <td>0.005131</td>\n    </tr>\n    <tr>\n      <th>vecteezy.com</th>\n      <td>111934</td>\n      <td>111508</td>\n      <td>10</td>\n      <td>0.005107</td>\n      <td>0.005116</td>\n    </tr>\n    <tr>\n      <th>colorado.edu</th>\n      <td>111630</td>\n      <td>111443</td>\n      <td>145</td>\n      <td>0.005093</td>\n      <td>0.005113</td>\n    </tr>\n    <tr>\n      <th>msk.ru</th>\n      <td>111016</td>\n      <td>110904</td>\n      <td>852</td>\n      <td>0.005065</td>\n      <td>0.005089</td>\n    </tr>\n    <tr>\n      <th>finalsite.net</th>\n      <td>110857</td>\n      <td>106064</td>\n      <td>1</td>\n      <td>0.005057</td>\n      <td>0.004867</td>\n    </tr>\n    <tr>\n      <th>garmin.com</th>\n      <td>110855</td>\n      <td>108967</td>\n      <td>37</td>\n      <td>0.005057</td>\n      <td>0.005000</td>\n    </tr>\n    <tr>\n      <th>ncsu.edu</th>\n      <td>110326</td>\n      <td>110126</td>\n      <td>480</td>\n      <td>0.005033</td>\n      <td>0.005053</td>\n    </tr>\n    <tr>\n      <th>cnr.it</th>\n      <td>110300</td>\n      <td>110180</td>\n      <td>679</td>\n      <td>0.005032</td>\n      <td>0.005055</td>\n    </tr>\n    <tr>\n      <th>antaranews.com</th>\n      <td>109552</td>\n      <td>109354</td>\n      <td>53</td>\n      <td>0.004998</td>\n      <td>0.005018</td>\n    </tr>\n    <tr>\n      <th>si.edu</th>\n      <td>109493</td>\n      <td>109368</td>\n      <td>92</td>\n      <td>0.004995</td>\n      <td>0.005018</td>\n    </tr>\n    <tr>\n      <th>twitch.tv</th>\n      <td>109346</td>\n      <td>109081</td>\n      <td>29</td>\n      <td>0.004989</td>\n      <td>0.005005</td>\n    </tr>\n    <tr>\n      <th>stripe.com</th>\n      <td>109324</td>\n      <td>104349</td>\n      <td>14</td>\n      <td>0.004988</td>\n      <td>0.004788</td>\n    </tr>\n    <tr>\n      <th>in.gov</th>\n      <td>109169</td>\n      <td>108470</td>\n      <td>227</td>\n      <td>0.004980</td>\n      <td>0.004977</td>\n    </tr>\n    <tr>\n      <th>atlassian.com</th>\n      <td>108972</td>\n      <td>107892</td>\n      <td>62</td>\n      <td>0.004971</td>\n      <td>0.004950</td>\n    </tr>\n    <tr>\n      <th>telegra.ph</th>\n      <td>108906</td>\n      <td>88750</td>\n      <td>1</td>\n      <td>0.004968</td>\n      <td>0.004072</td>\n    </tr>\n    <tr>\n      <th>indiana.edu</th>\n      <td>108667</td>\n      <td>108627</td>\n      <td>516</td>\n      <td>0.004958</td>\n      <td>0.004984</td>\n    </tr>\n    <tr>\n      <th>mynavi.jp</th>\n      <td>108355</td>\n      <td>104469</td>\n      <td>101</td>\n      <td>0.004943</td>\n      <td>0.004793</td>\n    </tr>\n    <tr>\n      <th>snu.ac.kr</th>\n      <td>108131</td>\n      <td>107998</td>\n      <td>641</td>\n      <td>0.004933</td>\n      <td>0.004955</td>\n    </tr>\n    <tr>\n      <th>senate.gov</th>\n      <td>108026</td>\n      <td>107174</td>\n      <td>143</td>\n      <td>0.004928</td>\n      <td>0.004918</td>\n    </tr>\n    <tr>\n      <th>uwaterloo.ca</th>\n      <td>107902</td>\n      <td>107330</td>\n      <td>179</td>\n      <td>0.004923</td>\n      <td>0.004925</td>\n    </tr>\n    <tr>\n      <th>uni-tuebingen.de</th>\n      <td>107322</td>\n      <td>107073</td>\n      <td>158</td>\n      <td>0.004896</td>\n      <td>0.004913</td>\n    </tr>\n    <tr>\n      <th>wustl.edu</th>\n      <td>107214</td>\n      <td>106898</td>\n      <td>329</td>\n      <td>0.004891</td>\n      <td>0.004905</td>\n    </tr>\n    <tr>\n      <th>youtube-nocookie.com</th>\n      <td>107099</td>\n      <td>107097</td>\n      <td>2</td>\n      <td>0.004886</td>\n      <td>0.004914</td>\n    </tr>\n    <tr>\n      <th>diva-portal.org</th>\n      <td>107055</td>\n      <td>106975</td>\n      <td>59</td>\n      <td>0.004884</td>\n      <td>0.004908</td>\n    </tr>\n    <tr>\n      <th>temple.edu</th>\n      <td>106812</td>\n      <td>106619</td>\n      <td>142</td>\n      <td>0.004873</td>\n      <td>0.004892</td>\n    </tr>\n    <tr>\n      <th>fu-berlin.de</th>\n      <td>106807</td>\n      <td>106130</td>\n      <td>159</td>\n      <td>0.004873</td>\n      <td>0.004870</td>\n    </tr>\n    <tr>\n      <th>tfrrs.org</th>\n      <td>106528</td>\n      <td>106426</td>\n      <td>15</td>\n      <td>0.004860</td>\n      <td>0.004883</td>\n    </tr>\n    <tr>\n      <th>china.com</th>\n      <td>106380</td>\n      <td>106368</td>\n      <td>88</td>\n      <td>0.004853</td>\n      <td>0.004881</td>\n    </tr>\n    <tr>\n      <th>nrw.de</th>\n      <td>105906</td>\n      <td>105651</td>\n      <td>497</td>\n      <td>0.004832</td>\n      <td>0.004848</td>\n    </tr>\n    <tr>\n      <th>gta5-mods.com</th>\n      <td>105667</td>\n      <td>105666</td>\n      <td>29</td>\n      <td>0.004821</td>\n      <td>0.004848</td>\n    </tr>\n    <tr>\n      <th>icm.edu.pl</th>\n      <td>105520</td>\n      <td>105455</td>\n      <td>60</td>\n      <td>0.004814</td>\n      <td>0.004839</td>\n    </tr>\n    <tr>\n      <th>unsplash.com</th>\n      <td>105481</td>\n      <td>105329</td>\n      <td>5</td>\n      <td>0.004812</td>\n      <td>0.004833</td>\n    </tr>\n    <tr>\n      <th>mn.gov</th>\n      <td>105422</td>\n      <td>103707</td>\n      <td>99</td>\n      <td>0.004810</td>\n      <td>0.004758</td>\n    </tr>\n    <tr>\n      <th>uc.pt</th>\n      <td>105280</td>\n      <td>105161</td>\n      <td>217</td>\n      <td>0.004803</td>\n      <td>0.004825</td>\n    </tr>\n    <tr>\n      <th>as.com</th>\n      <td>105211</td>\n      <td>104799</td>\n      <td>16</td>\n      <td>0.004800</td>\n      <td>0.004809</td>\n    </tr>\n    <tr>\n      <th>semrush.com</th>\n      <td>104758</td>\n      <td>104554</td>\n      <td>27</td>\n      <td>0.004779</td>\n      <td>0.004797</td>\n    </tr>\n    <tr>\n      <th>ucm.es</th>\n      <td>104610</td>\n      <td>104499</td>\n      <td>129</td>\n      <td>0.004772</td>\n      <td>0.004795</td>\n    </tr>\n    <tr>\n      <th>uni-bonn.de</th>\n      <td>103889</td>\n      <td>103325</td>\n      <td>330</td>\n      <td>0.004740</td>\n      <td>0.004741</td>\n    </tr>\n    <tr>\n      <th>khanacademy.org</th>\n      <td>102880</td>\n      <td>102824</td>\n      <td>72</td>\n      <td>0.004694</td>\n      <td>0.004718</td>\n    </tr>\n    <tr>\n      <th>uchile.cl</th>\n      <td>102048</td>\n      <td>101328</td>\n      <td>439</td>\n      <td>0.004656</td>\n      <td>0.004649</td>\n    </tr>\n    <tr>\n      <th>uni-lj.si</th>\n      <td>101688</td>\n      <td>101468</td>\n      <td>295</td>\n      <td>0.004639</td>\n      <td>0.004656</td>\n    </tr>\n    <tr>\n      <th>playstation.com</th>\n      <td>100986</td>\n      <td>100545</td>\n      <td>27</td>\n      <td>0.004607</td>\n      <td>0.004613</td>\n    </tr>\n    <tr>\n      <th>www.gov.uk</th>\n      <td>100841</td>\n      <td>86913</td>\n      <td>1</td>\n      <td>0.004601</td>\n      <td>0.003988</td>\n    </tr>\n    <tr>\n      <th>tufts.edu</th>\n      <td>100834</td>\n      <td>100733</td>\n      <td>181</td>\n      <td>0.004600</td>\n      <td>0.004622</td>\n    </tr>\n    <tr>\n      <th>vt.edu</th>\n      <td>100787</td>\n      <td>100512</td>\n      <td>724</td>\n      <td>0.004598</td>\n      <td>0.004612</td>\n    </tr>\n    <tr>\n      <th>espn.com</th>\n      <td>100310</td>\n      <td>100261</td>\n      <td>14</td>\n      <td>0.004576</td>\n      <td>0.004600</td>\n    </tr>\n    <tr>\n      <th>unb.br</th>\n      <td>99998</td>\n      <td>98047</td>\n      <td>518</td>\n      <td>0.004562</td>\n      <td>0.004499</td>\n    </tr>\n    <tr>\n      <th>legistar.com</th>\n      <td>99369</td>\n      <td>99178</td>\n      <td>301</td>\n      <td>0.004533</td>\n      <td>0.004551</td>\n    </tr>\n    <tr>\n      <th>tableau.com</th>\n      <td>99086</td>\n      <td>98757</td>\n      <td>25</td>\n      <td>0.004520</td>\n      <td>0.004531</td>\n    </tr>\n    <tr>\n      <th>unc.edu</th>\n      <td>98952</td>\n      <td>98190</td>\n      <td>890</td>\n      <td>0.004514</td>\n      <td>0.004505</td>\n    </tr>\n    <tr>\n      <th>ugent.be</th>\n      <td>98657</td>\n      <td>98449</td>\n      <td>428</td>\n      <td>0.004501</td>\n      <td>0.004517</td>\n    </tr>\n    <tr>\n      <th>bme.hu</th>\n      <td>98566</td>\n      <td>98374</td>\n      <td>433</td>\n      <td>0.004497</td>\n      <td>0.004514</td>\n    </tr>\n    <tr>\n      <th>virginia.gov</th>\n      <td>98549</td>\n      <td>98099</td>\n      <td>255</td>\n      <td>0.004496</td>\n      <td>0.004501</td>\n    </tr>\n    <tr>\n      <th>herokuapp.com</th>\n      <td>98514</td>\n      <td>98382</td>\n      <td>952</td>\n      <td>0.004494</td>\n      <td>0.004514</td>\n    </tr>\n    <tr>\n      <th>mhlw.go.jp</th>\n      <td>98477</td>\n      <td>98306</td>\n      <td>113</td>\n      <td>0.004493</td>\n      <td>0.004511</td>\n    </tr>\n    <tr>\n      <th>house.gov</th>\n      <td>97918</td>\n      <td>97761</td>\n      <td>556</td>\n      <td>0.004467</td>\n      <td>0.004486</td>\n    </tr>\n    <tr>\n      <th>sld.cu</th>\n      <td>97726</td>\n      <td>97147</td>\n      <td>374</td>\n      <td>0.004458</td>\n      <td>0.004457</td>\n    </tr>\n    <tr>\n      <th>er.ru</th>\n      <td>97698</td>\n      <td>97662</td>\n      <td>108</td>\n      <td>0.004457</td>\n      <td>0.004481</td>\n    </tr>\n    <tr>\n      <th>yandex.com</th>\n      <td>97588</td>\n      <td>97572</td>\n      <td>50</td>\n      <td>0.004452</td>\n      <td>0.004477</td>\n    </tr>\n    <tr>\n      <th>hubspot.com</th>\n      <td>96608</td>\n      <td>95539</td>\n      <td>48</td>\n      <td>0.004407</td>\n      <td>0.004384</td>\n    </tr>\n    <tr>\n      <th>mediaset.it</th>\n      <td>96126</td>\n      <td>95897</td>\n      <td>20</td>\n      <td>0.004385</td>\n      <td>0.004400</td>\n    </tr>\n    <tr>\n      <th>gamer.com.tw</th>\n      <td>95688</td>\n      <td>94963</td>\n      <td>15</td>\n      <td>0.004365</td>\n      <td>0.004357</td>\n    </tr>\n    <tr>\n      <th>lodz.pl</th>\n      <td>95520</td>\n      <td>94803</td>\n      <td>542</td>\n      <td>0.004358</td>\n      <td>0.004350</td>\n    </tr>\n    <tr>\n      <th>idnes.cz</th>\n      <td>95322</td>\n      <td>94714</td>\n      <td>254</td>\n      <td>0.004349</td>\n      <td>0.004346</td>\n    </tr>\n    <tr>\n      <th>perfil.com</th>\n      <td>95285</td>\n      <td>95218</td>\n      <td>19</td>\n      <td>0.004347</td>\n      <td>0.004369</td>\n    </tr>\n    <tr>\n      <th>steampowered.com</th>\n      <td>95192</td>\n      <td>94231</td>\n      <td>6</td>\n      <td>0.004343</td>\n      <td>0.004324</td>\n    </tr>\n    <tr>\n      <th>byu.edu</th>\n      <td>95053</td>\n      <td>94826</td>\n      <td>598</td>\n      <td>0.004336</td>\n      <td>0.004351</td>\n    </tr>\n    <tr>\n      <th>trend.az</th>\n      <td>94932</td>\n      <td>94290</td>\n      <td>8</td>\n      <td>0.004331</td>\n      <td>0.004326</td>\n    </tr>\n    <tr>\n      <th>news12.com</th>\n      <td>94828</td>\n      <td>94716</td>\n      <td>10</td>\n      <td>0.004326</td>\n      <td>0.004346</td>\n    </tr>\n    <tr>\n      <th>nyu.edu</th>\n      <td>94586</td>\n      <td>94087</td>\n      <td>217</td>\n      <td>0.004315</td>\n      <td>0.004317</td>\n    </tr>\n    <tr>\n      <th>ufrj.br</th>\n      <td>94573</td>\n      <td>94166</td>\n      <td>460</td>\n      <td>0.004315</td>\n      <td>0.004321</td>\n    </tr>\n    <tr>\n      <th>hessen.de</th>\n      <td>93833</td>\n      <td>93660</td>\n      <td>462</td>\n      <td>0.004281</td>\n      <td>0.004297</td>\n    </tr>\n    <tr>\n      <th>rozhlas.cz</th>\n      <td>93814</td>\n      <td>91265</td>\n      <td>59</td>\n      <td>0.004280</td>\n      <td>0.004188</td>\n    </tr>\n    <tr>\n      <th>marketscreener.com</th>\n      <td>93667</td>\n      <td>93460</td>\n      <td>16</td>\n      <td>0.004273</td>\n      <td>0.004288</td>\n    </tr>\n    <tr>\n      <th>panasonic.com</th>\n      <td>93506</td>\n      <td>91828</td>\n      <td>126</td>\n      <td>0.004266</td>\n      <td>0.004213</td>\n    </tr>\n    <tr>\n      <th>eclipse.org</th>\n      <td>93444</td>\n      <td>93094</td>\n      <td>28</td>\n      <td>0.004263</td>\n      <td>0.004271</td>\n    </tr>\n    <tr>\n      <th>habr.com</th>\n      <td>93308</td>\n      <td>92803</td>\n      <td>17</td>\n      <td>0.004257</td>\n      <td>0.004258</td>\n    </tr>\n    <tr>\n      <th>sky.it</th>\n      <td>92865</td>\n      <td>92393</td>\n      <td>24</td>\n      <td>0.004237</td>\n      <td>0.004239</td>\n    </tr>\n    <tr>\n      <th>yahoo.com</th>\n      <td>92858</td>\n      <td>92806</td>\n      <td>31</td>\n      <td>0.004236</td>\n      <td>0.004258</td>\n    </tr>\n    <tr>\n      <th>ccm.net</th>\n      <td>92836</td>\n      <td>92822</td>\n      <td>12</td>\n      <td>0.004235</td>\n      <td>0.004259</td>\n    </tr>\n    <tr>\n      <th>interia.pl</th>\n      <td>92398</td>\n      <td>91704</td>\n      <td>30</td>\n      <td>0.004215</td>\n      <td>0.004208</td>\n    </tr>\n    <tr>\n      <th>donga.com</th>\n      <td>92349</td>\n      <td>91715</td>\n      <td>30</td>\n      <td>0.004213</td>\n      <td>0.004208</td>\n    </tr>\n    <tr>\n      <th>omeka.net</th>\n      <td>92144</td>\n      <td>92135</td>\n      <td>588</td>\n      <td>0.004204</td>\n      <td>0.004227</td>\n    </tr>\n    <tr>\n      <th>tum.de</th>\n      <td>91848</td>\n      <td>91303</td>\n      <td>405</td>\n      <td>0.004190</td>\n      <td>0.004189</td>\n    </tr>\n    <tr>\n      <th>dartmouth.edu</th>\n      <td>91743</td>\n      <td>91555</td>\n      <td>204</td>\n      <td>0.004185</td>\n      <td>0.004201</td>\n    </tr>\n    <tr>\n      <th>unicamp.br</th>\n      <td>91535</td>\n      <td>89742</td>\n      <td>424</td>\n      <td>0.004176</td>\n      <td>0.004118</td>\n    </tr>\n    <tr>\n      <th>ndtv.com</th>\n      <td>91292</td>\n      <td>90452</td>\n      <td>17</td>\n      <td>0.004165</td>\n      <td>0.004150</td>\n    </tr>\n    <tr>\n      <th>exlibrisgroup.com</th>\n      <td>91113</td>\n      <td>91065</td>\n      <td>594</td>\n      <td>0.004157</td>\n      <td>0.004178</td>\n    </tr>\n    <tr>\n      <th>cnrs.fr</th>\n      <td>90737</td>\n      <td>90519</td>\n      <td>636</td>\n      <td>0.004140</td>\n      <td>0.004153</td>\n    </tr>\n    <tr>\n      <th>talent.com</th>\n      <td>90686</td>\n      <td>90661</td>\n      <td>79</td>\n      <td>0.004137</td>\n      <td>0.004160</td>\n    </tr>\n    <tr>\n      <th>usc.edu</th>\n      <td>90661</td>\n      <td>89752</td>\n      <td>424</td>\n      <td>0.004136</td>\n      <td>0.004118</td>\n    </tr>\n    <tr>\n      <th>wolfram.com</th>\n      <td>90448</td>\n      <td>90131</td>\n      <td>26</td>\n      <td>0.004126</td>\n      <td>0.004136</td>\n    </tr>\n    <tr>\n      <th>vietnamplus.vn</th>\n      <td>90343</td>\n      <td>90339</td>\n      <td>22</td>\n      <td>0.004122</td>\n      <td>0.004145</td>\n    </tr>\n    <tr>\n      <th>osu.edu</th>\n      <td>90339</td>\n      <td>89923</td>\n      <td>666</td>\n      <td>0.004121</td>\n      <td>0.004126</td>\n    </tr>\n    <tr>\n      <th>tvbs.com.tw</th>\n      <td>89948</td>\n      <td>87014</td>\n      <td>23</td>\n      <td>0.004104</td>\n      <td>0.003993</td>\n    </tr>\n    <tr>\n      <th>ulisboa.pt</th>\n      <td>89861</td>\n      <td>89579</td>\n      <td>461</td>\n      <td>0.004100</td>\n      <td>0.004110</td>\n    </tr>\n    <tr>\n      <th>cbsnews.com</th>\n      <td>89782</td>\n      <td>88627</td>\n      <td>5</td>\n      <td>0.004096</td>\n      <td>0.004067</td>\n    </tr>\n    <tr>\n      <th>hpe.com</th>\n      <td>89568</td>\n      <td>88860</td>\n      <td>66</td>\n      <td>0.004086</td>\n      <td>0.004077</td>\n    </tr>\n    <tr>\n      <th>uni-hamburg.de</th>\n      <td>89347</td>\n      <td>89114</td>\n      <td>378</td>\n      <td>0.004076</td>\n      <td>0.004089</td>\n    </tr>\n    <tr>\n      <th>baidu.com</th>\n      <td>89198</td>\n      <td>88939</td>\n      <td>227</td>\n      <td>0.004069</td>\n      <td>0.004081</td>\n    </tr>\n    <tr>\n      <th>blic.rs</th>\n      <td>88958</td>\n      <td>88458</td>\n      <td>11</td>\n      <td>0.004058</td>\n      <td>0.004059</td>\n    </tr>\n    <tr>\n      <th>cnet.com</th>\n      <td>88922</td>\n      <td>87014</td>\n      <td>7</td>\n      <td>0.004057</td>\n      <td>0.003993</td>\n    </tr>\n    <tr>\n      <th>bsky.app</th>\n      <td>88672</td>\n      <td>88198</td>\n      <td>12</td>\n      <td>0.004045</td>\n      <td>0.004047</td>\n    </tr>\n    <tr>\n      <th>arcgis.com</th>\n      <td>88660</td>\n      <td>87772</td>\n      <td>4837</td>\n      <td>0.004045</td>\n      <td>0.004027</td>\n    </tr>\n    <tr>\n      <th>fau.de</th>\n      <td>88500</td>\n      <td>88032</td>\n      <td>611</td>\n      <td>0.004038</td>\n      <td>0.004039</td>\n    </tr>\n    <tr>\n      <th>bayern.de</th>\n      <td>88332</td>\n      <td>87681</td>\n      <td>531</td>\n      <td>0.004030</td>\n      <td>0.004023</td>\n    </tr>\n    <tr>\n      <th>office.com</th>\n      <td>88093</td>\n      <td>87989</td>\n      <td>16</td>\n      <td>0.004019</td>\n      <td>0.004037</td>\n    </tr>\n    <tr>\n      <th>virginia.edu</th>\n      <td>87929</td>\n      <td>87533</td>\n      <td>407</td>\n      <td>0.004011</td>\n      <td>0.004016</td>\n    </tr>\n    <tr>\n      <th>odoo.com</th>\n      <td>87662</td>\n      <td>87247</td>\n      <td>3812</td>\n      <td>0.003999</td>\n      <td>0.004003</td>\n    </tr>\n    <tr>\n      <th>net.ru</th>\n      <td>87030</td>\n      <td>86554</td>\n      <td>357</td>\n      <td>0.003970</td>\n      <td>0.003971</td>\n    </tr>\n    <tr>\n      <th>burberry.com</th>\n      <td>86877</td>\n      <td>84116</td>\n      <td>50</td>\n      <td>0.003963</td>\n      <td>0.003860</td>\n    </tr>\n    <tr>\n      <th>virgilio.it</th>\n      <td>86506</td>\n      <td>86275</td>\n      <td>15</td>\n      <td>0.003947</td>\n      <td>0.003959</td>\n    </tr>\n    <tr>\n      <th>justice.gc.ca</th>\n      <td>86354</td>\n      <td>86287</td>\n      <td>12</td>\n      <td>0.003940</td>\n      <td>0.003959</td>\n    </tr>\n    <tr>\n      <th>toyota.com</th>\n      <td>86236</td>\n      <td>86120</td>\n      <td>22</td>\n      <td>0.003934</td>\n      <td>0.003951</td>\n    </tr>\n    <tr>\n      <th>main.jp</th>\n      <td>86187</td>\n      <td>86150</td>\n      <td>1311</td>\n      <td>0.003932</td>\n      <td>0.003953</td>\n    </tr>\n    <tr>\n      <th>unistra.fr</th>\n      <td>85898</td>\n      <td>85665</td>\n      <td>564</td>\n      <td>0.003919</td>\n      <td>0.003931</td>\n    </tr>\n    <tr>\n      <th>ucsd.edu</th>\n      <td>85896</td>\n      <td>85466</td>\n      <td>1258</td>\n      <td>0.003919</td>\n      <td>0.003921</td>\n    </tr>\n    <tr>\n      <th>rezdy.com</th>\n      <td>85840</td>\n      <td>85801</td>\n      <td>712</td>\n      <td>0.003916</td>\n      <td>0.003937</td>\n    </tr>\n    <tr>\n      <th>vercel.app</th>\n      <td>85412</td>\n      <td>85029</td>\n      <td>8191</td>\n      <td>0.003897</td>\n      <td>0.003901</td>\n    </tr>\n    <tr>\n      <th>uba.ar</th>\n      <td>85351</td>\n      <td>85130</td>\n      <td>447</td>\n      <td>0.003894</td>\n      <td>0.003906</td>\n    </tr>\n    <tr>\n      <th>fao.org</th>\n      <td>85271</td>\n      <td>84854</td>\n      <td>63</td>\n      <td>0.003890</td>\n      <td>0.003893</td>\n    </tr>\n    <tr>\n      <th>uv.es</th>\n      <td>84994</td>\n      <td>84825</td>\n      <td>359</td>\n      <td>0.003878</td>\n      <td>0.003892</td>\n    </tr>\n    <tr>\n      <th>developpement-durable.gouv.fr</th>\n      <td>84745</td>\n      <td>84579</td>\n      <td>174</td>\n      <td>0.003866</td>\n      <td>0.003881</td>\n    </tr>\n    <tr>\n      <th>imgur.com</th>\n      <td>84684</td>\n      <td>84604</td>\n      <td>12</td>\n      <td>0.003863</td>\n      <td>0.003882</td>\n    </tr>\n    <tr>\n      <th>maryland.gov</th>\n      <td>84194</td>\n      <td>83739</td>\n      <td>198</td>\n      <td>0.003841</td>\n      <td>0.003842</td>\n    </tr>\n    <tr>\n      <th>rs-online.com</th>\n      <td>84124</td>\n      <td>82058</td>\n      <td>34</td>\n      <td>0.003838</td>\n      <td>0.003765</td>\n    </tr>\n    <tr>\n      <th>rediff.com</th>\n      <td>84034</td>\n      <td>83746</td>\n      <td>45</td>\n      <td>0.003834</td>\n      <td>0.003843</td>\n    </tr>\n    <tr>\n      <th>us.es</th>\n      <td>83814</td>\n      <td>83745</td>\n      <td>179</td>\n      <td>0.003824</td>\n      <td>0.003843</td>\n    </tr>\n    <tr>\n      <th>keizai.biz</th>\n      <td>83773</td>\n      <td>83173</td>\n      <td>162</td>\n      <td>0.003822</td>\n      <td>0.003816</td>\n    </tr>\n    <tr>\n      <th>overdrive.com</th>\n      <td>83740</td>\n      <td>83642</td>\n      <td>1100</td>\n      <td>0.003820</td>\n      <td>0.003838</td>\n    </tr>\n    <tr>\n      <th>unesp.br</th>\n      <td>83690</td>\n      <td>83411</td>\n      <td>153</td>\n      <td>0.003818</td>\n      <td>0.003827</td>\n    </tr>\n    <tr>\n      <th>wikileaks.org</th>\n      <td>83572</td>\n      <td>83221</td>\n      <td>17</td>\n      <td>0.003813</td>\n      <td>0.003818</td>\n    </tr>\n    <tr>\n      <th>prnewswire.com</th>\n      <td>83352</td>\n      <td>83167</td>\n      <td>13</td>\n      <td>0.003803</td>\n      <td>0.003816</td>\n    </tr>\n    <tr>\n      <th>upc.edu</th>\n      <td>83141</td>\n      <td>82510</td>\n      <td>527</td>\n      <td>0.003793</td>\n      <td>0.003786</td>\n    </tr>\n    <tr>\n      <th>17173.com</th>\n      <td>83054</td>\n      <td>82565</td>\n      <td>259</td>\n      <td>0.003789</td>\n      <td>0.003788</td>\n    </tr>\n    <tr>\n      <th>archives.gov</th>\n      <td>82767</td>\n      <td>82576</td>\n      <td>49</td>\n      <td>0.003776</td>\n      <td>0.003789</td>\n    </tr>\n    <tr>\n      <th>dmm.com</th>\n      <td>82693</td>\n      <td>82537</td>\n      <td>77</td>\n      <td>0.003773</td>\n      <td>0.003787</td>\n    </tr>\n    <tr>\n      <th>aps.org</th>\n      <td>82561</td>\n      <td>81104</td>\n      <td>17</td>\n      <td>0.003767</td>\n      <td>0.003721</td>\n    </tr>\n    <tr>\n      <th>culture.gouv.fr</th>\n      <td>82529</td>\n      <td>81646</td>\n      <td>51</td>\n      <td>0.003765</td>\n      <td>0.003746</td>\n    </tr>\n    <tr>\n      <th>copernicus.org</th>\n      <td>82287</td>\n      <td>82099</td>\n      <td>66</td>\n      <td>0.003754</td>\n      <td>0.003767</td>\n    </tr>\n    <tr>\n      <th>ilsole24ore.com</th>\n      <td>82263</td>\n      <td>82138</td>\n      <td>181</td>\n      <td>0.003753</td>\n      <td>0.003769</td>\n    </tr>\n    <tr>\n      <th>utah.edu</th>\n      <td>82262</td>\n      <td>81571</td>\n      <td>737</td>\n      <td>0.003753</td>\n      <td>0.003743</td>\n    </tr>\n    <tr>\n      <th>helsinki.fi</th>\n      <td>82168</td>\n      <td>82016</td>\n      <td>75</td>\n      <td>0.003749</td>\n      <td>0.003763</td>\n    </tr>\n    <tr>\n      <th>issuu.com</th>\n      <td>81791</td>\n      <td>81601</td>\n      <td>2</td>\n      <td>0.003731</td>\n      <td>0.003744</td>\n    </tr>\n    <tr>\n      <th>u-tokyo.ac.jp</th>\n      <td>81733</td>\n      <td>81674</td>\n      <td>448</td>\n      <td>0.003729</td>\n      <td>0.003747</td>\n    </tr>\n    <tr>\n      <th>unt.edu</th>\n      <td>81704</td>\n      <td>72232</td>\n      <td>193</td>\n      <td>0.003727</td>\n      <td>0.003314</td>\n    </tr>\n    <tr>\n      <th>vice.com</th>\n      <td>81700</td>\n      <td>81134</td>\n      <td>10</td>\n      <td>0.003727</td>\n      <td>0.003723</td>\n    </tr>\n    <tr>\n      <th>uni-stuttgart.de</th>\n      <td>81570</td>\n      <td>81290</td>\n      <td>320</td>\n      <td>0.003721</td>\n      <td>0.003730</td>\n    </tr>\n    <tr>\n      <th>dnevnik.hr</th>\n      <td>81382</td>\n      <td>80739</td>\n      <td>20</td>\n      <td>0.003713</td>\n      <td>0.003705</td>\n    </tr>\n    <tr>\n      <th>ibiblio.org</th>\n      <td>81361</td>\n      <td>81352</td>\n      <td>9</td>\n      <td>0.003712</td>\n      <td>0.003733</td>\n    </tr>\n    <tr>\n      <th>lenovo.com</th>\n      <td>80932</td>\n      <td>80274</td>\n      <td>60</td>\n      <td>0.003692</td>\n      <td>0.003683</td>\n    </tr>\n    <tr>\n      <th>gov.sk</th>\n      <td>80624</td>\n      <td>80342</td>\n      <td>147</td>\n      <td>0.003678</td>\n      <td>0.003686</td>\n    </tr>\n    <tr>\n      <th>ucf.edu</th>\n      <td>80453</td>\n      <td>80191</td>\n      <td>296</td>\n      <td>0.003670</td>\n      <td>0.003679</td>\n    </tr>\n    <tr>\n      <th>excite.co.jp</th>\n      <td>80390</td>\n      <td>78966</td>\n      <td>20</td>\n      <td>0.003668</td>\n      <td>0.003623</td>\n    </tr>\n    <tr>\n      <th>uq.edu.au</th>\n      <td>80350</td>\n      <td>80146</td>\n      <td>218</td>\n      <td>0.003666</td>\n      <td>0.003677</td>\n    </tr>\n    <tr>\n      <th>niedersachsen.de</th>\n      <td>80186</td>\n      <td>79702</td>\n      <td>309</td>\n      <td>0.003658</td>\n      <td>0.003657</td>\n    </tr>\n    <tr>\n      <th>biglobe.ne.jp</th>\n      <td>80083</td>\n      <td>79885</td>\n      <td>101</td>\n      <td>0.003654</td>\n      <td>0.003665</td>\n    </tr>\n    <tr>\n      <th>uniroma1.it</th>\n      <td>79767</td>\n      <td>78666</td>\n      <td>391</td>\n      <td>0.003639</td>\n      <td>0.003609</td>\n    </tr>\n    <tr>\n      <th>facebook.com</th>\n      <td>79393</td>\n      <td>79073</td>\n      <td>10</td>\n      <td>0.003622</td>\n      <td>0.003628</td>\n    </tr>\n    <tr>\n      <th>overheid.nl</th>\n      <td>79325</td>\n      <td>76302</td>\n      <td>47</td>\n      <td>0.003619</td>\n      <td>0.003501</td>\n    </tr>\n    <tr>\n      <th>uiowa.edu</th>\n      <td>79278</td>\n      <td>78991</td>\n      <td>783</td>\n      <td>0.003617</td>\n      <td>0.003624</td>\n    </tr>\n    <tr>\n      <th>uber.com</th>\n      <td>79259</td>\n      <td>78016</td>\n      <td>20</td>\n      <td>0.003616</td>\n      <td>0.003580</td>\n    </tr>\n    <tr>\n      <th>unl.pt</th>\n      <td>79069</td>\n      <td>78927</td>\n      <td>299</td>\n      <td>0.003607</td>\n      <td>0.003621</td>\n    </tr>\n    <tr>\n      <th>uni-goettingen.de</th>\n      <td>78863</td>\n      <td>78512</td>\n      <td>239</td>\n      <td>0.003598</td>\n      <td>0.003602</td>\n    </tr>\n    <tr>\n      <th>uni-muenchen.de</th>\n      <td>78782</td>\n      <td>78726</td>\n      <td>519</td>\n      <td>0.003594</td>\n      <td>0.003612</td>\n    </tr>\n    <tr>\n      <th>rtp.pt</th>\n      <td>78512</td>\n      <td>76754</td>\n      <td>20</td>\n      <td>0.003582</td>\n      <td>0.003522</td>\n    </tr>\n    <tr>\n      <th>akipress.org</th>\n      <td>78423</td>\n      <td>78399</td>\n      <td>29</td>\n      <td>0.003578</td>\n      <td>0.003597</td>\n    </tr>\n    <tr>\n      <th>unimelb.edu.au</th>\n      <td>78419</td>\n      <td>78407</td>\n      <td>114</td>\n      <td>0.003578</td>\n      <td>0.003598</td>\n    </tr>\n    <tr>\n      <th>krymr.com</th>\n      <td>78276</td>\n      <td>78122</td>\n      <td>3</td>\n      <td>0.003571</td>\n      <td>0.003585</td>\n    </tr>\n    <tr>\n      <th>bg.ac.rs</th>\n      <td>78252</td>\n      <td>78007</td>\n      <td>523</td>\n      <td>0.003570</td>\n      <td>0.003579</td>\n    </tr>\n    <tr>\n      <th>rbc.ua</th>\n      <td>78249</td>\n      <td>78210</td>\n      <td>16</td>\n      <td>0.003570</td>\n      <td>0.003589</td>\n    </tr>\n    <tr>\n      <th>icrt.cu</th>\n      <td>78194</td>\n      <td>78182</td>\n      <td>58</td>\n      <td>0.003567</td>\n      <td>0.003587</td>\n    </tr>\n    <tr>\n      <th>unifr.ch</th>\n      <td>78091</td>\n      <td>77679</td>\n      <td>38</td>\n      <td>0.003563</td>\n      <td>0.003564</td>\n    </tr>\n    <tr>\n      <th>sputniknews.ru</th>\n      <td>77854</td>\n      <td>77590</td>\n      <td>9</td>\n      <td>0.003552</td>\n      <td>0.003560</td>\n    </tr>\n    <tr>\n      <th>miami.edu</th>\n      <td>77729</td>\n      <td>77401</td>\n      <td>497</td>\n      <td>0.003546</td>\n      <td>0.003551</td>\n    </tr>\n    <tr>\n      <th>bncollege.com</th>\n      <td>77409</td>\n      <td>77328</td>\n      <td>458</td>\n      <td>0.003532</td>\n      <td>0.003548</td>\n    </tr>\n    <tr>\n      <th>sinica.edu.tw</th>\n      <td>77283</td>\n      <td>77189</td>\n      <td>266</td>\n      <td>0.003526</td>\n      <td>0.003542</td>\n    </tr>\n    <tr>\n      <th>jotform.com</th>\n      <td>77248</td>\n      <td>77045</td>\n      <td>1041</td>\n      <td>0.003524</td>\n      <td>0.003535</td>\n    </tr>\n    <tr>\n      <th>metu.edu.tr</th>\n      <td>77021</td>\n      <td>76986</td>\n      <td>427</td>\n      <td>0.003514</td>\n      <td>0.003532</td>\n    </tr>\n    <tr>\n      <th>uw.edu.pl</th>\n      <td>76960</td>\n      <td>76519</td>\n      <td>648</td>\n      <td>0.003511</td>\n      <td>0.003511</td>\n    </tr>\n    <tr>\n      <th>neocities.org</th>\n      <td>76874</td>\n      <td>76667</td>\n      <td>11076</td>\n      <td>0.003507</td>\n      <td>0.003518</td>\n    </tr>\n    <tr>\n      <th>hatenadiary.jp</th>\n      <td>76628</td>\n      <td>76616</td>\n      <td>692</td>\n      <td>0.003496</td>\n      <td>0.003515</td>\n    </tr>\n    <tr>\n      <th>rp.pl</th>\n      <td>76273</td>\n      <td>75855</td>\n      <td>40</td>\n      <td>0.003480</td>\n      <td>0.003480</td>\n    </tr>\n    <tr>\n      <th>gov.bc.ca</th>\n      <td>76125</td>\n      <td>75975</td>\n      <td>143</td>\n      <td>0.003473</td>\n      <td>0.003486</td>\n    </tr>\n    <tr>\n      <th>statcan.gc.ca</th>\n      <td>75890</td>\n      <td>75577</td>\n      <td>18</td>\n      <td>0.003462</td>\n      <td>0.003468</td>\n    </tr>\n    <tr>\n      <th>pp.ua</th>\n      <td>75844</td>\n      <td>75736</td>\n      <td>613</td>\n      <td>0.003460</td>\n      <td>0.003475</td>\n    </tr>\n    <tr>\n      <th>libreoffice.org</th>\n      <td>75742</td>\n      <td>75678</td>\n      <td>68</td>\n      <td>0.003455</td>\n      <td>0.003472</td>\n    </tr>\n    <tr>\n      <th>uni-bremen.de</th>\n      <td>75569</td>\n      <td>75134</td>\n      <td>199</td>\n      <td>0.003448</td>\n      <td>0.003447</td>\n    </tr>\n    <tr>\n      <th>birdeye.com</th>\n      <td>75497</td>\n      <td>74654</td>\n      <td>6</td>\n      <td>0.003444</td>\n      <td>0.003425</td>\n    </tr>\n    <tr>\n      <th>ifeng.com</th>\n      <td>75485</td>\n      <td>75359</td>\n      <td>383</td>\n      <td>0.003444</td>\n      <td>0.003458</td>\n    </tr>\n    <tr>\n      <th>gov.si</th>\n      <td>75406</td>\n      <td>75239</td>\n      <td>70</td>\n      <td>0.003440</td>\n      <td>0.003452</td>\n    </tr>\n    <tr>\n      <th>unl.edu</th>\n      <td>75403</td>\n      <td>75214</td>\n      <td>580</td>\n      <td>0.003440</td>\n      <td>0.003451</td>\n    </tr>\n    <tr>\n      <th>check24.de</th>\n      <td>75355</td>\n      <td>74878</td>\n      <td>49</td>\n      <td>0.003438</td>\n      <td>0.003436</td>\n    </tr>\n    <tr>\n      <th>w3.org</th>\n      <td>75325</td>\n      <td>74994</td>\n      <td>14</td>\n      <td>0.003436</td>\n      <td>0.003441</td>\n    </tr>\n    <tr>\n      <th>pitt.edu</th>\n      <td>75288</td>\n      <td>74730</td>\n      <td>920</td>\n      <td>0.003435</td>\n      <td>0.003429</td>\n    </tr>\n    <tr>\n      <th>cbssports.com</th>\n      <td>75278</td>\n      <td>74175</td>\n      <td>31</td>\n      <td>0.003434</td>\n      <td>0.003403</td>\n    </tr>\n    <tr>\n      <th>aljazeera.com</th>\n      <td>75185</td>\n      <td>73504</td>\n      <td>8</td>\n      <td>0.003430</td>\n      <td>0.003373</td>\n    </tr>\n    <tr>\n      <th>detik.com</th>\n      <td>75140</td>\n      <td>75020</td>\n      <td>28</td>\n      <td>0.003428</td>\n      <td>0.003442</td>\n    </tr>\n    <tr>\n      <th>aladin.co.kr</th>\n      <td>75123</td>\n      <td>74931</td>\n      <td>14</td>\n      <td>0.003427</td>\n      <td>0.003438</td>\n    </tr>\n    <tr>\n      <th>bundestag.de</th>\n      <td>74854</td>\n      <td>74581</td>\n      <td>13</td>\n      <td>0.003415</td>\n      <td>0.003422</td>\n    </tr>\n    <tr>\n      <th>ucr.ac.cr</th>\n      <td>74786</td>\n      <td>74713</td>\n      <td>389</td>\n      <td>0.003412</td>\n      <td>0.003428</td>\n    </tr>\n    <tr>\n      <th>utah.gov</th>\n      <td>74737</td>\n      <td>74535</td>\n      <td>376</td>\n      <td>0.003410</td>\n      <td>0.003420</td>\n    </tr>\n    <tr>\n      <th>uzh.ch</th>\n      <td>74643</td>\n      <td>74365</td>\n      <td>746</td>\n      <td>0.003405</td>\n      <td>0.003412</td>\n    </tr>\n    <tr>\n      <th>answers.com</th>\n      <td>74640</td>\n      <td>74629</td>\n      <td>8</td>\n      <td>0.003405</td>\n      <td>0.003424</td>\n    </tr>\n    <tr>\n      <th>kommersant.ru</th>\n      <td>74549</td>\n      <td>74500</td>\n      <td>18</td>\n      <td>0.003401</td>\n      <td>0.003418</td>\n    </tr>\n    <tr>\n      <th>cancer.gov</th>\n      <td>74495</td>\n      <td>74235</td>\n      <td>89</td>\n      <td>0.003399</td>\n      <td>0.003406</td>\n    </tr>\n    <tr>\n      <th>ettoday.net</th>\n      <td>74306</td>\n      <td>74207</td>\n      <td>31</td>\n      <td>0.003390</td>\n      <td>0.003405</td>\n    </tr>\n    <tr>\n      <th>huaweicloud.com</th>\n      <td>74287</td>\n      <td>74267</td>\n      <td>51</td>\n      <td>0.003389</td>\n      <td>0.003408</td>\n    </tr>\n    <tr>\n      <th>rug.nl</th>\n      <td>74179</td>\n      <td>73665</td>\n      <td>95</td>\n      <td>0.003384</td>\n      <td>0.003380</td>\n    </tr>\n    <tr>\n      <th>cisco.com</th>\n      <td>74100</td>\n      <td>71722</td>\n      <td>103</td>\n      <td>0.003381</td>\n      <td>0.003291</td>\n    </tr>\n    <tr>\n      <th>freshdesk.com</th>\n      <td>73672</td>\n      <td>73272</td>\n      <td>2846</td>\n      <td>0.003361</td>\n      <td>0.003362</td>\n    </tr>\n    <tr>\n      <th>newsru.com</th>\n      <td>73106</td>\n      <td>73019</td>\n      <td>6</td>\n      <td>0.003335</td>\n      <td>0.003350</td>\n    </tr>\n    <tr>\n      <th>uct.ac.za</th>\n      <td>73056</td>\n      <td>72591</td>\n      <td>141</td>\n      <td>0.003333</td>\n      <td>0.003331</td>\n    </tr>\n    <tr>\n      <th>correiobraziliense.com.br</th>\n      <td>73027</td>\n      <td>72934</td>\n      <td>13</td>\n      <td>0.003332</td>\n      <td>0.003346</td>\n    </tr>\n    <tr>\n      <th>jst.go.jp</th>\n      <td>72982</td>\n      <td>72752</td>\n      <td>33</td>\n      <td>0.003330</td>\n      <td>0.003338</td>\n    </tr>\n    <tr>\n      <th>ut.ac.ir</th>\n      <td>72668</td>\n      <td>72516</td>\n      <td>299</td>\n      <td>0.003315</td>\n      <td>0.003327</td>\n    </tr>\n    <tr>\n      <th>gatech.edu</th>\n      <td>72204</td>\n      <td>72071</td>\n      <td>736</td>\n      <td>0.003294</td>\n      <td>0.003307</td>\n    </tr>\n    <tr>\n      <th>vlex.com</th>\n      <td>72158</td>\n      <td>72070</td>\n      <td>78</td>\n      <td>0.003292</td>\n      <td>0.003307</td>\n    </tr>\n    <tr>\n      <th>chess-results.com</th>\n      <td>72013</td>\n      <td>71993</td>\n      <td>5</td>\n      <td>0.003285</td>\n      <td>0.003303</td>\n    </tr>\n    <tr>\n      <th>iprima.cz</th>\n      <td>71968</td>\n      <td>71915</td>\n      <td>12</td>\n      <td>0.003283</td>\n      <td>0.003300</td>\n    </tr>\n    <tr>\n      <th>wroc.pl</th>\n      <td>71833</td>\n      <td>71619</td>\n      <td>548</td>\n      <td>0.003277</td>\n      <td>0.003286</td>\n    </tr>\n    <tr>\n      <th>globo.com</th>\n      <td>71818</td>\n      <td>71578</td>\n      <td>47</td>\n      <td>0.003276</td>\n      <td>0.003284</td>\n    </tr>\n    <tr>\n      <th>unipd.it</th>\n      <td>71800</td>\n      <td>71563</td>\n      <td>408</td>\n      <td>0.003276</td>\n      <td>0.003284</td>\n    </tr>\n    <tr>\n      <th>tyc.edu.tw</th>\n      <td>71731</td>\n      <td>71475</td>\n      <td>331</td>\n      <td>0.003272</td>\n      <td>0.003280</td>\n    </tr>\n    <tr>\n      <th>acer.com</th>\n      <td>71666</td>\n      <td>71327</td>\n      <td>22</td>\n      <td>0.003270</td>\n      <td>0.003273</td>\n    </tr>\n    <tr>\n      <th>timesnownews.com</th>\n      <td>71304</td>\n      <td>71223</td>\n      <td>11</td>\n      <td>0.003253</td>\n      <td>0.003268</td>\n    </tr>\n    <tr>\n      <th>churchofjesuschrist.org</th>\n      <td>71219</td>\n      <td>70737</td>\n      <td>94</td>\n      <td>0.003249</td>\n      <td>0.003246</td>\n    </tr>\n    <tr>\n      <th>walmart.com</th>\n      <td>71135</td>\n      <td>70609</td>\n      <td>38</td>\n      <td>0.003245</td>\n      <td>0.003240</td>\n    </tr>\n    <tr>\n      <th>stlouisfed.org</th>\n      <td>71127</td>\n      <td>71079</td>\n      <td>17</td>\n      <td>0.003245</td>\n      <td>0.003261</td>\n    </tr>\n    <tr>\n      <th>twitcasting.tv</th>\n      <td>70963</td>\n      <td>70681</td>\n      <td>38</td>\n      <td>0.003237</td>\n      <td>0.003243</td>\n    </tr>\n    <tr>\n      <th>ku.edu</th>\n      <td>70829</td>\n      <td>70683</td>\n      <td>608</td>\n      <td>0.003231</td>\n      <td>0.003243</td>\n    </tr>\n    <tr>\n      <th>chinanews.com.cn</th>\n      <td>70809</td>\n      <td>70462</td>\n      <td>39</td>\n      <td>0.003230</td>\n      <td>0.003233</td>\n    </tr>\n    <tr>\n      <th>lublin.pl</th>\n      <td>70809</td>\n      <td>70721</td>\n      <td>585</td>\n      <td>0.003230</td>\n      <td>0.003245</td>\n    </tr>\n    <tr>\n      <th>praca.gov.pl</th>\n      <td>70655</td>\n      <td>70598</td>\n      <td>378</td>\n      <td>0.003223</td>\n      <td>0.003239</td>\n    </tr>\n    <tr>\n      <th>indiamart.com</th>\n      <td>70203</td>\n      <td>70148</td>\n      <td>14</td>\n      <td>0.003203</td>\n      <td>0.003219</td>\n    </tr>\n    <tr>\n      <th>fifa.com</th>\n      <td>70062</td>\n      <td>69257</td>\n      <td>32</td>\n      <td>0.003196</td>\n      <td>0.003178</td>\n    </tr>\n    <tr>\n      <th>adelaide.edu.au</th>\n      <td>69949</td>\n      <td>66322</td>\n      <td>47</td>\n      <td>0.003191</td>\n      <td>0.003043</td>\n    </tr>\n    <tr>\n      <th>business-gazeta.ru</th>\n      <td>69908</td>\n      <td>69715</td>\n      <td>14</td>\n      <td>0.003189</td>\n      <td>0.003199</td>\n    </tr>\n    <tr>\n      <th>nvidia.com</th>\n      <td>69859</td>\n      <td>68334</td>\n      <td>53</td>\n      <td>0.003187</td>\n      <td>0.003135</td>\n    </tr>\n    <tr>\n      <th>shueisha.co.jp</th>\n      <td>69850</td>\n      <td>68877</td>\n      <td>53</td>\n      <td>0.003187</td>\n      <td>0.003160</td>\n    </tr>\n    <tr>\n      <th>moe.edu.tw</th>\n      <td>69805</td>\n      <td>69763</td>\n      <td>40</td>\n      <td>0.003185</td>\n      <td>0.003201</td>\n    </tr>\n    <tr>\n      <th>finalfantasyxiv.com</th>\n      <td>69804</td>\n      <td>69783</td>\n      <td>16</td>\n      <td>0.003185</td>\n      <td>0.003202</td>\n    </tr>\n    <tr>\n      <th>epfl.ch</th>\n      <td>69568</td>\n      <td>68638</td>\n      <td>213</td>\n      <td>0.003174</td>\n      <td>0.003149</td>\n    </tr>\n    <tr>\n      <th>nd.edu</th>\n      <td>69561</td>\n      <td>68584</td>\n      <td>123</td>\n      <td>0.003173</td>\n      <td>0.003147</td>\n    </tr>\n    <tr>\n      <th>ifixit.com</th>\n      <td>69486</td>\n      <td>69383</td>\n      <td>18</td>\n      <td>0.003170</td>\n      <td>0.003184</td>\n    </tr>\n    <tr>\n      <th>discord.com</th>\n      <td>69437</td>\n      <td>67340</td>\n      <td>5</td>\n      <td>0.003168</td>\n      <td>0.003090</td>\n    </tr>\n    <tr>\n      <th>kde.org</th>\n      <td>69415</td>\n      <td>69246</td>\n      <td>73</td>\n      <td>0.003167</td>\n      <td>0.003177</td>\n    </tr>\n    <tr>\n      <th>caixin.com</th>\n      <td>69160</td>\n      <td>68865</td>\n      <td>332</td>\n      <td>0.003155</td>\n      <td>0.003160</td>\n    </tr>\n    <tr>\n      <th>foxnews.com</th>\n      <td>69150</td>\n      <td>68965</td>\n      <td>14</td>\n      <td>0.003155</td>\n      <td>0.003164</td>\n    </tr>\n    <tr>\n      <th>r-project.org</th>\n      <td>69077</td>\n      <td>68861</td>\n      <td>113</td>\n      <td>0.003151</td>\n      <td>0.003160</td>\n    </tr>\n    <tr>\n      <th>hudl.com</th>\n      <td>69017</td>\n      <td>68782</td>\n      <td>61</td>\n      <td>0.003149</td>\n      <td>0.003156</td>\n    </tr>\n    <tr>\n      <th>ucdavis.edu</th>\n      <td>69002</td>\n      <td>68828</td>\n      <td>581</td>\n      <td>0.003148</td>\n      <td>0.003158</td>\n    </tr>\n    <tr>\n      <th>uservoice.com</th>\n      <td>68975</td>\n      <td>68808</td>\n      <td>230</td>\n      <td>0.003147</td>\n      <td>0.003157</td>\n    </tr>\n    <tr>\n      <th>informator.ua</th>\n      <td>68851</td>\n      <td>68794</td>\n      <td>16</td>\n      <td>0.003141</td>\n      <td>0.003157</td>\n    </tr>\n  </tbody>\n</table>"
  },
  {
    "path": "plots/domains.md",
    "content": "---\nlayout: table\ntable_include: domains-top-500.html\ntable_sortlist: \"{sortList: [[1,1]]}\"\ntable_searcher: \"Filter for domain names\"\n---\n\nTop-500 Registered Domains of the Latest Main Crawl\n===================================================\n\nThe table below shows the top 500 registered domains (in terms of page captures) of the last main/monthly crawl\n({{ site.latest_crawl }}). The underlying data is also provided in CSV format, see [domains-top-500.csv](./domains-top-500.csv).\n\nNote that the ranking by page captures only partially corresponds to the importance of domains, as the\ncrawler respects the robots.txt and tries hard not to overload web servers. Highly ranked domains tend to be\nunderrepresented. If you're looking for a list of domain or host names ranked by page rank or harmonic centrality,\nconsider using one of the [webgraph datasets](https://github.com/commoncrawl/cc-webgraph#exploring-webgraph-data-sets)\ninstead.\n"
  },
  {
    "path": "plots/languages-top-200.html",
    "content": "<table border=\"1\" class=\"dataframe tablesorter tablepercentage iso639-3-language\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th>crawl</th>\n      <th>CC-MAIN-2026-08</th>\n      <th>CC-MAIN-2026-12</th>\n      <th>CC-MAIN-2026-17</th>\n    </tr>\n    <tr>\n      <th>language</th>\n      <th></th>\n      <th></th>\n      <th></th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>&lt;unknown&gt;</th>\n      <td>3.1475</td>\n      <td>3.0996</td>\n      <td>3.1136</td>\n    </tr>\n    <tr>\n      <th>aar</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>abk</th>\n      <td>0.0007</td>\n      <td>0.0006</td>\n      <td>0.0006</td>\n    </tr>\n    <tr>\n      <th>afr</th>\n      <td>0.0073</td>\n      <td>0.0091</td>\n      <td>0.0083</td>\n    </tr>\n    <tr>\n      <th>aka</th>\n      <td>0.0003</td>\n      <td>0.0002</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>amh</th>\n      <td>0.0040</td>\n      <td>0.0039</td>\n      <td>0.0045</td>\n    </tr>\n    <tr>\n      <th>ara</th>\n      <td>0.6367</td>\n      <td>0.6522</td>\n      <td>0.6598</td>\n    </tr>\n    <tr>\n      <th>asm</th>\n      <td>0.0029</td>\n      <td>0.0038</td>\n      <td>0.0036</td>\n    </tr>\n    <tr>\n      <th>aym</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>aze</th>\n      <td>0.0568</td>\n      <td>0.0605</td>\n      <td>0.0609</td>\n    </tr>\n    <tr>\n      <th>bak</th>\n      <td>0.0035</td>\n      <td>0.0046</td>\n      <td>0.0018</td>\n    </tr>\n    <tr>\n      <th>bel</th>\n      <td>0.0158</td>\n      <td>0.0180</td>\n      <td>0.0165</td>\n    </tr>\n    <tr>\n      <th>ben</th>\n      <td>0.1038</td>\n      <td>0.1097</td>\n      <td>0.1140</td>\n    </tr>\n    <tr>\n      <th>bih</th>\n      <td>0.0007</td>\n      <td>0.0009</td>\n      <td>0.0008</td>\n    </tr>\n    <tr>\n      <th>bis</th>\n      <td>0.0002</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>bod</th>\n      <td>0.0013</td>\n      <td>0.0015</td>\n      <td>0.0012</td>\n    </tr>\n    <tr>\n      <th>bos</th>\n      <td>0.0543</td>\n      <td>0.0617</td>\n      <td>0.0615</td>\n    </tr>\n    <tr>\n      <th>bre</th>\n      <td>0.0032</td>\n      <td>0.0021</td>\n      <td>0.0028</td>\n    </tr>\n    <tr>\n      <th>bul</th>\n      <td>0.2639</td>\n      <td>0.2711</td>\n      <td>0.2639</td>\n    </tr>\n    <tr>\n      <th>cat</th>\n      <td>0.2073</td>\n      <td>0.2088</td>\n      <td>0.2010</td>\n    </tr>\n    <tr>\n      <th>ceb</th>\n      <td>0.0022</td>\n      <td>0.0021</td>\n      <td>0.0020</td>\n    </tr>\n    <tr>\n      <th>ces</th>\n      <td>1.1228</td>\n      <td>1.1453</td>\n      <td>1.1493</td>\n    </tr>\n    <tr>\n      <th>chr</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>cos</th>\n      <td>0.0028</td>\n      <td>0.0027</td>\n      <td>0.0028</td>\n    </tr>\n    <tr>\n      <th>crs</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>cym</th>\n      <td>0.0104</td>\n      <td>0.0108</td>\n      <td>0.0113</td>\n    </tr>\n    <tr>\n      <th>dan</th>\n      <td>0.4901</td>\n      <td>0.5249</td>\n      <td>0.5324</td>\n    </tr>\n    <tr>\n      <th>deu</th>\n      <td>5.7651</td>\n      <td>5.9818</td>\n      <td>5.9033</td>\n    </tr>\n    <tr>\n      <th>div</th>\n      <td>0.0023</td>\n      <td>0.0023</td>\n      <td>0.0024</td>\n    </tr>\n    <tr>\n      <th>dzo</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>ell</th>\n      <td>0.5054</td>\n      <td>0.5494</td>\n      <td>0.5787</td>\n    </tr>\n    <tr>\n      <th>eng</th>\n      <td>42.6029</td>\n      <td>41.0588</td>\n      <td>41.0204</td>\n    </tr>\n    <tr>\n      <th>epo</th>\n      <td>0.0107</td>\n      <td>0.0104</td>\n      <td>0.0082</td>\n    </tr>\n    <tr>\n      <th>est</th>\n      <td>0.1371</td>\n      <td>0.1444</td>\n      <td>0.1417</td>\n    </tr>\n    <tr>\n      <th>eus</th>\n      <td>0.0416</td>\n      <td>0.0393</td>\n      <td>0.0406</td>\n    </tr>\n    <tr>\n      <th>fao</th>\n      <td>0.0048</td>\n      <td>0.0054</td>\n      <td>0.0053</td>\n    </tr>\n    <tr>\n      <th>fas</th>\n      <td>0.8777</td>\n      <td>0.1982</td>\n      <td>0.2286</td>\n    </tr>\n    <tr>\n      <th>fij</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>fin</th>\n      <td>0.3425</td>\n      <td>0.3705</td>\n      <td>0.3833</td>\n    </tr>\n    <tr>\n      <th>fra</th>\n      <td>4.4567</td>\n      <td>4.6052</td>\n      <td>4.7551</td>\n    </tr>\n    <tr>\n      <th>fry</th>\n      <td>0.0027</td>\n      <td>0.0026</td>\n      <td>0.0020</td>\n    </tr>\n    <tr>\n      <th>gla</th>\n      <td>0.0019</td>\n      <td>0.0018</td>\n      <td>0.0019</td>\n    </tr>\n    <tr>\n      <th>gle</th>\n      <td>0.0065</td>\n      <td>0.0069</td>\n      <td>0.0071</td>\n    </tr>\n    <tr>\n      <th>glg</th>\n      <td>0.0358</td>\n      <td>0.0325</td>\n      <td>0.0325</td>\n    </tr>\n    <tr>\n      <th>glv</th>\n      <td>0.0006</td>\n      <td>0.0005</td>\n      <td>0.0006</td>\n    </tr>\n    <tr>\n      <th>got</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>grn</th>\n      <td>0.0009</td>\n      <td>0.0007</td>\n      <td>0.0008</td>\n    </tr>\n    <tr>\n      <th>guj</th>\n      <td>0.0115</td>\n      <td>0.0126</td>\n      <td>0.0129</td>\n    </tr>\n    <tr>\n      <th>hat</th>\n      <td>0.0028</td>\n      <td>0.0025</td>\n      <td>0.0022</td>\n    </tr>\n    <tr>\n      <th>hau</th>\n      <td>0.0033</td>\n      <td>0.0040</td>\n      <td>0.0036</td>\n    </tr>\n    <tr>\n      <th>haw</th>\n      <td>0.0008</td>\n      <td>0.0007</td>\n      <td>0.0007</td>\n    </tr>\n    <tr>\n      <th>heb</th>\n      <td>0.2303</td>\n      <td>0.2369</td>\n      <td>0.2608</td>\n    </tr>\n    <tr>\n      <th>hin</th>\n      <td>0.2106</td>\n      <td>0.2175</td>\n      <td>0.2259</td>\n    </tr>\n    <tr>\n      <th>hmn</th>\n      <td>0.0007</td>\n      <td>0.0007</td>\n      <td>0.0007</td>\n    </tr>\n    <tr>\n      <th>hrv</th>\n      <td>0.1937</td>\n      <td>0.2144</td>\n      <td>0.2178</td>\n    </tr>\n    <tr>\n      <th>hun</th>\n      <td>0.4952</td>\n      <td>0.5299</td>\n      <td>0.5477</td>\n    </tr>\n    <tr>\n      <th>hye</th>\n      <td>0.0323</td>\n      <td>0.0344</td>\n      <td>0.0327</td>\n    </tr>\n    <tr>\n      <th>ibo</th>\n      <td>0.0013</td>\n      <td>0.0011</td>\n      <td>0.0012</td>\n    </tr>\n    <tr>\n      <th>iku</th>\n      <td>0.0003</td>\n      <td>0.0004</td>\n      <td>0.0005</td>\n    </tr>\n    <tr>\n      <th>ile</th>\n      <td>0.0004</td>\n      <td>0.0004</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>ina</th>\n      <td>0.0007</td>\n      <td>0.0006</td>\n      <td>0.0007</td>\n    </tr>\n    <tr>\n      <th>ind</th>\n      <td>1.0059</td>\n      <td>1.0993</td>\n      <td>1.2181</td>\n    </tr>\n    <tr>\n      <th>ipk</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>isl</th>\n      <td>0.0395</td>\n      <td>0.0383</td>\n      <td>0.0347</td>\n    </tr>\n    <tr>\n      <th>ita</th>\n      <td>2.2823</td>\n      <td>2.3823</td>\n      <td>2.3284</td>\n    </tr>\n    <tr>\n      <th>jav</th>\n      <td>0.0030</td>\n      <td>0.0036</td>\n      <td>0.0035</td>\n    </tr>\n    <tr>\n      <th>jpn</th>\n      <td>5.6591</td>\n      <td>5.7207</td>\n      <td>5.1572</td>\n    </tr>\n    <tr>\n      <th>kal</th>\n      <td>0.0011</td>\n      <td>0.0011</td>\n      <td>0.0009</td>\n    </tr>\n    <tr>\n      <th>kan</th>\n      <td>0.0193</td>\n      <td>0.0179</td>\n      <td>0.0177</td>\n    </tr>\n    <tr>\n      <th>kas</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>kat</th>\n      <td>0.0429</td>\n      <td>0.0460</td>\n      <td>0.0448</td>\n    </tr>\n    <tr>\n      <th>kaz</th>\n      <td>0.0387</td>\n      <td>0.0380</td>\n      <td>0.0355</td>\n    </tr>\n    <tr>\n      <th>kha</th>\n      <td>0.0003</td>\n      <td>0.0003</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>khm</th>\n      <td>0.0095</td>\n      <td>0.0094</td>\n      <td>0.0106</td>\n    </tr>\n    <tr>\n      <th>kin</th>\n      <td>0.0022</td>\n      <td>0.0028</td>\n      <td>0.0028</td>\n    </tr>\n    <tr>\n      <th>kir</th>\n      <td>0.0113</td>\n      <td>0.0127</td>\n      <td>0.0113</td>\n    </tr>\n    <tr>\n      <th>kor</th>\n      <td>0.8145</td>\n      <td>0.8378</td>\n      <td>0.8230</td>\n    </tr>\n    <tr>\n      <th>kur</th>\n      <td>0.0066</td>\n      <td>0.0065</td>\n      <td>0.0068</td>\n    </tr>\n    <tr>\n      <th>lao</th>\n      <td>0.0042</td>\n      <td>0.0042</td>\n      <td>0.0058</td>\n    </tr>\n    <tr>\n      <th>lat</th>\n      <td>0.1018</td>\n      <td>0.1016</td>\n      <td>0.1172</td>\n    </tr>\n    <tr>\n      <th>lav</th>\n      <td>0.0855</td>\n      <td>0.0918</td>\n      <td>0.0921</td>\n    </tr>\n    <tr>\n      <th>lif</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>lin</th>\n      <td>0.0004</td>\n      <td>0.0004</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>lit</th>\n      <td>0.1693</td>\n      <td>0.1757</td>\n      <td>0.1753</td>\n    </tr>\n    <tr>\n      <th>ltz</th>\n      <td>0.0034</td>\n      <td>0.0040</td>\n      <td>0.0035</td>\n    </tr>\n    <tr>\n      <th>lug</th>\n      <td>0.0003</td>\n      <td>0.0002</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>mal</th>\n      <td>0.0275</td>\n      <td>0.0276</td>\n      <td>0.0255</td>\n    </tr>\n    <tr>\n      <th>mar</th>\n      <td>0.0314</td>\n      <td>0.0314</td>\n      <td>0.0315</td>\n    </tr>\n    <tr>\n      <th>mfe</th>\n      <td>0.0002</td>\n      <td>0.0002</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>mkd</th>\n      <td>0.0342</td>\n      <td>0.0397</td>\n      <td>0.0410</td>\n    </tr>\n    <tr>\n      <th>mlg</th>\n      <td>0.0056</td>\n      <td>0.0053</td>\n      <td>0.0056</td>\n    </tr>\n    <tr>\n      <th>mlt</th>\n      <td>0.0029</td>\n      <td>0.0031</td>\n      <td>0.0034</td>\n    </tr>\n    <tr>\n      <th>mon</th>\n      <td>0.0154</td>\n      <td>0.0161</td>\n      <td>0.0151</td>\n    </tr>\n    <tr>\n      <th>mri</th>\n      <td>0.0012</td>\n      <td>0.0012</td>\n      <td>0.0014</td>\n    </tr>\n    <tr>\n      <th>msa</th>\n      <td>0.0787</td>\n      <td>0.0824</td>\n      <td>0.0839</td>\n    </tr>\n    <tr>\n      <th>mya</th>\n      <td>0.0178</td>\n      <td>0.0168</td>\n      <td>0.0164</td>\n    </tr>\n    <tr>\n      <th>nau</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>nep</th>\n      <td>0.0533</td>\n      <td>0.0529</td>\n      <td>0.0626</td>\n    </tr>\n    <tr>\n      <th>nld</th>\n      <td>1.6783</td>\n      <td>1.8094</td>\n      <td>1.8420</td>\n    </tr>\n    <tr>\n      <th>nno</th>\n      <td>0.0139</td>\n      <td>0.0146</td>\n      <td>0.0147</td>\n    </tr>\n    <tr>\n      <th>nor</th>\n      <td>0.3060</td>\n      <td>0.3370</td>\n      <td>0.3405</td>\n    </tr>\n    <tr>\n      <th>nso</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>nya</th>\n      <td>0.0007</td>\n      <td>0.0007</td>\n      <td>0.0007</td>\n    </tr>\n    <tr>\n      <th>oci</th>\n      <td>0.0036</td>\n      <td>0.0040</td>\n      <td>0.0038</td>\n    </tr>\n    <tr>\n      <th>ori</th>\n      <td>0.0071</td>\n      <td>0.0071</td>\n      <td>0.0073</td>\n    </tr>\n    <tr>\n      <th>orm</th>\n      <td>0.0009</td>\n      <td>0.0006</td>\n      <td>0.0006</td>\n    </tr>\n    <tr>\n      <th>pan</th>\n      <td>0.0076</td>\n      <td>0.0091</td>\n      <td>0.0095</td>\n    </tr>\n    <tr>\n      <th>pol</th>\n      <td>1.9012</td>\n      <td>2.0425</td>\n      <td>2.0935</td>\n    </tr>\n    <tr>\n      <th>por</th>\n      <td>2.4098</td>\n      <td>2.5268</td>\n      <td>2.5116</td>\n    </tr>\n    <tr>\n      <th>pus</th>\n      <td>0.0044</td>\n      <td>0.0042</td>\n      <td>0.0040</td>\n    </tr>\n    <tr>\n      <th>que</th>\n      <td>0.0011</td>\n      <td>0.0008</td>\n      <td>0.0010</td>\n    </tr>\n    <tr>\n      <th>roh</th>\n      <td>0.0014</td>\n      <td>0.0017</td>\n      <td>0.0018</td>\n    </tr>\n    <tr>\n      <th>ron</th>\n      <td>0.4662</td>\n      <td>0.5622</td>\n      <td>0.6064</td>\n    </tr>\n    <tr>\n      <th>run</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>rus</th>\n      <td>6.1577</td>\n      <td>6.4899</td>\n      <td>6.5262</td>\n    </tr>\n    <tr>\n      <th>sag</th>\n      <td>0.0016</td>\n      <td>0.0007</td>\n      <td>0.0006</td>\n    </tr>\n    <tr>\n      <th>san</th>\n      <td>0.0052</td>\n      <td>0.0037</td>\n      <td>0.0038</td>\n    </tr>\n    <tr>\n      <th>sco</th>\n      <td>0.0007</td>\n      <td>0.0007</td>\n      <td>0.0007</td>\n    </tr>\n    <tr>\n      <th>sin</th>\n      <td>0.0099</td>\n      <td>0.0095</td>\n      <td>0.0099</td>\n    </tr>\n    <tr>\n      <th>slk</th>\n      <td>0.3924</td>\n      <td>0.4072</td>\n      <td>0.4118</td>\n    </tr>\n    <tr>\n      <th>slv</th>\n      <td>0.1229</td>\n      <td>0.1450</td>\n      <td>0.1535</td>\n    </tr>\n    <tr>\n      <th>smo</th>\n      <td>0.0007</td>\n      <td>0.0008</td>\n      <td>0.0008</td>\n    </tr>\n    <tr>\n      <th>sna</th>\n      <td>0.0008</td>\n      <td>0.0009</td>\n      <td>0.0008</td>\n    </tr>\n    <tr>\n      <th>snd</th>\n      <td>0.0024</td>\n      <td>0.0017</td>\n      <td>0.0020</td>\n    </tr>\n    <tr>\n      <th>som</th>\n      <td>0.0051</td>\n      <td>0.0056</td>\n      <td>0.0058</td>\n    </tr>\n    <tr>\n      <th>sot</th>\n      <td>0.0006</td>\n      <td>0.0006</td>\n      <td>0.0007</td>\n    </tr>\n    <tr>\n      <th>spa</th>\n      <td>4.4682</td>\n      <td>4.6581</td>\n      <td>4.7324</td>\n    </tr>\n    <tr>\n      <th>sqi</th>\n      <td>0.0499</td>\n      <td>0.0525</td>\n      <td>0.0511</td>\n    </tr>\n    <tr>\n      <th>srp</th>\n      <td>0.2306</td>\n      <td>0.2658</td>\n      <td>0.2610</td>\n    </tr>\n    <tr>\n      <th>ssw</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>sun</th>\n      <td>0.0019</td>\n      <td>0.0017</td>\n      <td>0.0015</td>\n    </tr>\n    <tr>\n      <th>sux</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>swa</th>\n      <td>0.0126</td>\n      <td>0.0140</td>\n      <td>0.0123</td>\n    </tr>\n    <tr>\n      <th>swe</th>\n      <td>0.6517</td>\n      <td>0.7275</td>\n      <td>0.7308</td>\n    </tr>\n    <tr>\n      <th>syr</th>\n      <td>0.0003</td>\n      <td>0.0003</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>tam</th>\n      <td>0.0468</td>\n      <td>0.0487</td>\n      <td>0.0464</td>\n    </tr>\n    <tr>\n      <th>tat</th>\n      <td>0.0082</td>\n      <td>0.0089</td>\n      <td>0.0071</td>\n    </tr>\n    <tr>\n      <th>tel</th>\n      <td>0.0215</td>\n      <td>0.0250</td>\n      <td>0.0226</td>\n    </tr>\n    <tr>\n      <th>tgk</th>\n      <td>0.0064</td>\n      <td>0.0070</td>\n      <td>0.0067</td>\n    </tr>\n    <tr>\n      <th>tgl</th>\n      <td>0.0098</td>\n      <td>0.0097</td>\n      <td>0.0103</td>\n    </tr>\n    <tr>\n      <th>tha</th>\n      <td>0.3740</td>\n      <td>0.3727</td>\n      <td>0.3940</td>\n    </tr>\n    <tr>\n      <th>tir</th>\n      <td>0.0007</td>\n      <td>0.0006</td>\n      <td>0.0012</td>\n    </tr>\n    <tr>\n      <th>ton</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>tsn</th>\n      <td>0.0003</td>\n      <td>0.0001</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>tso</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>tuk</th>\n      <td>0.0039</td>\n      <td>0.0041</td>\n      <td>0.0036</td>\n    </tr>\n    <tr>\n      <th>tur</th>\n      <td>1.1616</td>\n      <td>1.2224</td>\n      <td>1.2985</td>\n    </tr>\n    <tr>\n      <th>uig</th>\n      <td>0.0018</td>\n      <td>0.0017</td>\n      <td>0.0022</td>\n    </tr>\n    <tr>\n      <th>ukr</th>\n      <td>0.6678</td>\n      <td>0.7152</td>\n      <td>0.8012</td>\n    </tr>\n    <tr>\n      <th>urd</th>\n      <td>0.0321</td>\n      <td>0.0314</td>\n      <td>0.0322</td>\n    </tr>\n    <tr>\n      <th>uzb</th>\n      <td>0.0254</td>\n      <td>0.0258</td>\n      <td>0.0247</td>\n    </tr>\n    <tr>\n      <th>ven</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>vie</th>\n      <td>1.0294</td>\n      <td>1.0914</td>\n      <td>1.1284</td>\n    </tr>\n    <tr>\n      <th>vol</th>\n      <td>0.0008</td>\n      <td>0.0015</td>\n      <td>0.0014</td>\n    </tr>\n    <tr>\n      <th>war</th>\n      <td>0.0019</td>\n      <td>0.0022</td>\n      <td>0.0020</td>\n    </tr>\n    <tr>\n      <th>wol</th>\n      <td>0.0003</td>\n      <td>0.0002</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>xho</th>\n      <td>0.0009</td>\n      <td>0.0009</td>\n      <td>0.0009</td>\n    </tr>\n    <tr>\n      <th>yid</th>\n      <td>0.0022</td>\n      <td>0.0019</td>\n      <td>0.0017</td>\n    </tr>\n    <tr>\n      <th>yor</th>\n      <td>0.0015</td>\n      <td>0.0017</td>\n      <td>0.0016</td>\n    </tr>\n    <tr>\n      <th>zha</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>zho</th>\n      <td>4.9960</td>\n      <td>4.9855</td>\n      <td>4.8564</td>\n    </tr>\n    <tr>\n      <th>zul</th>\n      <td>0.0012</td>\n      <td>0.0012</td>\n      <td>0.0014</td>\n    </tr>\n  </tbody>\n</table>"
  },
  {
    "path": "plots/languages.csv",
    "content": "crawl,primary_language,pages,urls,%pages/crawl\nCC-MAIN-2008-2009,<unknown>,1798158091,1798158091,100.0000\nCC-MAIN-2009-2010,<unknown>,2863495211,2863495211,100.0000\nCC-MAIN-2012,<unknown>,3828539877,3828539877,100.0000\nCC-MAIN-2013-20,<unknown>,1796098643,1796098643,100.0000\nCC-MAIN-2013-48,<unknown>,2245773667,2245773667,100.0000\nCC-MAIN-2014-10,<unknown>,2301223474,2301223474,100.0000\nCC-MAIN-2014-15,<unknown>,2641371316,2641371316,100.0000\nCC-MAIN-2014-23,<unknown>,3608720876,3608720876,100.0000\nCC-MAIN-2014-35,<unknown>,2870692423,2870692423,100.0000\nCC-MAIN-2014-41,<unknown>,2979743543,2979743543,100.0000\nCC-MAIN-2014-42,<unknown>,3722131678,3722131678,100.0000\nCC-MAIN-2014-49,<unknown>,1948510433,1948510433,100.0000\nCC-MAIN-2014-52,<unknown>,2085977207,2085977207,100.0000\nCC-MAIN-2015-06,<unknown>,1826024103,1826024103,100.0000\nCC-MAIN-2015-11,<unknown>,1837196089,1837196089,100.0000\nCC-MAIN-2015-14,<unknown>,1646697534,1646697534,100.0000\nCC-MAIN-2015-18,<unknown>,2115818059,2115818059,100.0000\nCC-MAIN-2015-22,<unknown>,2015461448,2015461448,100.0000\nCC-MAIN-2015-27,<unknown>,1675619098,1675619098,100.0000\nCC-MAIN-2015-32,<unknown>,1815492409,1815492409,100.0000\nCC-MAIN-2015-35,<unknown>,1848022475,1848022475,100.0000\nCC-MAIN-2015-40,<unknown>,1321987379,1321987379,100.0000\nCC-MAIN-2015-48,<unknown>,1824170527,1824170527,100.0000\nCC-MAIN-2016-07,<unknown>,1733285122,1733285122,100.0000\nCC-MAIN-2016-18,<unknown>,1335046923,1335046923,100.0000\nCC-MAIN-2016-22,<unknown>,1466220798,1466220798,100.0000\nCC-MAIN-2016-26,<unknown>,1236815660,1236815660,100.0000\nCC-MAIN-2016-30,<unknown>,1737322304,1737322304,100.0000\nCC-MAIN-2016-36,<unknown>,1611613090,1611613090,100.0000\nCC-MAIN-2016-40,<unknown>,1722656393,1722656393,100.0000\nCC-MAIN-2016-44,<unknown>,3254976731,3254976731,100.0000\nCC-MAIN-2016-50,<unknown>,2866282390,2866282390,100.0000\nCC-MAIN-2017-04,<unknown>,3146498026,3146498026,100.0000\nCC-MAIN-2017-09,<unknown>,3084366662,3084366662,100.0000\nCC-MAIN-2017-13,<unknown>,3070720576,3070720576,100.0000\nCC-MAIN-2017-17,<unknown>,2942930482,2942930482,100.0000\nCC-MAIN-2017-22,<unknown>,2967293699,2967293699,100.0000\nCC-MAIN-2017-26,<unknown>,3165214086,3165214086,100.0000\nCC-MAIN-2017-30,<unknown>,2892213652,2892213652,100.0000\nCC-MAIN-2017-34,<unknown>,3280080910,3280080910,100.0000\nCC-MAIN-2017-39,<unknown>,3017180563,3017180563,100.0000\nCC-MAIN-2017-43,<unknown>,3650430218,3650430218,100.0000\nCC-MAIN-2017-47,<unknown>,3204943573,3204943573,100.0000\nCC-MAIN-2017-51,<unknown>,2914004423,2914004423,100.0000\nCC-MAIN-2018-05,<unknown>,3464537205,3464537205,100.0000\nCC-MAIN-2018-09,<unknown>,3488463319,3488463319,100.0000\nCC-MAIN-2018-13,<unknown>,3232738018,3232738018,100.0000\nCC-MAIN-2018-17,<unknown>,3101353989,3101353989,100.0000\nCC-MAIN-2018-22,<unknown>,2788388007,2788388007,100.0000\nCC-MAIN-2018-26,<unknown>,3069414247,3069414247,100.0000\nCC-MAIN-2018-30,<unknown>,3263958200,3263958200,100.0000\nCC-MAIN-2018-34,<unknown>,157758948,157758948,5.8727\nCC-MAIN-2018-34,aar,4172,4075,0.0002\nCC-MAIN-2018-34,abk,5174,5159,0.0002\nCC-MAIN-2018-34,afr,193831,192242,0.0072\nCC-MAIN-2018-34,aka,1644,1618,0.0001\nCC-MAIN-2018-34,amh,56720,55636,0.0021\nCC-MAIN-2018-34,ara,17967089,17869351,0.6688\nCC-MAIN-2018-34,asm,11618,11574,0.0004\nCC-MAIN-2018-34,aym,2094,2035,0.0001\nCC-MAIN-2018-34,aze,912585,908581,0.0340\nCC-MAIN-2018-34,bak,31433,31403,0.0012\nCC-MAIN-2018-34,bel,319114,318354,0.0119\nCC-MAIN-2018-34,ben,1219353,1211074,0.0454\nCC-MAIN-2018-34,bih,14331,14306,0.0005\nCC-MAIN-2018-34,bis,3615,3541,0.0001\nCC-MAIN-2018-34,blu,18001,17954,0.0007\nCC-MAIN-2018-34,bod,29019,28966,0.0011\nCC-MAIN-2018-34,bos,753829,750650,0.0281\nCC-MAIN-2018-34,bre,35508,35321,0.0013\nCC-MAIN-2018-34,bul,7003816,6953217,0.2607\nCC-MAIN-2018-34,cat,4579395,4524579,0.1705\nCC-MAIN-2018-34,ceb,30629,30517,0.0011\nCC-MAIN-2018-34,ces,27345500,26862578,1.0180\nCC-MAIN-2018-34,chr,1025,1024,0.0000\nCC-MAIN-2018-34,cos,35549,34961,0.0013\nCC-MAIN-2018-34,crs,2426,2302,0.0001\nCC-MAIN-2018-34,cym,163654,162032,0.0061\nCC-MAIN-2018-34,dan,9785256,9668039,0.3643\nCC-MAIN-2018-34,deu,133628300,131239485,4.9744\nCC-MAIN-2018-34,div,17735,17682,0.0007\nCC-MAIN-2018-34,dzo,1458,1454,0.0001\nCC-MAIN-2018-34,ell,12867678,12715916,0.4790\nCC-MAIN-2018-34,eng,1178882529,1161432337,43.8846\nCC-MAIN-2018-34,epo,108185,107733,0.0040\nCC-MAIN-2018-34,est,2630460,2594857,0.0979\nCC-MAIN-2018-34,eus,486668,482025,0.0181\nCC-MAIN-2018-34,fao,70997,70082,0.0026\nCC-MAIN-2018-34,fas,17018457,16910062,0.6335\nCC-MAIN-2018-34,fij,1909,1835,0.0001\nCC-MAIN-2018-34,fin,9495654,9354604,0.3535\nCC-MAIN-2018-34,fra,116138883,114663620,4.3233\nCC-MAIN-2018-34,fry,55862,55517,0.0021\nCC-MAIN-2018-34,gla,37507,37148,0.0014\nCC-MAIN-2018-34,gle,98063,97520,0.0037\nCC-MAIN-2018-34,glg,590232,584495,0.0220\nCC-MAIN-2018-34,glv,7558,7322,0.0003\nCC-MAIN-2018-34,got,365,362,0.0000\nCC-MAIN-2018-34,grn,22870,22638,0.0009\nCC-MAIN-2018-34,guj,131636,130973,0.0049\nCC-MAIN-2018-34,hat,32878,32777,0.0012\nCC-MAIN-2018-34,hau,40559,39861,0.0015\nCC-MAIN-2018-34,haw,6343,6252,0.0002\nCC-MAIN-2018-34,heb,4313879,4253840,0.1606\nCC-MAIN-2018-34,hin,1842721,1820540,0.0686\nCC-MAIN-2018-34,hrv,3592632,3566053,0.1337\nCC-MAIN-2018-34,hun,13034954,12907032,0.4852\nCC-MAIN-2018-34,hye,605141,601248,0.0225\nCC-MAIN-2018-34,ibo,4039,4008,0.0002\nCC-MAIN-2018-34,iku,3339,3325,0.0001\nCC-MAIN-2018-34,ile,7297,7170,0.0003\nCC-MAIN-2018-34,ina,19138,18902,0.0007\nCC-MAIN-2018-34,ind,19876418,19670480,0.7399\nCC-MAIN-2018-34,ipk,1804,1789,0.0001\nCC-MAIN-2018-34,isl,820455,812901,0.0305\nCC-MAIN-2018-34,ita,52747492,51973301,1.9636\nCC-MAIN-2018-34,jav,31469,31373,0.0012\nCC-MAIN-2018-34,jpn,143535898,142054611,5.3432\nCC-MAIN-2018-34,kal,15871,15599,0.0006\nCC-MAIN-2018-34,kan,159102,158465,0.0059\nCC-MAIN-2018-34,kas,29,27,0.0000\nCC-MAIN-2018-34,kat,674943,671871,0.0251\nCC-MAIN-2018-34,kaz,361123,359208,0.0134\nCC-MAIN-2018-34,kha,4984,4894,0.0002\nCC-MAIN-2018-34,khm,131955,130977,0.0049\nCC-MAIN-2018-34,kin,46300,46030,0.0017\nCC-MAIN-2018-34,kir,85309,85151,0.0032\nCC-MAIN-2018-34,kor,15020842,14834806,0.5592\nCC-MAIN-2018-34,kur,108778,108578,0.0040\nCC-MAIN-2018-34,lao,50900,50380,0.0019\nCC-MAIN-2018-34,lat,889401,881361,0.0331\nCC-MAIN-2018-34,lav,1943967,1926190,0.0724\nCC-MAIN-2018-34,lif,154,153,0.0000\nCC-MAIN-2018-34,lin,4101,4002,0.0002\nCC-MAIN-2018-34,lit,3453793,3410139,0.1286\nCC-MAIN-2018-34,ltz,53532,52895,0.0020\nCC-MAIN-2018-34,lug,3238,3187,0.0001\nCC-MAIN-2018-34,mal,343153,341324,0.0128\nCC-MAIN-2018-34,mar,189570,188817,0.0071\nCC-MAIN-2018-34,mfe,2795,2746,0.0001\nCC-MAIN-2018-34,mkd,441705,439487,0.0164\nCC-MAIN-2018-34,mlg,54122,53786,0.0020\nCC-MAIN-2018-34,mlt,49657,49369,0.0018\nCC-MAIN-2018-34,mon,323068,321689,0.0120\nCC-MAIN-2018-34,mri,14624,14350,0.0005\nCC-MAIN-2018-34,msa,2649378,2630915,0.0986\nCC-MAIN-2018-34,mya,213473,211957,0.0079\nCC-MAIN-2018-34,nau,1136,1097,0.0000\nCC-MAIN-2018-34,nep,291069,289491,0.0108\nCC-MAIN-2018-34,nld,36731598,36107045,1.3674\nCC-MAIN-2018-34,nno,330421,327453,0.0123\nCC-MAIN-2018-34,nor,7832173,7742445,0.2916\nCC-MAIN-2018-34,nso,1773,1756,0.0001\nCC-MAIN-2018-34,nya,12319,12231,0.0005\nCC-MAIN-2018-34,oci,65026,64723,0.0024\nCC-MAIN-2018-34,ori,45911,45820,0.0017\nCC-MAIN-2018-34,orm,8171,8078,0.0003\nCC-MAIN-2018-34,pan,78659,78380,0.0029\nCC-MAIN-2018-34,pol,44687229,44215001,1.6635\nCC-MAIN-2018-34,por,53220076,52581446,1.9811\nCC-MAIN-2018-34,pus,58627,58489,0.0022\nCC-MAIN-2018-34,que,8365,8226,0.0003\nCC-MAIN-2018-34,roh,33940,33733,0.0013\nCC-MAIN-2018-34,ron,13747709,13617648,0.5118\nCC-MAIN-2018-34,run,3306,3266,0.0001\nCC-MAIN-2018-34,rus,240333312,238711598,8.9466\nCC-MAIN-2018-34,sag,942,937,0.0000\nCC-MAIN-2018-34,san,44718,44187,0.0017\nCC-MAIN-2018-34,sco,20593,20284,0.0008\nCC-MAIN-2018-34,sin,142130,141543,0.0053\nCC-MAIN-2018-34,slk,6087516,6007171,0.2266\nCC-MAIN-2018-34,slv,2575104,2537138,0.0959\nCC-MAIN-2018-34,smo,7501,7437,0.0003\nCC-MAIN-2018-34,sna,8638,8544,0.0003\nCC-MAIN-2018-34,snd,12222,12194,0.0005\nCC-MAIN-2018-34,som,113834,113229,0.0042\nCC-MAIN-2018-34,sot,6194,6089,0.0002\nCC-MAIN-2018-34,spa,109410457,107990412,4.0729\nCC-MAIN-2018-34,sqi,760210,756686,0.0283\nCC-MAIN-2018-34,srp,3909562,3881981,0.1455\nCC-MAIN-2018-34,ssw,1289,1191,0.0000\nCC-MAIN-2018-34,sun,13950,13856,0.0005\nCC-MAIN-2018-34,sux,69,69,0.0000\nCC-MAIN-2018-34,swa,168171,166712,0.0063\nCC-MAIN-2018-34,swe,19418339,19204473,0.7229\nCC-MAIN-2018-34,syr,8729,8694,0.0003\nCC-MAIN-2018-34,tam,802423,797970,0.0299\nCC-MAIN-2018-34,tat,129074,128570,0.0048\nCC-MAIN-2018-34,tel,221312,220453,0.0082\nCC-MAIN-2018-34,tgk,62896,62629,0.0023\nCC-MAIN-2018-34,tgl,209645,209005,0.0078\nCC-MAIN-2018-34,tha,8536698,8473274,0.3178\nCC-MAIN-2018-34,tir,16925,16899,0.0006\nCC-MAIN-2018-34,ton,2350,2318,0.0001\nCC-MAIN-2018-34,tsn,3082,3015,0.0001\nCC-MAIN-2018-34,tso,1755,1705,0.0001\nCC-MAIN-2018-34,tuk,22202,22056,0.0008\nCC-MAIN-2018-34,tur,23422436,23182246,0.8719\nCC-MAIN-2018-34,uig,22912,22866,0.0009\nCC-MAIN-2018-34,ukr,9779432,9720315,0.3640\nCC-MAIN-2018-34,urd,532730,530336,0.0198\nCC-MAIN-2018-34,uzb,249163,248049,0.0093\nCC-MAIN-2018-34,ven,657,638,0.0000\nCC-MAIN-2018-34,vie,20055433,19903903,0.7466\nCC-MAIN-2018-34,vol,14232,14073,0.0005\nCC-MAIN-2018-34,war,54391,54016,0.0020\nCC-MAIN-2018-34,wol,3034,2973,0.0001\nCC-MAIN-2018-34,xho,8948,8569,0.0003\nCC-MAIN-2018-34,yid,33273,33192,0.0012\nCC-MAIN-2018-34,yor,8676,8637,0.0003\nCC-MAIN-2018-34,zha,1255,1215,0.0000\nCC-MAIN-2018-34,zho,113531714,113023462,4.2263\nCC-MAIN-2018-34,zul,11065,10976,0.0004\nCC-MAIN-2018-39,<unknown>,58844901,58844901,2.0711\nCC-MAIN-2018-39,aar,5473,5384,0.0002\nCC-MAIN-2018-39,abk,5305,5295,0.0002\nCC-MAIN-2018-39,afr,261174,259528,0.0092\nCC-MAIN-2018-39,aka,1047,1017,0.0000\nCC-MAIN-2018-39,amh,66663,66160,0.0023\nCC-MAIN-2018-39,ara,23546366,23291771,0.8287\nCC-MAIN-2018-39,asm,14134,14097,0.0005\nCC-MAIN-2018-39,aym,2325,2274,0.0001\nCC-MAIN-2018-39,aze,1123380,1119529,0.0395\nCC-MAIN-2018-39,bak,28165,28142,0.0010\nCC-MAIN-2018-39,bel,410998,408044,0.0145\nCC-MAIN-2018-39,ben,2316537,2243702,0.0815\nCC-MAIN-2018-39,bih,16527,16347,0.0006\nCC-MAIN-2018-39,bis,2782,2712,0.0001\nCC-MAIN-2018-39,blu,18145,17961,0.0006\nCC-MAIN-2018-39,bod,28726,28655,0.0010\nCC-MAIN-2018-39,bos,929888,923498,0.0327\nCC-MAIN-2018-39,bre,38067,37867,0.0013\nCC-MAIN-2018-39,bul,8396141,8338873,0.2955\nCC-MAIN-2018-39,cat,5063726,5012326,0.1782\nCC-MAIN-2018-39,ceb,37808,37733,0.0013\nCC-MAIN-2018-39,ces,29773412,29431604,1.0479\nCC-MAIN-2018-39,chr,1397,1396,0.0000\nCC-MAIN-2018-39,cos,38972,38397,0.0014\nCC-MAIN-2018-39,crs,3112,3058,0.0001\nCC-MAIN-2018-39,cym,175388,174068,0.0062\nCC-MAIN-2018-39,dan,10943101,10803399,0.3852\nCC-MAIN-2018-39,deu,146175979,144276394,5.1449\nCC-MAIN-2018-39,div,29884,29223,0.0011\nCC-MAIN-2018-39,dzo,1237,1233,0.0000\nCC-MAIN-2018-39,ell,14243392,14119800,0.5013\nCC-MAIN-2018-39,eng,1280182051,1262729057,45.0579\nCC-MAIN-2018-39,epo,129726,129235,0.0046\nCC-MAIN-2018-39,est,3145632,3078262,0.1107\nCC-MAIN-2018-39,eus,551653,547068,0.0194\nCC-MAIN-2018-39,fao,70858,69338,0.0025\nCC-MAIN-2018-39,fas,18484101,18361761,0.6506\nCC-MAIN-2018-39,fij,2293,2233,0.0001\nCC-MAIN-2018-39,fin,10652974,10512276,0.3749\nCC-MAIN-2018-39,fra,130936850,129466954,4.6085\nCC-MAIN-2018-39,fry,42206,41970,0.0015\nCC-MAIN-2018-39,gla,33590,32944,0.0012\nCC-MAIN-2018-39,gle,104784,104279,0.0037\nCC-MAIN-2018-39,glg,652585,647610,0.0230\nCC-MAIN-2018-39,glv,7925,7704,0.0003\nCC-MAIN-2018-39,got,755,753,0.0000\nCC-MAIN-2018-39,grn,26098,25850,0.0009\nCC-MAIN-2018-39,guj,268034,259259,0.0094\nCC-MAIN-2018-39,hat,38571,38478,0.0014\nCC-MAIN-2018-39,hau,45679,44657,0.0016\nCC-MAIN-2018-39,haw,6214,6115,0.0002\nCC-MAIN-2018-39,heb,4775015,4706645,0.1681\nCC-MAIN-2018-39,hin,3014813,2954232,0.1061\nCC-MAIN-2018-39,hrv,4089187,4060382,0.1439\nCC-MAIN-2018-39,hun,14482004,14362487,0.5097\nCC-MAIN-2018-39,hye,817747,806877,0.0288\nCC-MAIN-2018-39,ibo,4646,4628,0.0002\nCC-MAIN-2018-39,iku,4290,4270,0.0002\nCC-MAIN-2018-39,ile,9210,9102,0.0003\nCC-MAIN-2018-39,ina,21030,20850,0.0007\nCC-MAIN-2018-39,ind,21105983,20905174,0.7429\nCC-MAIN-2018-39,ipk,2642,2632,0.0001\nCC-MAIN-2018-39,isl,872738,861426,0.0307\nCC-MAIN-2018-39,ita,58924031,58260997,2.0739\nCC-MAIN-2018-39,jav,34621,34527,0.0012\nCC-MAIN-2018-39,jpn,156919435,155729928,5.5230\nCC-MAIN-2018-39,kal,16185,15890,0.0006\nCC-MAIN-2018-39,kan,374252,362325,0.0132\nCC-MAIN-2018-39,kas,74,72,0.0000\nCC-MAIN-2018-39,kat,878521,874082,0.0309\nCC-MAIN-2018-39,kaz,421258,414291,0.0148\nCC-MAIN-2018-39,kha,6503,6411,0.0002\nCC-MAIN-2018-39,khm,183198,176086,0.0064\nCC-MAIN-2018-39,kin,55908,52696,0.0020\nCC-MAIN-2018-39,kir,170206,169153,0.0060\nCC-MAIN-2018-39,kor,16888642,16780060,0.5944\nCC-MAIN-2018-39,kur,125804,125061,0.0044\nCC-MAIN-2018-39,lao,104226,103445,0.0037\nCC-MAIN-2018-39,lat,918789,911274,0.0323\nCC-MAIN-2018-39,lav,2267255,2243863,0.0798\nCC-MAIN-2018-39,lif,203,200,0.0000\nCC-MAIN-2018-39,lin,4636,4566,0.0002\nCC-MAIN-2018-39,lit,4050448,3995729,0.1426\nCC-MAIN-2018-39,ltz,60446,59821,0.0021\nCC-MAIN-2018-39,lug,6897,6845,0.0002\nCC-MAIN-2018-39,mal,684358,663901,0.0241\nCC-MAIN-2018-39,mar,364901,330580,0.0128\nCC-MAIN-2018-39,mfe,2559,2511,0.0001\nCC-MAIN-2018-39,mkd,576716,570376,0.0203\nCC-MAIN-2018-39,mlg,69368,68497,0.0024\nCC-MAIN-2018-39,mlt,65261,64433,0.0023\nCC-MAIN-2018-39,mon,385985,383892,0.0136\nCC-MAIN-2018-39,mri,15827,15651,0.0006\nCC-MAIN-2018-39,msa,2829844,2817663,0.0996\nCC-MAIN-2018-39,mya,357586,352523,0.0126\nCC-MAIN-2018-39,nau,1052,1020,0.0000\nCC-MAIN-2018-39,nep,366409,364210,0.0129\nCC-MAIN-2018-39,nld,40992049,40468601,1.4428\nCC-MAIN-2018-39,nno,387215,383098,0.0136\nCC-MAIN-2018-39,nor,8572354,8458655,0.3017\nCC-MAIN-2018-39,nso,12504,12491,0.0004\nCC-MAIN-2018-39,nya,11564,11478,0.0004\nCC-MAIN-2018-39,oci,62217,61941,0.0022\nCC-MAIN-2018-39,ori,74475,72827,0.0026\nCC-MAIN-2018-39,orm,7540,7444,0.0003\nCC-MAIN-2018-39,pan,125438,114586,0.0044\nCC-MAIN-2018-39,pol,47931208,47490515,1.6870\nCC-MAIN-2018-39,por,57804447,57212159,2.0345\nCC-MAIN-2018-39,pus,112333,106719,0.0040\nCC-MAIN-2018-39,que,22200,22096,0.0008\nCC-MAIN-2018-39,roh,31146,30912,0.0011\nCC-MAIN-2018-39,ron,15424255,15294875,0.5429\nCC-MAIN-2018-39,run,3966,3921,0.0001\nCC-MAIN-2018-39,rus,261423303,259910412,9.2012\nCC-MAIN-2018-39,sag,782,777,0.0000\nCC-MAIN-2018-39,san,57625,57369,0.0020\nCC-MAIN-2018-39,sco,22260,21985,0.0008\nCC-MAIN-2018-39,sin,196037,193379,0.0069\nCC-MAIN-2018-39,slk,6955199,6878393,0.2448\nCC-MAIN-2018-39,slv,2976912,2947343,0.1048\nCC-MAIN-2018-39,smo,14343,14272,0.0005\nCC-MAIN-2018-39,sna,11159,10610,0.0004\nCC-MAIN-2018-39,snd,50761,42899,0.0018\nCC-MAIN-2018-39,som,136716,135034,0.0048\nCC-MAIN-2018-39,sot,7811,7721,0.0003\nCC-MAIN-2018-39,spa,124112999,122557038,4.3683\nCC-MAIN-2018-39,sqi,980564,953791,0.0345\nCC-MAIN-2018-39,srp,4534019,4493095,0.1596\nCC-MAIN-2018-39,ssw,1238,1197,0.0000\nCC-MAIN-2018-39,sun,17175,17125,0.0006\nCC-MAIN-2018-39,sux,141,141,0.0000\nCC-MAIN-2018-39,swa,209199,205969,0.0074\nCC-MAIN-2018-39,swe,21120431,20849808,0.7434\nCC-MAIN-2018-39,syr,11514,11457,0.0004\nCC-MAIN-2018-39,tam,1454180,1420041,0.0512\nCC-MAIN-2018-39,tat,193388,192717,0.0068\nCC-MAIN-2018-39,tel,482809,472617,0.0170\nCC-MAIN-2018-39,tgk,132565,132035,0.0047\nCC-MAIN-2018-39,tgl,193633,190758,0.0068\nCC-MAIN-2018-39,tha,8253600,8193071,0.2905\nCC-MAIN-2018-39,tir,11698,11610,0.0004\nCC-MAIN-2018-39,ton,3305,3278,0.0001\nCC-MAIN-2018-39,tsn,23974,23922,0.0008\nCC-MAIN-2018-39,tso,2358,2317,0.0001\nCC-MAIN-2018-39,tuk,39655,39527,0.0014\nCC-MAIN-2018-39,tur,27018865,26762334,0.9510\nCC-MAIN-2018-39,uig,19837,19801,0.0007\nCC-MAIN-2018-39,ukr,11360127,11289655,0.3998\nCC-MAIN-2018-39,urd,960786,938765,0.0338\nCC-MAIN-2018-39,uzb,313334,311677,0.0110\nCC-MAIN-2018-39,ven,666,650,0.0000\nCC-MAIN-2018-39,vie,21243376,21109045,0.7477\nCC-MAIN-2018-39,vol,17323,17196,0.0006\nCC-MAIN-2018-39,war,61664,61239,0.0022\nCC-MAIN-2018-39,wol,2986,2920,0.0001\nCC-MAIN-2018-39,xho,26922,26495,0.0009\nCC-MAIN-2018-39,yid,38471,38160,0.0014\nCC-MAIN-2018-39,yor,10500,10470,0.0004\nCC-MAIN-2018-39,zha,1814,1784,0.0001\nCC-MAIN-2018-39,zho,129632990,129097780,4.5626\nCC-MAIN-2018-39,zul,21464,21393,0.0008\nCC-MAIN-2018-43,<unknown>,140402705,140402705,4.6158\nCC-MAIN-2018-43,aar,4872,4763,0.0002\nCC-MAIN-2018-43,abk,5974,5963,0.0002\nCC-MAIN-2018-43,afr,221168,219907,0.0073\nCC-MAIN-2018-43,aka,1082,1045,0.0000\nCC-MAIN-2018-43,amh,53482,53165,0.0018\nCC-MAIN-2018-43,ara,22560241,22451064,0.7417\nCC-MAIN-2018-43,asm,13601,13475,0.0004\nCC-MAIN-2018-43,aym,2189,2132,0.0001\nCC-MAIN-2018-43,aze,1119839,1115170,0.0368\nCC-MAIN-2018-43,bak,31510,31478,0.0010\nCC-MAIN-2018-43,bel,389551,387762,0.0128\nCC-MAIN-2018-43,ben,1636669,1628672,0.0538\nCC-MAIN-2018-43,bih,14293,14246,0.0005\nCC-MAIN-2018-43,bis,3302,3232,0.0001\nCC-MAIN-2018-43,blu,19277,19228,0.0006\nCC-MAIN-2018-43,bod,35723,35619,0.0012\nCC-MAIN-2018-43,bos,948243,944639,0.0312\nCC-MAIN-2018-43,bre,39577,39330,0.0013\nCC-MAIN-2018-43,bul,8362157,8294722,0.2749\nCC-MAIN-2018-43,cat,5176059,5123260,0.1702\nCC-MAIN-2018-43,ceb,44977,44903,0.0015\nCC-MAIN-2018-43,ces,30950822,30544331,1.0175\nCC-MAIN-2018-43,chr,1330,1328,0.0000\nCC-MAIN-2018-43,cos,43405,42969,0.0014\nCC-MAIN-2018-43,crs,2226,2170,0.0001\nCC-MAIN-2018-43,cym,203962,202310,0.0067\nCC-MAIN-2018-43,dan,11336692,11203459,0.3727\nCC-MAIN-2018-43,deu,151934809,149743486,4.9949\nCC-MAIN-2018-43,div,36547,36471,0.0012\nCC-MAIN-2018-43,dzo,1685,1681,0.0001\nCC-MAIN-2018-43,ell,14863656,14742221,0.4886\nCC-MAIN-2018-43,eng,1311380573,1294592847,43.1122\nCC-MAIN-2018-43,epo,132827,132317,0.0044\nCC-MAIN-2018-43,est,3119637,3085366,0.1026\nCC-MAIN-2018-43,eus,575282,570039,0.0189\nCC-MAIN-2018-43,fao,82953,82077,0.0027\nCC-MAIN-2018-43,fas,20521752,20363566,0.6747\nCC-MAIN-2018-43,fij,2145,2015,0.0001\nCC-MAIN-2018-43,fin,10358990,10238313,0.3406\nCC-MAIN-2018-43,fra,136090811,134017942,4.4740\nCC-MAIN-2018-43,fry,74499,74154,0.0024\nCC-MAIN-2018-43,gla,37701,37043,0.0012\nCC-MAIN-2018-43,gle,103301,102746,0.0034\nCC-MAIN-2018-43,glg,670052,663245,0.0220\nCC-MAIN-2018-43,glv,8427,8193,0.0003\nCC-MAIN-2018-43,got,1027,1025,0.0000\nCC-MAIN-2018-43,grn,25528,25226,0.0008\nCC-MAIN-2018-43,guj,167118,166397,0.0055\nCC-MAIN-2018-43,hat,39439,39229,0.0013\nCC-MAIN-2018-43,hau,38791,37390,0.0013\nCC-MAIN-2018-43,haw,6804,6728,0.0002\nCC-MAIN-2018-43,heb,4796987,4734122,0.1577\nCC-MAIN-2018-43,hin,2237424,2223011,0.0736\nCC-MAIN-2018-43,hrv,4331744,4301291,0.1424\nCC-MAIN-2018-43,hun,15436878,15314779,0.5075\nCC-MAIN-2018-43,hye,750036,745915,0.0247\nCC-MAIN-2018-43,ibo,4840,4816,0.0002\nCC-MAIN-2018-43,iku,4843,4825,0.0002\nCC-MAIN-2018-43,ile,8613,8503,0.0003\nCC-MAIN-2018-43,ina,22987,22786,0.0008\nCC-MAIN-2018-43,ind,22917168,22755378,0.7534\nCC-MAIN-2018-43,ipk,4505,4283,0.0001\nCC-MAIN-2018-43,isl,848293,838544,0.0279\nCC-MAIN-2018-43,ita,59958938,59248557,1.9712\nCC-MAIN-2018-43,jav,36872,36789,0.0012\nCC-MAIN-2018-43,jpn,164699835,163294150,5.4146\nCC-MAIN-2018-43,kal,15682,15331,0.0005\nCC-MAIN-2018-43,kan,226352,225400,0.0074\nCC-MAIN-2018-43,kas,22,20,0.0000\nCC-MAIN-2018-43,kat,836485,832203,0.0275\nCC-MAIN-2018-43,kaz,443616,440368,0.0146\nCC-MAIN-2018-43,kha,5828,5720,0.0002\nCC-MAIN-2018-43,khm,153324,151963,0.0050\nCC-MAIN-2018-43,kin,51494,50625,0.0017\nCC-MAIN-2018-43,kir,114031,113833,0.0037\nCC-MAIN-2018-43,kor,18346237,18263754,0.6031\nCC-MAIN-2018-43,kur,129228,128946,0.0042\nCC-MAIN-2018-43,lao,66004,65644,0.0022\nCC-MAIN-2018-43,lat,984088,975296,0.0324\nCC-MAIN-2018-43,lav,2189928,2168391,0.0720\nCC-MAIN-2018-43,lif,186,183,0.0000\nCC-MAIN-2018-43,lin,4738,4655,0.0002\nCC-MAIN-2018-43,lit,4124369,4071614,0.1356\nCC-MAIN-2018-43,ltz,59804,59120,0.0020\nCC-MAIN-2018-43,lug,3403,3357,0.0001\nCC-MAIN-2018-43,mal,421923,419624,0.0139\nCC-MAIN-2018-43,mar,283297,253172,0.0093\nCC-MAIN-2018-43,mfe,2977,2917,0.0001\nCC-MAIN-2018-43,mkd,542325,539655,0.0178\nCC-MAIN-2018-43,mlg,58503,58212,0.0019\nCC-MAIN-2018-43,mlt,53837,53565,0.0018\nCC-MAIN-2018-43,mon,399472,396079,0.0131\nCC-MAIN-2018-43,mri,21604,21046,0.0007\nCC-MAIN-2018-43,msa,2935856,2923393,0.0965\nCC-MAIN-2018-43,mya,259516,258698,0.0085\nCC-MAIN-2018-43,nau,1078,1045,0.0000\nCC-MAIN-2018-43,nep,365099,363823,0.0120\nCC-MAIN-2018-43,nld,42540738,41882253,1.3985\nCC-MAIN-2018-43,nno,391354,386058,0.0129\nCC-MAIN-2018-43,nor,8902292,8795013,0.2927\nCC-MAIN-2018-43,nso,4468,4451,0.0001\nCC-MAIN-2018-43,nya,10096,9997,0.0003\nCC-MAIN-2018-43,oci,57487,57179,0.0019\nCC-MAIN-2018-43,ori,66538,66452,0.0022\nCC-MAIN-2018-43,orm,8101,7969,0.0003\nCC-MAIN-2018-43,pan,96035,95730,0.0032\nCC-MAIN-2018-43,pol,51628822,51107900,1.6973\nCC-MAIN-2018-43,por,59355355,58778355,1.9513\nCC-MAIN-2018-43,pus,67676,67508,0.0022\nCC-MAIN-2018-43,que,15012,14889,0.0005\nCC-MAIN-2018-43,roh,40796,40558,0.0013\nCC-MAIN-2018-43,ron,15881874,15750505,0.5221\nCC-MAIN-2018-43,run,3723,3685,0.0001\nCC-MAIN-2018-43,rus,284290628,282424337,9.3462\nCC-MAIN-2018-43,sag,283,278,0.0000\nCC-MAIN-2018-43,san,54603,54321,0.0018\nCC-MAIN-2018-43,sco,20495,20174,0.0007\nCC-MAIN-2018-43,sin,169147,168594,0.0056\nCC-MAIN-2018-43,slk,7199295,7109809,0.2367\nCC-MAIN-2018-43,slv,2926196,2898321,0.0962\nCC-MAIN-2018-43,smo,7042,6993,0.0002\nCC-MAIN-2018-43,sna,10424,10328,0.0003\nCC-MAIN-2018-43,snd,16195,16144,0.0005\nCC-MAIN-2018-43,som,132377,131814,0.0044\nCC-MAIN-2018-43,sot,7579,7492,0.0002\nCC-MAIN-2018-43,spa,124288219,123042239,4.0860\nCC-MAIN-2018-43,sqi,932811,924019,0.0307\nCC-MAIN-2018-43,srp,4617991,4587795,0.1518\nCC-MAIN-2018-43,ssw,1418,1373,0.0000\nCC-MAIN-2018-43,sun,15334,15280,0.0005\nCC-MAIN-2018-43,sux,99,98,0.0000\nCC-MAIN-2018-43,swa,203285,202092,0.0067\nCC-MAIN-2018-43,swe,22283449,22028674,0.7326\nCC-MAIN-2018-43,syr,12681,12635,0.0004\nCC-MAIN-2018-43,tam,948012,943318,0.0312\nCC-MAIN-2018-43,tat,169003,168418,0.0056\nCC-MAIN-2018-43,tel,279905,278769,0.0092\nCC-MAIN-2018-43,tgk,97818,97650,0.0032\nCC-MAIN-2018-43,tgl,193991,193200,0.0064\nCC-MAIN-2018-43,tha,8947278,8884873,0.2941\nCC-MAIN-2018-43,tir,18921,18822,0.0006\nCC-MAIN-2018-43,ton,2155,2132,0.0001\nCC-MAIN-2018-43,tsn,8179,8107,0.0003\nCC-MAIN-2018-43,tso,2069,1996,0.0001\nCC-MAIN-2018-43,tuk,26950,26807,0.0009\nCC-MAIN-2018-43,tur,26970950,26701765,0.8867\nCC-MAIN-2018-43,uig,24132,24070,0.0008\nCC-MAIN-2018-43,ukr,12251460,12154920,0.4028\nCC-MAIN-2018-43,urd,658000,655307,0.0216\nCC-MAIN-2018-43,uzb,325374,323814,0.0107\nCC-MAIN-2018-43,ven,640,624,0.0000\nCC-MAIN-2018-43,vie,23250258,23088890,0.7644\nCC-MAIN-2018-43,vol,17298,17132,0.0006\nCC-MAIN-2018-43,war,60876,60358,0.0020\nCC-MAIN-2018-43,wol,3148,3084,0.0001\nCC-MAIN-2018-43,xho,15451,15153,0.0005\nCC-MAIN-2018-43,yid,46708,46381,0.0015\nCC-MAIN-2018-43,yor,10333,10306,0.0003\nCC-MAIN-2018-43,zha,1365,1331,0.0000\nCC-MAIN-2018-43,zho,158122717,157483503,5.1984\nCC-MAIN-2018-43,zul,12063,11993,0.0004\nCC-MAIN-2018-47,<unknown>,87938725,87938725,3.3227\nCC-MAIN-2018-47,aar,4533,4366,0.0002\nCC-MAIN-2018-47,abk,4801,4787,0.0002\nCC-MAIN-2018-47,afr,293729,292148,0.0111\nCC-MAIN-2018-47,aka,1717,1687,0.0001\nCC-MAIN-2018-47,amh,54966,54298,0.0021\nCC-MAIN-2018-47,ara,20668279,20564011,0.7809\nCC-MAIN-2018-47,asm,12560,12365,0.0005\nCC-MAIN-2018-47,aym,2244,2181,0.0001\nCC-MAIN-2018-47,aze,993984,990102,0.0376\nCC-MAIN-2018-47,bak,32668,32638,0.0012\nCC-MAIN-2018-47,bel,358096,355257,0.0135\nCC-MAIN-2018-47,ben,1924862,1917316,0.0727\nCC-MAIN-2018-47,bih,13384,13013,0.0005\nCC-MAIN-2018-47,bis,2932,2786,0.0001\nCC-MAIN-2018-47,blu,19058,18972,0.0007\nCC-MAIN-2018-47,bod,23455,23237,0.0009\nCC-MAIN-2018-47,bos,808370,804597,0.0305\nCC-MAIN-2018-47,bre,32061,31821,0.0012\nCC-MAIN-2018-47,bul,7662594,7588885,0.2895\nCC-MAIN-2018-47,cat,4287581,4235199,0.1620\nCC-MAIN-2018-47,ceb,29765,29672,0.0011\nCC-MAIN-2018-47,ces,26656758,26325821,1.0072\nCC-MAIN-2018-47,chr,836,832,0.0000\nCC-MAIN-2018-47,cos,37661,37028,0.0014\nCC-MAIN-2018-47,crs,2347,2276,0.0001\nCC-MAIN-2018-47,cym,159670,157898,0.0060\nCC-MAIN-2018-47,dan,10394977,10245791,0.3928\nCC-MAIN-2018-47,deu,132237656,129821485,4.9966\nCC-MAIN-2018-47,div,38065,37947,0.0014\nCC-MAIN-2018-47,dzo,868,860,0.0000\nCC-MAIN-2018-47,ell,12539906,12421211,0.4738\nCC-MAIN-2018-47,eng,1154728121,1137824732,43.6311\nCC-MAIN-2018-47,epo,114207,113272,0.0043\nCC-MAIN-2018-47,est,2790985,2756656,0.1055\nCC-MAIN-2018-47,eus,471820,467623,0.0178\nCC-MAIN-2018-47,fao,62790,62163,0.0024\nCC-MAIN-2018-47,fas,17566335,17418204,0.6637\nCC-MAIN-2018-47,fij,2274,2196,0.0001\nCC-MAIN-2018-47,fin,9796557,9668892,0.3702\nCC-MAIN-2018-47,fra,120054567,118234263,4.5362\nCC-MAIN-2018-47,fry,45998,45413,0.0017\nCC-MAIN-2018-47,gla,40979,40323,0.0015\nCC-MAIN-2018-47,gle,102154,101464,0.0039\nCC-MAIN-2018-47,glg,560122,554207,0.0212\nCC-MAIN-2018-47,glv,8001,7731,0.0003\nCC-MAIN-2018-47,got,655,645,0.0000\nCC-MAIN-2018-47,grn,23622,23085,0.0009\nCC-MAIN-2018-47,guj,217392,216715,0.0082\nCC-MAIN-2018-47,hat,30491,30375,0.0012\nCC-MAIN-2018-47,hau,35059,34613,0.0013\nCC-MAIN-2018-47,haw,8519,8393,0.0003\nCC-MAIN-2018-47,heb,4730177,4651703,0.1787\nCC-MAIN-2018-47,hin,2678015,2656595,0.1012\nCC-MAIN-2018-47,hrv,3829762,3796526,0.1447\nCC-MAIN-2018-47,hun,14106399,13969705,0.5330\nCC-MAIN-2018-47,hye,722051,717478,0.0273\nCC-MAIN-2018-47,ibo,6065,6026,0.0002\nCC-MAIN-2018-47,iku,3824,3794,0.0001\nCC-MAIN-2018-47,ile,10813,10657,0.0004\nCC-MAIN-2018-47,ina,18708,18462,0.0007\nCC-MAIN-2018-47,ind,20444991,20274722,0.7725\nCC-MAIN-2018-47,ipk,2519,2460,0.0001\nCC-MAIN-2018-47,isl,795036,785588,0.0300\nCC-MAIN-2018-47,ita,53898112,53057380,2.0365\nCC-MAIN-2018-47,jav,35740,35618,0.0014\nCC-MAIN-2018-47,jpn,147812347,146337305,5.5851\nCC-MAIN-2018-47,kal,16051,15758,0.0006\nCC-MAIN-2018-47,kan,335130,334456,0.0127\nCC-MAIN-2018-47,kas,182,177,0.0000\nCC-MAIN-2018-47,kat,681276,674684,0.0257\nCC-MAIN-2018-47,kaz,427895,424184,0.0162\nCC-MAIN-2018-47,kha,8280,8172,0.0003\nCC-MAIN-2018-47,khm,165802,165064,0.0063\nCC-MAIN-2018-47,kin,44327,44023,0.0017\nCC-MAIN-2018-47,kir,148353,147954,0.0056\nCC-MAIN-2018-47,kor,15393324,15320431,0.5816\nCC-MAIN-2018-47,kur,102722,102494,0.0039\nCC-MAIN-2018-47,lao,74426,74137,0.0028\nCC-MAIN-2018-47,lat,1007319,997169,0.0381\nCC-MAIN-2018-47,lav,1920836,1900469,0.0726\nCC-MAIN-2018-47,lif,184,183,0.0000\nCC-MAIN-2018-47,lin,5412,5310,0.0002\nCC-MAIN-2018-47,lit,3885013,3823705,0.1468\nCC-MAIN-2018-47,ltz,59799,58990,0.0023\nCC-MAIN-2018-47,lug,6394,6337,0.0002\nCC-MAIN-2018-47,mal,609293,607821,0.0230\nCC-MAIN-2018-47,mar,356383,347718,0.0135\nCC-MAIN-2018-47,mfe,3580,3503,0.0001\nCC-MAIN-2018-47,mkd,507318,504270,0.0192\nCC-MAIN-2018-47,mlg,67878,67571,0.0026\nCC-MAIN-2018-47,mlt,55665,55410,0.0021\nCC-MAIN-2018-47,mon,372104,370464,0.0141\nCC-MAIN-2018-47,mri,22025,21789,0.0008\nCC-MAIN-2018-47,msa,2301093,2290620,0.0869\nCC-MAIN-2018-47,mya,257888,257155,0.0097\nCC-MAIN-2018-47,nau,1598,1551,0.0001\nCC-MAIN-2018-47,nep,338290,336900,0.0128\nCC-MAIN-2018-47,nld,39617772,38915836,1.4969\nCC-MAIN-2018-47,nno,334365,330422,0.0126\nCC-MAIN-2018-47,nor,7963150,7859056,0.3009\nCC-MAIN-2018-47,nso,1767,1750,0.0001\nCC-MAIN-2018-47,nya,14260,14163,0.0005\nCC-MAIN-2018-47,oci,51951,51452,0.0020\nCC-MAIN-2018-47,ori,67903,67790,0.0026\nCC-MAIN-2018-47,orm,8087,7970,0.0003\nCC-MAIN-2018-47,pan,111566,110903,0.0042\nCC-MAIN-2018-47,pol,43573234,43123030,1.6464\nCC-MAIN-2018-47,por,52368242,51836029,1.9787\nCC-MAIN-2018-47,pus,94752,94587,0.0036\nCC-MAIN-2018-47,que,8490,8352,0.0003\nCC-MAIN-2018-47,roh,33931,33636,0.0013\nCC-MAIN-2018-47,ron,13786089,13655823,0.5209\nCC-MAIN-2018-47,run,3559,3512,0.0001\nCC-MAIN-2018-47,rus,255272365,253464610,9.6454\nCC-MAIN-2018-47,sag,381,376,0.0000\nCC-MAIN-2018-47,san,62436,62099,0.0024\nCC-MAIN-2018-47,sco,20218,19899,0.0008\nCC-MAIN-2018-47,sin,157164,156784,0.0059\nCC-MAIN-2018-47,slk,6442141,6355480,0.2434\nCC-MAIN-2018-47,slv,2663991,2637589,0.1007\nCC-MAIN-2018-47,smo,14022,13940,0.0005\nCC-MAIN-2018-47,sna,9350,9266,0.0004\nCC-MAIN-2018-47,snd,41813,41584,0.0016\nCC-MAIN-2018-47,som,124964,124337,0.0047\nCC-MAIN-2018-47,sot,8207,8092,0.0003\nCC-MAIN-2018-47,spa,109715592,108427511,4.1456\nCC-MAIN-2018-47,sqi,841907,836159,0.0318\nCC-MAIN-2018-47,srp,4040837,4004304,0.1527\nCC-MAIN-2018-47,ssw,1303,1237,0.0000\nCC-MAIN-2018-47,sun,15229,15123,0.0006\nCC-MAIN-2018-47,sux,98,98,0.0000\nCC-MAIN-2018-47,swa,157164,156685,0.0059\nCC-MAIN-2018-47,swe,19943091,19701462,0.7535\nCC-MAIN-2018-47,syr,9858,9786,0.0004\nCC-MAIN-2018-47,tam,1251200,1247517,0.0473\nCC-MAIN-2018-47,tat,138341,137429,0.0052\nCC-MAIN-2018-47,tel,432629,430568,0.0163\nCC-MAIN-2018-47,tgk,87700,87583,0.0033\nCC-MAIN-2018-47,tgl,176644,176051,0.0067\nCC-MAIN-2018-47,tha,7860020,7810827,0.2970\nCC-MAIN-2018-47,tir,10048,10025,0.0004\nCC-MAIN-2018-47,ton,2000,1972,0.0001\nCC-MAIN-2018-47,tsn,3405,3330,0.0001\nCC-MAIN-2018-47,tso,2640,2597,0.0001\nCC-MAIN-2018-47,tuk,36209,36003,0.0014\nCC-MAIN-2018-47,tur,24237166,23981899,0.9158\nCC-MAIN-2018-47,uig,18315,18221,0.0007\nCC-MAIN-2018-47,ukr,10580819,10504924,0.3998\nCC-MAIN-2018-47,urd,642550,640794,0.0243\nCC-MAIN-2018-47,uzb,268327,266760,0.0101\nCC-MAIN-2018-47,ven,982,955,0.0000\nCC-MAIN-2018-47,vie,20399254,20233938,0.7708\nCC-MAIN-2018-47,vol,23671,23458,0.0009\nCC-MAIN-2018-47,war,58213,57624,0.0022\nCC-MAIN-2018-47,wol,2915,2831,0.0001\nCC-MAIN-2018-47,xho,12253,11908,0.0005\nCC-MAIN-2018-47,yid,32179,32030,0.0012\nCC-MAIN-2018-47,yor,9801,9762,0.0004\nCC-MAIN-2018-47,zha,1407,1365,0.0001\nCC-MAIN-2018-47,zho,130515854,129869269,4.9315\nCC-MAIN-2018-47,zul,12598,12487,0.0005\nCC-MAIN-2018-51,<unknown>,101049798,101049798,3.1935\nCC-MAIN-2018-51,aar,6992,6858,0.0002\nCC-MAIN-2018-51,abk,5187,5174,0.0002\nCC-MAIN-2018-51,afr,275397,272816,0.0087\nCC-MAIN-2018-51,aka,1541,1504,0.0000\nCC-MAIN-2018-51,amh,59747,59446,0.0019\nCC-MAIN-2018-51,ara,22453066,22353107,0.7096\nCC-MAIN-2018-51,asm,12596,12325,0.0004\nCC-MAIN-2018-51,aym,4174,4083,0.0001\nCC-MAIN-2018-51,aze,1149739,1145102,0.0363\nCC-MAIN-2018-51,bak,30664,30583,0.0010\nCC-MAIN-2018-51,bel,405228,402359,0.0128\nCC-MAIN-2018-51,ben,1729839,1724421,0.0547\nCC-MAIN-2018-51,bih,15064,14890,0.0005\nCC-MAIN-2018-51,bis,5523,5433,0.0002\nCC-MAIN-2018-51,blu,25825,25768,0.0008\nCC-MAIN-2018-51,bod,38327,38262,0.0012\nCC-MAIN-2018-51,bos,964526,959643,0.0305\nCC-MAIN-2018-51,bre,42077,41818,0.0013\nCC-MAIN-2018-51,bul,8750728,8675970,0.2766\nCC-MAIN-2018-51,cat,5468792,5397284,0.1728\nCC-MAIN-2018-51,ceb,42006,41908,0.0013\nCC-MAIN-2018-51,ces,33459667,33047325,1.0574\nCC-MAIN-2018-51,chr,1520,1519,0.0000\nCC-MAIN-2018-51,cos,51864,51124,0.0016\nCC-MAIN-2018-51,crs,2634,2549,0.0001\nCC-MAIN-2018-51,cym,214791,212365,0.0068\nCC-MAIN-2018-51,dan,12559481,12369741,0.3969\nCC-MAIN-2018-51,deu,171757423,168820088,5.4281\nCC-MAIN-2018-51,div,30921,30734,0.0010\nCC-MAIN-2018-51,dzo,1287,1282,0.0000\nCC-MAIN-2018-51,ell,14700064,14568257,0.4646\nCC-MAIN-2018-51,eng,1394067798,1374809417,44.0568\nCC-MAIN-2018-51,epo,138989,138356,0.0044\nCC-MAIN-2018-51,est,3373001,3330293,0.1066\nCC-MAIN-2018-51,eus,658905,652211,0.0208\nCC-MAIN-2018-51,fao,90072,89304,0.0028\nCC-MAIN-2018-51,fas,21032161,20885569,0.6647\nCC-MAIN-2018-51,fij,2702,2628,0.0001\nCC-MAIN-2018-51,fin,11396463,11226970,0.3602\nCC-MAIN-2018-51,fra,142700548,140771850,4.5098\nCC-MAIN-2018-51,fry,76678,76237,0.0024\nCC-MAIN-2018-51,gla,38950,38492,0.0012\nCC-MAIN-2018-51,gle,121195,120202,0.0038\nCC-MAIN-2018-51,glg,729788,719560,0.0231\nCC-MAIN-2018-51,glv,9388,9055,0.0003\nCC-MAIN-2018-51,got,582,582,0.0000\nCC-MAIN-2018-51,grn,19956,19553,0.0006\nCC-MAIN-2018-51,guj,197872,197032,0.0063\nCC-MAIN-2018-51,hat,44925,44829,0.0014\nCC-MAIN-2018-51,hau,43910,43518,0.0014\nCC-MAIN-2018-51,haw,10667,10510,0.0003\nCC-MAIN-2018-51,heb,5341664,5256397,0.1688\nCC-MAIN-2018-51,hin,2588852,2569889,0.0818\nCC-MAIN-2018-51,hrv,4558445,4524120,0.1441\nCC-MAIN-2018-51,hun,16117907,15968310,0.5094\nCC-MAIN-2018-51,hye,782785,778512,0.0247\nCC-MAIN-2018-51,ibo,5167,5135,0.0002\nCC-MAIN-2018-51,iku,5162,5119,0.0002\nCC-MAIN-2018-51,ile,11003,10789,0.0003\nCC-MAIN-2018-51,ina,21037,20737,0.0007\nCC-MAIN-2018-51,ind,22958101,22783179,0.7255\nCC-MAIN-2018-51,ipk,2300,2274,0.0001\nCC-MAIN-2018-51,isl,917178,906849,0.0290\nCC-MAIN-2018-51,ita,68072953,67118124,2.1513\nCC-MAIN-2018-51,jav,39729,39462,0.0013\nCC-MAIN-2018-51,jpn,170080108,168634995,5.3751\nCC-MAIN-2018-51,kal,21269,20919,0.0007\nCC-MAIN-2018-51,kan,232344,231416,0.0073\nCC-MAIN-2018-51,kas,38,36,0.0000\nCC-MAIN-2018-51,kat,979221,972548,0.0309\nCC-MAIN-2018-51,kaz,442122,440137,0.0140\nCC-MAIN-2018-51,kha,10597,10449,0.0003\nCC-MAIN-2018-51,khm,164425,163878,0.0052\nCC-MAIN-2018-51,kin,50182,49708,0.0016\nCC-MAIN-2018-51,kir,109071,108764,0.0034\nCC-MAIN-2018-51,kor,18735338,18646657,0.5921\nCC-MAIN-2018-51,kur,136990,136536,0.0043\nCC-MAIN-2018-51,lao,74237,74006,0.0023\nCC-MAIN-2018-51,lat,1225355,1210880,0.0387\nCC-MAIN-2018-51,lav,2478010,2451429,0.0783\nCC-MAIN-2018-51,lif,189,189,0.0000\nCC-MAIN-2018-51,lin,5636,5503,0.0002\nCC-MAIN-2018-51,lit,4473120,4408691,0.1414\nCC-MAIN-2018-51,ltz,70272,69190,0.0022\nCC-MAIN-2018-51,lug,3835,3693,0.0001\nCC-MAIN-2018-51,mal,410247,408583,0.0130\nCC-MAIN-2018-51,mar,270763,268289,0.0086\nCC-MAIN-2018-51,mfe,3762,3683,0.0001\nCC-MAIN-2018-51,mkd,568511,564800,0.0180\nCC-MAIN-2018-51,mlg,63523,63214,0.0020\nCC-MAIN-2018-51,mlt,59421,58967,0.0019\nCC-MAIN-2018-51,mon,399731,394715,0.0126\nCC-MAIN-2018-51,mri,16633,16265,0.0005\nCC-MAIN-2018-51,msa,2751134,2734914,0.0869\nCC-MAIN-2018-51,mya,260809,260105,0.0082\nCC-MAIN-2018-51,nau,2054,2007,0.0001\nCC-MAIN-2018-51,nep,386403,384940,0.0122\nCC-MAIN-2018-51,nld,51750681,50795973,1.6355\nCC-MAIN-2018-51,nno,421570,415173,0.0133\nCC-MAIN-2018-51,nor,9441579,9320501,0.2984\nCC-MAIN-2018-51,nso,13775,13753,0.0004\nCC-MAIN-2018-51,nya,9408,9297,0.0003\nCC-MAIN-2018-51,oci,61649,60933,0.0019\nCC-MAIN-2018-51,ori,70061,70007,0.0022\nCC-MAIN-2018-51,orm,10587,10399,0.0003\nCC-MAIN-2018-51,pan,97136,96820,0.0031\nCC-MAIN-2018-51,pol,52810863,52254731,1.6690\nCC-MAIN-2018-51,por,62632790,62008236,1.9794\nCC-MAIN-2018-51,pus,66481,66222,0.0021\nCC-MAIN-2018-51,que,25854,25687,0.0008\nCC-MAIN-2018-51,roh,42152,41786,0.0013\nCC-MAIN-2018-51,ron,16352239,16209726,0.5168\nCC-MAIN-2018-51,run,3943,3887,0.0001\nCC-MAIN-2018-51,rus,283481265,281641787,8.9589\nCC-MAIN-2018-51,sag,712,707,0.0000\nCC-MAIN-2018-51,san,65734,65407,0.0021\nCC-MAIN-2018-51,sco,25132,24698,0.0008\nCC-MAIN-2018-51,sin,167001,166172,0.0053\nCC-MAIN-2018-51,slk,8231472,8130369,0.2601\nCC-MAIN-2018-51,slv,3195058,3159468,0.1010\nCC-MAIN-2018-51,smo,8633,8540,0.0003\nCC-MAIN-2018-51,sna,9862,9767,0.0003\nCC-MAIN-2018-51,snd,15895,15837,0.0005\nCC-MAIN-2018-51,som,132969,132417,0.0042\nCC-MAIN-2018-51,sot,8108,7982,0.0003\nCC-MAIN-2018-51,spa,130579509,129119778,4.1267\nCC-MAIN-2018-51,sqi,878582,870689,0.0278\nCC-MAIN-2018-51,srp,4803731,4760057,0.1518\nCC-MAIN-2018-51,ssw,3035,2974,0.0001\nCC-MAIN-2018-51,sun,19109,19033,0.0006\nCC-MAIN-2018-51,sux,142,142,0.0000\nCC-MAIN-2018-51,swa,227062,225776,0.0072\nCC-MAIN-2018-51,swe,23893466,23598466,0.7551\nCC-MAIN-2018-51,syr,12541,12456,0.0004\nCC-MAIN-2018-51,tam,943157,937890,0.0298\nCC-MAIN-2018-51,tat,197963,197286,0.0063\nCC-MAIN-2018-51,tel,285466,284560,0.0090\nCC-MAIN-2018-51,tgk,113893,113758,0.0036\nCC-MAIN-2018-51,tgl,217071,216561,0.0069\nCC-MAIN-2018-51,tha,9065937,9000602,0.2865\nCC-MAIN-2018-51,tir,14878,14839,0.0005\nCC-MAIN-2018-51,ton,2327,2293,0.0001\nCC-MAIN-2018-51,tsn,24884,24796,0.0008\nCC-MAIN-2018-51,tso,3531,3464,0.0001\nCC-MAIN-2018-51,tuk,28504,28311,0.0009\nCC-MAIN-2018-51,tur,27553326,27281904,0.8708\nCC-MAIN-2018-51,uig,25002,24877,0.0008\nCC-MAIN-2018-51,ukr,12202432,12122676,0.3856\nCC-MAIN-2018-51,urd,744204,741698,0.0235\nCC-MAIN-2018-51,uzb,312391,311110,0.0099\nCC-MAIN-2018-51,ven,1762,1732,0.0001\nCC-MAIN-2018-51,vie,22967366,22812746,0.7258\nCC-MAIN-2018-51,vol,18192,17957,0.0006\nCC-MAIN-2018-51,war,75145,74423,0.0024\nCC-MAIN-2018-51,wol,3459,3354,0.0001\nCC-MAIN-2018-51,xho,29520,29189,0.0009\nCC-MAIN-2018-51,yid,38237,38126,0.0012\nCC-MAIN-2018-51,yor,10741,10682,0.0003\nCC-MAIN-2018-51,zha,1529,1489,0.0000\nCC-MAIN-2018-51,zho,163796048,162978648,5.1765\nCC-MAIN-2018-51,zul,22213,22109,0.0007\nCC-MAIN-2019-04,<unknown>,84023781,84023781,2.9077\nCC-MAIN-2019-04,aar,4461,4371,0.0002\nCC-MAIN-2019-04,abk,5135,5129,0.0002\nCC-MAIN-2019-04,afr,271244,270003,0.0094\nCC-MAIN-2019-04,aka,1003,977,0.0000\nCC-MAIN-2019-04,amh,62222,61834,0.0022\nCC-MAIN-2019-04,ara,22019160,21908605,0.7620\nCC-MAIN-2019-04,asm,18416,18304,0.0006\nCC-MAIN-2019-04,aym,2484,2415,0.0001\nCC-MAIN-2019-04,aze,1090643,1085625,0.0377\nCC-MAIN-2019-04,bak,25632,25593,0.0009\nCC-MAIN-2019-04,bel,481995,480891,0.0167\nCC-MAIN-2019-04,ben,1861325,1854711,0.0644\nCC-MAIN-2019-04,bih,13334,13303,0.0005\nCC-MAIN-2019-04,bis,3242,3171,0.0001\nCC-MAIN-2019-04,blu,29812,29761,0.0010\nCC-MAIN-2019-04,bod,27662,27591,0.0010\nCC-MAIN-2019-04,bos,947495,944021,0.0328\nCC-MAIN-2019-04,bre,35007,34841,0.0012\nCC-MAIN-2019-04,bul,8255118,8202713,0.2857\nCC-MAIN-2019-04,cat,5039715,4991844,0.1744\nCC-MAIN-2019-04,ceb,33742,33648,0.0012\nCC-MAIN-2019-04,ces,30434242,30182751,1.0532\nCC-MAIN-2019-04,chr,949,948,0.0000\nCC-MAIN-2019-04,cos,45782,45279,0.0016\nCC-MAIN-2019-04,crs,1945,1886,0.0001\nCC-MAIN-2019-04,cym,188427,186266,0.0065\nCC-MAIN-2019-04,dan,11688576,11564933,0.4045\nCC-MAIN-2019-04,deu,157897489,156095482,5.4641\nCC-MAIN-2019-04,div,39471,39192,0.0014\nCC-MAIN-2019-04,dzo,1425,1422,0.0000\nCC-MAIN-2019-04,ell,14365850,14268772,0.4971\nCC-MAIN-2019-04,eng,1261630435,1247295383,43.6592\nCC-MAIN-2019-04,epo,115956,115449,0.0040\nCC-MAIN-2019-04,est,3206151,3176103,0.1109\nCC-MAIN-2019-04,eus,605927,601315,0.0210\nCC-MAIN-2019-04,fao,78069,77547,0.0027\nCC-MAIN-2019-04,fas,20492650,20360834,0.7092\nCC-MAIN-2019-04,fij,2048,1976,0.0001\nCC-MAIN-2019-04,fin,11125710,10997726,0.3850\nCC-MAIN-2019-04,fra,135009344,133645038,4.6720\nCC-MAIN-2019-04,fry,51626,51156,0.0018\nCC-MAIN-2019-04,gla,33340,32955,0.0012\nCC-MAIN-2019-04,gle,110221,109497,0.0038\nCC-MAIN-2019-04,glg,655155,650138,0.0227\nCC-MAIN-2019-04,glv,13533,13282,0.0005\nCC-MAIN-2019-04,got,408,407,0.0000\nCC-MAIN-2019-04,grn,15205,14958,0.0005\nCC-MAIN-2019-04,guj,202086,200143,0.0070\nCC-MAIN-2019-04,hat,41975,41889,0.0015\nCC-MAIN-2019-04,hau,32074,31841,0.0011\nCC-MAIN-2019-04,haw,8160,8063,0.0003\nCC-MAIN-2019-04,heb,5525237,5448106,0.1912\nCC-MAIN-2019-04,hin,2787484,2770363,0.0965\nCC-MAIN-2019-04,hrv,4370790,4342231,0.1513\nCC-MAIN-2019-04,hun,15400963,15292794,0.5330\nCC-MAIN-2019-04,hye,750220,746756,0.0260\nCC-MAIN-2019-04,ibo,6759,6725,0.0002\nCC-MAIN-2019-04,iku,4011,3956,0.0001\nCC-MAIN-2019-04,ile,9466,9349,0.0003\nCC-MAIN-2019-04,ina,20074,19882,0.0007\nCC-MAIN-2019-04,ind,22316326,22115139,0.7723\nCC-MAIN-2019-04,ipk,3398,3291,0.0001\nCC-MAIN-2019-04,isl,854569,844165,0.0296\nCC-MAIN-2019-04,ita,64132863,63525797,2.2193\nCC-MAIN-2019-04,jav,25703,25603,0.0009\nCC-MAIN-2019-04,jpn,150258880,149164371,5.1998\nCC-MAIN-2019-04,kal,16070,15695,0.0006\nCC-MAIN-2019-04,kan,260694,259206,0.0090\nCC-MAIN-2019-04,kas,108,106,0.0000\nCC-MAIN-2019-04,kat,776919,772951,0.0269\nCC-MAIN-2019-04,kaz,451909,449588,0.0156\nCC-MAIN-2019-04,kha,6330,6199,0.0002\nCC-MAIN-2019-04,khm,170181,169542,0.0059\nCC-MAIN-2019-04,kin,44887,44563,0.0016\nCC-MAIN-2019-04,kir,136533,136312,0.0047\nCC-MAIN-2019-04,kor,18239723,18137186,0.6312\nCC-MAIN-2019-04,kur,134087,133642,0.0046\nCC-MAIN-2019-04,lao,74728,73622,0.0026\nCC-MAIN-2019-04,lat,1088474,1081353,0.0377\nCC-MAIN-2019-04,lav,2251308,2230257,0.0779\nCC-MAIN-2019-04,lif,172,164,0.0000\nCC-MAIN-2019-04,lin,4644,4541,0.0002\nCC-MAIN-2019-04,lit,4203112,4160229,0.1455\nCC-MAIN-2019-04,ltz,64257,63455,0.0022\nCC-MAIN-2019-04,lug,5973,5920,0.0002\nCC-MAIN-2019-04,mal,516351,513982,0.0179\nCC-MAIN-2019-04,mar,323873,321606,0.0112\nCC-MAIN-2019-04,mfe,2658,2552,0.0001\nCC-MAIN-2019-04,mkd,563573,561158,0.0195\nCC-MAIN-2019-04,mlg,61277,60391,0.0021\nCC-MAIN-2019-04,mlt,64811,64600,0.0022\nCC-MAIN-2019-04,mon,426512,422233,0.0148\nCC-MAIN-2019-04,mri,18487,18109,0.0006\nCC-MAIN-2019-04,msa,2675105,2658527,0.0926\nCC-MAIN-2019-04,mya,273644,272478,0.0095\nCC-MAIN-2019-04,nau,1095,1060,0.0000\nCC-MAIN-2019-04,nep,391538,390520,0.0135\nCC-MAIN-2019-04,nld,48931563,48343220,1.6933\nCC-MAIN-2019-04,nno,376293,372640,0.0130\nCC-MAIN-2019-04,nor,8765650,8682060,0.3033\nCC-MAIN-2019-04,nso,4462,4447,0.0002\nCC-MAIN-2019-04,nya,8536,8451,0.0003\nCC-MAIN-2019-04,oci,53938,53639,0.0019\nCC-MAIN-2019-04,ori,70584,70535,0.0024\nCC-MAIN-2019-04,orm,9151,9025,0.0003\nCC-MAIN-2019-04,pan,112520,112266,0.0039\nCC-MAIN-2019-04,pol,50838289,50416172,1.7593\nCC-MAIN-2019-04,por,60013787,59509590,2.0768\nCC-MAIN-2019-04,pus,81925,81540,0.0028\nCC-MAIN-2019-04,que,14735,14621,0.0005\nCC-MAIN-2019-04,roh,39953,39685,0.0014\nCC-MAIN-2019-04,ron,15812114,15710776,0.5472\nCC-MAIN-2019-04,run,3055,3020,0.0001\nCC-MAIN-2019-04,rus,252592014,251146147,8.7410\nCC-MAIN-2019-04,sag,327,322,0.0000\nCC-MAIN-2019-04,san,60631,58774,0.0021\nCC-MAIN-2019-04,sco,19680,19359,0.0007\nCC-MAIN-2019-04,sin,178614,178033,0.0062\nCC-MAIN-2019-04,slk,8008639,7938349,0.2771\nCC-MAIN-2019-04,slv,3137831,3112349,0.1086\nCC-MAIN-2019-04,smo,11126,11047,0.0004\nCC-MAIN-2019-04,sna,10460,10399,0.0004\nCC-MAIN-2019-04,snd,21462,21442,0.0007\nCC-MAIN-2019-04,som,135383,134967,0.0047\nCC-MAIN-2019-04,sot,8537,8451,0.0003\nCC-MAIN-2019-04,spa,124236357,123134957,4.2992\nCC-MAIN-2019-04,sqi,919585,916269,0.0318\nCC-MAIN-2019-04,srp,4592038,4563898,0.1589\nCC-MAIN-2019-04,ssw,2364,2323,0.0001\nCC-MAIN-2019-04,sun,16231,16165,0.0006\nCC-MAIN-2019-04,sux,81,81,0.0000\nCC-MAIN-2019-04,swa,187625,186975,0.0065\nCC-MAIN-2019-04,swe,22570856,22367582,0.7811\nCC-MAIN-2019-04,syr,12629,12457,0.0004\nCC-MAIN-2019-04,tam,1142995,1138136,0.0396\nCC-MAIN-2019-04,tat,143824,143426,0.0050\nCC-MAIN-2019-04,tel,339096,337551,0.0117\nCC-MAIN-2019-04,tgk,102134,101967,0.0035\nCC-MAIN-2019-04,tgl,184448,184049,0.0064\nCC-MAIN-2019-04,tha,8982275,8925311,0.3108\nCC-MAIN-2019-04,tir,11704,11675,0.0004\nCC-MAIN-2019-04,ton,1592,1567,0.0001\nCC-MAIN-2019-04,tsn,8351,8297,0.0003\nCC-MAIN-2019-04,tso,2987,2950,0.0001\nCC-MAIN-2019-04,tuk,31072,30917,0.0011\nCC-MAIN-2019-04,tur,26490733,26228193,0.9167\nCC-MAIN-2019-04,uig,18488,18431,0.0006\nCC-MAIN-2019-04,ukr,10974360,10905799,0.3798\nCC-MAIN-2019-04,urd,640313,636304,0.0222\nCC-MAIN-2019-04,uzb,302312,300868,0.0105\nCC-MAIN-2019-04,ven,1533,1517,0.0001\nCC-MAIN-2019-04,vie,22537844,22400399,0.7799\nCC-MAIN-2019-04,vol,13875,13707,0.0005\nCC-MAIN-2019-04,war,63248,62821,0.0022\nCC-MAIN-2019-04,wol,4204,4144,0.0001\nCC-MAIN-2019-04,xho,18732,18461,0.0006\nCC-MAIN-2019-04,yid,35625,35574,0.0012\nCC-MAIN-2019-04,yor,9988,9953,0.0003\nCC-MAIN-2019-04,zha,1423,1380,0.0000\nCC-MAIN-2019-04,zho,143722702,143003949,4.9736\nCC-MAIN-2019-04,zul,19126,19015,0.0007\nCC-MAIN-2019-09,<unknown>,104159947,104159947,3.5748\nCC-MAIN-2019-09,aar,6787,6687,0.0002\nCC-MAIN-2019-09,abk,5867,5862,0.0002\nCC-MAIN-2019-09,afr,261126,259648,0.0090\nCC-MAIN-2019-09,aka,2285,1990,0.0001\nCC-MAIN-2019-09,amh,55800,55173,0.0019\nCC-MAIN-2019-09,ara,16518534,16407338,0.5669\nCC-MAIN-2019-09,asm,14183,14118,0.0005\nCC-MAIN-2019-09,aym,4151,3931,0.0001\nCC-MAIN-2019-09,aze,1124673,1120192,0.0386\nCC-MAIN-2019-09,bak,30907,30844,0.0011\nCC-MAIN-2019-09,bel,373872,372883,0.0128\nCC-MAIN-2019-09,ben,1833215,1813167,0.0629\nCC-MAIN-2019-09,bih,13913,13841,0.0005\nCC-MAIN-2019-09,bis,4330,4246,0.0001\nCC-MAIN-2019-09,blu,21463,21337,0.0007\nCC-MAIN-2019-09,bod,37213,36935,0.0013\nCC-MAIN-2019-09,bos,902944,898962,0.0310\nCC-MAIN-2019-09,bre,40415,40186,0.0014\nCC-MAIN-2019-09,bul,7636776,7584997,0.2621\nCC-MAIN-2019-09,cat,5322176,5268685,0.1827\nCC-MAIN-2019-09,ceb,26742,26611,0.0009\nCC-MAIN-2019-09,ces,31239927,30935489,1.0722\nCC-MAIN-2019-09,chr,886,883,0.0000\nCC-MAIN-2019-09,cos,48720,48272,0.0017\nCC-MAIN-2019-09,crs,2904,2845,0.0001\nCC-MAIN-2019-09,cym,197839,195915,0.0068\nCC-MAIN-2019-09,dan,12393961,12253160,0.4254\nCC-MAIN-2019-09,deu,165522495,163616824,5.6808\nCC-MAIN-2019-09,div,34351,34271,0.0012\nCC-MAIN-2019-09,dzo,1329,1323,0.0000\nCC-MAIN-2019-09,ell,14212728,14110142,0.4878\nCC-MAIN-2019-09,eng,1257255357,1242094925,43.1493\nCC-MAIN-2019-09,epo,125376,124748,0.0043\nCC-MAIN-2019-09,est,3124198,3089967,0.1072\nCC-MAIN-2019-09,eus,671567,665178,0.0230\nCC-MAIN-2019-09,fao,91800,90935,0.0032\nCC-MAIN-2019-09,fas,17676199,17542166,0.6067\nCC-MAIN-2019-09,fij,2703,2641,0.0001\nCC-MAIN-2019-09,fin,10579294,10448208,0.3631\nCC-MAIN-2019-09,fra,134005589,132563077,4.5991\nCC-MAIN-2019-09,fry,51181,50306,0.0018\nCC-MAIN-2019-09,gla,46881,46283,0.0016\nCC-MAIN-2019-09,gle,106249,105649,0.0036\nCC-MAIN-2019-09,glg,690211,685516,0.0237\nCC-MAIN-2019-09,glv,10003,9576,0.0003\nCC-MAIN-2019-09,got,374,374,0.0000\nCC-MAIN-2019-09,grn,22415,22204,0.0008\nCC-MAIN-2019-09,guj,201343,198993,0.0069\nCC-MAIN-2019-09,hat,34582,34510,0.0012\nCC-MAIN-2019-09,hau,34322,34125,0.0012\nCC-MAIN-2019-09,haw,10115,10034,0.0003\nCC-MAIN-2019-09,heb,5695219,5611221,0.1955\nCC-MAIN-2019-09,hin,2647191,2629788,0.0909\nCC-MAIN-2019-09,hrv,4415480,4386478,0.1515\nCC-MAIN-2019-09,hun,14930074,14808234,0.5124\nCC-MAIN-2019-09,hye,796318,792198,0.0273\nCC-MAIN-2019-09,ibo,4341,4327,0.0001\nCC-MAIN-2019-09,iku,4707,4667,0.0002\nCC-MAIN-2019-09,ile,10970,10849,0.0004\nCC-MAIN-2019-09,ina,18997,18794,0.0007\nCC-MAIN-2019-09,ind,22375932,22193292,0.7679\nCC-MAIN-2019-09,ipk,2426,2394,0.0001\nCC-MAIN-2019-09,isl,896392,888217,0.0308\nCC-MAIN-2019-09,ita,67382711,66741425,2.3126\nCC-MAIN-2019-09,jav,33397,33286,0.0011\nCC-MAIN-2019-09,jpn,153253941,152258335,5.2597\nCC-MAIN-2019-09,kal,23814,23517,0.0008\nCC-MAIN-2019-09,kan,222004,220480,0.0076\nCC-MAIN-2019-09,kas,147,145,0.0000\nCC-MAIN-2019-09,kat,908984,903623,0.0312\nCC-MAIN-2019-09,kaz,455525,453080,0.0156\nCC-MAIN-2019-09,kha,8176,8071,0.0003\nCC-MAIN-2019-09,khm,187166,186074,0.0064\nCC-MAIN-2019-09,kin,53394,52861,0.0018\nCC-MAIN-2019-09,kir,108414,107842,0.0037\nCC-MAIN-2019-09,kor,19672830,19398122,0.6752\nCC-MAIN-2019-09,kur,137523,136946,0.0047\nCC-MAIN-2019-09,lao,66052,65774,0.0023\nCC-MAIN-2019-09,lat,1339699,1331260,0.0460\nCC-MAIN-2019-09,lav,2424232,2403536,0.0832\nCC-MAIN-2019-09,lif,102,99,0.0000\nCC-MAIN-2019-09,lin,5299,5121,0.0002\nCC-MAIN-2019-09,lit,4051070,4017609,0.1390\nCC-MAIN-2019-09,ltz,75679,74887,0.0026\nCC-MAIN-2019-09,lug,6666,6606,0.0002\nCC-MAIN-2019-09,mal,512418,510027,0.0176\nCC-MAIN-2019-09,mar,301201,299494,0.0103\nCC-MAIN-2019-09,mfe,3505,3453,0.0001\nCC-MAIN-2019-09,mkd,603130,599421,0.0207\nCC-MAIN-2019-09,mlg,55769,54981,0.0019\nCC-MAIN-2019-09,mlt,57687,57464,0.0020\nCC-MAIN-2019-09,mon,388396,386275,0.0133\nCC-MAIN-2019-09,mri,16895,16505,0.0006\nCC-MAIN-2019-09,msa,2316962,2303759,0.0795\nCC-MAIN-2019-09,mya,249669,248874,0.0086\nCC-MAIN-2019-09,nau,1422,1383,0.0000\nCC-MAIN-2019-09,nep,412024,409997,0.0141\nCC-MAIN-2019-09,nld,50691873,50042293,1.7398\nCC-MAIN-2019-09,nno,414433,408925,0.0142\nCC-MAIN-2019-09,nor,8926612,8830688,0.3064\nCC-MAIN-2019-09,nso,1989,1976,0.0001\nCC-MAIN-2019-09,nya,8453,8371,0.0003\nCC-MAIN-2019-09,oci,59220,58108,0.0020\nCC-MAIN-2019-09,ori,76488,75804,0.0026\nCC-MAIN-2019-09,orm,10334,10116,0.0004\nCC-MAIN-2019-09,pan,116135,114670,0.0040\nCC-MAIN-2019-09,pol,49895840,49488417,1.7124\nCC-MAIN-2019-09,por,57708722,57232264,1.9806\nCC-MAIN-2019-09,pus,85185,84815,0.0029\nCC-MAIN-2019-09,que,10079,9966,0.0003\nCC-MAIN-2019-09,roh,40558,40131,0.0014\nCC-MAIN-2019-09,ron,15519822,15402751,0.5326\nCC-MAIN-2019-09,run,4005,3967,0.0001\nCC-MAIN-2019-09,rus,250143382,248453629,8.5850\nCC-MAIN-2019-09,sag,978,973,0.0000\nCC-MAIN-2019-09,san,64458,64101,0.0022\nCC-MAIN-2019-09,sco,23792,23517,0.0008\nCC-MAIN-2019-09,sin,177247,176386,0.0061\nCC-MAIN-2019-09,slk,8097406,8024389,0.2779\nCC-MAIN-2019-09,slv,3242552,3214142,0.1113\nCC-MAIN-2019-09,smo,9614,9553,0.0003\nCC-MAIN-2019-09,sna,8022,7944,0.0003\nCC-MAIN-2019-09,snd,24732,21920,0.0008\nCC-MAIN-2019-09,som,144227,143765,0.0049\nCC-MAIN-2019-09,sot,6763,6676,0.0002\nCC-MAIN-2019-09,spa,121644988,120522909,4.1749\nCC-MAIN-2019-09,sqi,887157,882495,0.0304\nCC-MAIN-2019-09,srp,4842388,4806920,0.1662\nCC-MAIN-2019-09,ssw,2162,2115,0.0001\nCC-MAIN-2019-09,sun,16336,16141,0.0006\nCC-MAIN-2019-09,sux,117,116,0.0000\nCC-MAIN-2019-09,swa,180072,178515,0.0062\nCC-MAIN-2019-09,swe,22327984,22095586,0.7663\nCC-MAIN-2019-09,syr,13576,13521,0.0005\nCC-MAIN-2019-09,tam,1042166,1036812,0.0358\nCC-MAIN-2019-09,tat,158125,157636,0.0054\nCC-MAIN-2019-09,tel,357135,355636,0.0123\nCC-MAIN-2019-09,tgk,98021,97827,0.0034\nCC-MAIN-2019-09,tgl,173038,172408,0.0059\nCC-MAIN-2019-09,tha,8831222,8776560,0.3031\nCC-MAIN-2019-09,tir,15114,15000,0.0005\nCC-MAIN-2019-09,ton,2303,2287,0.0001\nCC-MAIN-2019-09,tsn,4020,3970,0.0001\nCC-MAIN-2019-09,tso,2444,2403,0.0001\nCC-MAIN-2019-09,tuk,34580,34438,0.0012\nCC-MAIN-2019-09,tur,26206309,25963531,0.8994\nCC-MAIN-2019-09,uig,24465,24329,0.0008\nCC-MAIN-2019-09,ukr,11227085,11144157,0.3853\nCC-MAIN-2019-09,urd,563004,559388,0.0193\nCC-MAIN-2019-09,uzb,324100,322896,0.0111\nCC-MAIN-2019-09,ven,1496,1473,0.0001\nCC-MAIN-2019-09,vie,21591514,21466343,0.7410\nCC-MAIN-2019-09,vol,14607,14433,0.0005\nCC-MAIN-2019-09,war,69042,68558,0.0024\nCC-MAIN-2019-09,wol,3403,3340,0.0001\nCC-MAIN-2019-09,xho,11985,11755,0.0004\nCC-MAIN-2019-09,yid,35338,35201,0.0012\nCC-MAIN-2019-09,yor,8426,8407,0.0003\nCC-MAIN-2019-09,zha,1392,1362,0.0000\nCC-MAIN-2019-09,zho,153566522,152968363,5.2704\nCC-MAIN-2019-09,zul,12697,12613,0.0004\nCC-MAIN-2019-13,<unknown>,78140100,78140100,3.0408\nCC-MAIN-2019-13,aar,6344,6289,0.0002\nCC-MAIN-2019-13,abk,3133,3124,0.0001\nCC-MAIN-2019-13,afr,232763,231628,0.0091\nCC-MAIN-2019-13,aka,2617,2587,0.0001\nCC-MAIN-2019-13,amh,50549,50241,0.0020\nCC-MAIN-2019-13,ara,13906571,13819108,0.5412\nCC-MAIN-2019-13,asm,16500,16468,0.0006\nCC-MAIN-2019-13,aym,1854,1827,0.0001\nCC-MAIN-2019-13,aze,925916,921259,0.0360\nCC-MAIN-2019-13,bak,18810,18793,0.0007\nCC-MAIN-2019-13,bel,294131,293093,0.0114\nCC-MAIN-2019-13,ben,1369029,1362342,0.0533\nCC-MAIN-2019-13,bih,11139,11048,0.0004\nCC-MAIN-2019-13,bis,3211,3120,0.0001\nCC-MAIN-2019-13,blu,12665,12649,0.0005\nCC-MAIN-2019-13,bod,26047,25978,0.0010\nCC-MAIN-2019-13,bos,778387,772137,0.0303\nCC-MAIN-2019-13,bre,29557,29386,0.0012\nCC-MAIN-2019-13,bul,6546870,6495873,0.2548\nCC-MAIN-2019-13,cat,4711245,4662605,0.1833\nCC-MAIN-2019-13,ceb,20211,20181,0.0008\nCC-MAIN-2019-13,ces,27426608,27152340,1.0673\nCC-MAIN-2019-13,chr,673,673,0.0000\nCC-MAIN-2019-13,cos,36711,36425,0.0014\nCC-MAIN-2019-13,crs,2485,2456,0.0001\nCC-MAIN-2019-13,cym,168809,166938,0.0066\nCC-MAIN-2019-13,dan,10855848,10726275,0.4225\nCC-MAIN-2019-13,deu,146479255,144653258,5.7003\nCC-MAIN-2019-13,div,28337,28275,0.0011\nCC-MAIN-2019-13,dzo,884,879,0.0000\nCC-MAIN-2019-13,ell,12629590,12543850,0.4915\nCC-MAIN-2019-13,eng,1116378406,1102436383,43.4442\nCC-MAIN-2019-13,epo,103889,103539,0.0040\nCC-MAIN-2019-13,est,2717261,2687017,0.1057\nCC-MAIN-2019-13,eus,568631,563345,0.0221\nCC-MAIN-2019-13,fao,77242,76860,0.0030\nCC-MAIN-2019-13,fas,15380578,15264531,0.5985\nCC-MAIN-2019-13,fij,2206,2177,0.0001\nCC-MAIN-2019-13,fin,9193809,9073630,0.3578\nCC-MAIN-2019-13,fra,120134058,118802639,4.6751\nCC-MAIN-2019-13,fry,44584,44298,0.0017\nCC-MAIN-2019-13,gla,42559,42391,0.0017\nCC-MAIN-2019-13,gle,93025,92123,0.0036\nCC-MAIN-2019-13,glg,617835,612496,0.0240\nCC-MAIN-2019-13,glv,6315,6212,0.0002\nCC-MAIN-2019-13,got,259,258,0.0000\nCC-MAIN-2019-13,grn,17019,16758,0.0007\nCC-MAIN-2019-13,guj,172588,171521,0.0067\nCC-MAIN-2019-13,hat,24749,24688,0.0010\nCC-MAIN-2019-13,hau,40995,40825,0.0016\nCC-MAIN-2019-13,haw,6648,6607,0.0003\nCC-MAIN-2019-13,heb,5137262,5067042,0.1999\nCC-MAIN-2019-13,hin,2247449,2233597,0.0875\nCC-MAIN-2019-13,hrv,3911576,3883495,0.1522\nCC-MAIN-2019-13,hun,13032075,12927914,0.5071\nCC-MAIN-2019-13,hye,636163,633230,0.0248\nCC-MAIN-2019-13,ibo,4553,4541,0.0002\nCC-MAIN-2019-13,iku,5062,4984,0.0002\nCC-MAIN-2019-13,ile,8409,8350,0.0003\nCC-MAIN-2019-13,ina,16030,15926,0.0006\nCC-MAIN-2019-13,ind,18516052,18378744,0.7206\nCC-MAIN-2019-13,ipk,2242,2182,0.0001\nCC-MAIN-2019-13,isl,793865,786996,0.0309\nCC-MAIN-2019-13,ita,60630732,60003305,2.3595\nCC-MAIN-2019-13,jav,24734,24681,0.0010\nCC-MAIN-2019-13,jpn,131044910,130118271,5.0997\nCC-MAIN-2019-13,kal,18745,18453,0.0007\nCC-MAIN-2019-13,kan,173416,173028,0.0067\nCC-MAIN-2019-13,kas,97,95,0.0000\nCC-MAIN-2019-13,kat,724381,719725,0.0282\nCC-MAIN-2019-13,kaz,406799,404454,0.0158\nCC-MAIN-2019-13,kha,6158,6117,0.0002\nCC-MAIN-2019-13,khm,153218,152633,0.0060\nCC-MAIN-2019-13,kin,50959,50781,0.0020\nCC-MAIN-2019-13,kir,86962,86369,0.0034\nCC-MAIN-2019-13,kor,15425958,15350196,0.6003\nCC-MAIN-2019-13,kur,122797,122412,0.0048\nCC-MAIN-2019-13,lao,62871,62754,0.0024\nCC-MAIN-2019-13,lat,1244446,1235715,0.0484\nCC-MAIN-2019-13,lav,2089694,2067269,0.0813\nCC-MAIN-2019-13,lif,86,82,0.0000\nCC-MAIN-2019-13,lin,5221,5071,0.0002\nCC-MAIN-2019-13,lit,3573041,3539370,0.1390\nCC-MAIN-2019-13,ltz,60461,59689,0.0024\nCC-MAIN-2019-13,lug,5196,5158,0.0002\nCC-MAIN-2019-13,mal,375160,372966,0.0146\nCC-MAIN-2019-13,mar,253131,252083,0.0099\nCC-MAIN-2019-13,mfe,3723,3693,0.0001\nCC-MAIN-2019-13,mkd,518631,516321,0.0202\nCC-MAIN-2019-13,mlg,46118,45817,0.0018\nCC-MAIN-2019-13,mlt,45522,45375,0.0018\nCC-MAIN-2019-13,mon,327731,326308,0.0128\nCC-MAIN-2019-13,mri,24385,24154,0.0009\nCC-MAIN-2019-13,msa,1881323,1867997,0.0732\nCC-MAIN-2019-13,mya,225428,224927,0.0088\nCC-MAIN-2019-13,nau,1580,1565,0.0001\nCC-MAIN-2019-13,nep,335057,333701,0.0130\nCC-MAIN-2019-13,nld,46213908,45607909,1.7984\nCC-MAIN-2019-13,nno,363794,360362,0.0142\nCC-MAIN-2019-13,nor,8031934,7939407,0.3126\nCC-MAIN-2019-13,nso,7144,7142,0.0003\nCC-MAIN-2019-13,nya,10042,10013,0.0004\nCC-MAIN-2019-13,oci,48304,47708,0.0019\nCC-MAIN-2019-13,ori,57892,57709,0.0023\nCC-MAIN-2019-13,orm,8449,8356,0.0003\nCC-MAIN-2019-13,pan,88740,88137,0.0035\nCC-MAIN-2019-13,pol,43979837,43599839,1.7115\nCC-MAIN-2019-13,por,51550216,51098879,2.0061\nCC-MAIN-2019-13,pus,62833,62492,0.0024\nCC-MAIN-2019-13,que,17411,17361,0.0007\nCC-MAIN-2019-13,roh,41741,41550,0.0016\nCC-MAIN-2019-13,ron,13543560,13433446,0.5271\nCC-MAIN-2019-13,run,3033,3013,0.0001\nCC-MAIN-2019-13,rus,210211463,208583331,8.1804\nCC-MAIN-2019-13,sag,307,303,0.0000\nCC-MAIN-2019-13,san,56926,56689,0.0022\nCC-MAIN-2019-13,sco,18314,18132,0.0007\nCC-MAIN-2019-13,sin,153609,153085,0.0060\nCC-MAIN-2019-13,slk,7263065,7198000,0.2826\nCC-MAIN-2019-13,slv,2863773,2838461,0.1114\nCC-MAIN-2019-13,smo,8237,8083,0.0003\nCC-MAIN-2019-13,sna,7434,7387,0.0003\nCC-MAIN-2019-13,snd,11547,11377,0.0004\nCC-MAIN-2019-13,som,114788,114492,0.0045\nCC-MAIN-2019-13,sot,6700,6668,0.0003\nCC-MAIN-2019-13,spa,107305345,106231258,4.1758\nCC-MAIN-2019-13,sqi,728731,725108,0.0284\nCC-MAIN-2019-13,srp,4102790,4075338,0.1597\nCC-MAIN-2019-13,ssw,1128,1107,0.0000\nCC-MAIN-2019-13,sun,12740,12654,0.0005\nCC-MAIN-2019-13,sux,153,153,0.0000\nCC-MAIN-2019-13,swa,172194,171182,0.0067\nCC-MAIN-2019-13,swe,19025105,18808584,0.7404\nCC-MAIN-2019-13,syr,12234,12203,0.0005\nCC-MAIN-2019-13,tam,826726,823095,0.0322\nCC-MAIN-2019-13,tat,134953,134569,0.0053\nCC-MAIN-2019-13,tel,266736,265891,0.0104\nCC-MAIN-2019-13,tgk,98933,98812,0.0039\nCC-MAIN-2019-13,tgl,129980,129523,0.0051\nCC-MAIN-2019-13,tha,7951434,7903620,0.3094\nCC-MAIN-2019-13,tir,12950,12862,0.0005\nCC-MAIN-2019-13,ton,1837,1831,0.0001\nCC-MAIN-2019-13,tsn,13914,13883,0.0005\nCC-MAIN-2019-13,tso,2055,2041,0.0001\nCC-MAIN-2019-13,tuk,26178,26074,0.0010\nCC-MAIN-2019-13,tur,22729810,22504262,0.8845\nCC-MAIN-2019-13,uig,15895,15853,0.0006\nCC-MAIN-2019-13,ukr,9220813,9160927,0.3588\nCC-MAIN-2019-13,urd,457336,454979,0.0178\nCC-MAIN-2019-13,uzb,268227,266880,0.0104\nCC-MAIN-2019-13,ven,760,756,0.0000\nCC-MAIN-2019-13,vie,18846887,18726949,0.7334\nCC-MAIN-2019-13,vol,12039,11962,0.0005\nCC-MAIN-2019-13,war,46628,46257,0.0018\nCC-MAIN-2019-13,wol,2910,2879,0.0001\nCC-MAIN-2019-13,xho,23194,23117,0.0009\nCC-MAIN-2019-13,yid,26548,26495,0.0010\nCC-MAIN-2019-13,yor,5676,5663,0.0002\nCC-MAIN-2019-13,zha,1371,1348,0.0001\nCC-MAIN-2019-13,zho,157814842,157016563,6.1414\nCC-MAIN-2019-13,zul,18878,18844,0.0007\nCC-MAIN-2019-18,<unknown>,64919822,64919822,2.5991\nCC-MAIN-2019-18,aar,5271,5214,0.0002\nCC-MAIN-2019-18,abk,6382,6351,0.0003\nCC-MAIN-2019-18,afr,274845,273460,0.0110\nCC-MAIN-2019-18,aka,976,944,0.0000\nCC-MAIN-2019-18,amh,44000,43854,0.0018\nCC-MAIN-2019-18,ara,13377863,13296649,0.5356\nCC-MAIN-2019-18,asm,19121,18933,0.0008\nCC-MAIN-2019-18,aym,2259,2200,0.0001\nCC-MAIN-2019-18,aze,873335,868718,0.0350\nCC-MAIN-2019-18,bak,30229,30168,0.0012\nCC-MAIN-2019-18,bel,391018,382960,0.0157\nCC-MAIN-2019-18,ben,1447573,1441407,0.0580\nCC-MAIN-2019-18,bih,16291,16122,0.0007\nCC-MAIN-2019-18,bis,3237,3192,0.0001\nCC-MAIN-2019-18,blu,8330,8306,0.0003\nCC-MAIN-2019-18,bod,32915,32838,0.0013\nCC-MAIN-2019-18,bos,743754,739580,0.0298\nCC-MAIN-2019-18,bre,54883,54659,0.0022\nCC-MAIN-2019-18,bul,6458941,6409004,0.2586\nCC-MAIN-2019-18,cat,5368892,5313824,0.2149\nCC-MAIN-2019-18,ceb,61906,61831,0.0025\nCC-MAIN-2019-18,ces,26029228,25770626,1.0421\nCC-MAIN-2019-18,chr,1932,1924,0.0001\nCC-MAIN-2019-18,cos,51858,51477,0.0021\nCC-MAIN-2019-18,crs,1961,1936,0.0001\nCC-MAIN-2019-18,cym,200107,198207,0.0080\nCC-MAIN-2019-18,dan,10592708,10474873,0.4241\nCC-MAIN-2019-18,deu,142123628,140458001,5.6899\nCC-MAIN-2019-18,div,30365,30185,0.0012\nCC-MAIN-2019-18,dzo,1087,1086,0.0000\nCC-MAIN-2019-18,ell,12389584,12304050,0.4960\nCC-MAIN-2019-18,eng,1126498542,1112968124,45.0993\nCC-MAIN-2019-18,epo,175915,175270,0.0070\nCC-MAIN-2019-18,est,2577951,2547713,0.1032\nCC-MAIN-2019-18,eus,694207,687711,0.0278\nCC-MAIN-2019-18,fao,83585,83248,0.0033\nCC-MAIN-2019-18,fas,16788470,16654095,0.6721\nCC-MAIN-2019-18,fij,2072,2046,0.0001\nCC-MAIN-2019-18,fin,9200065,9087741,0.3683\nCC-MAIN-2019-18,fra,117801928,116566409,4.7162\nCC-MAIN-2019-18,fry,61981,61670,0.0025\nCC-MAIN-2019-18,gla,39889,39721,0.0016\nCC-MAIN-2019-18,gle,94719,94125,0.0038\nCC-MAIN-2019-18,glg,768634,763157,0.0308\nCC-MAIN-2019-18,glv,8946,8820,0.0004\nCC-MAIN-2019-18,got,664,658,0.0000\nCC-MAIN-2019-18,grn,17568,17374,0.0007\nCC-MAIN-2019-18,guj,167504,165946,0.0067\nCC-MAIN-2019-18,hat,26185,26092,0.0010\nCC-MAIN-2019-18,hau,30026,29879,0.0012\nCC-MAIN-2019-18,haw,31597,31535,0.0013\nCC-MAIN-2019-18,heb,5027075,4962291,0.2013\nCC-MAIN-2019-18,hin,2548508,2531990,0.1020\nCC-MAIN-2019-18,hrv,3766831,3740907,0.1508\nCC-MAIN-2019-18,hun,12249577,12152560,0.4904\nCC-MAIN-2019-18,hye,783034,779302,0.0313\nCC-MAIN-2019-18,ibo,4252,4236,0.0002\nCC-MAIN-2019-18,iku,4829,4757,0.0002\nCC-MAIN-2019-18,ile,9227,9150,0.0004\nCC-MAIN-2019-18,ina,19176,19037,0.0008\nCC-MAIN-2019-18,ind,18141533,18000985,0.7263\nCC-MAIN-2019-18,ipk,2961,2909,0.0001\nCC-MAIN-2019-18,isl,764799,758704,0.0306\nCC-MAIN-2019-18,ita,59655365,59028304,2.3883\nCC-MAIN-2019-18,jav,41317,41156,0.0017\nCC-MAIN-2019-18,jpn,122166512,121243648,4.8909\nCC-MAIN-2019-18,kal,22532,21845,0.0009\nCC-MAIN-2019-18,kan,179943,179339,0.0072\nCC-MAIN-2019-18,kas,65,62,0.0000\nCC-MAIN-2019-18,kat,902365,895342,0.0361\nCC-MAIN-2019-18,kaz,430626,426406,0.0172\nCC-MAIN-2019-18,kha,6142,6108,0.0002\nCC-MAIN-2019-18,khm,158457,157827,0.0063\nCC-MAIN-2019-18,kin,39020,38901,0.0016\nCC-MAIN-2019-18,kir,86052,85689,0.0034\nCC-MAIN-2019-18,kor,14315020,14252279,0.5731\nCC-MAIN-2019-18,kur,114590,114346,0.0046\nCC-MAIN-2019-18,lao,53287,52869,0.0021\nCC-MAIN-2019-18,lat,1313616,1305286,0.0526\nCC-MAIN-2019-18,lav,1994260,1976006,0.0798\nCC-MAIN-2019-18,lif,76,70,0.0000\nCC-MAIN-2019-18,lin,6060,5983,0.0002\nCC-MAIN-2019-18,lit,3404213,3376872,0.1363\nCC-MAIN-2019-18,ltz,85987,85004,0.0034\nCC-MAIN-2019-18,lug,5593,5548,0.0002\nCC-MAIN-2019-18,mal,424629,423052,0.0170\nCC-MAIN-2019-18,mar,276720,273508,0.0111\nCC-MAIN-2019-18,mfe,2994,2970,0.0001\nCC-MAIN-2019-18,mkd,532153,529748,0.0213\nCC-MAIN-2019-18,mlg,61035,60833,0.0024\nCC-MAIN-2019-18,mlt,45015,44785,0.0018\nCC-MAIN-2019-18,mon,327261,326179,0.0131\nCC-MAIN-2019-18,mri,19479,19268,0.0008\nCC-MAIN-2019-18,msa,2082000,2071049,0.0834\nCC-MAIN-2019-18,mya,211890,211075,0.0085\nCC-MAIN-2019-18,nau,1575,1566,0.0001\nCC-MAIN-2019-18,nep,348520,347363,0.0140\nCC-MAIN-2019-18,nld,45296904,44753978,1.8135\nCC-MAIN-2019-18,nno,401045,397375,0.0161\nCC-MAIN-2019-18,nor,7582636,7503398,0.3036\nCC-MAIN-2019-18,nso,5002,4997,0.0002\nCC-MAIN-2019-18,nya,7599,7560,0.0003\nCC-MAIN-2019-18,oci,101504,100912,0.0041\nCC-MAIN-2019-18,ori,64163,64066,0.0026\nCC-MAIN-2019-18,orm,7534,7438,0.0003\nCC-MAIN-2019-18,pan,105655,105346,0.0042\nCC-MAIN-2019-18,pol,41415680,41053683,1.6581\nCC-MAIN-2019-18,por,49315667,48893638,1.9743\nCC-MAIN-2019-18,pus,69194,68914,0.0028\nCC-MAIN-2019-18,que,15926,15830,0.0006\nCC-MAIN-2019-18,roh,39056,38798,0.0016\nCC-MAIN-2019-18,ron,13095211,12990298,0.5243\nCC-MAIN-2019-18,run,3195,3184,0.0001\nCC-MAIN-2019-18,rus,197363158,195657929,7.9014\nCC-MAIN-2019-18,sag,467,463,0.0000\nCC-MAIN-2019-18,san,65249,64934,0.0026\nCC-MAIN-2019-18,sco,18292,18078,0.0007\nCC-MAIN-2019-18,sin,151417,150704,0.0061\nCC-MAIN-2019-18,slk,6935702,6870946,0.2777\nCC-MAIN-2019-18,slv,2752095,2728768,0.1102\nCC-MAIN-2019-18,smo,6878,6704,0.0003\nCC-MAIN-2019-18,sna,8599,8458,0.0003\nCC-MAIN-2019-18,snd,19516,19467,0.0008\nCC-MAIN-2019-18,som,105468,105176,0.0042\nCC-MAIN-2019-18,sot,7186,7160,0.0003\nCC-MAIN-2019-18,spa,104483041,103481426,4.1830\nCC-MAIN-2019-18,sqi,818881,814207,0.0328\nCC-MAIN-2019-18,srp,4122179,4095568,0.1650\nCC-MAIN-2019-18,ssw,1482,1456,0.0001\nCC-MAIN-2019-18,sun,18089,18027,0.0007\nCC-MAIN-2019-18,sux,291,291,0.0000\nCC-MAIN-2019-18,swa,157613,156385,0.0063\nCC-MAIN-2019-18,swe,18519476,18318392,0.7414\nCC-MAIN-2019-18,syr,10255,10224,0.0004\nCC-MAIN-2019-18,tam,879425,875602,0.0352\nCC-MAIN-2019-18,tat,154930,153936,0.0062\nCC-MAIN-2019-18,tel,329498,328505,0.0132\nCC-MAIN-2019-18,tgk,88899,88736,0.0036\nCC-MAIN-2019-18,tgl,133085,132266,0.0053\nCC-MAIN-2019-18,tha,7536535,7490872,0.3017\nCC-MAIN-2019-18,tir,9907,9879,0.0004\nCC-MAIN-2019-18,ton,3192,3181,0.0001\nCC-MAIN-2019-18,tsn,5422,5398,0.0002\nCC-MAIN-2019-18,tso,2720,2703,0.0001\nCC-MAIN-2019-18,tuk,33913,33814,0.0014\nCC-MAIN-2019-18,tur,20646846,20448999,0.8266\nCC-MAIN-2019-18,uig,19639,19369,0.0008\nCC-MAIN-2019-18,ukr,9045935,8988451,0.3622\nCC-MAIN-2019-18,urd,501965,499722,0.0201\nCC-MAIN-2019-18,uzb,340052,338407,0.0136\nCC-MAIN-2019-18,ven,1039,1031,0.0000\nCC-MAIN-2019-18,vie,16818166,16702450,0.6733\nCC-MAIN-2019-18,vol,25759,25635,0.0010\nCC-MAIN-2019-18,war,96563,95919,0.0039\nCC-MAIN-2019-18,wol,3423,3383,0.0001\nCC-MAIN-2019-18,xho,12271,12118,0.0005\nCC-MAIN-2019-18,yid,34589,34433,0.0014\nCC-MAIN-2019-18,yor,13409,13364,0.0005\nCC-MAIN-2019-18,zha,2057,2027,0.0001\nCC-MAIN-2019-18,zho,134706960,133812654,5.3930\nCC-MAIN-2019-18,zul,10183,10137,0.0004\nCC-MAIN-2019-22,<unknown>,76808733,76808733,2.8663\nCC-MAIN-2019-22,aar,4076,3999,0.0002\nCC-MAIN-2019-22,abk,6809,6749,0.0003\nCC-MAIN-2019-22,afr,295406,293719,0.0110\nCC-MAIN-2019-22,aka,2193,2180,0.0001\nCC-MAIN-2019-22,amh,55625,55460,0.0021\nCC-MAIN-2019-22,ara,15199232,15085384,0.5672\nCC-MAIN-2019-22,asm,19122,18963,0.0007\nCC-MAIN-2019-22,aym,2450,2425,0.0001\nCC-MAIN-2019-22,aze,1109561,1104216,0.0414\nCC-MAIN-2019-22,bak,37239,37158,0.0014\nCC-MAIN-2019-22,bel,401793,395877,0.0150\nCC-MAIN-2019-22,ben,1580240,1569919,0.0590\nCC-MAIN-2019-22,bih,13484,13409,0.0005\nCC-MAIN-2019-22,bis,3666,3628,0.0001\nCC-MAIN-2019-22,blu,7865,7845,0.0003\nCC-MAIN-2019-22,bod,40949,40836,0.0015\nCC-MAIN-2019-22,bos,960899,957291,0.0359\nCC-MAIN-2019-22,bre,73274,73046,0.0027\nCC-MAIN-2019-22,bul,6963681,6907211,0.2599\nCC-MAIN-2019-22,cat,5325659,5274819,0.1987\nCC-MAIN-2019-22,ceb,53237,53145,0.0020\nCC-MAIN-2019-22,ces,29176532,28885374,1.0888\nCC-MAIN-2019-22,chr,1131,1127,0.0000\nCC-MAIN-2019-22,cos,54732,54445,0.0020\nCC-MAIN-2019-22,crs,2512,2483,0.0001\nCC-MAIN-2019-22,cym,216814,214728,0.0081\nCC-MAIN-2019-22,dan,11536209,11405899,0.4305\nCC-MAIN-2019-22,deu,146721176,145040829,5.4752\nCC-MAIN-2019-22,div,31638,31488,0.0012\nCC-MAIN-2019-22,dzo,1043,1036,0.0000\nCC-MAIN-2019-22,ell,13789980,13692862,0.5146\nCC-MAIN-2019-22,eng,1176031248,1161556713,43.8859\nCC-MAIN-2019-22,epo,156921,156361,0.0059\nCC-MAIN-2019-22,est,2826004,2785621,0.1055\nCC-MAIN-2019-22,eus,679221,674336,0.0253\nCC-MAIN-2019-22,fao,94213,93662,0.0035\nCC-MAIN-2019-22,fas,16517823,16386364,0.6164\nCC-MAIN-2019-22,fij,2485,2473,0.0001\nCC-MAIN-2019-22,fin,10486175,10373147,0.3913\nCC-MAIN-2019-22,fra,123149130,121883683,4.5956\nCC-MAIN-2019-22,fry,64116,63752,0.0024\nCC-MAIN-2019-22,gla,31633,31486,0.0012\nCC-MAIN-2019-22,gle,112313,111497,0.0042\nCC-MAIN-2019-22,glg,801632,795362,0.0299\nCC-MAIN-2019-22,glv,10418,10312,0.0004\nCC-MAIN-2019-22,got,353,352,0.0000\nCC-MAIN-2019-22,grn,17856,17706,0.0007\nCC-MAIN-2019-22,guj,175101,174071,0.0065\nCC-MAIN-2019-22,hat,27612,27444,0.0010\nCC-MAIN-2019-22,hau,35573,35356,0.0013\nCC-MAIN-2019-22,haw,24902,24847,0.0009\nCC-MAIN-2019-22,heb,5825655,5753838,0.2174\nCC-MAIN-2019-22,hin,2371102,2356415,0.0885\nCC-MAIN-2019-22,hrv,4223425,4195325,0.1576\nCC-MAIN-2019-22,hun,13756652,13639969,0.5134\nCC-MAIN-2019-22,hye,791044,786741,0.0295\nCC-MAIN-2019-22,ibo,4504,4491,0.0002\nCC-MAIN-2019-22,iku,4950,4839,0.0002\nCC-MAIN-2019-22,ile,8969,8870,0.0003\nCC-MAIN-2019-22,ina,16695,16587,0.0006\nCC-MAIN-2019-22,ind,20103106,19960836,0.7502\nCC-MAIN-2019-22,ipk,3779,3668,0.0001\nCC-MAIN-2019-22,isl,894834,886670,0.0334\nCC-MAIN-2019-22,ita,63073590,62451978,2.3537\nCC-MAIN-2019-22,jav,39594,39510,0.0015\nCC-MAIN-2019-22,jpn,128776829,127866093,4.8056\nCC-MAIN-2019-22,kal,22083,21594,0.0008\nCC-MAIN-2019-22,kan,193530,192525,0.0072\nCC-MAIN-2019-22,kas,181,179,0.0000\nCC-MAIN-2019-22,kat,918319,912172,0.0343\nCC-MAIN-2019-22,kaz,490730,485849,0.0183\nCC-MAIN-2019-22,kha,7324,7279,0.0003\nCC-MAIN-2019-22,khm,178073,177198,0.0066\nCC-MAIN-2019-22,kin,49752,49563,0.0019\nCC-MAIN-2019-22,kir,104885,104122,0.0039\nCC-MAIN-2019-22,kor,17184062,17114736,0.6413\nCC-MAIN-2019-22,kur,159442,158881,0.0059\nCC-MAIN-2019-22,lao,58293,58129,0.0022\nCC-MAIN-2019-22,lat,1415397,1407616,0.0528\nCC-MAIN-2019-22,lav,2352809,2328978,0.0878\nCC-MAIN-2019-22,lif,75,72,0.0000\nCC-MAIN-2019-22,lin,10788,10734,0.0004\nCC-MAIN-2019-22,lit,3692291,3655825,0.1378\nCC-MAIN-2019-22,ltz,83362,82809,0.0031\nCC-MAIN-2019-22,lug,5672,5645,0.0002\nCC-MAIN-2019-22,mal,436962,435118,0.0163\nCC-MAIN-2019-22,mar,271582,269549,0.0101\nCC-MAIN-2019-22,mfe,4786,4756,0.0002\nCC-MAIN-2019-22,mkd,559105,556549,0.0209\nCC-MAIN-2019-22,mlg,85516,85306,0.0032\nCC-MAIN-2019-22,mlt,61055,60126,0.0023\nCC-MAIN-2019-22,mon,383666,381746,0.0143\nCC-MAIN-2019-22,mri,23321,23187,0.0009\nCC-MAIN-2019-22,msa,2230274,2215469,0.0832\nCC-MAIN-2019-22,mya,233106,231969,0.0087\nCC-MAIN-2019-22,nau,1285,1277,0.0000\nCC-MAIN-2019-22,nep,387569,385876,0.0145\nCC-MAIN-2019-22,nld,46976839,46418546,1.7530\nCC-MAIN-2019-22,nno,473468,468656,0.0177\nCC-MAIN-2019-22,nor,8464168,8376237,0.3159\nCC-MAIN-2019-22,nso,3068,3063,0.0001\nCC-MAIN-2019-22,nya,6825,6795,0.0003\nCC-MAIN-2019-22,oci,79887,79501,0.0030\nCC-MAIN-2019-22,ori,59129,58821,0.0022\nCC-MAIN-2019-22,orm,9790,9755,0.0004\nCC-MAIN-2019-22,pan,115230,114891,0.0043\nCC-MAIN-2019-22,pol,46013071,45602836,1.7171\nCC-MAIN-2019-22,por,55799887,55291409,2.0823\nCC-MAIN-2019-22,pus,66987,66533,0.0025\nCC-MAIN-2019-22,que,14390,14326,0.0005\nCC-MAIN-2019-22,roh,42926,42559,0.0016\nCC-MAIN-2019-22,ron,14739014,14620017,0.5500\nCC-MAIN-2019-22,run,3164,3033,0.0001\nCC-MAIN-2019-22,rus,204497763,202945048,7.6312\nCC-MAIN-2019-22,sag,624,616,0.0000\nCC-MAIN-2019-22,san,82748,82274,0.0031\nCC-MAIN-2019-22,sco,21681,21497,0.0008\nCC-MAIN-2019-22,sin,160183,159211,0.0060\nCC-MAIN-2019-22,slk,7435183,7365934,0.2775\nCC-MAIN-2019-22,slv,3014570,2990493,0.1125\nCC-MAIN-2019-22,smo,6823,6755,0.0003\nCC-MAIN-2019-22,sna,7171,7134,0.0003\nCC-MAIN-2019-22,snd,15542,15159,0.0006\nCC-MAIN-2019-22,som,112336,112142,0.0042\nCC-MAIN-2019-22,sot,5872,5831,0.0002\nCC-MAIN-2019-22,spa,111600476,110554741,4.1646\nCC-MAIN-2019-22,sqi,880183,874033,0.0328\nCC-MAIN-2019-22,srp,4519351,4486229,0.1686\nCC-MAIN-2019-22,ssw,1496,1473,0.0001\nCC-MAIN-2019-22,sun,18041,17978,0.0007\nCC-MAIN-2019-22,sux,105,104,0.0000\nCC-MAIN-2019-22,swa,163992,163372,0.0061\nCC-MAIN-2019-22,swe,20260671,20048415,0.7561\nCC-MAIN-2019-22,syr,12870,12836,0.0005\nCC-MAIN-2019-22,tam,947182,941186,0.0353\nCC-MAIN-2019-22,tat,151893,150978,0.0057\nCC-MAIN-2019-22,tel,348949,346812,0.0130\nCC-MAIN-2019-22,tgk,76483,75847,0.0029\nCC-MAIN-2019-22,tgl,118937,118103,0.0044\nCC-MAIN-2019-22,tha,8112677,8065415,0.3027\nCC-MAIN-2019-22,tir,10395,10297,0.0004\nCC-MAIN-2019-22,ton,7433,7419,0.0003\nCC-MAIN-2019-22,tsn,3530,3502,0.0001\nCC-MAIN-2019-22,tso,3655,3642,0.0001\nCC-MAIN-2019-22,tuk,27846,27766,0.0010\nCC-MAIN-2019-22,tur,24206433,23974536,0.9033\nCC-MAIN-2019-22,uig,23652,23599,0.0009\nCC-MAIN-2019-22,ukr,9985263,9915607,0.3726\nCC-MAIN-2019-22,urd,492207,489294,0.0184\nCC-MAIN-2019-22,uzb,354782,353463,0.0132\nCC-MAIN-2019-22,ven,1164,1160,0.0000\nCC-MAIN-2019-22,vie,19951410,19808533,0.7445\nCC-MAIN-2019-22,vol,30098,30028,0.0011\nCC-MAIN-2019-22,war,70213,69854,0.0026\nCC-MAIN-2019-22,wol,4488,4462,0.0002\nCC-MAIN-2019-22,xho,10489,10397,0.0004\nCC-MAIN-2019-22,yid,28167,28099,0.0011\nCC-MAIN-2019-22,yor,12441,12420,0.0005\nCC-MAIN-2019-22,zha,1925,1905,0.0001\nCC-MAIN-2019-22,zho,175824791,174877419,6.5612\nCC-MAIN-2019-22,zul,12511,12463,0.0005\nCC-MAIN-2019-26,<unknown>,65217832,65217832,2.5139\nCC-MAIN-2019-26,aar,5112,5103,0.0002\nCC-MAIN-2019-26,abk,7395,7373,0.0003\nCC-MAIN-2019-26,afr,302657,301291,0.0117\nCC-MAIN-2019-26,aka,1713,1707,0.0001\nCC-MAIN-2019-26,amh,46746,46577,0.0018\nCC-MAIN-2019-26,ara,15095896,14982902,0.5819\nCC-MAIN-2019-26,asm,21920,21428,0.0008\nCC-MAIN-2019-26,aym,2237,2223,0.0001\nCC-MAIN-2019-26,aze,1207039,1201260,0.0465\nCC-MAIN-2019-26,bak,41039,40639,0.0016\nCC-MAIN-2019-26,bel,479240,474936,0.0185\nCC-MAIN-2019-26,ben,1609470,1602058,0.0620\nCC-MAIN-2019-26,bih,17170,16907,0.0007\nCC-MAIN-2019-26,bis,3109,3038,0.0001\nCC-MAIN-2019-26,blu,13058,13007,0.0005\nCC-MAIN-2019-26,bod,36705,36603,0.0014\nCC-MAIN-2019-26,bos,1020413,1014289,0.0393\nCC-MAIN-2019-26,bre,76741,76063,0.0030\nCC-MAIN-2019-26,bul,7736509,7678881,0.2982\nCC-MAIN-2019-26,cat,6034995,5986717,0.2326\nCC-MAIN-2019-26,ceb,49642,49598,0.0019\nCC-MAIN-2019-26,ces,27555314,27319717,1.0622\nCC-MAIN-2019-26,chr,2156,2153,0.0001\nCC-MAIN-2019-26,cos,57207,56553,0.0022\nCC-MAIN-2019-26,crs,2171,2152,0.0001\nCC-MAIN-2019-26,cym,254878,252735,0.0098\nCC-MAIN-2019-26,dan,11107254,11006910,0.4281\nCC-MAIN-2019-26,deu,142567712,141265463,5.4955\nCC-MAIN-2019-26,div,34581,34208,0.0013\nCC-MAIN-2019-26,dzo,1160,1106,0.0000\nCC-MAIN-2019-26,ell,14104880,14016735,0.5437\nCC-MAIN-2019-26,eng,1147050796,1134805773,44.2149\nCC-MAIN-2019-26,epo,240746,239515,0.0093\nCC-MAIN-2019-26,est,3410099,3366708,0.1314\nCC-MAIN-2019-26,eus,852266,847309,0.0329\nCC-MAIN-2019-26,fao,110095,108587,0.0042\nCC-MAIN-2019-26,fas,16274469,16154685,0.6273\nCC-MAIN-2019-26,fij,4903,4878,0.0002\nCC-MAIN-2019-26,fin,10254537,10159685,0.3953\nCC-MAIN-2019-26,fra,121707598,120666583,4.6914\nCC-MAIN-2019-26,fry,72113,71417,0.0028\nCC-MAIN-2019-26,gla,32479,32297,0.0013\nCC-MAIN-2019-26,gle,141589,140111,0.0055\nCC-MAIN-2019-26,glg,955471,948956,0.0368\nCC-MAIN-2019-26,glv,13054,12941,0.0005\nCC-MAIN-2019-26,got,1004,899,0.0000\nCC-MAIN-2019-26,grn,25547,25260,0.0010\nCC-MAIN-2019-26,guj,194378,193778,0.0075\nCC-MAIN-2019-26,hat,33098,32947,0.0013\nCC-MAIN-2019-26,hau,34917,34513,0.0013\nCC-MAIN-2019-26,haw,11863,11740,0.0005\nCC-MAIN-2019-26,heb,6372290,6309708,0.2456\nCC-MAIN-2019-26,hin,2614767,2594735,0.1008\nCC-MAIN-2019-26,hrv,4774876,4742153,0.1841\nCC-MAIN-2019-26,hun,13441481,13343894,0.5181\nCC-MAIN-2019-26,hye,925712,920432,0.0357\nCC-MAIN-2019-26,ibo,5673,5573,0.0002\nCC-MAIN-2019-26,iku,5937,5818,0.0002\nCC-MAIN-2019-26,ile,10192,10154,0.0004\nCC-MAIN-2019-26,ina,20051,19956,0.0008\nCC-MAIN-2019-26,ind,19091802,18949091,0.7359\nCC-MAIN-2019-26,ipk,2853,2707,0.0001\nCC-MAIN-2019-26,isl,974316,966535,0.0376\nCC-MAIN-2019-26,ita,61991136,61489798,2.3895\nCC-MAIN-2019-26,jav,48169,47465,0.0019\nCC-MAIN-2019-26,jpn,124539626,123793292,4.8006\nCC-MAIN-2019-26,kal,28059,27785,0.0011\nCC-MAIN-2019-26,kan,227760,226411,0.0088\nCC-MAIN-2019-26,kas,55,53,0.0000\nCC-MAIN-2019-26,kat,1076510,1070121,0.0415\nCC-MAIN-2019-26,kaz,567573,563847,0.0219\nCC-MAIN-2019-26,kha,5414,5378,0.0002\nCC-MAIN-2019-26,khm,185207,184483,0.0071\nCC-MAIN-2019-26,kin,48538,48263,0.0019\nCC-MAIN-2019-26,kir,117795,117347,0.0045\nCC-MAIN-2019-26,kor,17365914,17301003,0.6694\nCC-MAIN-2019-26,kur,166891,166136,0.0064\nCC-MAIN-2019-26,lao,71005,70515,0.0027\nCC-MAIN-2019-26,lat,1365745,1361039,0.0526\nCC-MAIN-2019-26,lav,2597236,2571412,0.1001\nCC-MAIN-2019-26,lif,71,68,0.0000\nCC-MAIN-2019-26,lin,6305,6273,0.0002\nCC-MAIN-2019-26,lit,4354391,4315586,0.1678\nCC-MAIN-2019-26,ltz,97952,97376,0.0038\nCC-MAIN-2019-26,lug,5775,5717,0.0002\nCC-MAIN-2019-26,mal,470784,468797,0.0181\nCC-MAIN-2019-26,mar,283313,279491,0.0109\nCC-MAIN-2019-26,mfe,2111,2092,0.0001\nCC-MAIN-2019-26,mkd,609850,607214,0.0235\nCC-MAIN-2019-26,mlg,100670,100274,0.0039\nCC-MAIN-2019-26,mlt,68571,67734,0.0026\nCC-MAIN-2019-26,mon,442849,440306,0.0171\nCC-MAIN-2019-26,mri,25693,24508,0.0010\nCC-MAIN-2019-26,msa,2556637,2544734,0.0985\nCC-MAIN-2019-26,mya,265270,263997,0.0102\nCC-MAIN-2019-26,nau,1229,1224,0.0000\nCC-MAIN-2019-26,nep,439210,435737,0.0169\nCC-MAIN-2019-26,nld,47294840,46876955,1.8231\nCC-MAIN-2019-26,nno,502753,498542,0.0194\nCC-MAIN-2019-26,nor,8321082,8237737,0.3207\nCC-MAIN-2019-26,nso,4467,4464,0.0002\nCC-MAIN-2019-26,nya,7006,6971,0.0003\nCC-MAIN-2019-26,oci,109053,108780,0.0042\nCC-MAIN-2019-26,ori,59459,59181,0.0023\nCC-MAIN-2019-26,orm,9834,9813,0.0004\nCC-MAIN-2019-26,pan,130611,130034,0.0050\nCC-MAIN-2019-26,pol,45222162,44880747,1.7432\nCC-MAIN-2019-26,por,55433875,55012622,2.1368\nCC-MAIN-2019-26,pus,76589,76175,0.0030\nCC-MAIN-2019-26,que,17244,17190,0.0007\nCC-MAIN-2019-26,roh,43529,43001,0.0017\nCC-MAIN-2019-26,ron,14573050,14472683,0.5617\nCC-MAIN-2019-26,run,2345,2288,0.0001\nCC-MAIN-2019-26,rus,191788563,190501902,7.3928\nCC-MAIN-2019-26,sag,700,641,0.0000\nCC-MAIN-2019-26,san,71707,71283,0.0028\nCC-MAIN-2019-26,sco,17896,17801,0.0007\nCC-MAIN-2019-26,sin,178899,177582,0.0069\nCC-MAIN-2019-26,slk,7285906,7231411,0.2808\nCC-MAIN-2019-26,slv,3538652,3509565,0.1364\nCC-MAIN-2019-26,smo,6721,6634,0.0003\nCC-MAIN-2019-26,sna,8706,8628,0.0003\nCC-MAIN-2019-26,snd,17299,16974,0.0007\nCC-MAIN-2019-26,som,107616,106972,0.0041\nCC-MAIN-2019-26,sot,6016,5967,0.0002\nCC-MAIN-2019-26,spa,110112628,109230348,4.2445\nCC-MAIN-2019-26,sqi,971263,966264,0.0374\nCC-MAIN-2019-26,srp,5160170,5118520,0.1989\nCC-MAIN-2019-26,ssw,1326,1283,0.0001\nCC-MAIN-2019-26,sun,25889,25541,0.0010\nCC-MAIN-2019-26,sux,103,103,0.0000\nCC-MAIN-2019-26,swa,188288,186523,0.0073\nCC-MAIN-2019-26,swe,20277986,20102011,0.7816\nCC-MAIN-2019-26,syr,12735,12447,0.0005\nCC-MAIN-2019-26,tam,1047595,1039067,0.0404\nCC-MAIN-2019-26,tat,166960,165736,0.0064\nCC-MAIN-2019-26,tel,370118,368109,0.0143\nCC-MAIN-2019-26,tgk,120733,119718,0.0047\nCC-MAIN-2019-26,tgl,149218,148761,0.0058\nCC-MAIN-2019-26,tha,7917976,7873392,0.3052\nCC-MAIN-2019-26,tir,14044,13945,0.0005\nCC-MAIN-2019-26,ton,6521,6462,0.0003\nCC-MAIN-2019-26,tsn,2862,2839,0.0001\nCC-MAIN-2019-26,tso,2722,2670,0.0001\nCC-MAIN-2019-26,tuk,37139,36729,0.0014\nCC-MAIN-2019-26,tur,22451004,22265410,0.8654\nCC-MAIN-2019-26,uig,24193,24042,0.0009\nCC-MAIN-2019-26,ukr,9748202,9694131,0.3758\nCC-MAIN-2019-26,urd,582398,578310,0.0224\nCC-MAIN-2019-26,uzb,426456,424292,0.0164\nCC-MAIN-2019-26,ven,1042,1040,0.0000\nCC-MAIN-2019-26,vie,18782670,18650626,0.7240\nCC-MAIN-2019-26,vol,45359,45052,0.0017\nCC-MAIN-2019-26,war,115176,114605,0.0044\nCC-MAIN-2019-26,wol,4561,4335,0.0002\nCC-MAIN-2019-26,xho,12237,11999,0.0005\nCC-MAIN-2019-26,yid,46405,46150,0.0018\nCC-MAIN-2019-26,yor,19523,19089,0.0008\nCC-MAIN-2019-26,zha,2576,2559,0.0001\nCC-MAIN-2019-26,zho,156054302,155017345,6.0154\nCC-MAIN-2019-26,zul,13920,13742,0.0005\nCC-MAIN-2019-30,<unknown>,54968397,54968397,2.1184\nCC-MAIN-2019-30,aar,3825,3811,0.0001\nCC-MAIN-2019-30,abk,7664,7577,0.0003\nCC-MAIN-2019-30,afr,306076,304325,0.0118\nCC-MAIN-2019-30,aka,1395,1373,0.0001\nCC-MAIN-2019-30,amh,56367,56116,0.0022\nCC-MAIN-2019-30,ara,15511534,15402082,0.5978\nCC-MAIN-2019-30,asm,22173,22129,0.0009\nCC-MAIN-2019-30,aym,3123,3102,0.0001\nCC-MAIN-2019-30,aze,1257204,1249854,0.0485\nCC-MAIN-2019-30,bak,38487,38457,0.0015\nCC-MAIN-2019-30,bel,486451,483188,0.0187\nCC-MAIN-2019-30,ben,1820196,1810492,0.0701\nCC-MAIN-2019-30,bih,14000,13953,0.0005\nCC-MAIN-2019-30,bis,3405,3378,0.0001\nCC-MAIN-2019-30,blu,8053,8029,0.0003\nCC-MAIN-2019-30,bod,39610,39576,0.0015\nCC-MAIN-2019-30,bos,1074547,1067769,0.0414\nCC-MAIN-2019-30,bre,80949,80369,0.0031\nCC-MAIN-2019-30,bul,6914449,6860877,0.2665\nCC-MAIN-2019-30,cat,6249946,6197978,0.2409\nCC-MAIN-2019-30,ceb,62761,62704,0.0024\nCC-MAIN-2019-30,ces,26516378,26288081,1.0219\nCC-MAIN-2019-30,chr,1529,1486,0.0001\nCC-MAIN-2019-30,cos,52695,52288,0.0020\nCC-MAIN-2019-30,crs,2159,2143,0.0001\nCC-MAIN-2019-30,cym,258725,256504,0.0100\nCC-MAIN-2019-30,dan,10918467,10815405,0.4208\nCC-MAIN-2019-30,deu,141898712,140472077,5.4686\nCC-MAIN-2019-30,div,37055,36661,0.0014\nCC-MAIN-2019-30,dzo,1153,1148,0.0000\nCC-MAIN-2019-30,ell,14199997,14113437,0.5472\nCC-MAIN-2019-30,eng,1156022925,1143473951,44.5516\nCC-MAIN-2019-30,epo,227992,226585,0.0088\nCC-MAIN-2019-30,est,3448265,3408713,0.1329\nCC-MAIN-2019-30,eus,834259,829061,0.0322\nCC-MAIN-2019-30,fao,110830,110180,0.0043\nCC-MAIN-2019-30,fas,15668724,15548142,0.6039\nCC-MAIN-2019-30,fij,2237,2181,0.0001\nCC-MAIN-2019-30,fin,10332056,10235216,0.3982\nCC-MAIN-2019-30,fra,121802722,120661050,4.6941\nCC-MAIN-2019-30,fry,74795,74511,0.0029\nCC-MAIN-2019-30,gla,32251,32172,0.0012\nCC-MAIN-2019-30,gle,128944,127681,0.0050\nCC-MAIN-2019-30,glg,985627,980200,0.0380\nCC-MAIN-2019-30,glv,8410,8357,0.0003\nCC-MAIN-2019-30,got,398,398,0.0000\nCC-MAIN-2019-30,grn,23565,23435,0.0009\nCC-MAIN-2019-30,guj,222280,221538,0.0086\nCC-MAIN-2019-30,hat,36147,36002,0.0014\nCC-MAIN-2019-30,hau,35461,35086,0.0014\nCC-MAIN-2019-30,haw,7639,7601,0.0003\nCC-MAIN-2019-30,heb,6840139,6773693,0.2636\nCC-MAIN-2019-30,hin,2973493,2956131,0.1146\nCC-MAIN-2019-30,hrv,5038754,5006272,0.1942\nCC-MAIN-2019-30,hun,13052667,12956545,0.5030\nCC-MAIN-2019-30,hye,941006,935359,0.0363\nCC-MAIN-2019-30,ibo,8215,8145,0.0003\nCC-MAIN-2019-30,iku,5131,4939,0.0002\nCC-MAIN-2019-30,ile,8449,8389,0.0003\nCC-MAIN-2019-30,ina,15955,15816,0.0006\nCC-MAIN-2019-30,ind,19965548,19799218,0.7694\nCC-MAIN-2019-30,ipk,3313,3177,0.0001\nCC-MAIN-2019-30,isl,1009642,999515,0.0389\nCC-MAIN-2019-30,ita,61455724,60912253,2.3684\nCC-MAIN-2019-30,jav,46605,46501,0.0018\nCC-MAIN-2019-30,jpn,121452791,120649489,4.6806\nCC-MAIN-2019-30,kal,22884,22704,0.0009\nCC-MAIN-2019-30,kan,256042,254877,0.0099\nCC-MAIN-2019-30,kas,119,117,0.0000\nCC-MAIN-2019-30,kat,1084317,1078234,0.0418\nCC-MAIN-2019-30,kaz,595471,591741,0.0229\nCC-MAIN-2019-30,kha,5310,5289,0.0002\nCC-MAIN-2019-30,khm,213656,212400,0.0082\nCC-MAIN-2019-30,kin,55545,55204,0.0021\nCC-MAIN-2019-30,kir,122421,121978,0.0047\nCC-MAIN-2019-30,kor,17352160,17284388,0.6687\nCC-MAIN-2019-30,kur,185442,184376,0.0071\nCC-MAIN-2019-30,lao,79528,79345,0.0031\nCC-MAIN-2019-30,lat,1377408,1371001,0.0531\nCC-MAIN-2019-30,lav,2746020,2720858,0.1058\nCC-MAIN-2019-30,lif,69,63,0.0000\nCC-MAIN-2019-30,lin,7329,7245,0.0003\nCC-MAIN-2019-30,lit,4543327,4505372,0.1751\nCC-MAIN-2019-30,ltz,96479,95990,0.0037\nCC-MAIN-2019-30,lug,7077,7054,0.0003\nCC-MAIN-2019-30,mal,528146,526121,0.0204\nCC-MAIN-2019-30,mar,330550,327327,0.0127\nCC-MAIN-2019-30,mfe,2420,2404,0.0001\nCC-MAIN-2019-30,mkd,594815,591333,0.0229\nCC-MAIN-2019-30,mlg,111117,110786,0.0043\nCC-MAIN-2019-30,mlt,70332,69944,0.0027\nCC-MAIN-2019-30,mon,459913,458165,0.0177\nCC-MAIN-2019-30,mri,19994,19872,0.0008\nCC-MAIN-2019-30,msa,2854469,2841218,0.1100\nCC-MAIN-2019-30,mya,270266,268077,0.0104\nCC-MAIN-2019-30,nau,926,918,0.0000\nCC-MAIN-2019-30,nep,461349,458486,0.0178\nCC-MAIN-2019-30,nld,46065049,45627827,1.7753\nCC-MAIN-2019-30,nno,530697,527416,0.0205\nCC-MAIN-2019-30,nor,8224705,8142274,0.3170\nCC-MAIN-2019-30,nso,2928,2927,0.0001\nCC-MAIN-2019-30,nya,5944,5924,0.0002\nCC-MAIN-2019-30,oci,88909,88366,0.0034\nCC-MAIN-2019-30,ori,66629,66421,0.0026\nCC-MAIN-2019-30,orm,8057,7980,0.0003\nCC-MAIN-2019-30,pan,139781,139468,0.0054\nCC-MAIN-2019-30,pol,43657009,43294585,1.6825\nCC-MAIN-2019-30,por,55124567,54702179,2.1244\nCC-MAIN-2019-30,pus,81661,81074,0.0031\nCC-MAIN-2019-30,que,16524,16479,0.0006\nCC-MAIN-2019-30,roh,43428,43213,0.0017\nCC-MAIN-2019-30,ron,14544386,14404970,0.5605\nCC-MAIN-2019-30,run,3154,3112,0.0001\nCC-MAIN-2019-30,rus,187313322,185983399,7.2188\nCC-MAIN-2019-30,sag,389,386,0.0000\nCC-MAIN-2019-30,san,78061,77036,0.0030\nCC-MAIN-2019-30,sco,19489,19388,0.0008\nCC-MAIN-2019-30,sin,181923,180424,0.0070\nCC-MAIN-2019-30,slk,9059482,8975432,0.3491\nCC-MAIN-2019-30,slv,3744338,3713254,0.1443\nCC-MAIN-2019-30,smo,5953,5916,0.0002\nCC-MAIN-2019-30,sna,5392,5322,0.0002\nCC-MAIN-2019-30,snd,19804,19602,0.0008\nCC-MAIN-2019-30,som,112597,112225,0.0043\nCC-MAIN-2019-30,sot,7375,7340,0.0003\nCC-MAIN-2019-30,spa,110378985,109447590,4.2539\nCC-MAIN-2019-30,sqi,1006128,999821,0.0388\nCC-MAIN-2019-30,srp,5429577,5387301,0.2092\nCC-MAIN-2019-30,ssw,1131,1113,0.0000\nCC-MAIN-2019-30,sun,25024,24987,0.0010\nCC-MAIN-2019-30,sux,282,282,0.0000\nCC-MAIN-2019-30,swa,190391,188950,0.0073\nCC-MAIN-2019-30,swe,19968488,19795903,0.7696\nCC-MAIN-2019-30,syr,13352,13253,0.0005\nCC-MAIN-2019-30,tam,1103131,1096482,0.0425\nCC-MAIN-2019-30,tat,163163,162280,0.0063\nCC-MAIN-2019-30,tel,422345,420418,0.0163\nCC-MAIN-2019-30,tgk,117968,116923,0.0045\nCC-MAIN-2019-30,tgl,138195,137358,0.0053\nCC-MAIN-2019-30,tha,8015518,7968735,0.3089\nCC-MAIN-2019-30,tir,10788,10772,0.0004\nCC-MAIN-2019-30,ton,5026,5018,0.0002\nCC-MAIN-2019-30,tsn,2530,2511,0.0001\nCC-MAIN-2019-30,tso,2383,2372,0.0001\nCC-MAIN-2019-30,tuk,29240,28988,0.0011\nCC-MAIN-2019-30,tur,22944535,22753782,0.8843\nCC-MAIN-2019-30,uig,25712,25670,0.0010\nCC-MAIN-2019-30,ukr,9562669,9508321,0.3685\nCC-MAIN-2019-30,urd,622680,618720,0.0240\nCC-MAIN-2019-30,uzb,444323,442098,0.0171\nCC-MAIN-2019-30,ven,660,656,0.0000\nCC-MAIN-2019-30,vie,18935668,18802563,0.7298\nCC-MAIN-2019-30,vol,41489,41349,0.0016\nCC-MAIN-2019-30,war,89568,89106,0.0035\nCC-MAIN-2019-30,wol,4547,4488,0.0002\nCC-MAIN-2019-30,xho,9956,9847,0.0004\nCC-MAIN-2019-30,yid,42924,42778,0.0017\nCC-MAIN-2019-30,yor,19659,19593,0.0008\nCC-MAIN-2019-30,zha,1922,1888,0.0001\nCC-MAIN-2019-30,zho,165765190,164654228,6.3884\nCC-MAIN-2019-30,zul,16333,16252,0.0006\nCC-MAIN-2019-35,<unknown>,62831863,62831863,2.1264\nCC-MAIN-2019-35,aar,6559,6539,0.0002\nCC-MAIN-2019-35,abk,9564,9527,0.0003\nCC-MAIN-2019-35,afr,382169,379374,0.0129\nCC-MAIN-2019-35,aka,3151,3139,0.0001\nCC-MAIN-2019-35,amh,65352,64818,0.0022\nCC-MAIN-2019-35,ara,17504547,17378999,0.5924\nCC-MAIN-2019-35,asm,24728,24366,0.0008\nCC-MAIN-2019-35,aym,2797,2717,0.0001\nCC-MAIN-2019-35,aze,1647494,1634852,0.0558\nCC-MAIN-2019-35,bak,55516,55084,0.0019\nCC-MAIN-2019-35,bel,619317,615160,0.0210\nCC-MAIN-2019-35,ben,2084218,2073448,0.0705\nCC-MAIN-2019-35,bih,18683,18585,0.0006\nCC-MAIN-2019-35,bis,4800,4776,0.0002\nCC-MAIN-2019-35,blu,17361,17300,0.0006\nCC-MAIN-2019-35,bod,58961,58538,0.0020\nCC-MAIN-2019-35,bos,1291253,1284451,0.0437\nCC-MAIN-2019-35,bre,100532,99895,0.0034\nCC-MAIN-2019-35,bul,9496020,9418204,0.3214\nCC-MAIN-2019-35,cat,7606578,7539523,0.2574\nCC-MAIN-2019-35,ceb,48967,48876,0.0017\nCC-MAIN-2019-35,ces,29382886,29112639,0.9944\nCC-MAIN-2019-35,chr,2183,2157,0.0001\nCC-MAIN-2019-35,cos,74283,73365,0.0025\nCC-MAIN-2019-35,crs,3013,2993,0.0001\nCC-MAIN-2019-35,cym,331498,328203,0.0112\nCC-MAIN-2019-35,dan,12394596,12267781,0.4195\nCC-MAIN-2019-35,deu,158429329,156777845,5.3617\nCC-MAIN-2019-35,div,43983,43489,0.0015\nCC-MAIN-2019-35,dzo,1766,1757,0.0001\nCC-MAIN-2019-35,ell,16566999,16468642,0.5607\nCC-MAIN-2019-35,eng,1292878331,1278892583,43.7547\nCC-MAIN-2019-35,epo,280281,279149,0.0095\nCC-MAIN-2019-35,est,4502008,4449448,0.1524\nCC-MAIN-2019-35,eus,1140247,1129139,0.0386\nCC-MAIN-2019-35,fao,149512,147986,0.0051\nCC-MAIN-2019-35,fas,17145084,16998729,0.5802\nCC-MAIN-2019-35,fij,2819,2805,0.0001\nCC-MAIN-2019-35,fin,11285948,11180186,0.3819\nCC-MAIN-2019-35,fra,131391269,130158607,4.4467\nCC-MAIN-2019-35,fry,85997,85470,0.0029\nCC-MAIN-2019-35,gla,42174,42071,0.0014\nCC-MAIN-2019-35,gle,166863,165727,0.0056\nCC-MAIN-2019-35,glg,1295075,1287480,0.0438\nCC-MAIN-2019-35,glv,13887,13612,0.0005\nCC-MAIN-2019-35,got,842,842,0.0000\nCC-MAIN-2019-35,grn,30760,30573,0.0010\nCC-MAIN-2019-35,guj,234146,233137,0.0079\nCC-MAIN-2019-35,hat,39476,39095,0.0013\nCC-MAIN-2019-35,hau,45025,44184,0.0015\nCC-MAIN-2019-35,haw,16145,16056,0.0005\nCC-MAIN-2019-35,heb,8485369,8394303,0.2872\nCC-MAIN-2019-35,hin,3348636,3329319,0.1133\nCC-MAIN-2019-35,hrv,6491656,6445970,0.2197\nCC-MAIN-2019-35,hun,15046166,14920769,0.5092\nCC-MAIN-2019-35,hye,1186635,1179094,0.0402\nCC-MAIN-2019-35,ibo,8918,8899,0.0003\nCC-MAIN-2019-35,iku,6086,5973,0.0002\nCC-MAIN-2019-35,ile,15892,15834,0.0005\nCC-MAIN-2019-35,ina,25553,25176,0.0009\nCC-MAIN-2019-35,ind,22023338,21869459,0.7453\nCC-MAIN-2019-35,ipk,3234,3154,0.0001\nCC-MAIN-2019-35,isl,1214372,1203740,0.0411\nCC-MAIN-2019-35,ita,67221480,66646603,2.2750\nCC-MAIN-2019-35,jav,63296,62937,0.0021\nCC-MAIN-2019-35,jpn,139528882,138521544,4.7221\nCC-MAIN-2019-35,kal,32344,32189,0.0011\nCC-MAIN-2019-35,kan,272659,271059,0.0092\nCC-MAIN-2019-35,kas,118,118,0.0000\nCC-MAIN-2019-35,kat,1694317,1684275,0.0573\nCC-MAIN-2019-35,kaz,795183,790524,0.0269\nCC-MAIN-2019-35,kha,7775,7737,0.0003\nCC-MAIN-2019-35,khm,270607,269363,0.0092\nCC-MAIN-2019-35,kin,70553,70255,0.0024\nCC-MAIN-2019-35,kir,179155,178232,0.0061\nCC-MAIN-2019-35,kor,21727555,21639546,0.7353\nCC-MAIN-2019-35,kur,222034,220448,0.0075\nCC-MAIN-2019-35,lao,97920,97753,0.0033\nCC-MAIN-2019-35,lat,1640157,1634713,0.0555\nCC-MAIN-2019-35,lav,3788677,3749139,0.1282\nCC-MAIN-2019-35,lif,103,99,0.0000\nCC-MAIN-2019-35,lin,7873,7647,0.0003\nCC-MAIN-2019-35,lit,7163994,7108937,0.2424\nCC-MAIN-2019-35,ltz,133785,133138,0.0045\nCC-MAIN-2019-35,lug,6138,6112,0.0002\nCC-MAIN-2019-35,mal,559007,556878,0.0189\nCC-MAIN-2019-35,mar,369499,365303,0.0125\nCC-MAIN-2019-35,mfe,3501,3489,0.0001\nCC-MAIN-2019-35,mkd,724867,720720,0.0245\nCC-MAIN-2019-35,mlg,124795,124512,0.0042\nCC-MAIN-2019-35,mlt,92613,92208,0.0031\nCC-MAIN-2019-35,mon,572133,569556,0.0194\nCC-MAIN-2019-35,mri,30441,29612,0.0010\nCC-MAIN-2019-35,msa,3865219,3845733,0.1308\nCC-MAIN-2019-35,mya,312765,311298,0.0106\nCC-MAIN-2019-35,nau,1581,1569,0.0001\nCC-MAIN-2019-35,nep,515003,509932,0.0174\nCC-MAIN-2019-35,nld,50669864,50170902,1.7148\nCC-MAIN-2019-35,nno,609346,605016,0.0206\nCC-MAIN-2019-35,nor,9242653,9151578,0.3128\nCC-MAIN-2019-35,nso,5075,4974,0.0002\nCC-MAIN-2019-35,nya,7717,7688,0.0003\nCC-MAIN-2019-35,oci,133670,132604,0.0045\nCC-MAIN-2019-35,ori,76262,76057,0.0026\nCC-MAIN-2019-35,orm,14042,13979,0.0005\nCC-MAIN-2019-35,pan,151982,151653,0.0051\nCC-MAIN-2019-35,pol,49960876,49534904,1.6908\nCC-MAIN-2019-35,por,59847290,59377082,2.0254\nCC-MAIN-2019-35,pus,101096,99850,0.0034\nCC-MAIN-2019-35,que,25930,25416,0.0009\nCC-MAIN-2019-35,roh,52376,52062,0.0018\nCC-MAIN-2019-35,ron,15980971,15864497,0.5408\nCC-MAIN-2019-35,run,4109,4081,0.0001\nCC-MAIN-2019-35,rus,202885815,201433206,6.8662\nCC-MAIN-2019-35,sag,943,938,0.0000\nCC-MAIN-2019-35,san,87598,87261,0.0030\nCC-MAIN-2019-35,sco,20668,20452,0.0007\nCC-MAIN-2019-35,sin,205682,204681,0.0070\nCC-MAIN-2019-35,slk,8667750,8592287,0.2933\nCC-MAIN-2019-35,slv,4894132,4851557,0.1656\nCC-MAIN-2019-35,smo,9409,9352,0.0003\nCC-MAIN-2019-35,sna,8025,7972,0.0003\nCC-MAIN-2019-35,snd,23453,23201,0.0008\nCC-MAIN-2019-35,som,116646,116240,0.0039\nCC-MAIN-2019-35,sot,8328,8294,0.0003\nCC-MAIN-2019-35,spa,120401300,119404190,4.0747\nCC-MAIN-2019-35,sqi,1286790,1278582,0.0435\nCC-MAIN-2019-35,srp,6969493,6915503,0.2359\nCC-MAIN-2019-35,ssw,2081,2010,0.0001\nCC-MAIN-2019-35,sun,36989,36715,0.0013\nCC-MAIN-2019-35,sux,127,127,0.0000\nCC-MAIN-2019-35,swa,229577,228616,0.0078\nCC-MAIN-2019-35,swe,22340045,22158289,0.7561\nCC-MAIN-2019-35,syr,14978,14851,0.0005\nCC-MAIN-2019-35,tam,1251112,1242357,0.0423\nCC-MAIN-2019-35,tat,195867,194231,0.0066\nCC-MAIN-2019-35,tel,470202,468667,0.0159\nCC-MAIN-2019-35,tgk,143676,143199,0.0049\nCC-MAIN-2019-35,tgl,177521,176477,0.0060\nCC-MAIN-2019-35,tha,9297938,9243272,0.3147\nCC-MAIN-2019-35,tir,21278,21143,0.0007\nCC-MAIN-2019-35,ton,5816,5805,0.0002\nCC-MAIN-2019-35,tsn,4084,4035,0.0001\nCC-MAIN-2019-35,tso,2783,2765,0.0001\nCC-MAIN-2019-35,tuk,46256,45827,0.0016\nCC-MAIN-2019-35,tur,25573772,25355058,0.8655\nCC-MAIN-2019-35,uig,33801,33473,0.0011\nCC-MAIN-2019-35,ukr,10918335,10848960,0.3695\nCC-MAIN-2019-35,urd,707840,703466,0.0240\nCC-MAIN-2019-35,uzb,554293,551295,0.0188\nCC-MAIN-2019-35,ven,1103,1098,0.0000\nCC-MAIN-2019-35,vie,22485123,22325274,0.7610\nCC-MAIN-2019-35,vol,41343,41247,0.0014\nCC-MAIN-2019-35,war,134263,133849,0.0045\nCC-MAIN-2019-35,wol,5712,5673,0.0002\nCC-MAIN-2019-35,xho,12128,12014,0.0004\nCC-MAIN-2019-35,yid,63174,62211,0.0021\nCC-MAIN-2019-35,yor,19851,19803,0.0007\nCC-MAIN-2019-35,zha,2608,2573,0.0001\nCC-MAIN-2019-35,zho,235739707,234353838,7.9781\nCC-MAIN-2019-35,zul,24652,24545,0.0008\nCC-MAIN-2019-39,<unknown>,77754022,77754022,3.0360\nCC-MAIN-2019-39,aar,3440,3424,0.0001\nCC-MAIN-2019-39,abk,8505,8486,0.0003\nCC-MAIN-2019-39,afr,371052,369209,0.0145\nCC-MAIN-2019-39,aka,1359,1355,0.0001\nCC-MAIN-2019-39,amh,61223,60906,0.0024\nCC-MAIN-2019-39,ara,15912537,15795605,0.6213\nCC-MAIN-2019-39,asm,21316,21210,0.0008\nCC-MAIN-2019-39,aym,3125,3070,0.0001\nCC-MAIN-2019-39,aze,1646943,1637276,0.0643\nCC-MAIN-2019-39,bak,50870,50710,0.0020\nCC-MAIN-2019-39,bel,617101,612656,0.0241\nCC-MAIN-2019-39,ben,2010097,1997005,0.0785\nCC-MAIN-2019-39,bih,12642,12595,0.0005\nCC-MAIN-2019-39,bis,3952,3928,0.0002\nCC-MAIN-2019-39,blu,14065,14025,0.0005\nCC-MAIN-2019-39,bod,57531,57500,0.0022\nCC-MAIN-2019-39,bos,1258498,1252016,0.0491\nCC-MAIN-2019-39,bre,88076,87870,0.0034\nCC-MAIN-2019-39,bul,7212237,7162213,0.2816\nCC-MAIN-2019-39,cat,7372520,7315741,0.2879\nCC-MAIN-2019-39,ceb,61772,61690,0.0024\nCC-MAIN-2019-39,ces,26290352,25993646,1.0265\nCC-MAIN-2019-39,chr,1631,1629,0.0001\nCC-MAIN-2019-39,cos,57491,57272,0.0022\nCC-MAIN-2019-39,crs,2672,2608,0.0001\nCC-MAIN-2019-39,cym,320654,318793,0.0125\nCC-MAIN-2019-39,dan,10752796,10653202,0.4199\nCC-MAIN-2019-39,deu,133325568,132145333,5.2059\nCC-MAIN-2019-39,div,41094,40899,0.0016\nCC-MAIN-2019-39,dzo,1761,1761,0.0001\nCC-MAIN-2019-39,ell,14451189,14375162,0.5643\nCC-MAIN-2019-39,eng,1125378295,1113867957,43.9418\nCC-MAIN-2019-39,epo,278691,277770,0.0109\nCC-MAIN-2019-39,est,4631189,4584537,0.1808\nCC-MAIN-2019-39,eus,1135159,1118993,0.0443\nCC-MAIN-2019-39,fao,144313,143569,0.0056\nCC-MAIN-2019-39,fas,13832049,13716723,0.5401\nCC-MAIN-2019-39,fij,1884,1873,0.0001\nCC-MAIN-2019-39,fin,10110565,10016135,0.3948\nCC-MAIN-2019-39,fra,113807749,112839604,4.4438\nCC-MAIN-2019-39,fry,77361,77150,0.0030\nCC-MAIN-2019-39,gla,34286,34233,0.0013\nCC-MAIN-2019-39,gle,164417,163440,0.0064\nCC-MAIN-2019-39,glg,1301286,1293148,0.0508\nCC-MAIN-2019-39,glv,9625,9606,0.0004\nCC-MAIN-2019-39,got,621,620,0.0000\nCC-MAIN-2019-39,grn,26705,26562,0.0010\nCC-MAIN-2019-39,guj,224047,223285,0.0087\nCC-MAIN-2019-39,hat,33901,33757,0.0013\nCC-MAIN-2019-39,hau,43297,42839,0.0017\nCC-MAIN-2019-39,haw,15405,15380,0.0006\nCC-MAIN-2019-39,heb,8402090,8325412,0.3281\nCC-MAIN-2019-39,hin,3067766,3054043,0.1198\nCC-MAIN-2019-39,hrv,6409001,6365202,0.2502\nCC-MAIN-2019-39,hun,13241006,13146198,0.5170\nCC-MAIN-2019-39,hye,1163147,1155842,0.0454\nCC-MAIN-2019-39,ibo,8357,8316,0.0003\nCC-MAIN-2019-39,iku,4724,4646,0.0002\nCC-MAIN-2019-39,ile,10290,10253,0.0004\nCC-MAIN-2019-39,ina,20538,20502,0.0008\nCC-MAIN-2019-39,ind,18932863,18805346,0.7393\nCC-MAIN-2019-39,ipk,3520,3454,0.0001\nCC-MAIN-2019-39,isl,1257667,1244814,0.0491\nCC-MAIN-2019-39,ita,57544414,57125584,2.2469\nCC-MAIN-2019-39,jav,51502,51375,0.0020\nCC-MAIN-2019-39,jpn,118155238,117319333,4.6135\nCC-MAIN-2019-39,kal,34712,34509,0.0014\nCC-MAIN-2019-39,kan,295226,293651,0.0115\nCC-MAIN-2019-39,kas,133,133,0.0000\nCC-MAIN-2019-39,kat,1521406,1515278,0.0594\nCC-MAIN-2019-39,kaz,774529,766792,0.0302\nCC-MAIN-2019-39,kha,6983,6975,0.0003\nCC-MAIN-2019-39,khm,241401,240647,0.0094\nCC-MAIN-2019-39,kin,66999,66636,0.0026\nCC-MAIN-2019-39,kir,153121,152536,0.0060\nCC-MAIN-2019-39,kor,19045934,18968952,0.7437\nCC-MAIN-2019-39,kur,223083,222085,0.0087\nCC-MAIN-2019-39,lao,91163,91030,0.0036\nCC-MAIN-2019-39,lat,1372976,1368967,0.0536\nCC-MAIN-2019-39,lav,3896311,3859418,0.1521\nCC-MAIN-2019-39,lif,80,74,0.0000\nCC-MAIN-2019-39,lin,6804,6700,0.0003\nCC-MAIN-2019-39,lit,6621720,6572143,0.2586\nCC-MAIN-2019-39,ltz,124982,124480,0.0049\nCC-MAIN-2019-39,lug,5516,5507,0.0002\nCC-MAIN-2019-39,mal,510133,508616,0.0199\nCC-MAIN-2019-39,mar,354041,346792,0.0138\nCC-MAIN-2019-39,mfe,2258,2249,0.0001\nCC-MAIN-2019-39,mkd,621391,617810,0.0243\nCC-MAIN-2019-39,mlg,131605,131261,0.0051\nCC-MAIN-2019-39,mlt,85230,84724,0.0033\nCC-MAIN-2019-39,mon,576917,574625,0.0225\nCC-MAIN-2019-39,mri,33485,33267,0.0013\nCC-MAIN-2019-39,msa,3630315,3613723,0.1418\nCC-MAIN-2019-39,mya,289854,288232,0.0113\nCC-MAIN-2019-39,nau,1260,1254,0.0000\nCC-MAIN-2019-39,nep,472479,469169,0.0184\nCC-MAIN-2019-39,nld,43150308,42789747,1.6849\nCC-MAIN-2019-39,nno,637168,633138,0.0249\nCC-MAIN-2019-39,nor,8278280,8197040,0.3232\nCC-MAIN-2019-39,nso,3279,3279,0.0001\nCC-MAIN-2019-39,nya,9084,9062,0.0004\nCC-MAIN-2019-39,oci,108560,108290,0.0042\nCC-MAIN-2019-39,ori,66397,66188,0.0026\nCC-MAIN-2019-39,orm,9432,9373,0.0004\nCC-MAIN-2019-39,pan,151926,151555,0.0059\nCC-MAIN-2019-39,pol,43819116,43455187,1.7110\nCC-MAIN-2019-39,por,54582139,54160714,2.1312\nCC-MAIN-2019-39,pus,94664,93803,0.0037\nCC-MAIN-2019-39,que,20750,20711,0.0008\nCC-MAIN-2019-39,roh,45431,45127,0.0018\nCC-MAIN-2019-39,ron,13825332,13737402,0.5398\nCC-MAIN-2019-39,run,2561,2533,0.0001\nCC-MAIN-2019-39,rus,169974819,168634495,6.6369\nCC-MAIN-2019-39,sag,360,359,0.0000\nCC-MAIN-2019-39,san,88850,87372,0.0035\nCC-MAIN-2019-39,sco,17673,17629,0.0007\nCC-MAIN-2019-39,sin,189130,188553,0.0074\nCC-MAIN-2019-39,slk,11609076,11507250,0.4533\nCC-MAIN-2019-39,slv,4882334,4844652,0.1906\nCC-MAIN-2019-39,smo,11512,11460,0.0004\nCC-MAIN-2019-39,sna,6863,6831,0.0003\nCC-MAIN-2019-39,snd,20674,20424,0.0008\nCC-MAIN-2019-39,som,102300,101935,0.0040\nCC-MAIN-2019-39,sot,10372,10308,0.0004\nCC-MAIN-2019-39,spa,102973860,102171592,4.0207\nCC-MAIN-2019-39,sqi,1230728,1221901,0.0481\nCC-MAIN-2019-39,srp,6878145,6825316,0.2686\nCC-MAIN-2019-39,ssw,1231,1171,0.0000\nCC-MAIN-2019-39,sun,35219,35081,0.0014\nCC-MAIN-2019-39,sux,46,46,0.0000\nCC-MAIN-2019-39,swa,227183,225522,0.0089\nCC-MAIN-2019-39,swe,19867660,19722766,0.7758\nCC-MAIN-2019-39,syr,15664,15617,0.0006\nCC-MAIN-2019-39,tam,1173244,1166632,0.0458\nCC-MAIN-2019-39,tat,177692,176281,0.0069\nCC-MAIN-2019-39,tel,447660,445909,0.0175\nCC-MAIN-2019-39,tgk,137324,136860,0.0054\nCC-MAIN-2019-39,tgl,165636,164904,0.0065\nCC-MAIN-2019-39,tha,8010553,7964062,0.3128\nCC-MAIN-2019-39,tir,18014,17915,0.0007\nCC-MAIN-2019-39,ton,3661,3659,0.0001\nCC-MAIN-2019-39,tsn,4050,4035,0.0002\nCC-MAIN-2019-39,tso,1890,1886,0.0001\nCC-MAIN-2019-39,tuk,43263,43042,0.0017\nCC-MAIN-2019-39,tur,22192037,22009890,0.8665\nCC-MAIN-2019-39,uig,38585,38481,0.0015\nCC-MAIN-2019-39,ukr,9462650,9400688,0.3695\nCC-MAIN-2019-39,urd,664951,660108,0.0260\nCC-MAIN-2019-39,uzb,548941,544205,0.0214\nCC-MAIN-2019-39,ven,1250,1249,0.0000\nCC-MAIN-2019-39,vie,18359382,18231675,0.7169\nCC-MAIN-2019-39,vol,45940,45894,0.0018\nCC-MAIN-2019-39,war,91962,91695,0.0036\nCC-MAIN-2019-39,wol,5241,5200,0.0002\nCC-MAIN-2019-39,xho,10501,10471,0.0004\nCC-MAIN-2019-39,yid,58291,57875,0.0023\nCC-MAIN-2019-39,yor,24429,24361,0.0010\nCC-MAIN-2019-39,zha,2340,2327,0.0001\nCC-MAIN-2019-39,zho,175896132,174677752,6.8681\nCC-MAIN-2019-39,zul,26061,25979,0.0010\nCC-MAIN-2019-43,<unknown>,68333048,68333048,2.2634\nCC-MAIN-2019-43,aar,7786,7758,0.0003\nCC-MAIN-2019-43,abk,9861,9852,0.0003\nCC-MAIN-2019-43,afr,452935,448626,0.0150\nCC-MAIN-2019-43,aka,3024,3020,0.0001\nCC-MAIN-2019-43,amh,70282,69982,0.0023\nCC-MAIN-2019-43,ara,17576335,17429378,0.5822\nCC-MAIN-2019-43,asm,30001,29907,0.0010\nCC-MAIN-2019-43,aym,4041,4010,0.0001\nCC-MAIN-2019-43,aze,1708469,1698734,0.0566\nCC-MAIN-2019-43,bak,51459,51417,0.0017\nCC-MAIN-2019-43,bel,691940,681225,0.0229\nCC-MAIN-2019-43,ben,2220766,2207269,0.0736\nCC-MAIN-2019-43,bih,17504,17423,0.0006\nCC-MAIN-2019-43,bis,3217,3204,0.0001\nCC-MAIN-2019-43,blu,18882,18805,0.0006\nCC-MAIN-2019-43,bod,59359,58921,0.0020\nCC-MAIN-2019-43,bos,1336565,1331236,0.0443\nCC-MAIN-2019-43,bre,95532,95296,0.0032\nCC-MAIN-2019-43,bul,9302605,9234047,0.3081\nCC-MAIN-2019-43,cat,8485099,8433420,0.2811\nCC-MAIN-2019-43,ceb,65435,65390,0.0022\nCC-MAIN-2019-43,ces,30132506,29779035,0.9981\nCC-MAIN-2019-43,chr,2060,2058,0.0001\nCC-MAIN-2019-43,cos,74630,74280,0.0025\nCC-MAIN-2019-43,crs,2290,2283,0.0001\nCC-MAIN-2019-43,cym,356110,354302,0.0118\nCC-MAIN-2019-43,dan,12537046,12415225,0.4153\nCC-MAIN-2019-43,deu,160518300,159044911,5.3169\nCC-MAIN-2019-43,div,40632,40472,0.0013\nCC-MAIN-2019-43,dzo,2167,2164,0.0001\nCC-MAIN-2019-43,ell,16458228,16354367,0.5451\nCC-MAIN-2019-43,eng,1305246368,1292378111,43.2339\nCC-MAIN-2019-43,epo,327182,326219,0.0108\nCC-MAIN-2019-43,est,5337746,5261123,0.1768\nCC-MAIN-2019-43,eus,1168007,1154094,0.0387\nCC-MAIN-2019-43,fao,146045,145110,0.0048\nCC-MAIN-2019-43,fas,15433238,15280448,0.5112\nCC-MAIN-2019-43,fij,1672,1663,0.0001\nCC-MAIN-2019-43,fin,11636400,11538478,0.3854\nCC-MAIN-2019-43,fra,130838304,129636658,4.3338\nCC-MAIN-2019-43,fry,96243,96061,0.0032\nCC-MAIN-2019-43,gla,41348,41253,0.0014\nCC-MAIN-2019-43,gle,185548,184641,0.0061\nCC-MAIN-2019-43,glg,1302858,1296261,0.0432\nCC-MAIN-2019-43,glv,10541,10445,0.0003\nCC-MAIN-2019-43,got,709,708,0.0000\nCC-MAIN-2019-43,grn,28275,28129,0.0009\nCC-MAIN-2019-43,guj,306958,304871,0.0102\nCC-MAIN-2019-43,hat,42246,42091,0.0014\nCC-MAIN-2019-43,hau,51728,51232,0.0017\nCC-MAIN-2019-43,haw,18889,18816,0.0006\nCC-MAIN-2019-43,heb,8299022,8232275,0.2749\nCC-MAIN-2019-43,hin,3863882,3840845,0.1280\nCC-MAIN-2019-43,hrv,7033244,6984687,0.2330\nCC-MAIN-2019-43,hun,15538830,15416126,0.5147\nCC-MAIN-2019-43,hye,1252851,1242119,0.0415\nCC-MAIN-2019-43,ibo,12650,12580,0.0004\nCC-MAIN-2019-43,iku,4871,4836,0.0002\nCC-MAIN-2019-43,ile,11244,11203,0.0004\nCC-MAIN-2019-43,ina,24968,24848,0.0008\nCC-MAIN-2019-43,ind,21183230,21035431,0.7017\nCC-MAIN-2019-43,ipk,2498,2474,0.0001\nCC-MAIN-2019-43,isl,1262710,1247981,0.0418\nCC-MAIN-2019-43,ita,68033611,67520341,2.2535\nCC-MAIN-2019-43,jav,63555,63365,0.0021\nCC-MAIN-2019-43,jpn,139070396,138108858,4.6064\nCC-MAIN-2019-43,kal,33384,33256,0.0011\nCC-MAIN-2019-43,kan,363952,359597,0.0121\nCC-MAIN-2019-43,kas,30,30,0.0000\nCC-MAIN-2019-43,kat,1586882,1578363,0.0526\nCC-MAIN-2019-43,kaz,876068,869001,0.0290\nCC-MAIN-2019-43,kha,4909,4891,0.0002\nCC-MAIN-2019-43,khm,267902,266781,0.0089\nCC-MAIN-2019-43,kin,76687,76497,0.0025\nCC-MAIN-2019-43,kir,179829,179252,0.0060\nCC-MAIN-2019-43,kor,23313095,23230908,0.7722\nCC-MAIN-2019-43,kur,224845,222772,0.0074\nCC-MAIN-2019-43,lao,109727,109283,0.0036\nCC-MAIN-2019-43,lat,1607792,1602180,0.0533\nCC-MAIN-2019-43,lav,4073657,4038949,0.1349\nCC-MAIN-2019-43,lif,84,81,0.0000\nCC-MAIN-2019-43,lin,8671,8652,0.0003\nCC-MAIN-2019-43,lit,7276534,7217618,0.2410\nCC-MAIN-2019-43,ltz,135673,134811,0.0045\nCC-MAIN-2019-43,lug,6758,6748,0.0002\nCC-MAIN-2019-43,mal,599035,597216,0.0198\nCC-MAIN-2019-43,mar,393313,389995,0.0130\nCC-MAIN-2019-43,mfe,1793,1789,0.0001\nCC-MAIN-2019-43,mkd,677479,674235,0.0224\nCC-MAIN-2019-43,mlg,135837,135345,0.0045\nCC-MAIN-2019-43,mlt,94256,93310,0.0031\nCC-MAIN-2019-43,mon,595935,592000,0.0197\nCC-MAIN-2019-43,mri,42271,41954,0.0014\nCC-MAIN-2019-43,msa,3911189,3898893,0.1296\nCC-MAIN-2019-43,mya,330804,329835,0.0110\nCC-MAIN-2019-43,nau,1179,1175,0.0000\nCC-MAIN-2019-43,nep,483046,478546,0.0160\nCC-MAIN-2019-43,nld,49949567,49524950,1.6545\nCC-MAIN-2019-43,nno,691983,686550,0.0229\nCC-MAIN-2019-43,nor,9175833,9100714,0.3039\nCC-MAIN-2019-43,nso,3819,3809,0.0001\nCC-MAIN-2019-43,nya,11113,11059,0.0004\nCC-MAIN-2019-43,oci,133003,132489,0.0044\nCC-MAIN-2019-43,ori,74605,74447,0.0025\nCC-MAIN-2019-43,orm,12149,12126,0.0004\nCC-MAIN-2019-43,pan,187797,187080,0.0062\nCC-MAIN-2019-43,pol,51213677,50794424,1.6964\nCC-MAIN-2019-43,por,60860932,60381112,2.0159\nCC-MAIN-2019-43,pus,92733,91228,0.0031\nCC-MAIN-2019-43,que,24083,23981,0.0008\nCC-MAIN-2019-43,roh,52501,52254,0.0017\nCC-MAIN-2019-43,ron,15610094,15499622,0.5171\nCC-MAIN-2019-43,run,2709,2678,0.0001\nCC-MAIN-2019-43,rus,196189482,194709242,6.4984\nCC-MAIN-2019-43,sag,402,402,0.0000\nCC-MAIN-2019-43,san,114002,113623,0.0038\nCC-MAIN-2019-43,sco,16681,16615,0.0006\nCC-MAIN-2019-43,sin,190504,190065,0.0063\nCC-MAIN-2019-43,slk,10168566,10068344,0.3368\nCC-MAIN-2019-43,slv,5364438,5327100,0.1777\nCC-MAIN-2019-43,smo,11439,11375,0.0004\nCC-MAIN-2019-43,sna,6610,6566,0.0002\nCC-MAIN-2019-43,snd,23096,22647,0.0008\nCC-MAIN-2019-43,som,110226,109827,0.0037\nCC-MAIN-2019-43,sot,12493,12479,0.0004\nCC-MAIN-2019-43,spa,120487115,119569914,3.9909\nCC-MAIN-2019-43,sqi,1292384,1285434,0.0428\nCC-MAIN-2019-43,srp,7761339,7699471,0.2571\nCC-MAIN-2019-43,ssw,1353,1339,0.0000\nCC-MAIN-2019-43,sun,35085,34877,0.0012\nCC-MAIN-2019-43,sux,67,67,0.0000\nCC-MAIN-2019-43,swa,224861,223087,0.0074\nCC-MAIN-2019-43,swe,22524695,22358918,0.7461\nCC-MAIN-2019-43,syr,13808,13671,0.0005\nCC-MAIN-2019-43,tam,1426462,1418179,0.0472\nCC-MAIN-2019-43,tat,178430,177742,0.0059\nCC-MAIN-2019-43,tel,614525,612127,0.0204\nCC-MAIN-2019-43,tgk,156283,156012,0.0052\nCC-MAIN-2019-43,tgl,199991,199369,0.0066\nCC-MAIN-2019-43,tha,10740949,10658331,0.3558\nCC-MAIN-2019-43,tir,17327,17285,0.0006\nCC-MAIN-2019-43,ton,3620,3615,0.0001\nCC-MAIN-2019-43,tsn,7824,7769,0.0003\nCC-MAIN-2019-43,tso,2288,2277,0.0001\nCC-MAIN-2019-43,tuk,45642,45284,0.0015\nCC-MAIN-2019-43,tur,24893179,24674579,0.8245\nCC-MAIN-2019-43,uig,48941,48837,0.0016\nCC-MAIN-2019-43,ukr,10796779,10730673,0.3576\nCC-MAIN-2019-43,urd,796106,791571,0.0264\nCC-MAIN-2019-43,uzb,588841,585363,0.0195\nCC-MAIN-2019-43,ven,1186,1185,0.0000\nCC-MAIN-2019-43,vie,22317510,22157832,0.7392\nCC-MAIN-2019-43,vol,43663,43583,0.0014\nCC-MAIN-2019-43,war,118778,118537,0.0039\nCC-MAIN-2019-43,wol,4537,4447,0.0002\nCC-MAIN-2019-43,xho,11708,11684,0.0004\nCC-MAIN-2019-43,yid,74865,74382,0.0025\nCC-MAIN-2019-43,yor,21854,21817,0.0007\nCC-MAIN-2019-43,zha,2585,2550,0.0001\nCC-MAIN-2019-43,zho,277288657,275925883,9.1847\nCC-MAIN-2019-43,zul,30158,30126,0.0010\nCC-MAIN-2019-47,<unknown>,59006038,59006038,2.2777\nCC-MAIN-2019-47,aar,3628,3596,0.0001\nCC-MAIN-2019-47,abk,9589,9580,0.0004\nCC-MAIN-2019-47,afr,350120,347784,0.0135\nCC-MAIN-2019-47,aka,2579,2574,0.0001\nCC-MAIN-2019-47,amh,58221,57131,0.0022\nCC-MAIN-2019-47,ara,14804478,14663359,0.5715\nCC-MAIN-2019-47,asm,20308,20172,0.0008\nCC-MAIN-2019-47,aym,2163,2129,0.0001\nCC-MAIN-2019-47,aze,1610581,1601745,0.0622\nCC-MAIN-2019-47,bak,49231,49053,0.0019\nCC-MAIN-2019-47,bel,635345,628111,0.0245\nCC-MAIN-2019-47,ben,1961358,1950536,0.0757\nCC-MAIN-2019-47,bih,14153,14109,0.0005\nCC-MAIN-2019-47,bis,4031,4019,0.0002\nCC-MAIN-2019-47,blu,15436,15290,0.0006\nCC-MAIN-2019-47,bod,65214,63886,0.0025\nCC-MAIN-2019-47,bos,1294356,1285167,0.0500\nCC-MAIN-2019-47,bre,80313,80143,0.0031\nCC-MAIN-2019-47,bul,7054467,6999684,0.2723\nCC-MAIN-2019-47,cat,8020183,7954317,0.3096\nCC-MAIN-2019-47,ceb,101306,101232,0.0039\nCC-MAIN-2019-47,ces,26229802,25953564,1.0125\nCC-MAIN-2019-47,chr,1657,1657,0.0001\nCC-MAIN-2019-47,cos,55999,55478,0.0022\nCC-MAIN-2019-47,crs,1531,1522,0.0001\nCC-MAIN-2019-47,cym,305406,303217,0.0118\nCC-MAIN-2019-47,dan,11277322,11161328,0.4353\nCC-MAIN-2019-47,deu,138414426,137054192,5.3430\nCC-MAIN-2019-47,div,39843,39730,0.0015\nCC-MAIN-2019-47,dzo,1968,1962,0.0001\nCC-MAIN-2019-47,ell,14436897,14318391,0.5573\nCC-MAIN-2019-47,eng,1133575107,1121843398,43.7573\nCC-MAIN-2019-47,epo,270148,269151,0.0104\nCC-MAIN-2019-47,est,5173046,5089521,0.1997\nCC-MAIN-2019-47,eus,1175365,1157629,0.0454\nCC-MAIN-2019-47,fao,134852,133903,0.0052\nCC-MAIN-2019-47,fas,12483575,12362944,0.4819\nCC-MAIN-2019-47,fij,1601,1596,0.0001\nCC-MAIN-2019-47,fin,10469258,10356745,0.4041\nCC-MAIN-2019-47,fra,114075636,113027439,4.4035\nCC-MAIN-2019-47,fry,77948,77797,0.0030\nCC-MAIN-2019-47,gla,32682,32560,0.0013\nCC-MAIN-2019-47,gle,159862,158785,0.0062\nCC-MAIN-2019-47,glg,1213361,1205161,0.0468\nCC-MAIN-2019-47,glv,8074,8049,0.0003\nCC-MAIN-2019-47,got,633,633,0.0000\nCC-MAIN-2019-47,grn,23338,23280,0.0009\nCC-MAIN-2019-47,guj,212946,212158,0.0082\nCC-MAIN-2019-47,hat,35564,35407,0.0014\nCC-MAIN-2019-47,hau,44360,43330,0.0017\nCC-MAIN-2019-47,haw,14723,14662,0.0006\nCC-MAIN-2019-47,heb,8500549,8423669,0.3281\nCC-MAIN-2019-47,hin,2916418,2903068,0.1126\nCC-MAIN-2019-47,hrv,6684142,6634036,0.2580\nCC-MAIN-2019-47,hun,13133660,13028248,0.5070\nCC-MAIN-2019-47,hye,1119629,1109096,0.0432\nCC-MAIN-2019-47,ibo,8663,8654,0.0003\nCC-MAIN-2019-47,iku,4325,4230,0.0002\nCC-MAIN-2019-47,ile,7564,7545,0.0003\nCC-MAIN-2019-47,ina,20152,20128,0.0008\nCC-MAIN-2019-47,ind,19453652,19313802,0.7509\nCC-MAIN-2019-47,ipk,2049,1993,0.0001\nCC-MAIN-2019-47,isl,1369351,1343619,0.0529\nCC-MAIN-2019-47,ita,59227849,58742978,2.2863\nCC-MAIN-2019-47,jav,54359,54275,0.0021\nCC-MAIN-2019-47,jpn,116548182,115801570,4.4989\nCC-MAIN-2019-47,kal,30163,30014,0.0012\nCC-MAIN-2019-47,kan,255037,253485,0.0098\nCC-MAIN-2019-47,kas,169,169,0.0000\nCC-MAIN-2019-47,kat,1480979,1471309,0.0572\nCC-MAIN-2019-47,kaz,792486,786829,0.0306\nCC-MAIN-2019-47,kha,5541,5530,0.0002\nCC-MAIN-2019-47,khm,222440,215984,0.0086\nCC-MAIN-2019-47,kin,45074,44463,0.0017\nCC-MAIN-2019-47,kir,164449,163149,0.0063\nCC-MAIN-2019-47,kor,19183876,19094013,0.7405\nCC-MAIN-2019-47,kur,197628,195816,0.0076\nCC-MAIN-2019-47,lao,94707,89953,0.0037\nCC-MAIN-2019-47,lat,1471809,1467180,0.0568\nCC-MAIN-2019-47,lav,3883884,3847910,0.1499\nCC-MAIN-2019-47,lif,87,84,0.0000\nCC-MAIN-2019-47,lin,9785,9762,0.0004\nCC-MAIN-2019-47,lit,6831762,6771843,0.2637\nCC-MAIN-2019-47,ltz,118015,117447,0.0046\nCC-MAIN-2019-47,lug,5982,5959,0.0002\nCC-MAIN-2019-47,mal,466942,465039,0.0180\nCC-MAIN-2019-47,mar,384760,373063,0.0149\nCC-MAIN-2019-47,mfe,2990,2986,0.0001\nCC-MAIN-2019-47,mkd,586068,581247,0.0226\nCC-MAIN-2019-47,mlg,97267,96938,0.0038\nCC-MAIN-2019-47,mlt,87827,87096,0.0034\nCC-MAIN-2019-47,mon,578247,575033,0.0223\nCC-MAIN-2019-47,mri,44826,44595,0.0017\nCC-MAIN-2019-47,msa,3846716,3830890,0.1485\nCC-MAIN-2019-47,mya,295187,291042,0.0114\nCC-MAIN-2019-47,nau,769,765,0.0000\nCC-MAIN-2019-47,nep,446020,442664,0.0172\nCC-MAIN-2019-47,nld,44994077,44559785,1.7368\nCC-MAIN-2019-47,nno,619647,615705,0.0239\nCC-MAIN-2019-47,nor,10267404,10156647,0.3963\nCC-MAIN-2019-47,nso,2643,2641,0.0001\nCC-MAIN-2019-47,nya,10938,10905,0.0004\nCC-MAIN-2019-47,oci,87497,87316,0.0034\nCC-MAIN-2019-47,ori,54731,54551,0.0021\nCC-MAIN-2019-47,orm,8367,7900,0.0003\nCC-MAIN-2019-47,pan,142683,141559,0.0055\nCC-MAIN-2019-47,pol,42461664,42074241,1.6391\nCC-MAIN-2019-47,por,55667619,55248827,2.1488\nCC-MAIN-2019-47,pus,84142,81940,0.0032\nCC-MAIN-2019-47,que,22529,22508,0.0009\nCC-MAIN-2019-47,roh,37059,36603,0.0014\nCC-MAIN-2019-47,ron,13907287,13792901,0.5368\nCC-MAIN-2019-47,run,1646,1606,0.0001\nCC-MAIN-2019-47,rus,170119732,168785073,6.5668\nCC-MAIN-2019-47,sag,462,462,0.0000\nCC-MAIN-2019-47,san,97235,96924,0.0038\nCC-MAIN-2019-47,sco,13227,13181,0.0005\nCC-MAIN-2019-47,sin,181532,180619,0.0070\nCC-MAIN-2019-47,slk,8606040,8536130,0.3322\nCC-MAIN-2019-47,slv,5274864,5229429,0.2036\nCC-MAIN-2019-47,smo,13785,13764,0.0005\nCC-MAIN-2019-47,sna,5934,5895,0.0002\nCC-MAIN-2019-47,snd,20590,20542,0.0008\nCC-MAIN-2019-47,som,88997,88349,0.0034\nCC-MAIN-2019-47,sot,8959,8922,0.0003\nCC-MAIN-2019-47,spa,107090805,106237308,4.1338\nCC-MAIN-2019-47,sqi,1203304,1195407,0.0464\nCC-MAIN-2019-47,srp,7397358,7330937,0.2855\nCC-MAIN-2019-47,ssw,691,687,0.0000\nCC-MAIN-2019-47,sun,31491,31287,0.0012\nCC-MAIN-2019-47,sux,89,88,0.0000\nCC-MAIN-2019-47,swa,197843,196247,0.0076\nCC-MAIN-2019-47,swe,19844757,19668411,0.7660\nCC-MAIN-2019-47,syr,15170,14955,0.0006\nCC-MAIN-2019-47,tam,1150511,1145577,0.0444\nCC-MAIN-2019-47,tat,161922,160005,0.0063\nCC-MAIN-2019-47,tel,433416,431767,0.0167\nCC-MAIN-2019-47,tgk,145813,144932,0.0056\nCC-MAIN-2019-47,tgl,164480,164030,0.0063\nCC-MAIN-2019-47,tha,8743485,8688960,0.3375\nCC-MAIN-2019-47,tir,19378,17061,0.0007\nCC-MAIN-2019-47,ton,2738,2733,0.0001\nCC-MAIN-2019-47,tsn,4866,4806,0.0002\nCC-MAIN-2019-47,tso,1123,1120,0.0000\nCC-MAIN-2019-47,tuk,40225,39859,0.0016\nCC-MAIN-2019-47,tur,21779530,21594773,0.8407\nCC-MAIN-2019-47,uig,43656,43572,0.0017\nCC-MAIN-2019-47,ukr,9085067,9025850,0.3507\nCC-MAIN-2019-47,urd,683323,679104,0.0264\nCC-MAIN-2019-47,uzb,587252,580642,0.0227\nCC-MAIN-2019-47,ven,2604,2602,0.0001\nCC-MAIN-2019-47,vie,19206124,19043596,0.7414\nCC-MAIN-2019-47,vol,36875,36856,0.0014\nCC-MAIN-2019-47,war,87816,87511,0.0034\nCC-MAIN-2019-47,wol,3942,3931,0.0002\nCC-MAIN-2019-47,xho,9192,9156,0.0004\nCC-MAIN-2019-47,yid,68904,68823,0.0027\nCC-MAIN-2019-47,yor,24269,24213,0.0009\nCC-MAIN-2019-47,zha,1415,1403,0.0001\nCC-MAIN-2019-47,zho,203704135,202699828,7.8632\nCC-MAIN-2019-47,zul,28250,28188,0.0011\nCC-MAIN-2019-51,<unknown>,49492126,49492126,2.0022\nCC-MAIN-2019-51,aar,4814,4780,0.0002\nCC-MAIN-2019-51,abk,9258,9256,0.0004\nCC-MAIN-2019-51,afr,299488,297968,0.0121\nCC-MAIN-2019-51,aka,2596,2533,0.0001\nCC-MAIN-2019-51,amh,54235,53339,0.0022\nCC-MAIN-2019-51,ara,14422661,14258503,0.5835\nCC-MAIN-2019-51,asm,23837,23690,0.0010\nCC-MAIN-2019-51,aym,1727,1724,0.0001\nCC-MAIN-2019-51,aze,1336094,1330823,0.0541\nCC-MAIN-2019-51,bak,43966,43826,0.0018\nCC-MAIN-2019-51,bel,536917,533555,0.0217\nCC-MAIN-2019-51,ben,1746829,1737822,0.0707\nCC-MAIN-2019-51,bih,15704,15680,0.0006\nCC-MAIN-2019-51,bis,2292,2284,0.0001\nCC-MAIN-2019-51,blu,12968,12193,0.0005\nCC-MAIN-2019-51,bod,50639,49881,0.0020\nCC-MAIN-2019-51,bos,1088619,1078879,0.0440\nCC-MAIN-2019-51,bre,79602,79529,0.0032\nCC-MAIN-2019-51,bul,7260164,7209376,0.2937\nCC-MAIN-2019-51,cat,6971412,6930649,0.2820\nCC-MAIN-2019-51,ceb,108330,108313,0.0044\nCC-MAIN-2019-51,ces,24906730,24670337,1.0076\nCC-MAIN-2019-51,chr,1905,1905,0.0001\nCC-MAIN-2019-51,cos,59903,59276,0.0024\nCC-MAIN-2019-51,crs,1636,1631,0.0001\nCC-MAIN-2019-51,cym,277999,276872,0.0112\nCC-MAIN-2019-51,dan,10740468,10642753,0.4345\nCC-MAIN-2019-51,deu,135336635,134103469,5.4750\nCC-MAIN-2019-51,div,37916,37835,0.0015\nCC-MAIN-2019-51,dzo,1994,1982,0.0001\nCC-MAIN-2019-51,ell,13638356,13548972,0.5517\nCC-MAIN-2019-51,eng,1077214925,1066854082,43.5783\nCC-MAIN-2019-51,epo,308225,306627,0.0125\nCC-MAIN-2019-51,est,4212472,4144041,0.1704\nCC-MAIN-2019-51,eus,939808,925134,0.0380\nCC-MAIN-2019-51,fao,110279,109509,0.0045\nCC-MAIN-2019-51,fas,13571219,13449822,0.5490\nCC-MAIN-2019-51,fij,1617,1609,0.0001\nCC-MAIN-2019-51,fin,10083916,9992456,0.4079\nCC-MAIN-2019-51,fra,110799596,109819182,4.4824\nCC-MAIN-2019-51,fry,69413,69282,0.0028\nCC-MAIN-2019-51,gla,29825,29590,0.0012\nCC-MAIN-2019-51,gle,144460,143543,0.0058\nCC-MAIN-2019-51,glg,1041615,1038004,0.0421\nCC-MAIN-2019-51,glv,7980,7961,0.0003\nCC-MAIN-2019-51,got,839,833,0.0000\nCC-MAIN-2019-51,grn,20718,20674,0.0008\nCC-MAIN-2019-51,guj,216239,210535,0.0087\nCC-MAIN-2019-51,hat,38056,37948,0.0015\nCC-MAIN-2019-51,hau,36383,35469,0.0015\nCC-MAIN-2019-51,haw,12626,12585,0.0005\nCC-MAIN-2019-51,heb,7074132,7021695,0.2862\nCC-MAIN-2019-51,hin,2678133,2667056,0.1083\nCC-MAIN-2019-51,hrv,5481854,5443461,0.2218\nCC-MAIN-2019-51,hun,12677604,12584168,0.5129\nCC-MAIN-2019-51,hye,1011067,1005754,0.0409\nCC-MAIN-2019-51,ibo,11149,11141,0.0005\nCC-MAIN-2019-51,iku,4961,4903,0.0002\nCC-MAIN-2019-51,ile,7066,7043,0.0003\nCC-MAIN-2019-51,ina,18830,18788,0.0008\nCC-MAIN-2019-51,ind,17918044,17796989,0.7249\nCC-MAIN-2019-51,ipk,1955,1897,0.0001\nCC-MAIN-2019-51,isl,1108127,1088324,0.0448\nCC-MAIN-2019-51,ita,57018242,56588766,2.3067\nCC-MAIN-2019-51,jav,60060,60013,0.0024\nCC-MAIN-2019-51,jpn,110066223,109409645,4.4527\nCC-MAIN-2019-51,kal,23791,23519,0.0010\nCC-MAIN-2019-51,kan,229338,228744,0.0093\nCC-MAIN-2019-51,kas,39,39,0.0000\nCC-MAIN-2019-51,kat,1299361,1292769,0.0526\nCC-MAIN-2019-51,kaz,665703,661263,0.0269\nCC-MAIN-2019-51,kha,3907,3900,0.0002\nCC-MAIN-2019-51,khm,209200,205720,0.0085\nCC-MAIN-2019-51,kin,43500,42956,0.0018\nCC-MAIN-2019-51,kir,165673,165140,0.0067\nCC-MAIN-2019-51,kor,19704683,19620034,0.7971\nCC-MAIN-2019-51,kur,177474,176484,0.0072\nCC-MAIN-2019-51,lao,84977,81580,0.0034\nCC-MAIN-2019-51,lat,1449015,1444385,0.0586\nCC-MAIN-2019-51,lav,3047609,3021796,0.1233\nCC-MAIN-2019-51,lif,134,126,0.0000\nCC-MAIN-2019-51,lin,5261,5161,0.0002\nCC-MAIN-2019-51,lit,5549743,5509888,0.2245\nCC-MAIN-2019-51,ltz,119163,118896,0.0048\nCC-MAIN-2019-51,lug,5056,4991,0.0002\nCC-MAIN-2019-51,mal,456951,455903,0.0185\nCC-MAIN-2019-51,mar,368753,363025,0.0149\nCC-MAIN-2019-51,mfe,2122,2115,0.0001\nCC-MAIN-2019-51,mkd,604594,599600,0.0245\nCC-MAIN-2019-51,mlg,98967,98757,0.0040\nCC-MAIN-2019-51,mlt,81907,81039,0.0033\nCC-MAIN-2019-51,mon,495397,491615,0.0200\nCC-MAIN-2019-51,mri,30736,30572,0.0012\nCC-MAIN-2019-51,msa,3731164,3719558,0.1509\nCC-MAIN-2019-51,mya,372723,367657,0.0151\nCC-MAIN-2019-51,nau,680,674,0.0000\nCC-MAIN-2019-51,nep,397344,394494,0.0161\nCC-MAIN-2019-51,new,2,2,0.0000\nCC-MAIN-2019-51,nld,42562272,42175613,1.7218\nCC-MAIN-2019-51,nno,566665,563658,0.0229\nCC-MAIN-2019-51,nor,8380112,8294913,0.3390\nCC-MAIN-2019-51,nso,4008,4007,0.0002\nCC-MAIN-2019-51,nya,5488,5478,0.0002\nCC-MAIN-2019-51,oci,109682,109542,0.0044\nCC-MAIN-2019-51,ori,55096,55000,0.0022\nCC-MAIN-2019-51,orm,10445,10190,0.0004\nCC-MAIN-2019-51,pan,145273,144958,0.0059\nCC-MAIN-2019-51,pol,41034937,40664763,1.6601\nCC-MAIN-2019-51,por,52296623,51937970,2.1156\nCC-MAIN-2019-51,pus,72936,71854,0.0030\nCC-MAIN-2019-51,que,22616,22606,0.0009\nCC-MAIN-2019-51,roh,32527,32395,0.0013\nCC-MAIN-2019-51,ron,13504096,13404736,0.5463\nCC-MAIN-2019-51,run,2101,2040,0.0001\nCC-MAIN-2019-51,rus,161693419,160427825,6.5412\nCC-MAIN-2019-51,sag,429,429,0.0000\nCC-MAIN-2019-51,san,73253,73122,0.0030\nCC-MAIN-2019-51,sco,12451,12413,0.0005\nCC-MAIN-2019-51,sin,166925,165946,0.0068\nCC-MAIN-2019-51,slk,7609015,7542365,0.3078\nCC-MAIN-2019-51,slv,4142345,4115473,0.1676\nCC-MAIN-2019-51,smo,7394,7362,0.0003\nCC-MAIN-2019-51,sna,5849,5835,0.0002\nCC-MAIN-2019-51,snd,18355,18249,0.0007\nCC-MAIN-2019-51,som,86738,86222,0.0035\nCC-MAIN-2019-51,sot,13972,13945,0.0006\nCC-MAIN-2019-51,spa,104514386,103709696,4.2281\nCC-MAIN-2019-51,sqi,1073284,1064910,0.0434\nCC-MAIN-2019-51,srp,6052522,5997481,0.2449\nCC-MAIN-2019-51,ssw,950,942,0.0000\nCC-MAIN-2019-51,sun,32422,32260,0.0013\nCC-MAIN-2019-51,sux,60,60,0.0000\nCC-MAIN-2019-51,swa,188582,187670,0.0076\nCC-MAIN-2019-51,swe,19003395,18857261,0.7688\nCC-MAIN-2019-51,syr,12684,12613,0.0005\nCC-MAIN-2019-51,tam,1161279,1157454,0.0470\nCC-MAIN-2019-51,tat,152177,151463,0.0062\nCC-MAIN-2019-51,tel,425966,424373,0.0172\nCC-MAIN-2019-51,tgk,145591,144843,0.0059\nCC-MAIN-2019-51,tgl,173164,172689,0.0070\nCC-MAIN-2019-51,tha,8311885,8258065,0.3363\nCC-MAIN-2019-51,tir,21548,19673,0.0009\nCC-MAIN-2019-51,ton,2040,2040,0.0001\nCC-MAIN-2019-51,tsn,6099,5924,0.0002\nCC-MAIN-2019-51,tso,5271,5255,0.0002\nCC-MAIN-2019-51,tuk,39846,39621,0.0016\nCC-MAIN-2019-51,tur,20285234,20118855,0.8206\nCC-MAIN-2019-51,uig,34049,33997,0.0014\nCC-MAIN-2019-51,ukr,8725126,8673919,0.3530\nCC-MAIN-2019-51,urd,634200,631112,0.0257\nCC-MAIN-2019-51,uzb,502226,498676,0.0203\nCC-MAIN-2019-51,ven,695,693,0.0000\nCC-MAIN-2019-51,vie,18609154,18464444,0.7528\nCC-MAIN-2019-51,vol,34677,34645,0.0014\nCC-MAIN-2019-51,war,106468,106249,0.0043\nCC-MAIN-2019-51,wol,3987,3974,0.0002\nCC-MAIN-2019-51,xho,8147,8136,0.0003\nCC-MAIN-2019-51,yid,67168,67139,0.0027\nCC-MAIN-2019-51,yor,23812,23774,0.0010\nCC-MAIN-2019-51,zha,1911,1893,0.0001\nCC-MAIN-2019-51,zho,206893092,205955109,8.3698\nCC-MAIN-2019-51,zul,26401,26371,0.0011\nCC-MAIN-2020-05,<unknown>,55645952,55645952,1.7944\nCC-MAIN-2020-05,aar,5329,5295,0.0002\nCC-MAIN-2020-05,abk,12123,12105,0.0004\nCC-MAIN-2020-05,afr,368432,367236,0.0119\nCC-MAIN-2020-05,aka,2994,2992,0.0001\nCC-MAIN-2020-05,amh,71116,69935,0.0023\nCC-MAIN-2020-05,ara,16458287,16285429,0.5307\nCC-MAIN-2020-05,asm,26365,26247,0.0009\nCC-MAIN-2020-05,aym,3489,3476,0.0001\nCC-MAIN-2020-05,aze,1416806,1410897,0.0457\nCC-MAIN-2020-05,bak,66369,66312,0.0021\nCC-MAIN-2020-05,bel,645629,640135,0.0208\nCC-MAIN-2020-05,ben,2010455,1995427,0.0648\nCC-MAIN-2020-05,bih,21632,21450,0.0007\nCC-MAIN-2020-05,bis,3707,3702,0.0001\nCC-MAIN-2020-05,blu,13673,13070,0.0004\nCC-MAIN-2020-05,bod,61240,60782,0.0020\nCC-MAIN-2020-05,bos,1266438,1256065,0.0408\nCC-MAIN-2020-05,bre,113478,113286,0.0037\nCC-MAIN-2020-05,bul,8641281,8579881,0.2787\nCC-MAIN-2020-05,cat,8506097,8451262,0.2743\nCC-MAIN-2020-05,ceb,94296,94275,0.0030\nCC-MAIN-2020-05,ces,32835365,32497062,1.0588\nCC-MAIN-2020-05,chr,2729,2727,0.0001\nCC-MAIN-2020-05,cos,74218,73364,0.0024\nCC-MAIN-2020-05,crs,1904,1902,0.0001\nCC-MAIN-2020-05,cym,357453,355518,0.0115\nCC-MAIN-2020-05,dan,14156742,14009506,0.4565\nCC-MAIN-2020-05,deu,175911564,174141615,5.6726\nCC-MAIN-2020-05,div,45886,45449,0.0015\nCC-MAIN-2020-05,dzo,2541,2541,0.0001\nCC-MAIN-2020-05,ell,16846663,16716385,0.5432\nCC-MAIN-2020-05,eng,1369923445,1355999659,44.1754\nCC-MAIN-2020-05,epo,302777,301985,0.0098\nCC-MAIN-2020-05,est,5034428,4974298,0.1623\nCC-MAIN-2020-05,eus,1110767,1099017,0.0358\nCC-MAIN-2020-05,fao,134233,133466,0.0043\nCC-MAIN-2020-05,fas,15776532,15621864,0.5087\nCC-MAIN-2020-05,fij,2476,2471,0.0001\nCC-MAIN-2020-05,fin,13076030,12946698,0.4217\nCC-MAIN-2020-05,fra,143760178,142413672,4.6358\nCC-MAIN-2020-05,fry,91382,91187,0.0029\nCC-MAIN-2020-05,gla,44113,44030,0.0014\nCC-MAIN-2020-05,gle,183988,182874,0.0059\nCC-MAIN-2020-05,glg,1228453,1221969,0.0396\nCC-MAIN-2020-05,glv,13717,13694,0.0004\nCC-MAIN-2020-05,got,1363,1360,0.0000\nCC-MAIN-2020-05,grn,22229,22082,0.0007\nCC-MAIN-2020-05,guj,250735,246268,0.0081\nCC-MAIN-2020-05,hat,48226,47882,0.0016\nCC-MAIN-2020-05,hau,42069,41565,0.0014\nCC-MAIN-2020-05,haw,13269,13181,0.0004\nCC-MAIN-2020-05,heb,8914615,8831167,0.2875\nCC-MAIN-2020-05,hin,3067211,3048584,0.0989\nCC-MAIN-2020-05,hrv,6448096,6395799,0.2079\nCC-MAIN-2020-05,hun,15956591,15822885,0.5145\nCC-MAIN-2020-05,hye,1149074,1142837,0.0371\nCC-MAIN-2020-05,ibo,7773,7745,0.0003\nCC-MAIN-2020-05,iku,7195,7099,0.0002\nCC-MAIN-2020-05,ile,8392,8360,0.0003\nCC-MAIN-2020-05,ina,23589,23529,0.0008\nCC-MAIN-2020-05,ind,22793912,22612403,0.7350\nCC-MAIN-2020-05,ipk,3134,3000,0.0001\nCC-MAIN-2020-05,isl,1375351,1352291,0.0444\nCC-MAIN-2020-05,ita,73303541,72700619,2.3638\nCC-MAIN-2020-05,jav,72000,71874,0.0023\nCC-MAIN-2020-05,jpn,144490249,143586999,4.6593\nCC-MAIN-2020-05,kal,33120,32820,0.0011\nCC-MAIN-2020-05,kan,255679,253867,0.0082\nCC-MAIN-2020-05,kas,182,182,0.0000\nCC-MAIN-2020-05,kat,1455299,1446412,0.0469\nCC-MAIN-2020-05,kaz,755987,749004,0.0244\nCC-MAIN-2020-05,kha,5265,5242,0.0002\nCC-MAIN-2020-05,khm,242996,239696,0.0078\nCC-MAIN-2020-05,kin,51767,50773,0.0017\nCC-MAIN-2020-05,kir,191475,190978,0.0062\nCC-MAIN-2020-05,kor,23755322,23636221,0.7660\nCC-MAIN-2020-05,kur,214450,212469,0.0069\nCC-MAIN-2020-05,lao,95936,93829,0.0031\nCC-MAIN-2020-05,lat,2298488,2292170,0.0741\nCC-MAIN-2020-05,lav,3553784,3525174,0.1146\nCC-MAIN-2020-05,lif,53,51,0.0000\nCC-MAIN-2020-05,lin,7014,6948,0.0002\nCC-MAIN-2020-05,lit,6284863,6235115,0.2027\nCC-MAIN-2020-05,ltz,133758,133290,0.0043\nCC-MAIN-2020-05,lug,5716,5711,0.0002\nCC-MAIN-2020-05,mal,528790,524972,0.0171\nCC-MAIN-2020-05,mar,457184,452481,0.0147\nCC-MAIN-2020-05,mfe,2203,2189,0.0001\nCC-MAIN-2020-05,mkd,763911,757151,0.0246\nCC-MAIN-2020-05,mlg,114557,114340,0.0037\nCC-MAIN-2020-05,mlt,99704,98597,0.0032\nCC-MAIN-2020-05,mon,556606,551632,0.0179\nCC-MAIN-2020-05,mri,39981,39813,0.0013\nCC-MAIN-2020-05,msa,4769640,4754481,0.1538\nCC-MAIN-2020-05,mya,386261,378884,0.0125\nCC-MAIN-2020-05,nau,855,849,0.0000\nCC-MAIN-2020-05,nep,504002,498495,0.0163\nCC-MAIN-2020-05,new,17,17,0.0000\nCC-MAIN-2020-05,nld,55848187,55279057,1.8009\nCC-MAIN-2020-05,nno,665061,661169,0.0214\nCC-MAIN-2020-05,nor,10718534,10601727,0.3456\nCC-MAIN-2020-05,nso,5668,5667,0.0002\nCC-MAIN-2020-05,nya,6057,6045,0.0002\nCC-MAIN-2020-05,oci,134644,133934,0.0043\nCC-MAIN-2020-05,ori,61595,61023,0.0020\nCC-MAIN-2020-05,orm,10496,10414,0.0003\nCC-MAIN-2020-05,pan,171249,169329,0.0055\nCC-MAIN-2020-05,pol,52016828,51520866,1.6774\nCC-MAIN-2020-05,por,67169667,66652285,2.1660\nCC-MAIN-2020-05,pus,88008,87155,0.0028\nCC-MAIN-2020-05,que,33519,33490,0.0011\nCC-MAIN-2020-05,roh,41298,41086,0.0013\nCC-MAIN-2020-05,ron,16970205,16822468,0.5472\nCC-MAIN-2020-05,run,2504,2425,0.0001\nCC-MAIN-2020-05,rus,206873420,205142957,6.6710\nCC-MAIN-2020-05,sag,739,739,0.0000\nCC-MAIN-2020-05,san,89000,88382,0.0029\nCC-MAIN-2020-05,sco,15674,15630,0.0005\nCC-MAIN-2020-05,sin,197414,195717,0.0064\nCC-MAIN-2020-05,slk,10442027,10347535,0.3367\nCC-MAIN-2020-05,slv,4943676,4904444,0.1594\nCC-MAIN-2020-05,smo,8004,7956,0.0003\nCC-MAIN-2020-05,sna,7465,7429,0.0002\nCC-MAIN-2020-05,snd,26483,26324,0.0009\nCC-MAIN-2020-05,som,107587,106970,0.0035\nCC-MAIN-2020-05,sot,10181,10160,0.0003\nCC-MAIN-2020-05,spa,133327951,132188751,4.2994\nCC-MAIN-2020-05,sqi,1182034,1172178,0.0381\nCC-MAIN-2020-05,srp,7114831,7046661,0.2294\nCC-MAIN-2020-05,ssw,1081,1076,0.0000\nCC-MAIN-2020-05,sun,38892,38801,0.0013\nCC-MAIN-2020-05,sux,47,47,0.0000\nCC-MAIN-2020-05,swa,226725,225318,0.0073\nCC-MAIN-2020-05,swe,24264337,24026639,0.7824\nCC-MAIN-2020-05,syr,11966,11930,0.0004\nCC-MAIN-2020-05,tam,1422056,1413596,0.0459\nCC-MAIN-2020-05,tat,208525,207936,0.0067\nCC-MAIN-2020-05,tel,530418,528354,0.0171\nCC-MAIN-2020-05,tgk,165441,164659,0.0053\nCC-MAIN-2020-05,tgl,202997,202384,0.0065\nCC-MAIN-2020-05,tha,10147301,10073065,0.3272\nCC-MAIN-2020-05,tir,21703,21152,0.0007\nCC-MAIN-2020-05,ton,1883,1882,0.0001\nCC-MAIN-2020-05,tsn,9267,9064,0.0003\nCC-MAIN-2020-05,tso,1998,1997,0.0001\nCC-MAIN-2020-05,tuk,43865,43556,0.0014\nCC-MAIN-2020-05,tur,25234178,25016291,0.8137\nCC-MAIN-2020-05,uig,43797,43665,0.0014\nCC-MAIN-2020-05,ukr,10767748,10693121,0.3472\nCC-MAIN-2020-05,urd,748790,740917,0.0241\nCC-MAIN-2020-05,uzb,583902,580036,0.0188\nCC-MAIN-2020-05,ven,986,985,0.0000\nCC-MAIN-2020-05,vie,23056197,22857612,0.7435\nCC-MAIN-2020-05,vol,35263,35247,0.0011\nCC-MAIN-2020-05,war,133950,133582,0.0043\nCC-MAIN-2020-05,wol,5198,5186,0.0002\nCC-MAIN-2020-05,xho,9446,9416,0.0003\nCC-MAIN-2020-05,yid,84711,84673,0.0027\nCC-MAIN-2020-05,yor,29762,29722,0.0010\nCC-MAIN-2020-05,zha,2433,2429,0.0001\nCC-MAIN-2020-05,zho,222817090,221713019,7.1851\nCC-MAIN-2020-05,zul,18963,18947,0.0006\nCC-MAIN-2020-10,<unknown>,60503588,60503588,2.3005\nCC-MAIN-2020-10,aar,3660,3609,0.0001\nCC-MAIN-2020-10,abk,7648,7639,0.0003\nCC-MAIN-2020-10,afr,275550,274518,0.0105\nCC-MAIN-2020-10,aka,2266,2259,0.0001\nCC-MAIN-2020-10,amh,48896,48756,0.0019\nCC-MAIN-2020-10,ara,15037318,14908782,0.5718\nCC-MAIN-2020-10,asm,20591,20529,0.0008\nCC-MAIN-2020-10,aym,1891,1875,0.0001\nCC-MAIN-2020-10,aze,1265345,1258932,0.0481\nCC-MAIN-2020-10,bak,30998,30974,0.0012\nCC-MAIN-2020-10,bel,480513,478298,0.0183\nCC-MAIN-2020-10,ben,1739875,1731729,0.0662\nCC-MAIN-2020-10,bih,10513,10479,0.0004\nCC-MAIN-2020-10,bis,3994,3986,0.0002\nCC-MAIN-2020-10,blu,8732,8715,0.0003\nCC-MAIN-2020-10,bod,38148,38078,0.0015\nCC-MAIN-2020-10,bos,1023585,1017694,0.0389\nCC-MAIN-2020-10,bre,63495,63424,0.0024\nCC-MAIN-2020-10,bul,7536516,7489505,0.2866\nCC-MAIN-2020-10,cat,6835332,6789173,0.2599\nCC-MAIN-2020-10,ceb,69004,68957,0.0026\nCC-MAIN-2020-10,ces,26633610,26360218,1.0127\nCC-MAIN-2020-10,chr,1018,1018,0.0000\nCC-MAIN-2020-10,cos,53059,52756,0.0020\nCC-MAIN-2020-10,crs,1797,1784,0.0001\nCC-MAIN-2020-10,cym,271819,270220,0.0103\nCC-MAIN-2020-10,dan,11558013,11448900,0.4395\nCC-MAIN-2020-10,deu,146413965,144955802,5.5671\nCC-MAIN-2020-10,div,42264,42130,0.0016\nCC-MAIN-2020-10,dzo,1931,1931,0.0001\nCC-MAIN-2020-10,ell,14037484,13951839,0.5338\nCC-MAIN-2020-10,eng,1118115804,1107143745,42.5145\nCC-MAIN-2020-10,epo,236993,236087,0.0090\nCC-MAIN-2020-10,est,4181864,4146203,0.1590\nCC-MAIN-2020-10,eus,905164,892917,0.0344\nCC-MAIN-2020-10,fao,104915,104403,0.0040\nCC-MAIN-2020-10,fas,13904753,13791278,0.5287\nCC-MAIN-2020-10,fij,2292,2286,0.0001\nCC-MAIN-2020-10,fin,10220564,10128103,0.3886\nCC-MAIN-2020-10,fra,118484916,117418841,4.5052\nCC-MAIN-2020-10,fry,71067,70795,0.0027\nCC-MAIN-2020-10,gla,29254,29200,0.0011\nCC-MAIN-2020-10,gle,151843,151114,0.0058\nCC-MAIN-2020-10,glg,1028924,1023395,0.0391\nCC-MAIN-2020-10,glv,8905,8893,0.0003\nCC-MAIN-2020-10,got,488,488,0.0000\nCC-MAIN-2020-10,grn,18055,18010,0.0007\nCC-MAIN-2020-10,guj,214455,212922,0.0082\nCC-MAIN-2020-10,hat,30642,30565,0.0012\nCC-MAIN-2020-10,hau,36656,36381,0.0014\nCC-MAIN-2020-10,haw,11025,10947,0.0004\nCC-MAIN-2020-10,heb,7314034,7249240,0.2781\nCC-MAIN-2020-10,hin,2763801,2750502,0.1051\nCC-MAIN-2020-10,hrv,5391539,5353124,0.2050\nCC-MAIN-2020-10,hun,13354650,13260690,0.5078\nCC-MAIN-2020-10,hye,1003257,996839,0.0381\nCC-MAIN-2020-10,ibo,9798,9775,0.0004\nCC-MAIN-2020-10,iku,4529,4496,0.0002\nCC-MAIN-2020-10,ile,6953,6932,0.0003\nCC-MAIN-2020-10,ina,14817,14787,0.0006\nCC-MAIN-2020-10,ind,18548274,18417578,0.7053\nCC-MAIN-2020-10,ipk,1803,1753,0.0001\nCC-MAIN-2020-10,isl,1032749,1016227,0.0393\nCC-MAIN-2020-10,ita,60334400,59887626,2.2941\nCC-MAIN-2020-10,jav,43988,43902,0.0017\nCC-MAIN-2020-10,jpn,127916585,127209550,4.8638\nCC-MAIN-2020-10,kal,31176,31049,0.0012\nCC-MAIN-2020-10,kan,238471,237765,0.0091\nCC-MAIN-2020-10,kas,48,48,0.0000\nCC-MAIN-2020-10,kat,1236605,1230662,0.0470\nCC-MAIN-2020-10,kaz,629113,624032,0.0239\nCC-MAIN-2020-10,kha,5731,5696,0.0002\nCC-MAIN-2020-10,khm,210690,209540,0.0080\nCC-MAIN-2020-10,kin,39644,39418,0.0015\nCC-MAIN-2020-10,kir,155210,154803,0.0059\nCC-MAIN-2020-10,kor,21573992,21484980,0.8203\nCC-MAIN-2020-10,kur,177993,176991,0.0068\nCC-MAIN-2020-10,lao,66561,66419,0.0025\nCC-MAIN-2020-10,lat,2244102,2237163,0.0853\nCC-MAIN-2020-10,lav,3019922,2991653,0.1148\nCC-MAIN-2020-10,lif,93,81,0.0000\nCC-MAIN-2020-10,lin,5540,5525,0.0002\nCC-MAIN-2020-10,lit,5104984,5063899,0.1941\nCC-MAIN-2020-10,ltz,101000,100442,0.0038\nCC-MAIN-2020-10,lug,5041,5031,0.0002\nCC-MAIN-2020-10,mal,467927,466196,0.0178\nCC-MAIN-2020-10,mar,336359,331764,0.0128\nCC-MAIN-2020-10,mfe,1797,1777,0.0001\nCC-MAIN-2020-10,mkd,640830,636787,0.0244\nCC-MAIN-2020-10,mlg,87184,86971,0.0033\nCC-MAIN-2020-10,mlt,76101,75635,0.0029\nCC-MAIN-2020-10,mon,467069,465029,0.0178\nCC-MAIN-2020-10,mri,25250,25107,0.0010\nCC-MAIN-2020-10,msa,2924636,2914712,0.1112\nCC-MAIN-2020-10,mya,279283,278355,0.0106\nCC-MAIN-2020-10,nau,842,838,0.0000\nCC-MAIN-2020-10,nep,402348,400601,0.0153\nCC-MAIN-2020-10,new,143,143,0.0000\nCC-MAIN-2020-10,nld,45605800,45149637,1.7341\nCC-MAIN-2020-10,nno,467648,464680,0.0178\nCC-MAIN-2020-10,nor,8481407,8397581,0.3225\nCC-MAIN-2020-10,nso,1506,1506,0.0001\nCC-MAIN-2020-10,nya,5870,5845,0.0002\nCC-MAIN-2020-10,oci,81748,81539,0.0031\nCC-MAIN-2020-10,ori,50360,50305,0.0019\nCC-MAIN-2020-10,orm,6171,6145,0.0002\nCC-MAIN-2020-10,pan,140450,140042,0.0053\nCC-MAIN-2020-10,pol,44433331,44041494,1.6895\nCC-MAIN-2020-10,por,56209517,55818467,2.1373\nCC-MAIN-2020-10,pus,66230,65816,0.0025\nCC-MAIN-2020-10,que,14404,14392,0.0005\nCC-MAIN-2020-10,roh,57381,57217,0.0022\nCC-MAIN-2020-10,ron,14701420,14585188,0.5590\nCC-MAIN-2020-10,run,2637,2499,0.0001\nCC-MAIN-2020-10,rus,172689286,171413054,6.5662\nCC-MAIN-2020-10,sag,269,269,0.0000\nCC-MAIN-2020-10,san,76372,76150,0.0029\nCC-MAIN-2020-10,sco,15105,15064,0.0006\nCC-MAIN-2020-10,sin,162640,161606,0.0062\nCC-MAIN-2020-10,slk,9273024,9193341,0.3526\nCC-MAIN-2020-10,slv,4251296,4216265,0.1616\nCC-MAIN-2020-10,smo,6348,6295,0.0002\nCC-MAIN-2020-10,sna,5506,5483,0.0002\nCC-MAIN-2020-10,snd,19617,19424,0.0007\nCC-MAIN-2020-10,som,90578,90257,0.0034\nCC-MAIN-2020-10,sot,8677,8665,0.0003\nCC-MAIN-2020-10,spa,108486095,107655963,4.1250\nCC-MAIN-2020-10,sqi,1020332,1014739,0.0388\nCC-MAIN-2020-10,srp,5893693,5842853,0.2241\nCC-MAIN-2020-10,ssw,908,901,0.0000\nCC-MAIN-2020-10,sun,25289,25184,0.0010\nCC-MAIN-2020-10,sux,59,59,0.0000\nCC-MAIN-2020-10,swa,159676,158730,0.0061\nCC-MAIN-2020-10,swe,19768541,19590266,0.7517\nCC-MAIN-2020-10,syr,13657,13629,0.0005\nCC-MAIN-2020-10,tam,1104975,1101554,0.0420\nCC-MAIN-2020-10,tat,141742,141549,0.0054\nCC-MAIN-2020-10,tel,413879,411613,0.0157\nCC-MAIN-2020-10,tgk,116464,115951,0.0044\nCC-MAIN-2020-10,tgl,142301,141635,0.0054\nCC-MAIN-2020-10,tha,8605611,8555705,0.3272\nCC-MAIN-2020-10,tir,14656,14552,0.0006\nCC-MAIN-2020-10,ton,1666,1665,0.0001\nCC-MAIN-2020-10,tsn,8221,8139,0.0003\nCC-MAIN-2020-10,tso,892,887,0.0000\nCC-MAIN-2020-10,tuk,35154,34976,0.0013\nCC-MAIN-2020-10,tur,22131882,21961070,0.8415\nCC-MAIN-2020-10,uig,40811,40789,0.0016\nCC-MAIN-2020-10,ukr,9529640,9472936,0.3623\nCC-MAIN-2020-10,urd,546223,543099,0.0208\nCC-MAIN-2020-10,uzb,442071,439981,0.0168\nCC-MAIN-2020-10,ven,909,908,0.0000\nCC-MAIN-2020-10,vie,18745307,18602585,0.7128\nCC-MAIN-2020-10,vol,40221,40206,0.0015\nCC-MAIN-2020-10,war,74135,73716,0.0028\nCC-MAIN-2020-10,wol,4105,4081,0.0002\nCC-MAIN-2020-10,xho,9492,9471,0.0004\nCC-MAIN-2020-10,yid,40171,40152,0.0015\nCC-MAIN-2020-10,yor,17654,17616,0.0007\nCC-MAIN-2020-10,zha,989,986,0.0000\nCC-MAIN-2020-10,zho,235369023,234400870,8.9495\nCC-MAIN-2020-10,zul,14561,14531,0.0006\nCC-MAIN-2020-16,<unknown>,71244517,71244517,2.4684\nCC-MAIN-2020-16,aar,5490,5465,0.0002\nCC-MAIN-2020-16,abk,10823,10742,0.0004\nCC-MAIN-2020-16,afr,328015,325528,0.0114\nCC-MAIN-2020-16,aka,2083,2080,0.0001\nCC-MAIN-2020-16,amh,62258,61707,0.0022\nCC-MAIN-2020-16,ara,14435760,14299264,0.5002\nCC-MAIN-2020-16,asm,21231,21150,0.0007\nCC-MAIN-2020-16,aym,2463,2426,0.0001\nCC-MAIN-2020-16,aze,1512092,1503381,0.0524\nCC-MAIN-2020-16,bak,38231,38154,0.0013\nCC-MAIN-2020-16,bel,558764,555934,0.0194\nCC-MAIN-2020-16,ben,1975279,1965598,0.0684\nCC-MAIN-2020-16,bih,17543,17482,0.0006\nCC-MAIN-2020-16,bis,4014,4006,0.0001\nCC-MAIN-2020-16,blu,12796,12731,0.0004\nCC-MAIN-2020-16,bod,49211,49133,0.0017\nCC-MAIN-2020-16,bos,1179747,1172228,0.0409\nCC-MAIN-2020-16,bre,86762,86680,0.0030\nCC-MAIN-2020-16,bul,9612951,9544222,0.3331\nCC-MAIN-2020-16,cat,8351137,8288880,0.2893\nCC-MAIN-2020-16,ceb,43089,43058,0.0015\nCC-MAIN-2020-16,ces,30801759,30524936,1.0672\nCC-MAIN-2020-16,chr,1919,1917,0.0001\nCC-MAIN-2020-16,cos,68960,68757,0.0024\nCC-MAIN-2020-16,crs,2571,2566,0.0001\nCC-MAIN-2020-16,cym,351053,349226,0.0122\nCC-MAIN-2020-16,dan,13740381,13620149,0.4761\nCC-MAIN-2020-16,deu,166238267,164574249,5.7597\nCC-MAIN-2020-16,div,45236,45103,0.0016\nCC-MAIN-2020-16,dzo,2734,2734,0.0001\nCC-MAIN-2020-16,ell,14808881,14709957,0.5131\nCC-MAIN-2020-16,eng,1230417570,1218716211,42.6305\nCC-MAIN-2020-16,epo,230860,230127,0.0080\nCC-MAIN-2020-16,est,5327221,5281549,0.1846\nCC-MAIN-2020-16,eus,1119061,1106835,0.0388\nCC-MAIN-2020-16,fao,141616,140989,0.0049\nCC-MAIN-2020-16,fas,15222785,15079555,0.5274\nCC-MAIN-2020-16,fij,2828,2824,0.0001\nCC-MAIN-2020-16,fin,11976219,11867022,0.4149\nCC-MAIN-2020-16,fra,131318453,130153919,4.5498\nCC-MAIN-2020-16,fry,87041,86656,0.0030\nCC-MAIN-2020-16,gla,40618,40556,0.0014\nCC-MAIN-2020-16,gle,194966,194094,0.0068\nCC-MAIN-2020-16,glg,1287185,1278885,0.0446\nCC-MAIN-2020-16,glv,13488,13467,0.0005\nCC-MAIN-2020-16,got,1143,1141,0.0000\nCC-MAIN-2020-16,grn,21078,21005,0.0007\nCC-MAIN-2020-16,guj,214031,211151,0.0074\nCC-MAIN-2020-16,hat,37796,37638,0.0013\nCC-MAIN-2020-16,hau,38690,38184,0.0013\nCC-MAIN-2020-16,haw,11135,11116,0.0004\nCC-MAIN-2020-16,heb,9387313,9303276,0.3252\nCC-MAIN-2020-16,hin,2942743,2922709,0.1020\nCC-MAIN-2020-16,hrv,6816983,6768352,0.2362\nCC-MAIN-2020-16,hun,14822754,14704298,0.5136\nCC-MAIN-2020-16,hye,1099670,1091914,0.0381\nCC-MAIN-2020-16,ibo,10903,10882,0.0004\nCC-MAIN-2020-16,iku,6850,6584,0.0002\nCC-MAIN-2020-16,ile,7481,7441,0.0003\nCC-MAIN-2020-16,ina,22485,22419,0.0008\nCC-MAIN-2020-16,ind,20893943,20759962,0.7239\nCC-MAIN-2020-16,ipk,2879,2824,0.0001\nCC-MAIN-2020-16,isl,1362473,1347351,0.0472\nCC-MAIN-2020-16,ita,67800294,67273336,2.3491\nCC-MAIN-2020-16,jav,60922,60877,0.0021\nCC-MAIN-2020-16,jpn,138240687,137395531,4.7897\nCC-MAIN-2020-16,kal,34441,34126,0.0012\nCC-MAIN-2020-16,kan,221715,220832,0.0077\nCC-MAIN-2020-16,kas,170,170,0.0000\nCC-MAIN-2020-16,kat,1427407,1418578,0.0495\nCC-MAIN-2020-16,kaz,733396,727659,0.0254\nCC-MAIN-2020-16,kha,5074,5047,0.0002\nCC-MAIN-2020-16,khm,212589,210426,0.0074\nCC-MAIN-2020-16,kin,40637,39978,0.0014\nCC-MAIN-2020-16,kir,177649,176853,0.0062\nCC-MAIN-2020-16,kor,21135259,21030198,0.7323\nCC-MAIN-2020-16,kur,196377,195668,0.0068\nCC-MAIN-2020-16,lao,75607,75425,0.0026\nCC-MAIN-2020-16,lat,2831907,2825904,0.0981\nCC-MAIN-2020-16,lav,3963519,3929578,0.1373\nCC-MAIN-2020-16,lif,91,88,0.0000\nCC-MAIN-2020-16,lin,8273,8236,0.0003\nCC-MAIN-2020-16,lit,6689226,6639914,0.2318\nCC-MAIN-2020-16,ltz,131785,131116,0.0046\nCC-MAIN-2020-16,lug,5544,5538,0.0002\nCC-MAIN-2020-16,mal,467474,464669,0.0162\nCC-MAIN-2020-16,mar,359720,353471,0.0125\nCC-MAIN-2020-16,mfe,1785,1761,0.0001\nCC-MAIN-2020-16,mkd,677425,670514,0.0235\nCC-MAIN-2020-16,mlg,89412,89110,0.0031\nCC-MAIN-2020-16,mlt,85188,84466,0.0030\nCC-MAIN-2020-16,mon,564131,561293,0.0195\nCC-MAIN-2020-16,mri,29842,29731,0.0010\nCC-MAIN-2020-16,msa,3400462,3388050,0.1178\nCC-MAIN-2020-16,mya,320266,318973,0.0111\nCC-MAIN-2020-16,nau,972,963,0.0000\nCC-MAIN-2020-16,nep,452768,449910,0.0157\nCC-MAIN-2020-16,new,134,134,0.0000\nCC-MAIN-2020-16,nld,54367712,53868986,1.8837\nCC-MAIN-2020-16,nno,606854,602421,0.0210\nCC-MAIN-2020-16,nor,9906047,9800595,0.3432\nCC-MAIN-2020-16,nso,3609,3608,0.0001\nCC-MAIN-2020-16,nya,7932,7893,0.0003\nCC-MAIN-2020-16,oci,90794,90593,0.0031\nCC-MAIN-2020-16,ori,52457,52306,0.0018\nCC-MAIN-2020-16,orm,7404,7346,0.0003\nCC-MAIN-2020-16,pan,156527,155611,0.0054\nCC-MAIN-2020-16,pol,49702960,49220902,1.7221\nCC-MAIN-2020-16,por,61266196,60810740,2.1227\nCC-MAIN-2020-16,pus,73107,72824,0.0025\nCC-MAIN-2020-16,que,24375,24354,0.0008\nCC-MAIN-2020-16,roh,59012,58315,0.0020\nCC-MAIN-2020-16,ron,16257101,16135211,0.5633\nCC-MAIN-2020-16,run,2603,2544,0.0001\nCC-MAIN-2020-16,rus,199942773,198403710,6.9275\nCC-MAIN-2020-16,sag,642,641,0.0000\nCC-MAIN-2020-16,san,86167,85240,0.0030\nCC-MAIN-2020-16,sco,17013,16950,0.0006\nCC-MAIN-2020-16,sin,188617,187889,0.0065\nCC-MAIN-2020-16,slk,9174966,9097865,0.3179\nCC-MAIN-2020-16,slv,5546977,5498855,0.1922\nCC-MAIN-2020-16,smo,13218,13183,0.0005\nCC-MAIN-2020-16,sna,6416,6395,0.0002\nCC-MAIN-2020-16,snd,27355,27031,0.0009\nCC-MAIN-2020-16,som,83116,82915,0.0029\nCC-MAIN-2020-16,sot,10523,10472,0.0004\nCC-MAIN-2020-16,spa,117914699,116962092,4.0854\nCC-MAIN-2020-16,sqi,1127669,1117139,0.0391\nCC-MAIN-2020-16,srp,7367299,7299423,0.2553\nCC-MAIN-2020-16,ssw,931,920,0.0000\nCC-MAIN-2020-16,sun,33933,33831,0.0012\nCC-MAIN-2020-16,sux,68,68,0.0000\nCC-MAIN-2020-16,swa,209738,208795,0.0073\nCC-MAIN-2020-16,swe,22532769,22320809,0.7807\nCC-MAIN-2020-16,syr,13787,13741,0.0005\nCC-MAIN-2020-16,tam,1167799,1161729,0.0405\nCC-MAIN-2020-16,tat,158963,158308,0.0055\nCC-MAIN-2020-16,tel,459063,457431,0.0159\nCC-MAIN-2020-16,tgk,149242,148836,0.0052\nCC-MAIN-2020-16,tgl,185565,184297,0.0064\nCC-MAIN-2020-16,tha,8689641,8638234,0.3011\nCC-MAIN-2020-16,tir,21962,21815,0.0008\nCC-MAIN-2020-16,ton,1559,1557,0.0001\nCC-MAIN-2020-16,tsn,7815,7719,0.0003\nCC-MAIN-2020-16,tso,1674,1671,0.0001\nCC-MAIN-2020-16,tuk,44290,43825,0.0015\nCC-MAIN-2020-16,tur,23667840,23489426,0.8200\nCC-MAIN-2020-16,uig,48316,48286,0.0017\nCC-MAIN-2020-16,ukr,10500589,10431554,0.3638\nCC-MAIN-2020-16,urd,586551,582863,0.0203\nCC-MAIN-2020-16,uzb,533137,529383,0.0185\nCC-MAIN-2020-16,ven,897,896,0.0000\nCC-MAIN-2020-16,vie,20920807,20755700,0.7248\nCC-MAIN-2020-16,vol,40440,40426,0.0014\nCC-MAIN-2020-16,war,89806,89480,0.0031\nCC-MAIN-2020-16,wol,6096,5961,0.0002\nCC-MAIN-2020-16,xho,10810,10771,0.0004\nCC-MAIN-2020-16,yid,52359,52297,0.0018\nCC-MAIN-2020-16,yor,26003,25898,0.0009\nCC-MAIN-2020-16,zha,2307,2302,0.0001\nCC-MAIN-2020-16,zho,220824816,219789633,7.6510\nCC-MAIN-2020-16,zul,16098,16063,0.0006\nCC-MAIN-2020-24,<unknown>,59522517,59522517,2.1541\nCC-MAIN-2020-24,aar,4052,4033,0.0001\nCC-MAIN-2020-24,abk,11740,11622,0.0004\nCC-MAIN-2020-24,afr,330192,328554,0.0119\nCC-MAIN-2020-24,aka,1279,1277,0.0000\nCC-MAIN-2020-24,amh,71308,70031,0.0026\nCC-MAIN-2020-24,ara,17114822,16958396,0.6194\nCC-MAIN-2020-24,asm,25309,25132,0.0009\nCC-MAIN-2020-24,aym,3288,3276,0.0001\nCC-MAIN-2020-24,aze,1900176,1886016,0.0688\nCC-MAIN-2020-24,bak,39525,39440,0.0014\nCC-MAIN-2020-24,bel,574835,572045,0.0208\nCC-MAIN-2020-24,ben,2419440,2405804,0.0876\nCC-MAIN-2020-24,bih,15301,15210,0.0006\nCC-MAIN-2020-24,bis,2827,2819,0.0001\nCC-MAIN-2020-24,blu,13256,13130,0.0005\nCC-MAIN-2020-24,bod,47323,47085,0.0017\nCC-MAIN-2020-24,bos,1366077,1355912,0.0494\nCC-MAIN-2020-24,bre,88161,88039,0.0032\nCC-MAIN-2020-24,bul,10532681,10450125,0.3812\nCC-MAIN-2020-24,cat,8383654,8300665,0.3034\nCC-MAIN-2020-24,ceb,67152,67096,0.0024\nCC-MAIN-2020-24,ces,27496656,27218572,0.9951\nCC-MAIN-2020-24,chr,1657,1650,0.0001\nCC-MAIN-2020-24,cos,65437,64959,0.0024\nCC-MAIN-2020-24,crs,1454,1440,0.0001\nCC-MAIN-2020-24,cym,358027,355514,0.0130\nCC-MAIN-2020-24,dan,12667055,12532685,0.4584\nCC-MAIN-2020-24,deu,153641053,152029948,5.5602\nCC-MAIN-2020-24,div,56900,56497,0.0021\nCC-MAIN-2020-24,dzo,2255,2245,0.0001\nCC-MAIN-2020-24,ell,15737142,15633814,0.5695\nCC-MAIN-2020-24,eng,1169681402,1158419660,42.3306\nCC-MAIN-2020-24,epo,233927,232751,0.0085\nCC-MAIN-2020-24,est,5525446,5468351,0.2000\nCC-MAIN-2020-24,eus,1183303,1170173,0.0428\nCC-MAIN-2020-24,fao,149680,148965,0.0054\nCC-MAIN-2020-24,fas,16313340,16158829,0.5904\nCC-MAIN-2020-24,fij,1829,1826,0.0001\nCC-MAIN-2020-24,fin,11085491,10972289,0.4012\nCC-MAIN-2020-24,fra,121895645,120724482,4.4114\nCC-MAIN-2020-24,fry,87467,86784,0.0032\nCC-MAIN-2020-24,gla,38827,38730,0.0014\nCC-MAIN-2020-24,gle,176890,176086,0.0064\nCC-MAIN-2020-24,glg,1336937,1326431,0.0484\nCC-MAIN-2020-24,glv,10239,10219,0.0004\nCC-MAIN-2020-24,got,511,510,0.0000\nCC-MAIN-2020-24,grn,18842,18764,0.0007\nCC-MAIN-2020-24,guj,240732,239494,0.0087\nCC-MAIN-2020-24,hat,47150,46972,0.0017\nCC-MAIN-2020-24,hau,44070,43694,0.0016\nCC-MAIN-2020-24,haw,10562,10522,0.0004\nCC-MAIN-2020-24,heb,9210954,9111088,0.3333\nCC-MAIN-2020-24,hin,3220515,3201225,0.1165\nCC-MAIN-2020-24,hrv,7537696,7476703,0.2728\nCC-MAIN-2020-24,hun,14698987,14580467,0.5320\nCC-MAIN-2020-24,hye,1250331,1240743,0.0452\nCC-MAIN-2020-24,ibo,10707,10616,0.0004\nCC-MAIN-2020-24,iku,5458,5416,0.0002\nCC-MAIN-2020-24,ile,6967,6945,0.0003\nCC-MAIN-2020-24,ina,23236,23199,0.0008\nCC-MAIN-2020-24,ind,20976956,20822901,0.7592\nCC-MAIN-2020-24,ipk,2818,2785,0.0001\nCC-MAIN-2020-24,isl,1340623,1325752,0.0485\nCC-MAIN-2020-24,ita,64524138,63986214,2.3351\nCC-MAIN-2020-24,jav,64295,64112,0.0023\nCC-MAIN-2020-24,jpn,130184339,129381159,4.7113\nCC-MAIN-2020-24,kal,35763,35635,0.0013\nCC-MAIN-2020-24,kan,256935,256043,0.0093\nCC-MAIN-2020-24,kas,73,73,0.0000\nCC-MAIN-2020-24,kat,1679469,1668548,0.0608\nCC-MAIN-2020-24,kaz,834844,827576,0.0302\nCC-MAIN-2020-24,kha,4256,4208,0.0002\nCC-MAIN-2020-24,khm,264498,262276,0.0096\nCC-MAIN-2020-24,kin,51116,50870,0.0018\nCC-MAIN-2020-24,kir,201272,200187,0.0073\nCC-MAIN-2020-24,kor,23669451,23555716,0.8566\nCC-MAIN-2020-24,kur,225476,224008,0.0082\nCC-MAIN-2020-24,lao,78060,77873,0.0028\nCC-MAIN-2020-24,lat,3086138,3078040,0.1117\nCC-MAIN-2020-24,lav,4241005,4194240,0.1535\nCC-MAIN-2020-24,lif,33,33,0.0000\nCC-MAIN-2020-24,lin,10888,10874,0.0004\nCC-MAIN-2020-24,lit,7476366,7403577,0.2706\nCC-MAIN-2020-24,ltz,123480,122852,0.0045\nCC-MAIN-2020-24,lug,7841,7833,0.0003\nCC-MAIN-2020-24,mal,565127,562141,0.0205\nCC-MAIN-2020-24,mar,382408,378979,0.0138\nCC-MAIN-2020-24,mfe,1537,1523,0.0001\nCC-MAIN-2020-24,mkd,758678,751658,0.0275\nCC-MAIN-2020-24,mlg,99536,98707,0.0036\nCC-MAIN-2020-24,mlt,96806,96062,0.0035\nCC-MAIN-2020-24,mon,637849,634559,0.0231\nCC-MAIN-2020-24,mri,29848,29614,0.0011\nCC-MAIN-2020-24,msa,3421758,3402987,0.1238\nCC-MAIN-2020-24,mya,321637,319789,0.0116\nCC-MAIN-2020-24,nau,784,780,0.0000\nCC-MAIN-2020-24,nep,573108,570259,0.0207\nCC-MAIN-2020-24,new,35,35,0.0000\nCC-MAIN-2020-24,nld,49465307,48966039,1.7901\nCC-MAIN-2020-24,nno,569052,564860,0.0206\nCC-MAIN-2020-24,nor,9607000,9505300,0.3477\nCC-MAIN-2020-24,nso,2822,2820,0.0001\nCC-MAIN-2020-24,nya,9466,9353,0.0003\nCC-MAIN-2020-24,oci,94354,94148,0.0034\nCC-MAIN-2020-24,ori,73753,73623,0.0027\nCC-MAIN-2020-24,orm,9466,9418,0.0003\nCC-MAIN-2020-24,pan,180389,179395,0.0065\nCC-MAIN-2020-24,pol,48887354,48426507,1.7692\nCC-MAIN-2020-24,por,61701683,61201707,2.2330\nCC-MAIN-2020-24,pus,88491,87979,0.0032\nCC-MAIN-2020-24,que,21987,21950,0.0008\nCC-MAIN-2020-24,roh,60995,60619,0.0022\nCC-MAIN-2020-24,ron,16710263,16566620,0.6047\nCC-MAIN-2020-24,run,2036,2017,0.0001\nCC-MAIN-2020-24,rus,187203158,185664898,6.7749\nCC-MAIN-2020-24,sag,215,215,0.0000\nCC-MAIN-2020-24,san,91713,90965,0.0033\nCC-MAIN-2020-24,sco,16105,16032,0.0006\nCC-MAIN-2020-24,sin,218721,217823,0.0079\nCC-MAIN-2020-24,slk,8478284,8393563,0.3068\nCC-MAIN-2020-24,slv,6047717,5991722,0.2189\nCC-MAIN-2020-24,smo,12501,12441,0.0005\nCC-MAIN-2020-24,sna,11340,11309,0.0004\nCC-MAIN-2020-24,snd,32387,32030,0.0012\nCC-MAIN-2020-24,som,131440,131132,0.0048\nCC-MAIN-2020-24,sot,12014,11985,0.0004\nCC-MAIN-2020-24,spa,116398487,115413676,4.2124\nCC-MAIN-2020-24,sqi,1405955,1395006,0.0509\nCC-MAIN-2020-24,srp,8018632,7942717,0.2902\nCC-MAIN-2020-24,ssw,877,867,0.0000\nCC-MAIN-2020-24,sun,31378,31301,0.0011\nCC-MAIN-2020-24,sux,54,54,0.0000\nCC-MAIN-2020-24,swa,218490,216709,0.0079\nCC-MAIN-2020-24,swe,21206534,21004796,0.7675\nCC-MAIN-2020-24,syr,13918,13880,0.0005\nCC-MAIN-2020-24,tam,1243762,1236052,0.0450\nCC-MAIN-2020-24,tat,177078,176080,0.0064\nCC-MAIN-2020-24,tel,508632,506893,0.0184\nCC-MAIN-2020-24,tgk,159129,158341,0.0058\nCC-MAIN-2020-24,tgl,181878,180776,0.0066\nCC-MAIN-2020-24,tha,9687735,9630067,0.3506\nCC-MAIN-2020-24,tir,17860,17763,0.0006\nCC-MAIN-2020-24,ton,2212,2207,0.0001\nCC-MAIN-2020-24,tsn,8242,8180,0.0003\nCC-MAIN-2020-24,tso,1108,1104,0.0000\nCC-MAIN-2020-24,tuk,49715,49390,0.0018\nCC-MAIN-2020-24,tur,25741844,25509041,0.9316\nCC-MAIN-2020-24,uig,49260,49211,0.0018\nCC-MAIN-2020-24,ukr,10659848,10578042,0.3858\nCC-MAIN-2020-24,urd,679744,675428,0.0246\nCC-MAIN-2020-24,uzb,603528,598649,0.0218\nCC-MAIN-2020-24,ven,837,833,0.0000\nCC-MAIN-2020-24,vie,21271407,21090462,0.7698\nCC-MAIN-2020-24,vol,32095,32037,0.0012\nCC-MAIN-2020-24,war,86726,86386,0.0031\nCC-MAIN-2020-24,wol,3825,3809,0.0001\nCC-MAIN-2020-24,xho,13127,13078,0.0005\nCC-MAIN-2020-24,yid,55047,54870,0.0020\nCC-MAIN-2020-24,yor,24771,24705,0.0009\nCC-MAIN-2020-24,zha,1390,1387,0.0001\nCC-MAIN-2020-24,zho,212049832,210986221,7.6740\nCC-MAIN-2020-24,zul,22856,22780,0.0008\nCC-MAIN-2020-29,<unknown>,63590044,63590044,2.0221\nCC-MAIN-2020-29,aar,7388,7365,0.0002\nCC-MAIN-2020-29,abk,14542,14509,0.0005\nCC-MAIN-2020-29,afr,360165,358420,0.0115\nCC-MAIN-2020-29,aka,1735,1734,0.0001\nCC-MAIN-2020-29,amh,75810,75382,0.0024\nCC-MAIN-2020-29,ara,17504649,17360788,0.5566\nCC-MAIN-2020-29,asm,31211,30972,0.0010\nCC-MAIN-2020-29,aym,3559,3518,0.0001\nCC-MAIN-2020-29,aze,1717594,1704907,0.0546\nCC-MAIN-2020-29,bak,43940,43874,0.0014\nCC-MAIN-2020-29,bel,613169,608149,0.0195\nCC-MAIN-2020-29,ben,2375508,2361414,0.0755\nCC-MAIN-2020-29,bih,19497,19431,0.0006\nCC-MAIN-2020-29,bis,4705,4689,0.0001\nCC-MAIN-2020-29,blu,13117,13078,0.0004\nCC-MAIN-2020-29,bod,45564,45203,0.0014\nCC-MAIN-2020-29,bos,1307757,1299363,0.0416\nCC-MAIN-2020-29,bre,111971,111313,0.0036\nCC-MAIN-2020-29,bul,9966938,9893159,0.3169\nCC-MAIN-2020-29,cat,8541397,8459164,0.2716\nCC-MAIN-2020-29,ceb,56322,56255,0.0018\nCC-MAIN-2020-29,ces,33361996,33004462,1.0609\nCC-MAIN-2020-29,chr,2497,2488,0.0001\nCC-MAIN-2020-29,cos,73184,72981,0.0023\nCC-MAIN-2020-29,crs,1790,1784,0.0001\nCC-MAIN-2020-29,cym,389405,386938,0.0124\nCC-MAIN-2020-29,dan,14525853,14362935,0.4619\nCC-MAIN-2020-29,deu,178821800,176844138,5.6864\nCC-MAIN-2020-29,div,63813,63497,0.0020\nCC-MAIN-2020-29,dzo,2981,2977,0.0001\nCC-MAIN-2020-29,ell,17770175,17646972,0.5651\nCC-MAIN-2020-29,eng,1365003279,1350855247,43.4060\nCC-MAIN-2020-29,epo,264844,264245,0.0084\nCC-MAIN-2020-29,est,5187786,5139644,0.1650\nCC-MAIN-2020-29,eus,1196958,1184072,0.0381\nCC-MAIN-2020-29,fao,146747,145516,0.0047\nCC-MAIN-2020-29,fas,18018863,17844047,0.5730\nCC-MAIN-2020-29,fij,2577,2568,0.0001\nCC-MAIN-2020-29,fin,13128533,12975146,0.4175\nCC-MAIN-2020-29,fra,146145276,144582780,4.6473\nCC-MAIN-2020-29,fry,90083,89663,0.0029\nCC-MAIN-2020-29,gla,41175,41102,0.0013\nCC-MAIN-2020-29,gle,211996,210996,0.0067\nCC-MAIN-2020-29,glg,1319199,1311973,0.0419\nCC-MAIN-2020-29,glv,14663,14643,0.0005\nCC-MAIN-2020-29,got,1523,1521,0.0000\nCC-MAIN-2020-29,grn,21379,21257,0.0007\nCC-MAIN-2020-29,guj,253841,252377,0.0081\nCC-MAIN-2020-29,hat,50066,49810,0.0016\nCC-MAIN-2020-29,hau,44682,44527,0.0014\nCC-MAIN-2020-29,haw,11336,11299,0.0004\nCC-MAIN-2020-29,heb,9412872,9311587,0.2993\nCC-MAIN-2020-29,hin,3292090,3271915,0.1047\nCC-MAIN-2020-29,hrv,7176613,7113663,0.2282\nCC-MAIN-2020-29,hun,16880313,16726242,0.5368\nCC-MAIN-2020-29,hye,1239058,1232107,0.0394\nCC-MAIN-2020-29,ibo,12168,12141,0.0004\nCC-MAIN-2020-29,iku,7588,7487,0.0002\nCC-MAIN-2020-29,ile,9336,9314,0.0003\nCC-MAIN-2020-29,ina,20849,20769,0.0007\nCC-MAIN-2020-29,ind,23828411,23630283,0.7577\nCC-MAIN-2020-29,ipk,3818,3752,0.0001\nCC-MAIN-2020-29,isl,1356607,1345210,0.0431\nCC-MAIN-2020-29,ita,76451976,75756294,2.4311\nCC-MAIN-2020-29,jav,73033,72765,0.0023\nCC-MAIN-2020-29,jpn,152383698,151328615,4.8457\nCC-MAIN-2020-29,kal,38872,38622,0.0012\nCC-MAIN-2020-29,kan,281719,280232,0.0090\nCC-MAIN-2020-29,kas,173,173,0.0000\nCC-MAIN-2020-29,kat,1545937,1537976,0.0492\nCC-MAIN-2020-29,kaz,797359,789940,0.0254\nCC-MAIN-2020-29,kha,4532,4507,0.0001\nCC-MAIN-2020-29,khm,256433,255065,0.0082\nCC-MAIN-2020-29,kin,51005,50558,0.0016\nCC-MAIN-2020-29,kir,175501,174824,0.0056\nCC-MAIN-2020-29,kor,24847663,24731924,0.7901\nCC-MAIN-2020-29,kur,212256,209573,0.0067\nCC-MAIN-2020-29,lao,82873,82440,0.0026\nCC-MAIN-2020-29,lat,4715922,4707491,0.1500\nCC-MAIN-2020-29,lav,3890462,3851516,0.1237\nCC-MAIN-2020-29,lif,50,48,0.0000\nCC-MAIN-2020-29,lin,7363,7342,0.0002\nCC-MAIN-2020-29,lit,6613586,6553506,0.2103\nCC-MAIN-2020-29,ltz,131446,130960,0.0042\nCC-MAIN-2020-29,lug,7198,7119,0.0002\nCC-MAIN-2020-29,mal,577713,575424,0.0184\nCC-MAIN-2020-29,mar,426899,422752,0.0136\nCC-MAIN-2020-29,mfe,1678,1653,0.0001\nCC-MAIN-2020-29,mkd,830348,823511,0.0264\nCC-MAIN-2020-29,mlg,112371,111827,0.0036\nCC-MAIN-2020-29,mlt,106684,104412,0.0034\nCC-MAIN-2020-29,mon,598791,596581,0.0190\nCC-MAIN-2020-29,mri,35170,34812,0.0011\nCC-MAIN-2020-29,msa,3843511,3825665,0.1222\nCC-MAIN-2020-29,mya,380205,377967,0.0121\nCC-MAIN-2020-29,nau,954,948,0.0000\nCC-MAIN-2020-29,nep,571095,566551,0.0182\nCC-MAIN-2020-29,new,2,2,0.0000\nCC-MAIN-2020-29,nld,57480843,56860419,1.8278\nCC-MAIN-2020-29,nno,615734,611557,0.0196\nCC-MAIN-2020-29,nor,11067991,10937732,0.3520\nCC-MAIN-2020-29,nso,4109,4103,0.0001\nCC-MAIN-2020-29,nya,8293,8226,0.0003\nCC-MAIN-2020-29,oci,105689,105434,0.0034\nCC-MAIN-2020-29,ori,72858,72397,0.0023\nCC-MAIN-2020-29,orm,10201,10176,0.0003\nCC-MAIN-2020-29,pan,148652,147391,0.0047\nCC-MAIN-2020-29,pol,55398038,54846611,1.7616\nCC-MAIN-2020-29,por,68380096,67802053,2.1744\nCC-MAIN-2020-29,pus,92074,91430,0.0029\nCC-MAIN-2020-29,que,28771,28721,0.0009\nCC-MAIN-2020-29,roh,41339,41215,0.0013\nCC-MAIN-2020-29,ron,18781663,18612044,0.5972\nCC-MAIN-2020-29,run,2321,2304,0.0001\nCC-MAIN-2020-29,rus,223863063,221798417,7.1187\nCC-MAIN-2020-29,sag,696,695,0.0000\nCC-MAIN-2020-29,san,98651,97598,0.0031\nCC-MAIN-2020-29,sco,16571,16499,0.0005\nCC-MAIN-2020-29,sin,232591,230938,0.0074\nCC-MAIN-2020-29,slk,10136876,10016565,0.3223\nCC-MAIN-2020-29,slv,5531327,5480255,0.1759\nCC-MAIN-2020-29,smo,12359,12313,0.0004\nCC-MAIN-2020-29,sna,7382,7345,0.0002\nCC-MAIN-2020-29,snd,33446,33118,0.0011\nCC-MAIN-2020-29,som,111889,111144,0.0036\nCC-MAIN-2020-29,sot,14102,13995,0.0004\nCC-MAIN-2020-29,spa,135814588,134532982,4.3188\nCC-MAIN-2020-29,sqi,1366116,1355384,0.0434\nCC-MAIN-2020-29,srp,7790074,7724436,0.2477\nCC-MAIN-2020-29,ssw,1177,1171,0.0000\nCC-MAIN-2020-29,sun,41855,41717,0.0013\nCC-MAIN-2020-29,sux,82,82,0.0000\nCC-MAIN-2020-29,swa,223639,221292,0.0071\nCC-MAIN-2020-29,swe,24533576,24272408,0.7801\nCC-MAIN-2020-29,syr,14853,14823,0.0005\nCC-MAIN-2020-29,tam,1384546,1374880,0.0440\nCC-MAIN-2020-29,tat,207270,206118,0.0066\nCC-MAIN-2020-29,tel,515581,513547,0.0164\nCC-MAIN-2020-29,tgk,193445,192950,0.0062\nCC-MAIN-2020-29,tgl,186512,185672,0.0059\nCC-MAIN-2020-29,tha,10348539,10284251,0.3291\nCC-MAIN-2020-29,tir,16843,16609,0.0005\nCC-MAIN-2020-29,ton,1656,1652,0.0001\nCC-MAIN-2020-29,tsn,6958,6899,0.0002\nCC-MAIN-2020-29,tso,1720,1713,0.0001\nCC-MAIN-2020-29,tuk,53459,53074,0.0017\nCC-MAIN-2020-29,tur,28114010,27846770,0.8940\nCC-MAIN-2020-29,uig,51774,51530,0.0016\nCC-MAIN-2020-29,ukr,11781824,11688969,0.3747\nCC-MAIN-2020-29,urd,721064,717201,0.0229\nCC-MAIN-2020-29,uzb,549782,546055,0.0175\nCC-MAIN-2020-29,ven,883,881,0.0000\nCC-MAIN-2020-29,vie,25448589,25203589,0.8092\nCC-MAIN-2020-29,vol,44505,44474,0.0014\nCC-MAIN-2020-29,war,91954,91672,0.0029\nCC-MAIN-2020-29,wol,5335,5300,0.0002\nCC-MAIN-2020-29,xho,11284,11232,0.0004\nCC-MAIN-2020-29,yid,63918,63819,0.0020\nCC-MAIN-2020-29,yor,29245,29195,0.0009\nCC-MAIN-2020-29,zha,2087,2081,0.0001\nCC-MAIN-2020-29,zho,196909900,195902179,6.2616\nCC-MAIN-2020-29,zul,38069,37936,0.0012\nCC-MAIN-2020-34,<unknown>,57629154,57629154,2.3524\nCC-MAIN-2020-34,aar,6046,6022,0.0002\nCC-MAIN-2020-34,abk,9849,9832,0.0004\nCC-MAIN-2020-34,afr,316484,315612,0.0129\nCC-MAIN-2020-34,aka,1144,1143,0.0000\nCC-MAIN-2020-34,amh,50741,50378,0.0021\nCC-MAIN-2020-34,ara,14371255,14261994,0.5866\nCC-MAIN-2020-34,asm,24009,23779,0.0010\nCC-MAIN-2020-34,aym,2217,2205,0.0001\nCC-MAIN-2020-34,aze,1402486,1394069,0.0572\nCC-MAIN-2020-34,bak,59498,59379,0.0024\nCC-MAIN-2020-34,bel,543550,540216,0.0222\nCC-MAIN-2020-34,ben,2046419,2033000,0.0835\nCC-MAIN-2020-34,bih,13812,13787,0.0006\nCC-MAIN-2020-34,bis,3145,3101,0.0001\nCC-MAIN-2020-34,blu,8072,8060,0.0003\nCC-MAIN-2020-34,bod,30649,30461,0.0013\nCC-MAIN-2020-34,bos,1077246,1072227,0.0440\nCC-MAIN-2020-34,bre,127736,127597,0.0052\nCC-MAIN-2020-34,bul,7416328,7367345,0.3027\nCC-MAIN-2020-34,cat,6947313,6888023,0.2836\nCC-MAIN-2020-34,ceb,82653,82635,0.0034\nCC-MAIN-2020-34,ces,24063225,23860846,0.9822\nCC-MAIN-2020-34,chr,1670,1670,0.0001\nCC-MAIN-2020-34,cos,60931,60728,0.0025\nCC-MAIN-2020-34,crs,1432,1424,0.0001\nCC-MAIN-2020-34,cym,362037,360264,0.0148\nCC-MAIN-2020-34,dan,10991610,10888172,0.4487\nCC-MAIN-2020-34,deu,135906725,134570815,5.5476\nCC-MAIN-2020-34,div,46568,46426,0.0019\nCC-MAIN-2020-34,dzo,2195,2195,0.0001\nCC-MAIN-2020-34,ell,13463070,13383959,0.5496\nCC-MAIN-2020-34,eng,1071880271,1061638128,43.7532\nCC-MAIN-2020-34,epo,282426,281855,0.0115\nCC-MAIN-2020-34,est,4137757,4097409,0.1689\nCC-MAIN-2020-34,eus,1023698,1012856,0.0418\nCC-MAIN-2020-34,fao,105319,104887,0.0043\nCC-MAIN-2020-34,fas,13295647,13189519,0.5427\nCC-MAIN-2020-34,fij,1949,1945,0.0001\nCC-MAIN-2020-34,fin,9973794,9889684,0.4071\nCC-MAIN-2020-34,fra,113214103,112180354,4.6213\nCC-MAIN-2020-34,fry,92703,92455,0.0038\nCC-MAIN-2020-34,gla,32973,32935,0.0013\nCC-MAIN-2020-34,gle,167723,166750,0.0068\nCC-MAIN-2020-34,glg,1191002,1185468,0.0486\nCC-MAIN-2020-34,glv,11507,11489,0.0005\nCC-MAIN-2020-34,got,678,678,0.0000\nCC-MAIN-2020-34,grn,16485,16428,0.0007\nCC-MAIN-2020-34,guj,218327,217110,0.0089\nCC-MAIN-2020-34,hat,42981,42822,0.0018\nCC-MAIN-2020-34,hau,38298,38034,0.0016\nCC-MAIN-2020-34,haw,8878,8859,0.0004\nCC-MAIN-2020-34,heb,7101278,7039869,0.2899\nCC-MAIN-2020-34,hin,2823809,2808456,0.1153\nCC-MAIN-2020-34,hrv,5585247,5540034,0.2280\nCC-MAIN-2020-34,hun,13043445,12940963,0.5324\nCC-MAIN-2020-34,hye,1137324,1130904,0.0464\nCC-MAIN-2020-34,ibo,8990,8971,0.0004\nCC-MAIN-2020-34,iku,4959,4859,0.0002\nCC-MAIN-2020-34,ile,11140,11120,0.0005\nCC-MAIN-2020-34,ina,15711,15648,0.0006\nCC-MAIN-2020-34,ind,17706809,17568457,0.7228\nCC-MAIN-2020-34,ipk,2857,2790,0.0001\nCC-MAIN-2020-34,isl,1063504,1055966,0.0434\nCC-MAIN-2020-34,ita,58842821,58350726,2.4019\nCC-MAIN-2020-34,jav,76500,76334,0.0031\nCC-MAIN-2020-34,jpn,118846038,118175846,4.8512\nCC-MAIN-2020-34,kal,32380,32258,0.0013\nCC-MAIN-2020-34,kan,234763,233876,0.0096\nCC-MAIN-2020-34,kas,27,26,0.0000\nCC-MAIN-2020-34,kat,1259183,1251290,0.0514\nCC-MAIN-2020-34,kaz,671037,665939,0.0274\nCC-MAIN-2020-34,kha,3817,3801,0.0002\nCC-MAIN-2020-34,khm,218123,216839,0.0089\nCC-MAIN-2020-34,kin,38497,38248,0.0016\nCC-MAIN-2020-34,kir,155633,155171,0.0064\nCC-MAIN-2020-34,kor,20408050,20315390,0.8330\nCC-MAIN-2020-34,kur,178949,178229,0.0073\nCC-MAIN-2020-34,lao,61926,61791,0.0025\nCC-MAIN-2020-34,lat,4284599,4279140,0.1749\nCC-MAIN-2020-34,lav,2904734,2880955,0.1186\nCC-MAIN-2020-34,lif,58,55,0.0000\nCC-MAIN-2020-34,lin,7869,7860,0.0003\nCC-MAIN-2020-34,lit,4894885,4854045,0.1998\nCC-MAIN-2020-34,ltz,111647,111205,0.0046\nCC-MAIN-2020-34,lug,5384,5346,0.0002\nCC-MAIN-2020-34,mal,562270,558937,0.0230\nCC-MAIN-2020-34,mar,403177,400466,0.0165\nCC-MAIN-2020-34,mfe,1504,1481,0.0001\nCC-MAIN-2020-34,mkd,691798,687269,0.0282\nCC-MAIN-2020-34,mlg,104025,103574,0.0042\nCC-MAIN-2020-34,mlt,97748,96987,0.0040\nCC-MAIN-2020-34,mon,462132,460189,0.0189\nCC-MAIN-2020-34,mri,36727,36504,0.0015\nCC-MAIN-2020-34,msa,3507934,3496841,0.1432\nCC-MAIN-2020-34,mya,312516,311505,0.0128\nCC-MAIN-2020-34,nau,831,822,0.0000\nCC-MAIN-2020-34,nep,491259,485918,0.0201\nCC-MAIN-2020-34,nld,42532300,42129464,1.7361\nCC-MAIN-2020-34,nno,530115,527069,0.0216\nCC-MAIN-2020-34,nor,8621078,8536743,0.3519\nCC-MAIN-2020-34,nso,2314,2314,0.0001\nCC-MAIN-2020-34,nya,7583,7550,0.0003\nCC-MAIN-2020-34,oci,119609,119419,0.0049\nCC-MAIN-2020-34,ori,63764,63555,0.0026\nCC-MAIN-2020-34,orm,6635,6617,0.0003\nCC-MAIN-2020-34,pan,131757,131295,0.0054\nCC-MAIN-2020-34,pol,41862929,41496169,1.7088\nCC-MAIN-2020-34,por,52691211,52301028,2.1508\nCC-MAIN-2020-34,pus,71793,71510,0.0029\nCC-MAIN-2020-34,que,27815,27795,0.0011\nCC-MAIN-2020-34,roh,34822,34727,0.0014\nCC-MAIN-2020-34,ron,14252687,14144650,0.5818\nCC-MAIN-2020-34,run,1835,1814,0.0001\nCC-MAIN-2020-34,rus,160940583,159722418,6.5694\nCC-MAIN-2020-34,sag,267,267,0.0000\nCC-MAIN-2020-34,san,82933,81590,0.0034\nCC-MAIN-2020-34,sco,15952,15739,0.0007\nCC-MAIN-2020-34,sin,170193,169349,0.0069\nCC-MAIN-2020-34,slk,7370325,7304947,0.3008\nCC-MAIN-2020-34,slv,4255927,4219862,0.1737\nCC-MAIN-2020-34,smo,9571,9542,0.0004\nCC-MAIN-2020-34,sna,6298,6288,0.0003\nCC-MAIN-2020-34,snd,29849,29781,0.0012\nCC-MAIN-2020-34,som,83708,83214,0.0034\nCC-MAIN-2020-34,sot,7552,7477,0.0003\nCC-MAIN-2020-34,spa,104884818,104035905,4.2813\nCC-MAIN-2020-34,sqi,1129021,1122159,0.0461\nCC-MAIN-2020-34,srp,6134783,6089371,0.2504\nCC-MAIN-2020-34,ssw,709,704,0.0000\nCC-MAIN-2020-34,sun,28194,28154,0.0012\nCC-MAIN-2020-34,sux,59,59,0.0000\nCC-MAIN-2020-34,swa,196922,195689,0.0080\nCC-MAIN-2020-34,swe,18341879,18184768,0.7487\nCC-MAIN-2020-34,syr,14211,14168,0.0006\nCC-MAIN-2020-34,tam,1170234,1163079,0.0478\nCC-MAIN-2020-34,tat,191764,190820,0.0078\nCC-MAIN-2020-34,tel,486134,484438,0.0198\nCC-MAIN-2020-34,tgk,168064,167824,0.0069\nCC-MAIN-2020-34,tgl,183725,182895,0.0075\nCC-MAIN-2020-34,tha,8777308,8730602,0.3583\nCC-MAIN-2020-34,tir,12090,11796,0.0005\nCC-MAIN-2020-34,ton,1416,1412,0.0001\nCC-MAIN-2020-34,tsn,5885,5838,0.0002\nCC-MAIN-2020-34,tso,1006,997,0.0000\nCC-MAIN-2020-34,tuk,38129,37831,0.0016\nCC-MAIN-2020-34,tur,20937544,20769035,0.8547\nCC-MAIN-2020-34,uig,44472,44393,0.0018\nCC-MAIN-2020-34,ukr,9281521,9220269,0.3789\nCC-MAIN-2020-34,urd,628594,624440,0.0257\nCC-MAIN-2020-34,uzb,501338,498367,0.0205\nCC-MAIN-2020-34,ven,905,904,0.0000\nCC-MAIN-2020-34,vie,19861147,19701077,0.8107\nCC-MAIN-2020-34,vol,50911,50893,0.0021\nCC-MAIN-2020-34,war,110894,110539,0.0045\nCC-MAIN-2020-34,wol,4474,4457,0.0002\nCC-MAIN-2020-34,xho,8074,8041,0.0003\nCC-MAIN-2020-34,yid,57133,56972,0.0023\nCC-MAIN-2020-34,yor,26327,26303,0.0011\nCC-MAIN-2020-34,zha,953,951,0.0000\nCC-MAIN-2020-34,zho,161361769,160614355,6.5866\nCC-MAIN-2020-34,zul,40725,40635,0.0017\nCC-MAIN-2020-40,<unknown>,95987305,95987305,2.7634\nCC-MAIN-2020-40,aar,5247,5231,0.0002\nCC-MAIN-2020-40,abk,12503,12482,0.0004\nCC-MAIN-2020-40,afr,346477,344779,0.0100\nCC-MAIN-2020-40,aka,2680,2668,0.0001\nCC-MAIN-2020-40,amh,91574,91322,0.0026\nCC-MAIN-2020-40,ara,18630929,18505951,0.5364\nCC-MAIN-2020-40,asm,41319,41034,0.0012\nCC-MAIN-2020-40,aym,2290,2244,0.0001\nCC-MAIN-2020-40,aze,1566811,1556390,0.0451\nCC-MAIN-2020-40,bak,45601,45549,0.0013\nCC-MAIN-2020-40,bel,560786,558590,0.0161\nCC-MAIN-2020-40,ben,2601951,2591397,0.0749\nCC-MAIN-2020-40,bih,20056,20032,0.0006\nCC-MAIN-2020-40,bis,3832,3795,0.0001\nCC-MAIN-2020-40,blu,9085,9059,0.0003\nCC-MAIN-2020-40,bod,37524,37356,0.0011\nCC-MAIN-2020-40,bos,1338763,1332784,0.0385\nCC-MAIN-2020-40,bre,106602,106247,0.0031\nCC-MAIN-2020-40,bul,9723648,9660247,0.2799\nCC-MAIN-2020-40,cat,7933920,7875983,0.2284\nCC-MAIN-2020-40,ceb,60673,60626,0.0017\nCC-MAIN-2020-40,ces,38769407,38422223,1.1161\nCC-MAIN-2020-40,chr,2146,2146,0.0001\nCC-MAIN-2020-40,cos,65381,65155,0.0019\nCC-MAIN-2020-40,crs,1877,1836,0.0001\nCC-MAIN-2020-40,cym,343518,341391,0.0099\nCC-MAIN-2020-40,dan,15126043,14991482,0.4355\nCC-MAIN-2020-40,deu,192395120,190458267,5.5388\nCC-MAIN-2020-40,div,57107,56834,0.0016\nCC-MAIN-2020-40,dzo,3080,3079,0.0001\nCC-MAIN-2020-40,ell,18001663,17904740,0.5182\nCC-MAIN-2020-40,eng,1475101941,1462537038,42.4664\nCC-MAIN-2020-40,epo,237955,237444,0.0069\nCC-MAIN-2020-40,est,4714574,4676035,0.1357\nCC-MAIN-2020-40,eus,1048796,1037812,0.0302\nCC-MAIN-2020-40,fao,134917,134085,0.0039\nCC-MAIN-2020-40,fas,21592072,21431380,0.6216\nCC-MAIN-2020-40,fij,2687,2676,0.0001\nCC-MAIN-2020-40,fin,13486690,13360105,0.3883\nCC-MAIN-2020-40,fra,155414919,154062789,4.4742\nCC-MAIN-2020-40,fry,86220,85965,0.0025\nCC-MAIN-2020-40,gla,45004,44958,0.0013\nCC-MAIN-2020-40,gle,171401,170666,0.0049\nCC-MAIN-2020-40,glg,1150028,1144556,0.0331\nCC-MAIN-2020-40,glv,11063,11052,0.0003\nCC-MAIN-2020-40,got,1296,1296,0.0000\nCC-MAIN-2020-40,grn,21691,21468,0.0006\nCC-MAIN-2020-40,guj,250020,249061,0.0072\nCC-MAIN-2020-40,hat,48335,48220,0.0014\nCC-MAIN-2020-40,hau,51470,51332,0.0015\nCC-MAIN-2020-40,haw,8745,8732,0.0003\nCC-MAIN-2020-40,heb,8590521,8488248,0.2473\nCC-MAIN-2020-40,hin,3754213,3736904,0.1081\nCC-MAIN-2020-40,hrv,6657335,6617408,0.1917\nCC-MAIN-2020-40,hun,19242671,19104381,0.5540\nCC-MAIN-2020-40,hye,1138422,1130566,0.0328\nCC-MAIN-2020-40,ibo,9684,9668,0.0003\nCC-MAIN-2020-40,iku,6797,6684,0.0002\nCC-MAIN-2020-40,ile,9239,9222,0.0003\nCC-MAIN-2020-40,ina,20697,20634,0.0006\nCC-MAIN-2020-40,ind,28818911,28640428,0.8297\nCC-MAIN-2020-40,ipk,4444,4337,0.0001\nCC-MAIN-2020-40,isl,1293356,1283314,0.0372\nCC-MAIN-2020-40,ita,84279224,83641458,2.4263\nCC-MAIN-2020-40,jav,62283,62230,0.0018\nCC-MAIN-2020-40,jpn,174755947,173633748,5.0310\nCC-MAIN-2020-40,kal,31762,31618,0.0009\nCC-MAIN-2020-40,kan,300239,299529,0.0086\nCC-MAIN-2020-40,kas,228,228,0.0000\nCC-MAIN-2020-40,kat,1371936,1364038,0.0395\nCC-MAIN-2020-40,kaz,789548,779245,0.0227\nCC-MAIN-2020-40,kha,4856,4843,0.0001\nCC-MAIN-2020-40,khm,268747,267108,0.0077\nCC-MAIN-2020-40,kin,57869,57595,0.0017\nCC-MAIN-2020-40,kir,180581,179461,0.0052\nCC-MAIN-2020-40,kor,22491868,22395378,0.6475\nCC-MAIN-2020-40,kur,209703,208880,0.0060\nCC-MAIN-2020-40,lao,88589,88424,0.0026\nCC-MAIN-2020-40,lat,8020904,8012348,0.2309\nCC-MAIN-2020-40,lav,3334272,3307575,0.0960\nCC-MAIN-2020-40,lif,51,50,0.0000\nCC-MAIN-2020-40,lin,7775,7746,0.0002\nCC-MAIN-2020-40,lit,5436678,5390996,0.1565\nCC-MAIN-2020-40,ltz,109997,109281,0.0032\nCC-MAIN-2020-40,lug,7430,7410,0.0002\nCC-MAIN-2020-40,mal,618498,615894,0.0178\nCC-MAIN-2020-40,mar,479395,476203,0.0138\nCC-MAIN-2020-40,mfe,2095,2084,0.0001\nCC-MAIN-2020-40,mkd,873962,868971,0.0252\nCC-MAIN-2020-40,mlg,88145,87808,0.0025\nCC-MAIN-2020-40,mlt,103212,102705,0.0030\nCC-MAIN-2020-40,mon,480747,478607,0.0138\nCC-MAIN-2020-40,mri,31858,31495,0.0009\nCC-MAIN-2020-40,msa,3480285,3467733,0.1002\nCC-MAIN-2020-40,mya,369319,368156,0.0106\nCC-MAIN-2020-40,nau,863,858,0.0000\nCC-MAIN-2020-40,nep,719212,702488,0.0207\nCC-MAIN-2020-40,new,2,2,0.0000\nCC-MAIN-2020-40,nld,62401575,61856503,1.7965\nCC-MAIN-2020-40,nno,568700,564975,0.0164\nCC-MAIN-2020-40,nor,12038922,11898810,0.3466\nCC-MAIN-2020-40,nso,3240,3240,0.0001\nCC-MAIN-2020-40,nya,7697,7583,0.0002\nCC-MAIN-2020-40,oci,117552,117282,0.0034\nCC-MAIN-2020-40,ori,130127,129923,0.0037\nCC-MAIN-2020-40,orm,11993,11889,0.0003\nCC-MAIN-2020-40,pan,158775,158395,0.0046\nCC-MAIN-2020-40,pol,55636920,55179717,1.6017\nCC-MAIN-2020-40,por,75676803,75140224,2.1786\nCC-MAIN-2020-40,pus,83454,83133,0.0024\nCC-MAIN-2020-40,que,27516,27498,0.0008\nCC-MAIN-2020-40,roh,35779,35097,0.0010\nCC-MAIN-2020-40,ron,20518619,20380943,0.5907\nCC-MAIN-2020-40,run,3001,2990,0.0001\nCC-MAIN-2020-40,rus,293129367,291059066,8.4388\nCC-MAIN-2020-40,sag,581,581,0.0000\nCC-MAIN-2020-40,san,80885,80627,0.0023\nCC-MAIN-2020-40,sco,13992,13785,0.0004\nCC-MAIN-2020-40,sin,222145,221365,0.0064\nCC-MAIN-2020-40,slk,11453880,11357806,0.3297\nCC-MAIN-2020-40,slv,4908275,4872132,0.1413\nCC-MAIN-2020-40,smo,7911,7884,0.0002\nCC-MAIN-2020-40,sna,7316,7294,0.0002\nCC-MAIN-2020-40,snd,29957,29836,0.0009\nCC-MAIN-2020-40,som,146143,145606,0.0042\nCC-MAIN-2020-40,sot,8964,8940,0.0003\nCC-MAIN-2020-40,spa,149518692,148303686,4.3045\nCC-MAIN-2020-40,sqi,1358808,1353643,0.0391\nCC-MAIN-2020-40,srp,7201237,7152217,0.2073\nCC-MAIN-2020-40,ssw,1019,1009,0.0000\nCC-MAIN-2020-40,sun,31588,31551,0.0009\nCC-MAIN-2020-40,sux,54,54,0.0000\nCC-MAIN-2020-40,swa,201621,200671,0.0058\nCC-MAIN-2020-40,swe,25324317,25104748,0.7291\nCC-MAIN-2020-40,syr,15015,14979,0.0004\nCC-MAIN-2020-40,tam,1381873,1372940,0.0398\nCC-MAIN-2020-40,tat,275340,274381,0.0079\nCC-MAIN-2020-40,tel,534577,533239,0.0154\nCC-MAIN-2020-40,tgk,158834,158583,0.0046\nCC-MAIN-2020-40,tgl,193299,192524,0.0056\nCC-MAIN-2020-40,tha,11126173,11065450,0.3203\nCC-MAIN-2020-40,tir,27630,27314,0.0008\nCC-MAIN-2020-40,ton,1782,1778,0.0001\nCC-MAIN-2020-40,tsn,7381,7328,0.0002\nCC-MAIN-2020-40,tso,1585,1584,0.0000\nCC-MAIN-2020-40,tuk,48745,48613,0.0014\nCC-MAIN-2020-40,tur,34591897,34356240,0.9959\nCC-MAIN-2020-40,uig,40788,40564,0.0012\nCC-MAIN-2020-40,ukr,13519002,13433131,0.3892\nCC-MAIN-2020-40,urd,751868,747998,0.0216\nCC-MAIN-2020-40,uzb,535085,531680,0.0154\nCC-MAIN-2020-40,ven,794,790,0.0000\nCC-MAIN-2020-40,vie,30146892,29927237,0.8679\nCC-MAIN-2020-40,vol,31615,31605,0.0009\nCC-MAIN-2020-40,war,83272,82990,0.0024\nCC-MAIN-2020-40,wol,5364,5352,0.0002\nCC-MAIN-2020-40,xho,14542,14481,0.0004\nCC-MAIN-2020-40,yid,59738,59555,0.0017\nCC-MAIN-2020-40,yor,28208,28183,0.0008\nCC-MAIN-2020-40,zha,2257,2249,0.0001\nCC-MAIN-2020-40,zho,202805553,201863517,5.8385\nCC-MAIN-2020-40,zul,35560,35454,0.0010\nCC-MAIN-2020-45,<unknown>,75363030,75363030,2.7595\nCC-MAIN-2020-45,aar,5040,5022,0.0002\nCC-MAIN-2020-45,abk,9324,9311,0.0003\nCC-MAIN-2020-45,afr,320918,319487,0.0118\nCC-MAIN-2020-45,aka,2645,2627,0.0001\nCC-MAIN-2020-45,amh,74000,73591,0.0027\nCC-MAIN-2020-45,ara,15877432,15761427,0.5814\nCC-MAIN-2020-45,asm,49305,48284,0.0018\nCC-MAIN-2020-45,aym,1706,1668,0.0001\nCC-MAIN-2020-45,aze,1343458,1334390,0.0492\nCC-MAIN-2020-45,bak,41420,41364,0.0015\nCC-MAIN-2020-45,bel,517269,515896,0.0189\nCC-MAIN-2020-45,ben,2242003,2233610,0.0821\nCC-MAIN-2020-45,bih,18312,18290,0.0007\nCC-MAIN-2020-45,bis,2895,2868,0.0001\nCC-MAIN-2020-45,blu,7817,7794,0.0003\nCC-MAIN-2020-45,bod,34574,34464,0.0013\nCC-MAIN-2020-45,bos,1120682,1113985,0.0410\nCC-MAIN-2020-45,bre,93889,93780,0.0034\nCC-MAIN-2020-45,bul,7427905,7378567,0.2720\nCC-MAIN-2020-45,cat,6326501,6291540,0.2316\nCC-MAIN-2020-45,ceb,50339,50312,0.0018\nCC-MAIN-2020-45,ces,28755214,28499052,1.0529\nCC-MAIN-2020-45,chr,1631,1631,0.0001\nCC-MAIN-2020-45,cos,61251,61167,0.0022\nCC-MAIN-2020-45,crs,1492,1484,0.0001\nCC-MAIN-2020-45,cym,320579,318931,0.0117\nCC-MAIN-2020-45,dan,11976326,11876437,0.4385\nCC-MAIN-2020-45,deu,146322251,144975093,5.3577\nCC-MAIN-2020-45,div,44254,43976,0.0016\nCC-MAIN-2020-45,dzo,2036,2036,0.0001\nCC-MAIN-2020-45,ell,15102620,15015011,0.5530\nCC-MAIN-2020-45,eng,1191092734,1180501336,43.6128\nCC-MAIN-2020-45,epo,260197,259584,0.0095\nCC-MAIN-2020-45,est,3747961,3713083,0.1372\nCC-MAIN-2020-45,eus,843167,835476,0.0309\nCC-MAIN-2020-45,fao,97369,96869,0.0036\nCC-MAIN-2020-45,fas,16016576,15895282,0.5865\nCC-MAIN-2020-45,fij,2141,2140,0.0001\nCC-MAIN-2020-45,fin,10828811,10748076,0.3965\nCC-MAIN-2020-45,fra,120769915,119744966,4.4221\nCC-MAIN-2020-45,fry,89715,89574,0.0033\nCC-MAIN-2020-45,gla,40184,40134,0.0015\nCC-MAIN-2020-45,gle,186854,186220,0.0068\nCC-MAIN-2020-45,glg,1006038,1001537,0.0368\nCC-MAIN-2020-45,glv,9563,9553,0.0004\nCC-MAIN-2020-45,got,529,529,0.0000\nCC-MAIN-2020-45,grn,14847,14758,0.0005\nCC-MAIN-2020-45,guj,232550,231484,0.0085\nCC-MAIN-2020-45,hat,41757,41670,0.0015\nCC-MAIN-2020-45,hau,45451,45285,0.0017\nCC-MAIN-2020-45,haw,7236,7219,0.0003\nCC-MAIN-2020-45,heb,6949705,6893685,0.2545\nCC-MAIN-2020-45,hin,3502098,3481719,0.1282\nCC-MAIN-2020-45,hrv,5218689,5187671,0.1911\nCC-MAIN-2020-45,hun,14683253,14566847,0.5376\nCC-MAIN-2020-45,hye,927417,921794,0.0340\nCC-MAIN-2020-45,ibo,10866,10658,0.0004\nCC-MAIN-2020-45,iku,5268,5175,0.0002\nCC-MAIN-2020-45,ile,9328,9309,0.0003\nCC-MAIN-2020-45,ina,16611,16569,0.0006\nCC-MAIN-2020-45,ind,22293229,22169356,0.8163\nCC-MAIN-2020-45,ipk,4402,4350,0.0002\nCC-MAIN-2020-45,isl,1062483,1053465,0.0389\nCC-MAIN-2020-45,ita,65373733,64885747,2.3937\nCC-MAIN-2020-45,jav,56250,56154,0.0021\nCC-MAIN-2020-45,jpn,124774244,124037368,4.5687\nCC-MAIN-2020-45,kal,22523,22291,0.0008\nCC-MAIN-2020-45,kan,259332,258407,0.0095\nCC-MAIN-2020-45,kas,50,50,0.0000\nCC-MAIN-2020-45,kat,1137503,1131501,0.0417\nCC-MAIN-2020-45,kaz,583718,580316,0.0214\nCC-MAIN-2020-45,kha,3124,3107,0.0001\nCC-MAIN-2020-45,khm,238778,238052,0.0087\nCC-MAIN-2020-45,kin,52308,52129,0.0019\nCC-MAIN-2020-45,kir,136211,135467,0.0050\nCC-MAIN-2020-45,kor,19445941,19349001,0.7120\nCC-MAIN-2020-45,kur,183129,182590,0.0067\nCC-MAIN-2020-45,lao,92412,92279,0.0034\nCC-MAIN-2020-45,lat,8660921,8654156,0.3171\nCC-MAIN-2020-45,lav,2547816,2522677,0.0933\nCC-MAIN-2020-45,lif,49,44,0.0000\nCC-MAIN-2020-45,lin,6383,6261,0.0002\nCC-MAIN-2020-45,lit,4197244,4162793,0.1537\nCC-MAIN-2020-45,ltz,98462,97911,0.0036\nCC-MAIN-2020-45,lug,4909,4894,0.0002\nCC-MAIN-2020-45,mal,575407,572178,0.0211\nCC-MAIN-2020-45,mar,388898,386379,0.0142\nCC-MAIN-2020-45,mfe,1651,1645,0.0001\nCC-MAIN-2020-45,mkd,701179,696860,0.0257\nCC-MAIN-2020-45,mlg,81238,80957,0.0030\nCC-MAIN-2020-45,mlt,114042,113204,0.0042\nCC-MAIN-2020-45,mon,380498,377544,0.0139\nCC-MAIN-2020-45,mri,24704,24472,0.0009\nCC-MAIN-2020-45,msa,3262719,3250620,0.1195\nCC-MAIN-2020-45,mya,337957,337282,0.0124\nCC-MAIN-2020-45,nau,815,812,0.0000\nCC-MAIN-2020-45,nep,661150,656491,0.0242\nCC-MAIN-2020-45,new,3,3,0.0000\nCC-MAIN-2020-45,nld,48112979,47724087,1.7617\nCC-MAIN-2020-45,nno,499353,495225,0.0183\nCC-MAIN-2020-45,nor,10062831,9970204,0.3685\nCC-MAIN-2020-45,nso,2121,2120,0.0001\nCC-MAIN-2020-45,nya,5650,5630,0.0002\nCC-MAIN-2020-45,oci,101985,101710,0.0037\nCC-MAIN-2020-45,ori,120743,120249,0.0044\nCC-MAIN-2020-45,orm,9143,9103,0.0003\nCC-MAIN-2020-45,pan,161797,161232,0.0059\nCC-MAIN-2020-45,pol,43922909,43546573,1.6083\nCC-MAIN-2020-45,por,58811859,58423983,2.1534\nCC-MAIN-2020-45,pus,77379,77084,0.0028\nCC-MAIN-2020-45,que,23187,23177,0.0008\nCC-MAIN-2020-45,roh,43729,43497,0.0016\nCC-MAIN-2020-45,ron,16422666,16314064,0.6013\nCC-MAIN-2020-45,run,1817,1801,0.0001\nCC-MAIN-2020-45,rus,198959177,197475871,7.2850\nCC-MAIN-2020-45,sag,251,251,0.0000\nCC-MAIN-2020-45,san,67796,67380,0.0025\nCC-MAIN-2020-45,sco,11756,11536,0.0004\nCC-MAIN-2020-45,sin,181048,179912,0.0066\nCC-MAIN-2020-45,slk,9823609,9750035,0.3597\nCC-MAIN-2020-45,slv,3713068,3686535,0.1360\nCC-MAIN-2020-45,smo,5666,5641,0.0002\nCC-MAIN-2020-45,sna,8154,8139,0.0003\nCC-MAIN-2020-45,snd,26247,26096,0.0010\nCC-MAIN-2020-45,som,123267,122914,0.0045\nCC-MAIN-2020-45,sot,9982,9943,0.0004\nCC-MAIN-2020-45,spa,117328279,116420613,4.2961\nCC-MAIN-2020-45,sqi,1089234,1083953,0.0399\nCC-MAIN-2020-45,srp,5753748,5715595,0.2107\nCC-MAIN-2020-45,ssw,1227,1222,0.0000\nCC-MAIN-2020-45,sun,24079,24065,0.0009\nCC-MAIN-2020-45,sux,51,51,0.0000\nCC-MAIN-2020-45,swa,209511,208375,0.0077\nCC-MAIN-2020-45,swe,19827436,19662754,0.7260\nCC-MAIN-2020-45,syr,14543,14537,0.0005\nCC-MAIN-2020-45,tam,1241283,1232551,0.0455\nCC-MAIN-2020-45,tat,211900,211290,0.0078\nCC-MAIN-2020-45,tel,541888,539547,0.0198\nCC-MAIN-2020-45,tgk,133851,133704,0.0049\nCC-MAIN-2020-45,tgl,165639,164702,0.0061\nCC-MAIN-2020-45,tha,9198003,9145340,0.3368\nCC-MAIN-2020-45,tir,19275,19114,0.0007\nCC-MAIN-2020-45,ton,1574,1571,0.0001\nCC-MAIN-2020-45,tsn,9569,9403,0.0004\nCC-MAIN-2020-45,tso,1507,1501,0.0001\nCC-MAIN-2020-45,tuk,56142,56068,0.0021\nCC-MAIN-2020-45,tur,27351930,27156333,1.0015\nCC-MAIN-2020-45,uig,37136,37020,0.0014\nCC-MAIN-2020-45,ukr,9630825,9572157,0.3526\nCC-MAIN-2020-45,urd,657553,653975,0.0241\nCC-MAIN-2020-45,uzb,517114,509981,0.0189\nCC-MAIN-2020-45,ven,734,732,0.0000\nCC-MAIN-2020-45,vie,23693300,23495250,0.8675\nCC-MAIN-2020-45,vol,32071,32060,0.0012\nCC-MAIN-2020-45,war,78656,78438,0.0029\nCC-MAIN-2020-45,wol,3667,3631,0.0001\nCC-MAIN-2020-45,xho,42956,42888,0.0016\nCC-MAIN-2020-45,yid,46578,46502,0.0017\nCC-MAIN-2020-45,yor,24469,24427,0.0009\nCC-MAIN-2020-45,zha,2001,1995,0.0001\nCC-MAIN-2020-45,zho,173832526,173183829,6.3650\nCC-MAIN-2020-45,zul,32456,32324,0.0012\nCC-MAIN-2020-50,<unknown>,66593642,66593642,2.5201\nCC-MAIN-2020-50,aar,3205,3190,0.0001\nCC-MAIN-2020-50,abk,9587,9578,0.0004\nCC-MAIN-2020-50,afr,280486,279309,0.0106\nCC-MAIN-2020-50,aka,1627,1612,0.0001\nCC-MAIN-2020-50,amh,66703,66381,0.0025\nCC-MAIN-2020-50,ara,15436185,15311790,0.5842\nCC-MAIN-2020-50,asm,36358,36264,0.0014\nCC-MAIN-2020-50,aym,2521,2501,0.0001\nCC-MAIN-2020-50,aze,1323339,1317176,0.0501\nCC-MAIN-2020-50,bak,38859,38827,0.0015\nCC-MAIN-2020-50,bel,485074,483177,0.0184\nCC-MAIN-2020-50,ben,2159822,2153400,0.0817\nCC-MAIN-2020-50,bih,16874,16855,0.0006\nCC-MAIN-2020-50,bis,3068,3063,0.0001\nCC-MAIN-2020-50,blu,6737,6666,0.0003\nCC-MAIN-2020-50,bod,24286,24206,0.0009\nCC-MAIN-2020-50,bos,1054415,1050329,0.0399\nCC-MAIN-2020-50,bre,81472,81383,0.0031\nCC-MAIN-2020-50,bul,7144552,7100116,0.2704\nCC-MAIN-2020-50,cat,6056142,6015945,0.2292\nCC-MAIN-2020-50,ceb,68161,68106,0.0026\nCC-MAIN-2020-50,ces,28549830,28318609,1.0804\nCC-MAIN-2020-50,chr,1892,1892,0.0001\nCC-MAIN-2020-50,cos,53163,53041,0.0020\nCC-MAIN-2020-50,crs,1455,1423,0.0001\nCC-MAIN-2020-50,cym,304475,302741,0.0115\nCC-MAIN-2020-50,dan,11814558,11720998,0.4471\nCC-MAIN-2020-50,deu,143318720,142036361,5.4237\nCC-MAIN-2020-50,div,42644,42498,0.0016\nCC-MAIN-2020-50,dzo,1703,1701,0.0001\nCC-MAIN-2020-50,ell,14257809,14169786,0.5396\nCC-MAIN-2020-50,eng,1163898139,1154007384,44.0458\nCC-MAIN-2020-50,epo,253341,253038,0.0096\nCC-MAIN-2020-50,est,3592681,3560070,0.1360\nCC-MAIN-2020-50,eus,771437,766780,0.0292\nCC-MAIN-2020-50,fao,95032,94623,0.0036\nCC-MAIN-2020-50,fas,16170474,16025329,0.6119\nCC-MAIN-2020-50,fij,1628,1623,0.0001\nCC-MAIN-2020-50,fin,10291830,10208111,0.3895\nCC-MAIN-2020-50,fra,117889016,116949845,4.4613\nCC-MAIN-2020-50,fry,75614,75389,0.0029\nCC-MAIN-2020-50,gla,35344,35234,0.0013\nCC-MAIN-2020-50,gle,184643,183508,0.0070\nCC-MAIN-2020-50,glg,930529,925728,0.0352\nCC-MAIN-2020-50,glv,9824,9810,0.0004\nCC-MAIN-2020-50,got,1026,1024,0.0000\nCC-MAIN-2020-50,grn,15469,15393,0.0006\nCC-MAIN-2020-50,guj,235675,235137,0.0089\nCC-MAIN-2020-50,hat,41201,41094,0.0016\nCC-MAIN-2020-50,hau,39394,39135,0.0015\nCC-MAIN-2020-50,haw,9484,9451,0.0004\nCC-MAIN-2020-50,heb,6734424,6669558,0.2549\nCC-MAIN-2020-50,hin,3431907,3417467,0.1299\nCC-MAIN-2020-50,hrv,5103534,5073355,0.1931\nCC-MAIN-2020-50,hun,14261659,14153710,0.5397\nCC-MAIN-2020-50,hye,895902,890629,0.0339\nCC-MAIN-2020-50,ibo,6677,6632,0.0003\nCC-MAIN-2020-50,iku,5255,5190,0.0002\nCC-MAIN-2020-50,ile,6650,6625,0.0003\nCC-MAIN-2020-50,ina,14287,14257,0.0005\nCC-MAIN-2020-50,ind,21098352,20992169,0.7984\nCC-MAIN-2020-50,ipk,3565,3511,0.0001\nCC-MAIN-2020-50,isl,1018277,1011568,0.0385\nCC-MAIN-2020-50,ita,62833782,62375218,2.3778\nCC-MAIN-2020-50,jav,62331,62244,0.0024\nCC-MAIN-2020-50,jpn,123727564,123110634,4.6823\nCC-MAIN-2020-50,kal,20450,20328,0.0008\nCC-MAIN-2020-50,kan,245987,245225,0.0093\nCC-MAIN-2020-50,kas,99,98,0.0000\nCC-MAIN-2020-50,kat,1066454,1052389,0.0404\nCC-MAIN-2020-50,kaz,594282,591514,0.0225\nCC-MAIN-2020-50,kha,3093,3081,0.0001\nCC-MAIN-2020-50,khm,225603,224784,0.0085\nCC-MAIN-2020-50,kin,56695,56358,0.0021\nCC-MAIN-2020-50,kir,127181,126610,0.0048\nCC-MAIN-2020-50,kor,18536004,18445977,0.7015\nCC-MAIN-2020-50,kur,162502,162100,0.0061\nCC-MAIN-2020-50,lao,84881,84462,0.0032\nCC-MAIN-2020-50,lat,7217904,7211451,0.2731\nCC-MAIN-2020-50,lav,2428367,2407924,0.0919\nCC-MAIN-2020-50,lif,93,92,0.0000\nCC-MAIN-2020-50,lin,6618,6583,0.0003\nCC-MAIN-2020-50,lit,4068469,4035154,0.1540\nCC-MAIN-2020-50,ltz,79933,79614,0.0030\nCC-MAIN-2020-50,lug,5099,5058,0.0002\nCC-MAIN-2020-50,mal,537634,533555,0.0203\nCC-MAIN-2020-50,mar,374468,372947,0.0142\nCC-MAIN-2020-50,mfe,1599,1585,0.0001\nCC-MAIN-2020-50,mkd,701910,696207,0.0266\nCC-MAIN-2020-50,mlg,66376,66180,0.0025\nCC-MAIN-2020-50,mlt,117588,116598,0.0044\nCC-MAIN-2020-50,mon,359292,357990,0.0136\nCC-MAIN-2020-50,mri,23904,23714,0.0009\nCC-MAIN-2020-50,msa,2984255,2975531,0.1129\nCC-MAIN-2020-50,mya,289154,288264,0.0109\nCC-MAIN-2020-50,nau,680,679,0.0000\nCC-MAIN-2020-50,nep,602389,598365,0.0228\nCC-MAIN-2020-50,nld,46506864,46157182,1.7600\nCC-MAIN-2020-50,nno,464077,458669,0.0176\nCC-MAIN-2020-50,nor,9443086,9363229,0.3574\nCC-MAIN-2020-50,nso,2361,2359,0.0001\nCC-MAIN-2020-50,nya,5627,5596,0.0002\nCC-MAIN-2020-50,oci,85406,85235,0.0032\nCC-MAIN-2020-50,ori,104444,104309,0.0040\nCC-MAIN-2020-50,orm,9049,8995,0.0003\nCC-MAIN-2020-50,pan,126483,126216,0.0048\nCC-MAIN-2020-50,pol,42341790,42016623,1.6024\nCC-MAIN-2020-50,por,56838480,56487800,2.1510\nCC-MAIN-2020-50,pus,71783,71629,0.0027\nCC-MAIN-2020-50,que,20912,20903,0.0008\nCC-MAIN-2020-50,roh,43935,43720,0.0017\nCC-MAIN-2020-50,ron,15559280,15469646,0.5888\nCC-MAIN-2020-50,run,1816,1799,0.0001\nCC-MAIN-2020-50,rus,193116648,191965793,7.3082\nCC-MAIN-2020-50,sag,320,319,0.0000\nCC-MAIN-2020-50,san,55697,55204,0.0021\nCC-MAIN-2020-50,sco,12182,11973,0.0005\nCC-MAIN-2020-50,sin,174667,173976,0.0066\nCC-MAIN-2020-50,slk,9317436,9252474,0.3526\nCC-MAIN-2020-50,slv,3634701,3606367,0.1375\nCC-MAIN-2020-50,smo,6621,6602,0.0003\nCC-MAIN-2020-50,sna,8172,8100,0.0003\nCC-MAIN-2020-50,snd,23322,23271,0.0009\nCC-MAIN-2020-50,som,117387,116875,0.0044\nCC-MAIN-2020-50,sot,8142,8103,0.0003\nCC-MAIN-2020-50,spa,113239137,112407640,4.2853\nCC-MAIN-2020-50,sqi,1083242,1078269,0.0410\nCC-MAIN-2020-50,srp,5526916,5487878,0.2092\nCC-MAIN-2020-50,ssw,677,670,0.0000\nCC-MAIN-2020-50,sun,21898,21873,0.0008\nCC-MAIN-2020-50,sux,70,70,0.0000\nCC-MAIN-2020-50,swa,185811,184931,0.0070\nCC-MAIN-2020-50,swe,19130645,18980912,0.7240\nCC-MAIN-2020-50,syr,11242,11227,0.0004\nCC-MAIN-2020-50,tam,1165913,1160489,0.0441\nCC-MAIN-2020-50,tat,213507,213087,0.0081\nCC-MAIN-2020-50,tel,501520,500473,0.0190\nCC-MAIN-2020-50,tgk,117019,116817,0.0044\nCC-MAIN-2020-50,tgl,159749,158656,0.0060\nCC-MAIN-2020-50,tha,8805168,8757772,0.3332\nCC-MAIN-2020-50,tir,20334,20121,0.0008\nCC-MAIN-2020-50,ton,1612,1603,0.0001\nCC-MAIN-2020-50,tsn,10381,10210,0.0004\nCC-MAIN-2020-50,tso,1292,1288,0.0000\nCC-MAIN-2020-50,tuk,53658,53435,0.0020\nCC-MAIN-2020-50,tur,26022519,25835569,0.9848\nCC-MAIN-2020-50,uig,32252,32187,0.0012\nCC-MAIN-2020-50,ukr,9474105,9406736,0.3585\nCC-MAIN-2020-50,urd,625232,621372,0.0237\nCC-MAIN-2020-50,uzb,443294,439846,0.0168\nCC-MAIN-2020-50,ven,422,421,0.0000\nCC-MAIN-2020-50,vie,23981945,23797486,0.9076\nCC-MAIN-2020-50,vol,28608,28596,0.0011\nCC-MAIN-2020-50,war,81406,81206,0.0031\nCC-MAIN-2020-50,wol,4099,4056,0.0002\nCC-MAIN-2020-50,xho,42809,42676,0.0016\nCC-MAIN-2020-50,yid,37396,37354,0.0014\nCC-MAIN-2020-50,yor,19020,18970,0.0007\nCC-MAIN-2020-50,zha,2369,2369,0.0001\nCC-MAIN-2020-50,zho,159313381,158736114,6.0290\nCC-MAIN-2020-50,zul,37891,37754,0.0014\nCC-MAIN-2021-04,<unknown>,78270928,78270928,2.3012\nCC-MAIN-2021-04,aar,6422,6408,0.0002\nCC-MAIN-2021-04,abk,9704,9693,0.0003\nCC-MAIN-2021-04,afr,353719,351925,0.0104\nCC-MAIN-2021-04,aka,2100,2092,0.0001\nCC-MAIN-2021-04,amh,95305,94812,0.0028\nCC-MAIN-2021-04,ara,19101195,18954234,0.5616\nCC-MAIN-2021-04,asm,50434,50312,0.0015\nCC-MAIN-2021-04,aym,2146,2117,0.0001\nCC-MAIN-2021-04,aze,1548046,1539599,0.0455\nCC-MAIN-2021-04,bak,49842,49756,0.0015\nCC-MAIN-2021-04,bel,546611,542911,0.0161\nCC-MAIN-2021-04,ben,2681993,2671241,0.0789\nCC-MAIN-2021-04,bih,17192,17156,0.0005\nCC-MAIN-2021-04,bis,4164,4148,0.0001\nCC-MAIN-2021-04,blu,10477,10395,0.0003\nCC-MAIN-2021-04,bod,32107,31957,0.0009\nCC-MAIN-2021-04,bos,1311659,1305466,0.0386\nCC-MAIN-2021-04,bre,90657,90544,0.0027\nCC-MAIN-2021-04,bul,9070911,9006191,0.2667\nCC-MAIN-2021-04,cat,7730326,7672657,0.2273\nCC-MAIN-2021-04,ceb,54594,54480,0.0016\nCC-MAIN-2021-04,ces,36586487,36264746,1.0757\nCC-MAIN-2021-04,chr,1971,1971,0.0001\nCC-MAIN-2021-04,cos,73445,73223,0.0022\nCC-MAIN-2021-04,crs,1609,1592,0.0000\nCC-MAIN-2021-04,cym,358792,357353,0.0105\nCC-MAIN-2021-04,dan,15273378,15133419,0.4490\nCC-MAIN-2021-04,deu,188397429,186570796,5.5390\nCC-MAIN-2021-04,div,53410,53287,0.0016\nCC-MAIN-2021-04,dzo,2477,2476,0.0001\nCC-MAIN-2021-04,ell,18299263,18177294,0.5380\nCC-MAIN-2021-04,eng,1503828706,1490655829,44.2135\nCC-MAIN-2021-04,epo,252818,252218,0.0074\nCC-MAIN-2021-04,est,4467923,4425067,0.1314\nCC-MAIN-2021-04,eus,1001881,993734,0.0295\nCC-MAIN-2021-04,fao,128990,128205,0.0038\nCC-MAIN-2021-04,fas,20893043,20712781,0.6143\nCC-MAIN-2021-04,fij,3569,3568,0.0001\nCC-MAIN-2021-04,fin,13200561,13087925,0.3881\nCC-MAIN-2021-04,fra,152889682,151481580,4.4951\nCC-MAIN-2021-04,fry,92654,92458,0.0027\nCC-MAIN-2021-04,gla,48315,48193,0.0014\nCC-MAIN-2021-04,gle,206623,205550,0.0061\nCC-MAIN-2021-04,glg,1172517,1166264,0.0345\nCC-MAIN-2021-04,glv,12754,12742,0.0004\nCC-MAIN-2021-04,got,616,616,0.0000\nCC-MAIN-2021-04,grn,20488,20370,0.0006\nCC-MAIN-2021-04,guj,294393,293434,0.0087\nCC-MAIN-2021-04,hat,46558,46286,0.0014\nCC-MAIN-2021-04,hau,54355,53985,0.0016\nCC-MAIN-2021-04,haw,10623,10594,0.0003\nCC-MAIN-2021-04,heb,8693180,8617709,0.2556\nCC-MAIN-2021-04,hin,4185074,4163013,0.1230\nCC-MAIN-2021-04,hrv,6542604,6501434,0.1924\nCC-MAIN-2021-04,hun,18592776,18445904,0.5466\nCC-MAIN-2021-04,hye,1050372,1044926,0.0309\nCC-MAIN-2021-04,ibo,9728,9666,0.0003\nCC-MAIN-2021-04,iku,5688,5608,0.0002\nCC-MAIN-2021-04,ile,8159,8104,0.0002\nCC-MAIN-2021-04,ina,17893,17845,0.0005\nCC-MAIN-2021-04,ind,27703335,27550613,0.8145\nCC-MAIN-2021-04,ipk,4481,4420,0.0001\nCC-MAIN-2021-04,isl,1310561,1300129,0.0385\nCC-MAIN-2021-04,ita,83423203,82764506,2.4527\nCC-MAIN-2021-04,jav,68549,68413,0.0020\nCC-MAIN-2021-04,jpn,162804862,161865491,4.7866\nCC-MAIN-2021-04,kal,30219,29982,0.0009\nCC-MAIN-2021-04,kan,309943,308697,0.0091\nCC-MAIN-2021-04,kas,175,175,0.0000\nCC-MAIN-2021-04,kat,1269380,1261553,0.0373\nCC-MAIN-2021-04,kaz,683318,677929,0.0201\nCC-MAIN-2021-04,kha,5248,5230,0.0002\nCC-MAIN-2021-04,khm,300772,299747,0.0088\nCC-MAIN-2021-04,kin,63709,63347,0.0019\nCC-MAIN-2021-04,kir,146342,144960,0.0043\nCC-MAIN-2021-04,kor,22840271,22728125,0.6715\nCC-MAIN-2021-04,kur,204372,203123,0.0060\nCC-MAIN-2021-04,lao,103238,102998,0.0030\nCC-MAIN-2021-04,lat,6675318,6652568,0.1963\nCC-MAIN-2021-04,lav,2970478,2944269,0.0873\nCC-MAIN-2021-04,lif,87,87,0.0000\nCC-MAIN-2021-04,lin,5224,5178,0.0002\nCC-MAIN-2021-04,lit,5362226,5316644,0.1577\nCC-MAIN-2021-04,ltz,106019,105367,0.0031\nCC-MAIN-2021-04,lug,5641,5614,0.0002\nCC-MAIN-2021-04,mal,676894,674490,0.0199\nCC-MAIN-2021-04,mar,496649,493346,0.0146\nCC-MAIN-2021-04,mfe,2259,2249,0.0001\nCC-MAIN-2021-04,mkd,889870,883560,0.0262\nCC-MAIN-2021-04,mlg,83060,82827,0.0024\nCC-MAIN-2021-04,mlt,125068,124160,0.0037\nCC-MAIN-2021-04,mon,461112,459209,0.0136\nCC-MAIN-2021-04,mri,29241,28781,0.0009\nCC-MAIN-2021-04,msa,3539460,3527199,0.1041\nCC-MAIN-2021-04,mya,352615,351371,0.0104\nCC-MAIN-2021-04,nau,770,766,0.0000\nCC-MAIN-2021-04,nep,805140,799130,0.0237\nCC-MAIN-2021-04,new,37,37,0.0000\nCC-MAIN-2021-04,nld,62125816,61576970,1.8265\nCC-MAIN-2021-04,nno,540707,536299,0.0159\nCC-MAIN-2021-04,nor,12001727,11884278,0.3529\nCC-MAIN-2021-04,nso,2467,2463,0.0001\nCC-MAIN-2021-04,nya,8468,8424,0.0002\nCC-MAIN-2021-04,oci,94997,94760,0.0028\nCC-MAIN-2021-04,ori,122957,122800,0.0036\nCC-MAIN-2021-04,orm,15432,15370,0.0005\nCC-MAIN-2021-04,pan,168347,167966,0.0049\nCC-MAIN-2021-04,pol,55409808,54938872,1.6291\nCC-MAIN-2021-04,por,73474214,72966884,2.1602\nCC-MAIN-2021-04,pus,90702,90395,0.0027\nCC-MAIN-2021-04,que,26780,26762,0.0008\nCC-MAIN-2021-04,roh,47235,46790,0.0014\nCC-MAIN-2021-04,ron,20059269,19923430,0.5898\nCC-MAIN-2021-04,run,2882,2853,0.0001\nCC-MAIN-2021-04,rus,256280378,254444607,7.5348\nCC-MAIN-2021-04,sag,467,467,0.0000\nCC-MAIN-2021-04,san,76863,76423,0.0023\nCC-MAIN-2021-04,sco,14175,13954,0.0004\nCC-MAIN-2021-04,sin,215962,214934,0.0063\nCC-MAIN-2021-04,slk,12240989,12143954,0.3599\nCC-MAIN-2021-04,slv,4732019,4694648,0.1391\nCC-MAIN-2021-04,smo,7814,7776,0.0002\nCC-MAIN-2021-04,sna,11559,11400,0.0003\nCC-MAIN-2021-04,snd,24516,24453,0.0007\nCC-MAIN-2021-04,som,159270,158436,0.0047\nCC-MAIN-2021-04,sot,8502,8470,0.0002\nCC-MAIN-2021-04,spa,148409299,147220515,4.3633\nCC-MAIN-2021-04,sqi,1296319,1289767,0.0381\nCC-MAIN-2021-04,srp,7008413,6953413,0.2061\nCC-MAIN-2021-04,ssw,889,880,0.0000\nCC-MAIN-2021-04,sun,27380,27333,0.0008\nCC-MAIN-2021-04,sux,170,170,0.0000\nCC-MAIN-2021-04,swa,243070,242087,0.0071\nCC-MAIN-2021-04,swe,24708165,24481239,0.7264\nCC-MAIN-2021-04,syr,18170,18140,0.0005\nCC-MAIN-2021-04,tam,1444153,1438387,0.0425\nCC-MAIN-2021-04,tat,259351,258339,0.0076\nCC-MAIN-2021-04,tel,573248,572046,0.0169\nCC-MAIN-2021-04,tgk,146405,146105,0.0043\nCC-MAIN-2021-04,tgl,194407,193475,0.0057\nCC-MAIN-2021-04,tha,11108049,11037172,0.3266\nCC-MAIN-2021-04,tir,25369,24874,0.0007\nCC-MAIN-2021-04,ton,1888,1885,0.0001\nCC-MAIN-2021-04,tsn,10953,10748,0.0003\nCC-MAIN-2021-04,tso,1428,1421,0.0000\nCC-MAIN-2021-04,tuk,63174,62984,0.0019\nCC-MAIN-2021-04,tur,33793964,33532247,0.9936\nCC-MAIN-2021-04,uig,40401,40270,0.0012\nCC-MAIN-2021-04,ukr,12688368,12602475,0.3730\nCC-MAIN-2021-04,urd,725101,720295,0.0213\nCC-MAIN-2021-04,uzb,547316,541817,0.0161\nCC-MAIN-2021-04,ven,1322,1318,0.0000\nCC-MAIN-2021-04,vie,29426539,29171132,0.8652\nCC-MAIN-2021-04,vol,34233,34216,0.0010\nCC-MAIN-2021-04,war,89290,89004,0.0026\nCC-MAIN-2021-04,wol,3025,3019,0.0001\nCC-MAIN-2021-04,xho,37430,37288,0.0011\nCC-MAIN-2021-04,yid,45284,45234,0.0013\nCC-MAIN-2021-04,yor,23851,23794,0.0007\nCC-MAIN-2021-04,zha,1489,1489,0.0000\nCC-MAIN-2021-04,zho,188608875,187784085,5.5452\nCC-MAIN-2021-04,zul,34815,34599,0.0010\nCC-MAIN-2021-10,<unknown>,61719539,61719539,2.2552\nCC-MAIN-2021-10,aar,3791,3783,0.0001\nCC-MAIN-2021-10,abk,9034,9016,0.0003\nCC-MAIN-2021-10,afr,307684,306284,0.0112\nCC-MAIN-2021-10,aka,1243,1235,0.0000\nCC-MAIN-2021-10,amh,78602,78217,0.0029\nCC-MAIN-2021-10,ara,16732765,16628456,0.6114\nCC-MAIN-2021-10,asm,25904,25847,0.0009\nCC-MAIN-2021-10,aym,3419,3356,0.0001\nCC-MAIN-2021-10,aze,1221371,1213968,0.0446\nCC-MAIN-2021-10,bak,33071,33054,0.0012\nCC-MAIN-2021-10,bel,497418,496321,0.0182\nCC-MAIN-2021-10,ben,2421809,2414845,0.0885\nCC-MAIN-2021-10,bih,19808,19792,0.0007\nCC-MAIN-2021-10,bis,2142,2131,0.0001\nCC-MAIN-2021-10,bod,36322,36089,0.0013\nCC-MAIN-2021-10,bos,1135462,1130524,0.0415\nCC-MAIN-2021-10,bre,71729,71402,0.0026\nCC-MAIN-2021-10,bul,7063545,7021740,0.2581\nCC-MAIN-2021-10,cat,6321411,6275544,0.2310\nCC-MAIN-2021-10,ceb,66493,66412,0.0024\nCC-MAIN-2021-10,ces,30286409,30079481,1.1067\nCC-MAIN-2021-10,chr,7791,7791,0.0003\nCC-MAIN-2021-10,cos,62481,62386,0.0023\nCC-MAIN-2021-10,crs,1386,1374,0.0001\nCC-MAIN-2021-10,cym,304919,303749,0.0111\nCC-MAIN-2021-10,dan,12106404,12015327,0.4424\nCC-MAIN-2021-10,deu,150119053,148846879,5.4853\nCC-MAIN-2021-10,div,46827,46731,0.0017\nCC-MAIN-2021-10,dzo,2488,2488,0.0001\nCC-MAIN-2021-10,ell,14694900,14613532,0.5369\nCC-MAIN-2021-10,eng,1212156453,1202770768,44.2918\nCC-MAIN-2021-10,epo,261336,261039,0.0095\nCC-MAIN-2021-10,est,3389002,3362468,0.1238\nCC-MAIN-2021-10,eus,796288,773657,0.0291\nCC-MAIN-2021-10,fao,103973,103481,0.0038\nCC-MAIN-2021-10,fas,17789111,17589117,0.6500\nCC-MAIN-2021-10,fij,2942,2937,0.0001\nCC-MAIN-2021-10,fin,10417862,10343627,0.3807\nCC-MAIN-2021-10,fra,121483661,120537446,4.4390\nCC-MAIN-2021-10,fry,81387,81266,0.0030\nCC-MAIN-2021-10,gla,41524,41486,0.0015\nCC-MAIN-2021-10,gle,179370,178756,0.0066\nCC-MAIN-2021-10,glg,926466,921235,0.0339\nCC-MAIN-2021-10,glv,10876,10863,0.0004\nCC-MAIN-2021-10,got,899,899,0.0000\nCC-MAIN-2021-10,grn,18492,18338,0.0007\nCC-MAIN-2021-10,guj,294792,294277,0.0108\nCC-MAIN-2021-10,hat,44969,44870,0.0016\nCC-MAIN-2021-10,hau,52589,52073,0.0019\nCC-MAIN-2021-10,haw,10721,10700,0.0004\nCC-MAIN-2021-10,heb,6867483,6811031,0.2509\nCC-MAIN-2021-10,hin,3637302,3624796,0.1329\nCC-MAIN-2021-10,hmn,11045,11012,0.0004\nCC-MAIN-2021-10,hrv,4967425,4939905,0.1815\nCC-MAIN-2021-10,hun,15110855,15008575,0.5521\nCC-MAIN-2021-10,hye,851577,847458,0.0311\nCC-MAIN-2021-10,ibo,10768,10656,0.0004\nCC-MAIN-2021-10,iku,4882,4874,0.0002\nCC-MAIN-2021-10,ile,6355,6341,0.0002\nCC-MAIN-2021-10,ina,14140,14101,0.0005\nCC-MAIN-2021-10,ind,22656046,22546468,0.8278\nCC-MAIN-2021-10,ipk,4811,4807,0.0002\nCC-MAIN-2021-10,isl,990096,982434,0.0362\nCC-MAIN-2021-10,ita,64743966,64274959,2.3657\nCC-MAIN-2021-10,jav,51909,51835,0.0019\nCC-MAIN-2021-10,jpn,127774944,127184552,4.6689\nCC-MAIN-2021-10,kal,21882,21808,0.0008\nCC-MAIN-2021-10,kan,279650,279058,0.0102\nCC-MAIN-2021-10,kas,121,121,0.0000\nCC-MAIN-2021-10,kat,1092535,1086309,0.0399\nCC-MAIN-2021-10,kaz,590825,587187,0.0216\nCC-MAIN-2021-10,kha,3437,3432,0.0001\nCC-MAIN-2021-10,khm,223418,222848,0.0082\nCC-MAIN-2021-10,kin,46220,46005,0.0017\nCC-MAIN-2021-10,kir,154244,153795,0.0056\nCC-MAIN-2021-10,kor,19329044,19246621,0.7063\nCC-MAIN-2021-10,kur,157001,156597,0.0057\nCC-MAIN-2021-10,lao,98205,97807,0.0036\nCC-MAIN-2021-10,lat,4572061,4558944,0.1671\nCC-MAIN-2021-10,lav,2447970,2430910,0.0894\nCC-MAIN-2021-10,lif,66,63,0.0000\nCC-MAIN-2021-10,lin,5091,5086,0.0002\nCC-MAIN-2021-10,lit,4311690,4276691,0.1575\nCC-MAIN-2021-10,ltz,90651,90183,0.0033\nCC-MAIN-2021-10,lug,4837,4830,0.0002\nCC-MAIN-2021-10,mal,576140,569008,0.0211\nCC-MAIN-2021-10,mar,497053,495859,0.0182\nCC-MAIN-2021-10,mfe,1880,1874,0.0001\nCC-MAIN-2021-10,mkd,784731,776245,0.0287\nCC-MAIN-2021-10,mlg,82599,82177,0.0030\nCC-MAIN-2021-10,mlt,115440,114729,0.0042\nCC-MAIN-2021-10,mon,399862,398222,0.0146\nCC-MAIN-2021-10,mri,26594,26410,0.0010\nCC-MAIN-2021-10,msa,2257027,2249529,0.0825\nCC-MAIN-2021-10,mya,287656,287014,0.0105\nCC-MAIN-2021-10,nau,771,768,0.0000\nCC-MAIN-2021-10,nep,735943,733133,0.0269\nCC-MAIN-2021-10,nld,48564638,48199512,1.7745\nCC-MAIN-2021-10,nno,491513,488572,0.0180\nCC-MAIN-2021-10,nor,9593906,9506409,0.3506\nCC-MAIN-2021-10,nso,2780,2774,0.0001\nCC-MAIN-2021-10,nya,10206,10197,0.0004\nCC-MAIN-2021-10,oci,85567,85263,0.0031\nCC-MAIN-2021-10,ori,118467,118254,0.0043\nCC-MAIN-2021-10,orm,12209,12069,0.0004\nCC-MAIN-2021-10,pan,148075,147838,0.0054\nCC-MAIN-2021-10,pol,43141329,42844498,1.5764\nCC-MAIN-2021-10,por,59399970,59066186,2.1705\nCC-MAIN-2021-10,pus,112952,112619,0.0041\nCC-MAIN-2021-10,que,19237,19225,0.0007\nCC-MAIN-2021-10,roh,24528,24404,0.0009\nCC-MAIN-2021-10,ron,16190261,16081782,0.5916\nCC-MAIN-2021-10,run,1482,1459,0.0001\nCC-MAIN-2021-10,rus,204887689,203671759,7.4865\nCC-MAIN-2021-10,sag,525,525,0.0000\nCC-MAIN-2021-10,san,50710,50584,0.0019\nCC-MAIN-2021-10,sco,13383,13335,0.0005\nCC-MAIN-2021-10,sin,175961,175243,0.0064\nCC-MAIN-2021-10,slk,9166523,9109261,0.3349\nCC-MAIN-2021-10,slv,3799343,3776147,0.1388\nCC-MAIN-2021-10,smo,8840,8826,0.0003\nCC-MAIN-2021-10,sna,11376,11347,0.0004\nCC-MAIN-2021-10,snd,23209,23184,0.0008\nCC-MAIN-2021-10,som,118156,117926,0.0043\nCC-MAIN-2021-10,sot,10894,10883,0.0004\nCC-MAIN-2021-10,spa,118487065,117646784,4.3295\nCC-MAIN-2021-10,sqi,1223473,1216607,0.0447\nCC-MAIN-2021-10,srp,5611237,5579075,0.2050\nCC-MAIN-2021-10,ssw,983,976,0.0000\nCC-MAIN-2021-10,sun,23876,23815,0.0009\nCC-MAIN-2021-10,sux,49,49,0.0000\nCC-MAIN-2021-10,swa,215454,214560,0.0079\nCC-MAIN-2021-10,swe,19858076,19710544,0.7256\nCC-MAIN-2021-10,syr,23894,23844,0.0009\nCC-MAIN-2021-10,tam,1112363,1108696,0.0406\nCC-MAIN-2021-10,tat,230614,230248,0.0084\nCC-MAIN-2021-10,tel,453066,451918,0.0166\nCC-MAIN-2021-10,tgk,135234,134844,0.0049\nCC-MAIN-2021-10,tgl,168373,167789,0.0062\nCC-MAIN-2021-10,tha,9419764,9372015,0.3442\nCC-MAIN-2021-10,tir,20106,19930,0.0007\nCC-MAIN-2021-10,ton,1780,1777,0.0001\nCC-MAIN-2021-10,tsn,6561,6507,0.0002\nCC-MAIN-2021-10,tso,1399,1397,0.0001\nCC-MAIN-2021-10,tuk,57148,57045,0.0021\nCC-MAIN-2021-10,tur,27939419,27757418,1.0209\nCC-MAIN-2021-10,uig,35798,35770,0.0013\nCC-MAIN-2021-10,ukr,11265613,11189289,0.4116\nCC-MAIN-2021-10,urd,704916,701605,0.0258\nCC-MAIN-2021-10,uzb,492285,488624,0.0180\nCC-MAIN-2021-10,ven,1030,1027,0.0000\nCC-MAIN-2021-10,vie,22953013,22769175,0.8387\nCC-MAIN-2021-10,vol,22681,22665,0.0008\nCC-MAIN-2021-10,war,80117,79929,0.0029\nCC-MAIN-2021-10,wol,6411,6394,0.0002\nCC-MAIN-2021-10,xho,38340,38251,0.0014\nCC-MAIN-2021-10,yid,38756,38723,0.0014\nCC-MAIN-2021-10,yor,24518,24485,0.0009\nCC-MAIN-2021-10,zha,2263,2259,0.0001\nCC-MAIN-2021-10,zho,159500737,158714134,5.8281\nCC-MAIN-2021-10,zul,43561,43470,0.0016\nCC-MAIN-2021-17,<unknown>,65772500,65772500,2.0984\nCC-MAIN-2021-17,aar,4664,4651,0.0001\nCC-MAIN-2021-17,abk,9284,9278,0.0003\nCC-MAIN-2021-17,afr,336544,335216,0.0107\nCC-MAIN-2021-17,aka,1422,1419,0.0000\nCC-MAIN-2021-17,amh,86622,86264,0.0028\nCC-MAIN-2021-17,ara,18160085,18066860,0.5794\nCC-MAIN-2021-17,asm,34562,34500,0.0011\nCC-MAIN-2021-17,aym,2209,2169,0.0001\nCC-MAIN-2021-17,aze,1318930,1310056,0.0421\nCC-MAIN-2021-17,bak,42456,42358,0.0014\nCC-MAIN-2021-17,bel,536994,536050,0.0171\nCC-MAIN-2021-17,ben,2639614,2632716,0.0842\nCC-MAIN-2021-17,bih,19573,19541,0.0006\nCC-MAIN-2021-17,bis,2976,2971,0.0001\nCC-MAIN-2021-17,bod,34038,33988,0.0011\nCC-MAIN-2021-17,bos,1320845,1316619,0.0421\nCC-MAIN-2021-17,bre,72982,72904,0.0023\nCC-MAIN-2021-17,bul,8118472,8083984,0.2590\nCC-MAIN-2021-17,cat,6993991,6947680,0.2231\nCC-MAIN-2021-17,ceb,60311,60292,0.0019\nCC-MAIN-2021-17,ces,36031883,35819868,1.1496\nCC-MAIN-2021-17,chr,889,889,0.0000\nCC-MAIN-2021-17,cos,75944,75855,0.0024\nCC-MAIN-2021-17,crs,1625,1610,0.0001\nCC-MAIN-2021-17,cym,341463,340577,0.0109\nCC-MAIN-2021-17,dan,14000243,13912576,0.4467\nCC-MAIN-2021-17,deu,179441609,178227113,5.7249\nCC-MAIN-2021-17,div,51855,51777,0.0017\nCC-MAIN-2021-17,dzo,2751,2751,0.0001\nCC-MAIN-2021-17,ell,16610515,16545737,0.5299\nCC-MAIN-2021-17,eng,1376021766,1366771034,43.9003\nCC-MAIN-2021-17,epo,303500,303148,0.0097\nCC-MAIN-2021-17,est,4088378,4064632,0.1304\nCC-MAIN-2021-17,eus,909769,889087,0.0290\nCC-MAIN-2021-17,fao,111985,111230,0.0036\nCC-MAIN-2021-17,fas,19670459,19533264,0.6276\nCC-MAIN-2021-17,fij,2990,2988,0.0001\nCC-MAIN-2021-17,fin,12461594,12395464,0.3976\nCC-MAIN-2021-17,fra,141921997,141014638,4.5278\nCC-MAIN-2021-17,fry,86231,86124,0.0028\nCC-MAIN-2021-17,gla,41974,41894,0.0013\nCC-MAIN-2021-17,gle,190000,189442,0.0061\nCC-MAIN-2021-17,glg,1085156,1080751,0.0346\nCC-MAIN-2021-17,glv,11588,11572,0.0004\nCC-MAIN-2021-17,got,557,557,0.0000\nCC-MAIN-2021-17,grn,18253,18169,0.0006\nCC-MAIN-2021-17,guj,322101,321291,0.0103\nCC-MAIN-2021-17,hat,47107,47005,0.0015\nCC-MAIN-2021-17,hau,57581,57269,0.0018\nCC-MAIN-2021-17,haw,12551,12535,0.0004\nCC-MAIN-2021-17,heb,7919924,7873112,0.2527\nCC-MAIN-2021-17,hin,3919102,3908370,0.1250\nCC-MAIN-2021-17,hmn,12555,12541,0.0004\nCC-MAIN-2021-17,hrv,5801290,5779221,0.1851\nCC-MAIN-2021-17,hun,17405035,17318952,0.5553\nCC-MAIN-2021-17,hye,959540,956125,0.0306\nCC-MAIN-2021-17,ibo,9917,9907,0.0003\nCC-MAIN-2021-17,iku,5352,5344,0.0002\nCC-MAIN-2021-17,ile,8171,8151,0.0003\nCC-MAIN-2021-17,ina,16424,16399,0.0005\nCC-MAIN-2021-17,ind,26987375,26895811,0.8610\nCC-MAIN-2021-17,ipk,4821,4813,0.0002\nCC-MAIN-2021-17,isl,1198913,1191831,0.0382\nCC-MAIN-2021-17,ita,76560697,76129896,2.4426\nCC-MAIN-2021-17,jav,55998,55967,0.0018\nCC-MAIN-2021-17,jpn,154007258,153425537,4.9134\nCC-MAIN-2021-17,kal,38107,37589,0.0012\nCC-MAIN-2021-17,kan,277367,276664,0.0088\nCC-MAIN-2021-17,kas,182,182,0.0000\nCC-MAIN-2021-17,kat,1214177,1209008,0.0387\nCC-MAIN-2021-17,kaz,662375,660159,0.0211\nCC-MAIN-2021-17,kha,4879,4841,0.0002\nCC-MAIN-2021-17,khm,257465,257043,0.0082\nCC-MAIN-2021-17,kin,48826,48713,0.0016\nCC-MAIN-2021-17,kir,145920,145576,0.0047\nCC-MAIN-2021-17,kor,20773298,20702935,0.6627\nCC-MAIN-2021-17,kur,182025,181419,0.0058\nCC-MAIN-2021-17,lao,123198,122867,0.0039\nCC-MAIN-2021-17,lat,4445487,4440391,0.1418\nCC-MAIN-2021-17,lav,2838202,2823502,0.0905\nCC-MAIN-2021-17,lif,84,84,0.0000\nCC-MAIN-2021-17,lin,8483,8463,0.0003\nCC-MAIN-2021-17,lit,5170680,5140700,0.1650\nCC-MAIN-2021-17,ltz,105510,104930,0.0034\nCC-MAIN-2021-17,lug,4321,4317,0.0001\nCC-MAIN-2021-17,mal,602984,600844,0.0192\nCC-MAIN-2021-17,mar,520262,518937,0.0166\nCC-MAIN-2021-17,mfe,3070,3058,0.0001\nCC-MAIN-2021-17,mkd,849055,845733,0.0271\nCC-MAIN-2021-17,mlg,83919,83661,0.0027\nCC-MAIN-2021-17,mlt,108955,107286,0.0035\nCC-MAIN-2021-17,mon,461263,459859,0.0147\nCC-MAIN-2021-17,mri,37215,37097,0.0012\nCC-MAIN-2021-17,msa,2453863,2446257,0.0783\nCC-MAIN-2021-17,mya,323408,322698,0.0103\nCC-MAIN-2021-17,nau,1095,1092,0.0000\nCC-MAIN-2021-17,nep,809973,807945,0.0258\nCC-MAIN-2021-17,nld,58348940,58005495,1.8616\nCC-MAIN-2021-17,nno,568834,563924,0.0181\nCC-MAIN-2021-17,nor,11367645,11298359,0.3627\nCC-MAIN-2021-17,nso,2139,2138,0.0001\nCC-MAIN-2021-17,nya,11844,11818,0.0004\nCC-MAIN-2021-17,oci,91564,91383,0.0029\nCC-MAIN-2021-17,ori,127315,127120,0.0041\nCC-MAIN-2021-17,orm,14285,14225,0.0005\nCC-MAIN-2021-17,pan,152633,152259,0.0049\nCC-MAIN-2021-17,pol,50450890,50175474,1.6096\nCC-MAIN-2021-17,por,68141893,67836828,2.1740\nCC-MAIN-2021-17,pus,102676,102535,0.0033\nCC-MAIN-2021-17,que,19406,19397,0.0006\nCC-MAIN-2021-17,roh,29041,28701,0.0009\nCC-MAIN-2021-17,ron,19124643,19023326,0.6101\nCC-MAIN-2021-17,run,2669,2620,0.0001\nCC-MAIN-2021-17,rus,241097213,240019436,7.6919\nCC-MAIN-2021-17,sag,530,529,0.0000\nCC-MAIN-2021-17,san,62774,62644,0.0020\nCC-MAIN-2021-17,sco,12338,12304,0.0004\nCC-MAIN-2021-17,sin,217709,216815,0.0069\nCC-MAIN-2021-17,slk,10817467,10758705,0.3451\nCC-MAIN-2021-17,slv,4508464,4486407,0.1438\nCC-MAIN-2021-17,smo,11956,11928,0.0004\nCC-MAIN-2021-17,sna,14273,14227,0.0005\nCC-MAIN-2021-17,snd,24330,24315,0.0008\nCC-MAIN-2021-17,som,136564,136253,0.0044\nCC-MAIN-2021-17,sot,10370,10357,0.0003\nCC-MAIN-2021-17,spa,136619959,135862106,4.3587\nCC-MAIN-2021-17,sqi,1255464,1246677,0.0401\nCC-MAIN-2021-17,srp,6413568,6382743,0.2046\nCC-MAIN-2021-17,ssw,964,957,0.0000\nCC-MAIN-2021-17,sun,26563,26544,0.0008\nCC-MAIN-2021-17,sux,94,94,0.0000\nCC-MAIN-2021-17,swa,207804,207072,0.0066\nCC-MAIN-2021-17,swe,23387063,23244509,0.7461\nCC-MAIN-2021-17,syr,21010,20998,0.0007\nCC-MAIN-2021-17,tam,1196178,1190187,0.0382\nCC-MAIN-2021-17,tat,257151,256728,0.0082\nCC-MAIN-2021-17,tel,467367,464675,0.0149\nCC-MAIN-2021-17,tgk,149813,149067,0.0048\nCC-MAIN-2021-17,tgl,188812,188449,0.0060\nCC-MAIN-2021-17,tha,10846712,10795668,0.3461\nCC-MAIN-2021-17,tir,21091,20917,0.0007\nCC-MAIN-2021-17,ton,1640,1636,0.0001\nCC-MAIN-2021-17,tsn,5992,5935,0.0002\nCC-MAIN-2021-17,tso,1340,1338,0.0000\nCC-MAIN-2021-17,tuk,59744,59622,0.0019\nCC-MAIN-2021-17,tur,32475013,32317792,1.0361\nCC-MAIN-2021-17,uig,41030,40988,0.0013\nCC-MAIN-2021-17,ukr,12932058,12865605,0.4126\nCC-MAIN-2021-17,urd,743102,738899,0.0237\nCC-MAIN-2021-17,uzb,526826,522023,0.0168\nCC-MAIN-2021-17,ven,867,864,0.0000\nCC-MAIN-2021-17,vie,27050780,26873056,0.8630\nCC-MAIN-2021-17,vol,28428,28409,0.0009\nCC-MAIN-2021-17,war,80421,80253,0.0026\nCC-MAIN-2021-17,wol,4097,4071,0.0001\nCC-MAIN-2021-17,xho,41662,41549,0.0013\nCC-MAIN-2021-17,yid,40071,39997,0.0013\nCC-MAIN-2021-17,yor,26153,26140,0.0008\nCC-MAIN-2021-17,zha,1541,1539,0.0000\nCC-MAIN-2021-17,zho,166872699,166295898,5.3239\nCC-MAIN-2021-17,zul,39916,39772,0.0013\nCC-MAIN-2021-21,<unknown>,75912178,75912178,2.8840\nCC-MAIN-2021-21,aar,3178,3165,0.0001\nCC-MAIN-2021-21,abk,8807,8805,0.0003\nCC-MAIN-2021-21,afr,326041,325205,0.0124\nCC-MAIN-2021-21,aka,1139,1137,0.0000\nCC-MAIN-2021-21,amh,77430,77003,0.0029\nCC-MAIN-2021-21,ara,16234770,16143014,0.6168\nCC-MAIN-2021-21,asm,28495,28446,0.0011\nCC-MAIN-2021-21,aym,2087,2071,0.0001\nCC-MAIN-2021-21,aze,1200246,1195301,0.0456\nCC-MAIN-2021-21,bak,38378,38322,0.0015\nCC-MAIN-2021-21,bel,466442,465652,0.0177\nCC-MAIN-2021-21,ben,2322916,2313938,0.0883\nCC-MAIN-2021-21,bih,15840,15822,0.0006\nCC-MAIN-2021-21,bis,3623,3616,0.0001\nCC-MAIN-2021-21,bod,25549,25480,0.0010\nCC-MAIN-2021-21,bos,1133514,1130098,0.0431\nCC-MAIN-2021-21,bre,73546,73371,0.0028\nCC-MAIN-2021-21,bul,7314843,7284400,0.2779\nCC-MAIN-2021-21,cat,6101395,6062794,0.2318\nCC-MAIN-2021-21,ceb,69453,69434,0.0026\nCC-MAIN-2021-21,ces,29278892,29096077,1.1124\nCC-MAIN-2021-21,chr,977,976,0.0000\nCC-MAIN-2021-21,cos,64146,64039,0.0024\nCC-MAIN-2021-21,crs,2085,2081,0.0001\nCC-MAIN-2021-21,cym,303314,302431,0.0115\nCC-MAIN-2021-21,dan,11260225,11186233,0.4278\nCC-MAIN-2021-21,deu,149784332,148699101,5.6906\nCC-MAIN-2021-21,div,43441,43389,0.0017\nCC-MAIN-2021-21,dzo,953,950,0.0000\nCC-MAIN-2021-21,ell,14268073,14208221,0.5421\nCC-MAIN-2021-21,eng,1180315707,1171997136,44.8424\nCC-MAIN-2021-21,epo,257138,256172,0.0098\nCC-MAIN-2021-21,est,3365189,3346292,0.1278\nCC-MAIN-2021-21,eus,805506,781501,0.0306\nCC-MAIN-2021-21,fao,94316,94022,0.0036\nCC-MAIN-2021-21,fas,16911834,16792408,0.6425\nCC-MAIN-2021-21,fij,1939,1939,0.0001\nCC-MAIN-2021-21,fin,10372577,10309390,0.3941\nCC-MAIN-2021-21,fra,117781024,116985318,4.4747\nCC-MAIN-2021-21,fry,89589,89440,0.0034\nCC-MAIN-2021-21,gla,43200,43097,0.0016\nCC-MAIN-2021-21,gle,165445,164771,0.0063\nCC-MAIN-2021-21,glg,953330,946985,0.0362\nCC-MAIN-2021-21,glv,12225,12212,0.0005\nCC-MAIN-2021-21,got,926,926,0.0000\nCC-MAIN-2021-21,grn,18091,18036,0.0007\nCC-MAIN-2021-21,guj,296655,296033,0.0113\nCC-MAIN-2021-21,hat,44942,44843,0.0017\nCC-MAIN-2021-21,hau,47671,47503,0.0018\nCC-MAIN-2021-21,haw,11734,11725,0.0004\nCC-MAIN-2021-21,heb,6633214,6581836,0.2520\nCC-MAIN-2021-21,hin,3396796,3387870,0.1291\nCC-MAIN-2021-21,hmn,9556,9535,0.0004\nCC-MAIN-2021-21,hrv,4984710,4963189,0.1894\nCC-MAIN-2021-21,hun,14885214,14809167,0.5655\nCC-MAIN-2021-21,hye,810799,808285,0.0308\nCC-MAIN-2021-21,ibo,11265,11230,0.0004\nCC-MAIN-2021-21,iku,5015,5010,0.0002\nCC-MAIN-2021-21,ile,9569,9545,0.0004\nCC-MAIN-2021-21,ina,16892,16859,0.0006\nCC-MAIN-2021-21,ind,21874945,21791235,0.8311\nCC-MAIN-2021-21,ipk,4477,4474,0.0002\nCC-MAIN-2021-21,isl,1081505,1074318,0.0411\nCC-MAIN-2021-21,ita,63899833,63519263,2.4277\nCC-MAIN-2021-21,jav,48543,48521,0.0018\nCC-MAIN-2021-21,jpn,120684744,120188449,4.5850\nCC-MAIN-2021-21,kal,40803,40735,0.0016\nCC-MAIN-2021-21,kan,263130,262716,0.0100\nCC-MAIN-2021-21,kas,100,100,0.0000\nCC-MAIN-2021-21,kat,1045717,1042207,0.0397\nCC-MAIN-2021-21,kaz,571266,569639,0.0217\nCC-MAIN-2021-21,kha,3733,3720,0.0001\nCC-MAIN-2021-21,khm,212321,212098,0.0081\nCC-MAIN-2021-21,kin,45784,45570,0.0017\nCC-MAIN-2021-21,kir,129662,129404,0.0049\nCC-MAIN-2021-21,kor,16788786,16718814,0.6378\nCC-MAIN-2021-21,kur,163109,162501,0.0062\nCC-MAIN-2021-21,lao,108451,108155,0.0041\nCC-MAIN-2021-21,lat,2788778,2784642,0.1060\nCC-MAIN-2021-21,lav,2482610,2470217,0.0943\nCC-MAIN-2021-21,lif,7,7,0.0000\nCC-MAIN-2021-21,lin,5230,5221,0.0002\nCC-MAIN-2021-21,lit,4369074,4343340,0.1660\nCC-MAIN-2021-21,ltz,95622,95304,0.0036\nCC-MAIN-2021-21,lug,3620,3617,0.0001\nCC-MAIN-2021-21,mal,556395,554775,0.0211\nCC-MAIN-2021-21,mar,480338,478179,0.0182\nCC-MAIN-2021-21,mfe,2671,2659,0.0001\nCC-MAIN-2021-21,mkd,765254,761929,0.0291\nCC-MAIN-2021-21,mlg,81266,80939,0.0031\nCC-MAIN-2021-21,mlt,104154,103572,0.0040\nCC-MAIN-2021-21,mon,391631,390340,0.0149\nCC-MAIN-2021-21,mri,31780,31690,0.0012\nCC-MAIN-2021-21,msa,2091449,2085907,0.0795\nCC-MAIN-2021-21,mya,268593,267971,0.0102\nCC-MAIN-2021-21,nau,1336,1333,0.0001\nCC-MAIN-2021-21,nep,716181,713739,0.0272\nCC-MAIN-2021-21,nld,47595390,47297920,1.8082\nCC-MAIN-2021-21,nno,533809,530685,0.0203\nCC-MAIN-2021-21,nor,9344547,9284578,0.3550\nCC-MAIN-2021-21,nso,2498,2497,0.0001\nCC-MAIN-2021-21,nya,11006,10990,0.0004\nCC-MAIN-2021-21,oci,88422,88165,0.0034\nCC-MAIN-2021-21,ori,122249,122073,0.0046\nCC-MAIN-2021-21,orm,13068,13033,0.0005\nCC-MAIN-2021-21,pan,134281,134089,0.0051\nCC-MAIN-2021-21,pol,42245931,42004421,1.6050\nCC-MAIN-2021-21,por,56256203,55977615,2.1373\nCC-MAIN-2021-21,pus,105805,105700,0.0040\nCC-MAIN-2021-21,que,20999,20992,0.0008\nCC-MAIN-2021-21,roh,29202,28604,0.0011\nCC-MAIN-2021-21,ron,16245908,16171600,0.6172\nCC-MAIN-2021-21,run,2955,2909,0.0001\nCC-MAIN-2021-21,rus,191246667,190425854,7.2658\nCC-MAIN-2021-21,sag,425,425,0.0000\nCC-MAIN-2021-21,san,54961,54837,0.0021\nCC-MAIN-2021-21,sco,12956,12929,0.0005\nCC-MAIN-2021-21,sin,184294,183679,0.0070\nCC-MAIN-2021-21,slk,9143580,9095756,0.3474\nCC-MAIN-2021-21,slv,3823448,3799284,0.1453\nCC-MAIN-2021-21,smo,11089,11074,0.0004\nCC-MAIN-2021-21,sna,14239,14209,0.0005\nCC-MAIN-2021-21,snd,25985,25948,0.0010\nCC-MAIN-2021-21,som,115216,115020,0.0044\nCC-MAIN-2021-21,sot,11300,11290,0.0004\nCC-MAIN-2021-21,spa,114011616,113349238,4.3315\nCC-MAIN-2021-21,sqi,1157794,1151410,0.0440\nCC-MAIN-2021-21,srp,5624924,5598258,0.2137\nCC-MAIN-2021-21,ssw,1074,1066,0.0000\nCC-MAIN-2021-21,sun,23039,23015,0.0009\nCC-MAIN-2021-21,sux,136,136,0.0000\nCC-MAIN-2021-21,swa,186029,185448,0.0071\nCC-MAIN-2021-21,swe,19471891,19343569,0.7398\nCC-MAIN-2021-21,syr,18608,18590,0.0007\nCC-MAIN-2021-21,tam,1032549,1028644,0.0392\nCC-MAIN-2021-21,tat,205394,205209,0.0078\nCC-MAIN-2021-21,tel,417368,416502,0.0159\nCC-MAIN-2021-21,tgk,136535,136051,0.0052\nCC-MAIN-2021-21,tgl,188047,187307,0.0071\nCC-MAIN-2021-21,tha,9063588,9030492,0.3443\nCC-MAIN-2021-21,tir,18916,18784,0.0007\nCC-MAIN-2021-21,ton,1491,1488,0.0001\nCC-MAIN-2021-21,tsn,7888,7636,0.0003\nCC-MAIN-2021-21,tso,1631,1630,0.0001\nCC-MAIN-2021-21,tuk,57725,57548,0.0022\nCC-MAIN-2021-21,tur,26581530,26438656,1.0099\nCC-MAIN-2021-21,uig,28579,28548,0.0011\nCC-MAIN-2021-21,ukr,10608787,10552061,0.4030\nCC-MAIN-2021-21,urd,674028,670973,0.0256\nCC-MAIN-2021-21,uzb,468456,466788,0.0178\nCC-MAIN-2021-21,ven,791,786,0.0000\nCC-MAIN-2021-21,vie,21152281,21023608,0.8036\nCC-MAIN-2021-21,vol,30511,30489,0.0012\nCC-MAIN-2021-21,war,85011,84618,0.0032\nCC-MAIN-2021-21,wol,4414,4403,0.0002\nCC-MAIN-2021-21,xho,37919,37879,0.0014\nCC-MAIN-2021-21,yid,38798,38746,0.0015\nCC-MAIN-2021-21,yor,25508,25492,0.0010\nCC-MAIN-2021-21,zha,2210,2208,0.0001\nCC-MAIN-2021-21,zho,122416405,122031097,4.6508\nCC-MAIN-2021-21,zul,43287,43230,0.0016\nCC-MAIN-2021-25,<unknown>,57849416,57849416,2.3539\nCC-MAIN-2021-25,aar,3141,3125,0.0001\nCC-MAIN-2021-25,abk,7084,7079,0.0003\nCC-MAIN-2021-25,afr,320370,319224,0.0130\nCC-MAIN-2021-25,aka,1704,1702,0.0001\nCC-MAIN-2021-25,amh,74818,74383,0.0030\nCC-MAIN-2021-25,ara,15750800,15674677,0.6409\nCC-MAIN-2021-25,asm,45102,44993,0.0018\nCC-MAIN-2021-25,aym,1307,1298,0.0001\nCC-MAIN-2021-25,aze,1126535,1122425,0.0458\nCC-MAIN-2021-25,bak,27923,27898,0.0011\nCC-MAIN-2021-25,bel,428059,427269,0.0174\nCC-MAIN-2021-25,ben,2261081,2256377,0.0920\nCC-MAIN-2021-25,bih,13490,13481,0.0005\nCC-MAIN-2021-25,bis,2499,2488,0.0001\nCC-MAIN-2021-25,bod,21216,21067,0.0009\nCC-MAIN-2021-25,bos,992577,990020,0.0404\nCC-MAIN-2021-25,bre,53239,53173,0.0022\nCC-MAIN-2021-25,bul,6471109,6440847,0.2633\nCC-MAIN-2021-25,cat,5561397,5530210,0.2263\nCC-MAIN-2021-25,ceb,69083,69051,0.0028\nCC-MAIN-2021-25,ces,24586961,24425237,1.0004\nCC-MAIN-2021-25,chr,630,630,0.0000\nCC-MAIN-2021-25,cos,56104,55957,0.0023\nCC-MAIN-2021-25,crs,1652,1646,0.0001\nCC-MAIN-2021-25,cym,251961,251349,0.0103\nCC-MAIN-2021-25,dan,10281668,10219718,0.4184\nCC-MAIN-2021-25,deu,137272897,136321152,5.5856\nCC-MAIN-2021-25,div,50695,50644,0.0021\nCC-MAIN-2021-25,dzo,1780,1778,0.0001\nCC-MAIN-2021-25,ell,13524724,13471831,0.5503\nCC-MAIN-2021-25,eng,1110498198,1103016342,45.1857\nCC-MAIN-2021-25,epo,239741,239418,0.0098\nCC-MAIN-2021-25,est,3225730,3200631,0.1313\nCC-MAIN-2021-25,eus,689282,663956,0.0280\nCC-MAIN-2021-25,fao,75535,75260,0.0031\nCC-MAIN-2021-25,fas,16446253,16332749,0.6692\nCC-MAIN-2021-25,fij,1630,1627,0.0001\nCC-MAIN-2021-25,fin,9478006,9412487,0.3857\nCC-MAIN-2021-25,fra,107460102,106764099,4.3725\nCC-MAIN-2021-25,fry,86509,86311,0.0035\nCC-MAIN-2021-25,gla,48925,48779,0.0020\nCC-MAIN-2021-25,gle,142609,142183,0.0058\nCC-MAIN-2021-25,glg,875498,872427,0.0356\nCC-MAIN-2021-25,glv,8454,8436,0.0003\nCC-MAIN-2021-25,got,707,705,0.0000\nCC-MAIN-2021-25,grn,15455,15386,0.0006\nCC-MAIN-2021-25,guj,310407,309720,0.0126\nCC-MAIN-2021-25,hat,42465,42394,0.0017\nCC-MAIN-2021-25,hau,49479,49327,0.0020\nCC-MAIN-2021-25,haw,20351,20319,0.0008\nCC-MAIN-2021-25,heb,5837289,5794459,0.2375\nCC-MAIN-2021-25,hin,3576299,3566433,0.1455\nCC-MAIN-2021-25,hmn,18627,18491,0.0008\nCC-MAIN-2021-25,hrv,4550178,4532049,0.1851\nCC-MAIN-2021-25,hun,13080707,13010052,0.5322\nCC-MAIN-2021-25,hye,807099,804527,0.0328\nCC-MAIN-2021-25,ibo,15979,15947,0.0007\nCC-MAIN-2021-25,iku,3982,3981,0.0002\nCC-MAIN-2021-25,ile,7116,7105,0.0003\nCC-MAIN-2021-25,ina,14575,14550,0.0006\nCC-MAIN-2021-25,ind,20766086,20695329,0.8450\nCC-MAIN-2021-25,ipk,3911,3909,0.0002\nCC-MAIN-2021-25,isl,991562,987696,0.0403\nCC-MAIN-2021-25,ita,59258504,58944258,2.4112\nCC-MAIN-2021-25,jav,48362,48272,0.0020\nCC-MAIN-2021-25,jpn,107788318,107333357,4.3859\nCC-MAIN-2021-25,kal,40943,40860,0.0017\nCC-MAIN-2021-25,kan,283840,283406,0.0115\nCC-MAIN-2021-25,kas,84,84,0.0000\nCC-MAIN-2021-25,kat,897252,894900,0.0365\nCC-MAIN-2021-25,kaz,615330,613667,0.0250\nCC-MAIN-2021-25,kha,4788,4779,0.0002\nCC-MAIN-2021-25,khm,193963,193415,0.0079\nCC-MAIN-2021-25,kin,47483,47371,0.0019\nCC-MAIN-2021-25,kir,120536,120281,0.0049\nCC-MAIN-2021-25,kor,16457897,16400846,0.6697\nCC-MAIN-2021-25,kur,113759,113465,0.0046\nCC-MAIN-2021-25,lao,76614,76362,0.0031\nCC-MAIN-2021-25,lat,2744004,2739326,0.1117\nCC-MAIN-2021-25,lav,2246777,2234956,0.0914\nCC-MAIN-2021-25,lif,39,36,0.0000\nCC-MAIN-2021-25,lin,7010,6992,0.0003\nCC-MAIN-2021-25,lit,4022343,4001569,0.1637\nCC-MAIN-2021-25,ltz,81334,81059,0.0033\nCC-MAIN-2021-25,lug,3155,3152,0.0001\nCC-MAIN-2021-25,mal,519094,514784,0.0211\nCC-MAIN-2021-25,mar,482478,481148,0.0196\nCC-MAIN-2021-25,mfe,1883,1878,0.0001\nCC-MAIN-2021-25,mkd,721697,718103,0.0294\nCC-MAIN-2021-25,mlg,74260,74011,0.0030\nCC-MAIN-2021-25,mlt,97053,96812,0.0039\nCC-MAIN-2021-25,mon,339347,338472,0.0138\nCC-MAIN-2021-25,mri,29914,29820,0.0012\nCC-MAIN-2021-25,msa,2023322,2017036,0.0823\nCC-MAIN-2021-25,mya,268053,267582,0.0109\nCC-MAIN-2021-25,nau,1183,1181,0.0000\nCC-MAIN-2021-25,nep,727065,725353,0.0296\nCC-MAIN-2021-25,nld,43642320,43347338,1.7758\nCC-MAIN-2021-25,nno,437473,434003,0.0178\nCC-MAIN-2021-25,nor,8553119,8496705,0.3480\nCC-MAIN-2021-25,nso,1668,1668,0.0001\nCC-MAIN-2021-25,nya,11395,11354,0.0005\nCC-MAIN-2021-25,oci,68193,68056,0.0028\nCC-MAIN-2021-25,ori,94889,94778,0.0039\nCC-MAIN-2021-25,orm,13634,13577,0.0006\nCC-MAIN-2021-25,pan,117600,117403,0.0048\nCC-MAIN-2021-25,pol,39040630,38816427,1.5885\nCC-MAIN-2021-25,por,52102297,51834267,2.1200\nCC-MAIN-2021-25,pus,87440,87179,0.0036\nCC-MAIN-2021-25,que,12173,12166,0.0005\nCC-MAIN-2021-25,roh,26021,25515,0.0011\nCC-MAIN-2021-25,ron,15075174,15022823,0.6134\nCC-MAIN-2021-25,run,1997,1974,0.0001\nCC-MAIN-2021-25,rus,166295368,165472699,6.7665\nCC-MAIN-2021-25,sag,548,547,0.0000\nCC-MAIN-2021-25,san,47214,47099,0.0019\nCC-MAIN-2021-25,sco,10452,10421,0.0004\nCC-MAIN-2021-25,sin,183096,182309,0.0075\nCC-MAIN-2021-25,slk,8520665,8476319,0.3467\nCC-MAIN-2021-25,slv,3601316,3578025,0.1465\nCC-MAIN-2021-25,smo,12103,12079,0.0005\nCC-MAIN-2021-25,sna,14671,14615,0.0006\nCC-MAIN-2021-25,snd,31835,31785,0.0013\nCC-MAIN-2021-25,som,128719,128498,0.0052\nCC-MAIN-2021-25,sot,11847,11820,0.0005\nCC-MAIN-2021-25,spa,105941455,105349944,4.3107\nCC-MAIN-2021-25,sqi,1050382,1047806,0.0427\nCC-MAIN-2021-25,srp,4954137,4925020,0.2016\nCC-MAIN-2021-25,ssw,1058,1050,0.0000\nCC-MAIN-2021-25,sun,23689,23656,0.0010\nCC-MAIN-2021-25,sux,77,76,0.0000\nCC-MAIN-2021-25,swa,164273,163691,0.0067\nCC-MAIN-2021-25,swe,17783504,17669306,0.7236\nCC-MAIN-2021-25,syr,11496,11479,0.0005\nCC-MAIN-2021-25,tam,1007355,1004118,0.0410\nCC-MAIN-2021-25,tat,170130,169953,0.0069\nCC-MAIN-2021-25,tel,450363,449637,0.0183\nCC-MAIN-2021-25,tgk,123116,122658,0.0050\nCC-MAIN-2021-25,tgl,173295,172915,0.0071\nCC-MAIN-2021-25,tha,11657354,11623961,0.4743\nCC-MAIN-2021-25,tir,16052,15952,0.0007\nCC-MAIN-2021-25,ton,1096,1089,0.0000\nCC-MAIN-2021-25,tsn,8421,8207,0.0003\nCC-MAIN-2021-25,tso,1149,1148,0.0000\nCC-MAIN-2021-25,tuk,60197,60066,0.0024\nCC-MAIN-2021-25,tur,25576817,25455643,1.0407\nCC-MAIN-2021-25,uig,24288,24221,0.0010\nCC-MAIN-2021-25,ukr,10147902,10099183,0.4129\nCC-MAIN-2021-25,urd,655462,653501,0.0267\nCC-MAIN-2021-25,uzb,397403,395761,0.0162\nCC-MAIN-2021-25,ven,1071,1069,0.0000\nCC-MAIN-2021-25,vie,37417228,37263879,1.5225\nCC-MAIN-2021-25,vol,26111,26103,0.0011\nCC-MAIN-2021-25,war,74588,74320,0.0030\nCC-MAIN-2021-25,wol,3341,3335,0.0001\nCC-MAIN-2021-25,xho,40698,40640,0.0017\nCC-MAIN-2021-25,yid,36532,36425,0.0015\nCC-MAIN-2021-25,yor,23128,23091,0.0009\nCC-MAIN-2021-25,zha,1001,999,0.0000\nCC-MAIN-2021-25,zho,124579683,124114474,5.0691\nCC-MAIN-2021-25,zul,46595,46540,0.0019\nCC-MAIN-2021-31,<unknown>,55152192,55152192,1.7425\nCC-MAIN-2021-31,aar,2338,2327,0.0001\nCC-MAIN-2021-31,abk,11703,11700,0.0004\nCC-MAIN-2021-31,afr,375588,374574,0.0119\nCC-MAIN-2021-31,aka,3062,3049,0.0001\nCC-MAIN-2021-31,amh,113846,112873,0.0036\nCC-MAIN-2021-31,ara,17865281,17778741,0.5644\nCC-MAIN-2021-31,asm,53779,53609,0.0017\nCC-MAIN-2021-31,aym,1932,1886,0.0001\nCC-MAIN-2021-31,aze,1232516,1228884,0.0389\nCC-MAIN-2021-31,bak,38187,38175,0.0012\nCC-MAIN-2021-31,bel,497646,493198,0.0157\nCC-MAIN-2021-31,ben,2640212,2634457,0.0834\nCC-MAIN-2021-31,bih,19383,19370,0.0006\nCC-MAIN-2021-31,bis,3328,3315,0.0001\nCC-MAIN-2021-31,bod,28084,27896,0.0009\nCC-MAIN-2021-31,bos,1277668,1274183,0.0404\nCC-MAIN-2021-31,bre,77833,77656,0.0025\nCC-MAIN-2021-31,bul,8418194,8376078,0.2660\nCC-MAIN-2021-31,cat,7201196,7166106,0.2275\nCC-MAIN-2021-31,ceb,47548,47510,0.0015\nCC-MAIN-2021-31,ces,35554783,35362940,1.1233\nCC-MAIN-2021-31,chr,1294,1291,0.0000\nCC-MAIN-2021-31,cos,76974,76745,0.0024\nCC-MAIN-2021-31,crs,1379,1375,0.0000\nCC-MAIN-2021-31,cym,316697,315528,0.0100\nCC-MAIN-2021-31,dan,13264653,13191056,0.4191\nCC-MAIN-2021-31,deu,186833537,185607191,5.9029\nCC-MAIN-2021-31,div,57259,57173,0.0018\nCC-MAIN-2021-31,dzo,2170,2170,0.0001\nCC-MAIN-2021-31,ell,17257444,17186945,0.5452\nCC-MAIN-2021-31,eng,1442029616,1433409824,45.5605\nCC-MAIN-2021-31,epo,211892,211433,0.0067\nCC-MAIN-2021-31,est,4212803,4188956,0.1331\nCC-MAIN-2021-31,eus,845252,819419,0.0267\nCC-MAIN-2021-31,fao,104088,103554,0.0033\nCC-MAIN-2021-31,fas,20794102,20595225,0.6570\nCC-MAIN-2021-31,fij,2379,2376,0.0001\nCC-MAIN-2021-31,fin,12457144,12389941,0.3936\nCC-MAIN-2021-31,fra,142712898,141884064,4.5090\nCC-MAIN-2021-31,fry,102329,102146,0.0032\nCC-MAIN-2021-31,gla,53779,53694,0.0017\nCC-MAIN-2021-31,gle,178887,178291,0.0057\nCC-MAIN-2021-31,glg,1089129,1085560,0.0344\nCC-MAIN-2021-31,glv,14751,14741,0.0005\nCC-MAIN-2021-31,got,1136,1135,0.0000\nCC-MAIN-2021-31,grn,21003,20941,0.0007\nCC-MAIN-2021-31,guj,352742,351773,0.0111\nCC-MAIN-2021-31,hat,47910,47823,0.0015\nCC-MAIN-2021-31,hau,75498,75312,0.0024\nCC-MAIN-2021-31,haw,17584,17548,0.0006\nCC-MAIN-2021-31,heb,7808734,7763728,0.2467\nCC-MAIN-2021-31,hin,4172426,4160011,0.1318\nCC-MAIN-2021-31,hmn,22252,18274,0.0007\nCC-MAIN-2021-31,hrv,5886172,5859501,0.1860\nCC-MAIN-2021-31,hun,16912426,16834432,0.5343\nCC-MAIN-2021-31,hye,872481,869469,0.0276\nCC-MAIN-2021-31,ibo,16545,16496,0.0005\nCC-MAIN-2021-31,iku,6157,6149,0.0002\nCC-MAIN-2021-31,ile,8429,8399,0.0003\nCC-MAIN-2021-31,ina,18575,18554,0.0006\nCC-MAIN-2021-31,ind,26903931,26815563,0.8500\nCC-MAIN-2021-31,ipk,5132,5120,0.0002\nCC-MAIN-2021-31,isl,1287077,1281402,0.0407\nCC-MAIN-2021-31,ita,77083323,76701902,2.4354\nCC-MAIN-2021-31,jav,71685,71560,0.0023\nCC-MAIN-2021-31,jpn,155954879,155432969,4.9273\nCC-MAIN-2021-31,kal,54599,54509,0.0017\nCC-MAIN-2021-31,kan,326927,326343,0.0103\nCC-MAIN-2021-31,kas,203,203,0.0000\nCC-MAIN-2021-31,kat,1037007,1033371,0.0328\nCC-MAIN-2021-31,kaz,681772,679821,0.0215\nCC-MAIN-2021-31,kha,5347,5239,0.0002\nCC-MAIN-2021-31,khm,281646,281149,0.0089\nCC-MAIN-2021-31,kin,58440,58228,0.0018\nCC-MAIN-2021-31,kir,153435,153188,0.0048\nCC-MAIN-2021-31,kor,18036214,17973907,0.5698\nCC-MAIN-2021-31,kur,159379,159005,0.0050\nCC-MAIN-2021-31,lao,116072,115570,0.0037\nCC-MAIN-2021-31,lat,3988538,3980647,0.1260\nCC-MAIN-2021-31,lav,2804613,2789589,0.0886\nCC-MAIN-2021-31,lif,18,18,0.0000\nCC-MAIN-2021-31,lin,6606,6592,0.0002\nCC-MAIN-2021-31,lit,5183948,5158606,0.1638\nCC-MAIN-2021-31,ltz,115753,115421,0.0037\nCC-MAIN-2021-31,lug,3661,3638,0.0001\nCC-MAIN-2021-31,mal,597752,595191,0.0189\nCC-MAIN-2021-31,mar,549317,547694,0.0174\nCC-MAIN-2021-31,mfe,2603,2578,0.0001\nCC-MAIN-2021-31,mkd,909667,906323,0.0287\nCC-MAIN-2021-31,mlg,89533,89193,0.0028\nCC-MAIN-2021-31,mlt,108309,107826,0.0034\nCC-MAIN-2021-31,mon,413846,412543,0.0131\nCC-MAIN-2021-31,mri,41925,41762,0.0013\nCC-MAIN-2021-31,msa,2682597,2675675,0.0848\nCC-MAIN-2021-31,mya,336444,335825,0.0106\nCC-MAIN-2021-31,nau,749,744,0.0000\nCC-MAIN-2021-31,nep,864248,861930,0.0273\nCC-MAIN-2021-31,nld,60694360,60318512,1.9176\nCC-MAIN-2021-31,nno,534678,531397,0.0169\nCC-MAIN-2021-31,nor,10918739,10847255,0.3450\nCC-MAIN-2021-31,nso,3228,3228,0.0001\nCC-MAIN-2021-31,nya,15011,14980,0.0005\nCC-MAIN-2021-31,oci,88565,88328,0.0028\nCC-MAIN-2021-31,ori,100034,99936,0.0032\nCC-MAIN-2021-31,orm,18921,18544,0.0006\nCC-MAIN-2021-31,pan,158173,157639,0.0050\nCC-MAIN-2021-31,pol,52132272,51844129,1.6471\nCC-MAIN-2021-31,por,69847083,69526983,2.2068\nCC-MAIN-2021-31,pus,92508,92047,0.0029\nCC-MAIN-2021-31,que,22598,22584,0.0007\nCC-MAIN-2021-31,roh,29741,29280,0.0009\nCC-MAIN-2021-31,ron,19121129,19043840,0.6041\nCC-MAIN-2021-31,run,1799,1772,0.0001\nCC-MAIN-2021-31,rus,230727698,229811731,7.2898\nCC-MAIN-2021-31,sag,479,479,0.0000\nCC-MAIN-2021-31,san,62499,62360,0.0020\nCC-MAIN-2021-31,sco,12708,12597,0.0004\nCC-MAIN-2021-31,sin,227135,226385,0.0072\nCC-MAIN-2021-31,slk,11579341,11522429,0.3658\nCC-MAIN-2021-31,slv,4759036,4731517,0.1504\nCC-MAIN-2021-31,smo,17917,17894,0.0006\nCC-MAIN-2021-31,sna,18000,17981,0.0006\nCC-MAIN-2021-31,snd,37378,37329,0.0012\nCC-MAIN-2021-31,som,152495,152318,0.0048\nCC-MAIN-2021-31,sot,15748,15732,0.0005\nCC-MAIN-2021-31,spa,139594921,138911086,4.4105\nCC-MAIN-2021-31,sqi,1176770,1173932,0.0372\nCC-MAIN-2021-31,srp,6488801,6445083,0.2050\nCC-MAIN-2021-31,ssw,1073,1060,0.0000\nCC-MAIN-2021-31,sun,33018,32990,0.0010\nCC-MAIN-2021-31,sux,83,83,0.0000\nCC-MAIN-2021-31,swa,218700,217010,0.0069\nCC-MAIN-2021-31,swe,23079384,22943036,0.7292\nCC-MAIN-2021-31,syr,11599,11586,0.0004\nCC-MAIN-2021-31,tam,1249314,1245512,0.0395\nCC-MAIN-2021-31,tat,207822,207680,0.0066\nCC-MAIN-2021-31,tel,532797,531552,0.0168\nCC-MAIN-2021-31,tgk,156330,156135,0.0049\nCC-MAIN-2021-31,tgl,228412,227856,0.0072\nCC-MAIN-2021-31,tha,13083761,13037034,0.4134\nCC-MAIN-2021-31,tir,31395,31236,0.0010\nCC-MAIN-2021-31,ton,1729,1721,0.0001\nCC-MAIN-2021-31,tsn,7880,7840,0.0002\nCC-MAIN-2021-31,tso,1730,1730,0.0001\nCC-MAIN-2021-31,tuk,66442,66294,0.0021\nCC-MAIN-2021-31,tur,32314997,32177054,1.0210\nCC-MAIN-2021-31,uig,35173,35130,0.0011\nCC-MAIN-2021-31,ukr,12714957,12661970,0.4017\nCC-MAIN-2021-31,urd,753982,751222,0.0238\nCC-MAIN-2021-31,uzb,478478,477059,0.0151\nCC-MAIN-2021-31,ven,809,808,0.0000\nCC-MAIN-2021-31,vie,29999571,29852213,0.9478\nCC-MAIN-2021-31,vol,31379,31359,0.0010\nCC-MAIN-2021-31,war,66153,65846,0.0021\nCC-MAIN-2021-31,wol,4627,4618,0.0001\nCC-MAIN-2021-31,xho,40787,40726,0.0013\nCC-MAIN-2021-31,yid,44706,44656,0.0014\nCC-MAIN-2021-31,yor,31646,31567,0.0010\nCC-MAIN-2021-31,zha,2165,2163,0.0001\nCC-MAIN-2021-31,zho,130563035,130195445,4.1251\nCC-MAIN-2021-31,zul,52136,52055,0.0016\nCC-MAIN-2021-39,<unknown>,84000284,84000284,2.8379\nCC-MAIN-2021-39,aar,5272,5255,0.0002\nCC-MAIN-2021-39,abk,10366,10348,0.0004\nCC-MAIN-2021-39,afr,392282,391142,0.0133\nCC-MAIN-2021-39,aka,2436,2412,0.0001\nCC-MAIN-2021-39,amh,101499,100819,0.0034\nCC-MAIN-2021-39,ara,17703653,17622867,0.5981\nCC-MAIN-2021-39,asm,50564,50429,0.0017\nCC-MAIN-2021-39,aym,1898,1850,0.0001\nCC-MAIN-2021-39,aze,1317681,1310686,0.0445\nCC-MAIN-2021-39,bak,32321,32302,0.0011\nCC-MAIN-2021-39,bel,529748,528715,0.0179\nCC-MAIN-2021-39,ben,2635524,2630851,0.0890\nCC-MAIN-2021-39,bih,16497,16459,0.0006\nCC-MAIN-2021-39,bis,3909,3894,0.0001\nCC-MAIN-2021-39,bod,31104,31021,0.0011\nCC-MAIN-2021-39,bos,1265916,1262510,0.0428\nCC-MAIN-2021-39,bre,70080,70021,0.0024\nCC-MAIN-2021-39,bul,8033591,7995762,0.2714\nCC-MAIN-2021-39,cat,6985385,6951551,0.2360\nCC-MAIN-2021-39,ceb,67082,67055,0.0023\nCC-MAIN-2021-39,ces,30145576,29981425,1.0185\nCC-MAIN-2021-39,chr,775,775,0.0000\nCC-MAIN-2021-39,cos,76668,76458,0.0026\nCC-MAIN-2021-39,crs,2102,2093,0.0001\nCC-MAIN-2021-39,cym,303455,302214,0.0103\nCC-MAIN-2021-39,dan,11985154,11904758,0.4049\nCC-MAIN-2021-39,deu,165970137,164845645,5.6073\nCC-MAIN-2021-39,div,60243,60193,0.0020\nCC-MAIN-2021-39,dzo,3072,3070,0.0001\nCC-MAIN-2021-39,ell,16102905,16034280,0.5440\nCC-MAIN-2021-39,eng,1344556676,1334957345,45.4257\nCC-MAIN-2021-39,epo,265860,265435,0.0090\nCC-MAIN-2021-39,est,3952964,3925728,0.1336\nCC-MAIN-2021-39,eus,823984,801659,0.0278\nCC-MAIN-2021-39,fao,99739,99306,0.0034\nCC-MAIN-2021-39,fas,18858908,18703877,0.6371\nCC-MAIN-2021-39,fij,1812,1811,0.0001\nCC-MAIN-2021-39,fin,11555516,11487992,0.3904\nCC-MAIN-2021-39,fra,131526242,130731042,4.4436\nCC-MAIN-2021-39,fry,108942,108705,0.0037\nCC-MAIN-2021-39,gla,61172,60962,0.0021\nCC-MAIN-2021-39,gle,175478,174002,0.0059\nCC-MAIN-2021-39,glg,1122078,1118598,0.0379\nCC-MAIN-2021-39,glv,13693,13678,0.0005\nCC-MAIN-2021-39,got,807,807,0.0000\nCC-MAIN-2021-39,grn,20400,20366,0.0007\nCC-MAIN-2021-39,guj,350347,349426,0.0118\nCC-MAIN-2021-39,hat,45684,45525,0.0015\nCC-MAIN-2021-39,hau,58869,58604,0.0020\nCC-MAIN-2021-39,haw,20383,20337,0.0007\nCC-MAIN-2021-39,heb,7195050,7152013,0.2431\nCC-MAIN-2021-39,hin,3965681,3951650,0.1340\nCC-MAIN-2021-39,hmn,21760,18515,0.0007\nCC-MAIN-2021-39,hrv,5739947,5717604,0.1939\nCC-MAIN-2021-39,hun,15934993,15866060,0.5384\nCC-MAIN-2021-39,hye,931790,929143,0.0315\nCC-MAIN-2021-39,ibo,18355,18287,0.0006\nCC-MAIN-2021-39,iku,6132,6116,0.0002\nCC-MAIN-2021-39,ile,9557,9540,0.0003\nCC-MAIN-2021-39,ina,15270,15250,0.0005\nCC-MAIN-2021-39,ind,25482245,25385971,0.8609\nCC-MAIN-2021-39,ipk,2508,2492,0.0001\nCC-MAIN-2021-39,isl,1220447,1215083,0.0412\nCC-MAIN-2021-39,ita,70643308,70284564,2.3867\nCC-MAIN-2021-39,jav,65337,65241,0.0022\nCC-MAIN-2021-39,jpn,133228651,132712635,4.5011\nCC-MAIN-2021-39,kal,51649,51597,0.0017\nCC-MAIN-2021-39,kan,325891,325361,0.0110\nCC-MAIN-2021-39,kas,89,88,0.0000\nCC-MAIN-2021-39,kat,1049816,1046099,0.0355\nCC-MAIN-2021-39,kaz,727750,725699,0.0246\nCC-MAIN-2021-39,kha,4559,4547,0.0002\nCC-MAIN-2021-39,khm,229360,228793,0.0077\nCC-MAIN-2021-39,kin,59698,59580,0.0020\nCC-MAIN-2021-39,kir,144141,143761,0.0049\nCC-MAIN-2021-39,kor,20279008,20205115,0.6851\nCC-MAIN-2021-39,kur,145144,144415,0.0049\nCC-MAIN-2021-39,lao,111705,110920,0.0038\nCC-MAIN-2021-39,lat,3242162,3235836,0.1095\nCC-MAIN-2021-39,lav,2724134,2703816,0.0920\nCC-MAIN-2021-39,lif,41,34,0.0000\nCC-MAIN-2021-39,lin,8253,8195,0.0003\nCC-MAIN-2021-39,lit,5072665,5049341,0.1714\nCC-MAIN-2021-39,ltz,107915,107543,0.0036\nCC-MAIN-2021-39,lug,4273,4253,0.0001\nCC-MAIN-2021-39,mal,629668,627689,0.0213\nCC-MAIN-2021-39,mar,544735,542859,0.0184\nCC-MAIN-2021-39,mfe,3108,3077,0.0001\nCC-MAIN-2021-39,mkd,925082,921530,0.0313\nCC-MAIN-2021-39,mlg,78789,78247,0.0027\nCC-MAIN-2021-39,mlt,127099,125995,0.0043\nCC-MAIN-2021-39,mon,461484,460878,0.0156\nCC-MAIN-2021-39,mri,46061,45883,0.0016\nCC-MAIN-2021-39,msa,2460981,2454104,0.0831\nCC-MAIN-2021-39,mya,325585,324679,0.0110\nCC-MAIN-2021-39,nau,1222,1218,0.0000\nCC-MAIN-2021-39,nep,945450,944073,0.0319\nCC-MAIN-2021-39,nld,52443909,52081884,1.7718\nCC-MAIN-2021-39,nno,549075,542601,0.0186\nCC-MAIN-2021-39,nor,10008678,9937023,0.3381\nCC-MAIN-2021-39,nso,2235,2235,0.0001\nCC-MAIN-2021-39,nya,16720,16671,0.0006\nCC-MAIN-2021-39,oci,92970,92665,0.0031\nCC-MAIN-2021-39,ori,99474,99378,0.0034\nCC-MAIN-2021-39,orm,15796,15704,0.0005\nCC-MAIN-2021-39,pan,168206,167945,0.0057\nCC-MAIN-2021-39,pol,49252311,48992865,1.6640\nCC-MAIN-2021-39,por,62025631,61701704,2.0955\nCC-MAIN-2021-39,pus,91160,90875,0.0031\nCC-MAIN-2021-39,que,16907,16891,0.0006\nCC-MAIN-2021-39,roh,30190,29244,0.0010\nCC-MAIN-2021-39,ron,18119057,18048184,0.6122\nCC-MAIN-2021-39,run,2489,2442,0.0001\nCC-MAIN-2021-39,rus,193331098,192517009,6.5317\nCC-MAIN-2021-39,sag,446,446,0.0000\nCC-MAIN-2021-39,san,63573,63439,0.0021\nCC-MAIN-2021-39,sco,12471,12405,0.0004\nCC-MAIN-2021-39,sin,222155,221314,0.0075\nCC-MAIN-2021-39,slk,10558282,10509543,0.3567\nCC-MAIN-2021-39,slv,4540437,4512967,0.1534\nCC-MAIN-2021-39,smo,15649,15607,0.0005\nCC-MAIN-2021-39,sna,20189,20153,0.0007\nCC-MAIN-2021-39,snd,34250,34215,0.0012\nCC-MAIN-2021-39,som,144718,144523,0.0049\nCC-MAIN-2021-39,sot,15737,15718,0.0005\nCC-MAIN-2021-39,spa,128796294,128086615,4.3514\nCC-MAIN-2021-39,sqi,1172998,1170229,0.0396\nCC-MAIN-2021-39,srp,6275570,6230466,0.2120\nCC-MAIN-2021-39,ssw,807,791,0.0000\nCC-MAIN-2021-39,sun,30702,30657,0.0010\nCC-MAIN-2021-39,sux,168,168,0.0000\nCC-MAIN-2021-39,swa,225643,225020,0.0076\nCC-MAIN-2021-39,swe,20675969,20534691,0.6985\nCC-MAIN-2021-39,syr,13348,13315,0.0005\nCC-MAIN-2021-39,tam,1262534,1259598,0.0427\nCC-MAIN-2021-39,tat,245711,245560,0.0083\nCC-MAIN-2021-39,tel,558463,557451,0.0189\nCC-MAIN-2021-39,tgk,155455,155253,0.0053\nCC-MAIN-2021-39,tgl,225799,224645,0.0076\nCC-MAIN-2021-39,tha,14219366,14166494,0.4804\nCC-MAIN-2021-39,tir,19350,19017,0.0007\nCC-MAIN-2021-39,ton,1231,1224,0.0000\nCC-MAIN-2021-39,tsn,3961,3939,0.0001\nCC-MAIN-2021-39,tso,1115,1114,0.0000\nCC-MAIN-2021-39,tuk,70608,70482,0.0024\nCC-MAIN-2021-39,tur,29573875,29447150,0.9991\nCC-MAIN-2021-39,uig,27942,27889,0.0009\nCC-MAIN-2021-39,ukr,12215021,12162147,0.4127\nCC-MAIN-2021-39,urd,827311,821926,0.0280\nCC-MAIN-2021-39,uzb,477001,474844,0.0161\nCC-MAIN-2021-39,ven,1404,1397,0.0000\nCC-MAIN-2021-39,vie,26123743,25950182,0.8826\nCC-MAIN-2021-39,vol,22316,22296,0.0008\nCC-MAIN-2021-39,war,85291,85097,0.0029\nCC-MAIN-2021-39,wol,4612,4580,0.0002\nCC-MAIN-2021-39,xho,59485,59391,0.0020\nCC-MAIN-2021-39,yid,44473,44422,0.0015\nCC-MAIN-2021-39,yor,30355,30284,0.0010\nCC-MAIN-2021-39,zha,1218,1216,0.0000\nCC-MAIN-2021-39,zho,147655310,147248053,4.9885\nCC-MAIN-2021-39,zul,60236,60112,0.0020\nCC-MAIN-2021-43,<unknown>,93142998,93142998,2.7811\nCC-MAIN-2021-43,aar,4126,4116,0.0001\nCC-MAIN-2021-43,abk,12179,11986,0.0004\nCC-MAIN-2021-43,afr,389955,389097,0.0116\nCC-MAIN-2021-43,aka,2522,2494,0.0001\nCC-MAIN-2021-43,amh,110884,110600,0.0033\nCC-MAIN-2021-43,ara,19412267,19334599,0.5796\nCC-MAIN-2021-43,asm,52003,51789,0.0016\nCC-MAIN-2021-43,aym,2416,2363,0.0001\nCC-MAIN-2021-43,aze,1337256,1331928,0.0399\nCC-MAIN-2021-43,bak,38536,38519,0.0012\nCC-MAIN-2021-43,bel,505804,504518,0.0151\nCC-MAIN-2021-43,ben,2824993,2818347,0.0843\nCC-MAIN-2021-43,bih,19580,19556,0.0006\nCC-MAIN-2021-43,bis,4291,4278,0.0001\nCC-MAIN-2021-43,bod,30930,30816,0.0009\nCC-MAIN-2021-43,bos,1375168,1372311,0.0411\nCC-MAIN-2021-43,bre,80958,80908,0.0024\nCC-MAIN-2021-43,bul,8687306,8661632,0.2594\nCC-MAIN-2021-43,cat,7812200,7773424,0.2333\nCC-MAIN-2021-43,ceb,71591,71561,0.0021\nCC-MAIN-2021-43,ces,33813900,33668785,1.0096\nCC-MAIN-2021-43,chr,1237,1237,0.0000\nCC-MAIN-2021-43,cos,83678,83403,0.0025\nCC-MAIN-2021-43,crs,1889,1882,0.0001\nCC-MAIN-2021-43,cym,374708,373622,0.0112\nCC-MAIN-2021-43,dan,13849487,13772318,0.4135\nCC-MAIN-2021-43,deu,190277957,189155184,5.6813\nCC-MAIN-2021-43,div,60394,60345,0.0018\nCC-MAIN-2021-43,dzo,3617,3617,0.0001\nCC-MAIN-2021-43,ell,18179289,18121369,0.5428\nCC-MAIN-2021-43,eng,1520274370,1511434684,45.3925\nCC-MAIN-2021-43,epo,293783,292992,0.0088\nCC-MAIN-2021-43,est,4555645,4527138,0.1360\nCC-MAIN-2021-43,eus,972507,964201,0.0290\nCC-MAIN-2021-43,fao,116921,116529,0.0035\nCC-MAIN-2021-43,fas,21077413,20912105,0.6293\nCC-MAIN-2021-43,fij,3806,3767,0.0001\nCC-MAIN-2021-43,fin,13267600,13199824,0.3961\nCC-MAIN-2021-43,fra,147941614,147165708,4.4173\nCC-MAIN-2021-43,fry,103313,103031,0.0031\nCC-MAIN-2021-43,gla,65853,65663,0.0020\nCC-MAIN-2021-43,gle,183645,182747,0.0055\nCC-MAIN-2021-43,glg,1259498,1255030,0.0376\nCC-MAIN-2021-43,glv,12974,12957,0.0004\nCC-MAIN-2021-43,got,1395,1394,0.0000\nCC-MAIN-2021-43,grn,21238,21160,0.0006\nCC-MAIN-2021-43,guj,344967,344373,0.0103\nCC-MAIN-2021-43,hat,47493,47381,0.0014\nCC-MAIN-2021-43,hau,109131,108476,0.0033\nCC-MAIN-2021-43,haw,17476,17459,0.0005\nCC-MAIN-2021-43,heb,7996327,7960445,0.2388\nCC-MAIN-2021-43,hin,4245452,4234544,0.1268\nCC-MAIN-2021-43,hmn,16246,16214,0.0005\nCC-MAIN-2021-43,hrv,6397941,6375376,0.1910\nCC-MAIN-2021-43,hun,18238851,18172627,0.5446\nCC-MAIN-2021-43,hye,1012463,1009812,0.0302\nCC-MAIN-2021-43,ibo,17841,17800,0.0005\nCC-MAIN-2021-43,iku,6501,6483,0.0002\nCC-MAIN-2021-43,ile,9314,9286,0.0003\nCC-MAIN-2021-43,ina,18237,18217,0.0005\nCC-MAIN-2021-43,ind,27902794,27810589,0.8331\nCC-MAIN-2021-43,ipk,2552,2548,0.0001\nCC-MAIN-2021-43,isl,1263380,1258742,0.0377\nCC-MAIN-2021-43,ita,80712457,80349384,2.4099\nCC-MAIN-2021-43,jav,65738,65703,0.0020\nCC-MAIN-2021-43,jpn,159199562,158696026,4.7534\nCC-MAIN-2021-43,kal,38615,38486,0.0012\nCC-MAIN-2021-43,kan,319644,319225,0.0095\nCC-MAIN-2021-43,kas,216,216,0.0000\nCC-MAIN-2021-43,kat,1194112,1190652,0.0357\nCC-MAIN-2021-43,kaz,747873,746732,0.0223\nCC-MAIN-2021-43,kha,5882,5878,0.0002\nCC-MAIN-2021-43,khm,303974,303657,0.0091\nCC-MAIN-2021-43,kin,65460,65220,0.0020\nCC-MAIN-2021-43,kir,170220,169761,0.0051\nCC-MAIN-2021-43,kor,21553744,21433208,0.6436\nCC-MAIN-2021-43,kur,171092,170228,0.0051\nCC-MAIN-2021-43,lao,129270,128171,0.0039\nCC-MAIN-2021-43,lat,3864966,3859731,0.1154\nCC-MAIN-2021-43,lav,2973049,2956188,0.0888\nCC-MAIN-2021-43,lif,162,152,0.0000\nCC-MAIN-2021-43,lin,6403,6375,0.0002\nCC-MAIN-2021-43,lit,5679670,5656641,0.1696\nCC-MAIN-2021-43,ltz,124041,123689,0.0037\nCC-MAIN-2021-43,lug,3700,3663,0.0001\nCC-MAIN-2021-43,mal,621034,618019,0.0185\nCC-MAIN-2021-43,mar,592738,590543,0.0177\nCC-MAIN-2021-43,mfe,2537,2520,0.0001\nCC-MAIN-2021-43,mkd,997757,994653,0.0298\nCC-MAIN-2021-43,mlg,83375,83095,0.0025\nCC-MAIN-2021-43,mlt,141224,138128,0.0042\nCC-MAIN-2021-43,mon,495828,495170,0.0148\nCC-MAIN-2021-43,mri,47610,47508,0.0014\nCC-MAIN-2021-43,msa,2683546,2675957,0.0801\nCC-MAIN-2021-43,mya,375686,374787,0.0112\nCC-MAIN-2021-43,nau,852,849,0.0000\nCC-MAIN-2021-43,nep,960924,959920,0.0287\nCC-MAIN-2021-43,nld,60556279,60216916,1.8081\nCC-MAIN-2021-43,nno,565374,561548,0.0169\nCC-MAIN-2021-43,nor,11316875,11242692,0.3379\nCC-MAIN-2021-43,nso,3331,3331,0.0001\nCC-MAIN-2021-43,nya,14744,14718,0.0004\nCC-MAIN-2021-43,oci,90146,89929,0.0027\nCC-MAIN-2021-43,ori,131089,130952,0.0039\nCC-MAIN-2021-43,orm,14910,14855,0.0004\nCC-MAIN-2021-43,pan,156739,156457,0.0047\nCC-MAIN-2021-43,pol,54308987,54043690,1.6216\nCC-MAIN-2021-43,por,73063314,72740460,2.1815\nCC-MAIN-2021-43,pus,98806,98557,0.0030\nCC-MAIN-2021-43,que,23361,23345,0.0007\nCC-MAIN-2021-43,roh,44438,43164,0.0013\nCC-MAIN-2021-43,ron,20223721,20146867,0.6038\nCC-MAIN-2021-43,run,2345,2294,0.0001\nCC-MAIN-2021-43,rus,227642136,226651106,6.7970\nCC-MAIN-2021-43,sag,390,390,0.0000\nCC-MAIN-2021-43,san,91350,91120,0.0027\nCC-MAIN-2021-43,sco,18002,17974,0.0005\nCC-MAIN-2021-43,sin,267041,266190,0.0080\nCC-MAIN-2021-43,slk,11599469,11550163,0.3463\nCC-MAIN-2021-43,slv,4946344,4923233,0.1477\nCC-MAIN-2021-43,smo,14592,14570,0.0004\nCC-MAIN-2021-43,sna,19274,19222,0.0006\nCC-MAIN-2021-43,snd,32091,32068,0.0010\nCC-MAIN-2021-43,som,157189,157039,0.0047\nCC-MAIN-2021-43,sot,14589,14542,0.0004\nCC-MAIN-2021-43,spa,144509768,143771991,4.3148\nCC-MAIN-2021-43,sqi,1250185,1245607,0.0373\nCC-MAIN-2021-43,srp,6950333,6919893,0.2075\nCC-MAIN-2021-43,ssw,1171,1160,0.0000\nCC-MAIN-2021-43,sun,34878,34832,0.0010\nCC-MAIN-2021-43,sux,81,81,0.0000\nCC-MAIN-2021-43,swa,242022,241570,0.0072\nCC-MAIN-2021-43,swe,23607101,23472889,0.7049\nCC-MAIN-2021-43,syr,18671,18653,0.0006\nCC-MAIN-2021-43,tam,1336627,1332283,0.0399\nCC-MAIN-2021-43,tat,249531,249192,0.0075\nCC-MAIN-2021-43,tel,517401,515655,0.0154\nCC-MAIN-2021-43,tgk,138541,138411,0.0041\nCC-MAIN-2021-43,tgl,258358,257184,0.0077\nCC-MAIN-2021-43,tha,12375695,12325611,0.3695\nCC-MAIN-2021-43,tir,28753,28581,0.0009\nCC-MAIN-2021-43,ton,1771,1760,0.0001\nCC-MAIN-2021-43,tsn,3332,3299,0.0001\nCC-MAIN-2021-43,tso,2540,2538,0.0001\nCC-MAIN-2021-43,tuk,74999,74927,0.0022\nCC-MAIN-2021-43,tur,32259542,32136886,0.9632\nCC-MAIN-2021-43,uig,38002,37955,0.0011\nCC-MAIN-2021-43,ukr,13496052,13429025,0.4030\nCC-MAIN-2021-43,urd,868468,864123,0.0259\nCC-MAIN-2021-43,uzb,515752,513975,0.0154\nCC-MAIN-2021-43,ven,1661,1659,0.0000\nCC-MAIN-2021-43,vie,28225816,28075820,0.8428\nCC-MAIN-2021-43,vol,26133,26109,0.0008\nCC-MAIN-2021-43,war,84197,84019,0.0025\nCC-MAIN-2021-43,wol,5551,5520,0.0002\nCC-MAIN-2021-43,xho,70212,70144,0.0021\nCC-MAIN-2021-43,yid,51122,51083,0.0015\nCC-MAIN-2021-43,yor,34554,34477,0.0010\nCC-MAIN-2021-43,zha,1894,1892,0.0001\nCC-MAIN-2021-43,zho,161716903,161283879,4.8286\nCC-MAIN-2021-43,zul,67851,67742,0.0020\nCC-MAIN-2021-49,<unknown>,94003828,94003828,3.7199\nCC-MAIN-2021-49,aar,4557,4544,0.0002\nCC-MAIN-2021-49,abk,11223,11161,0.0004\nCC-MAIN-2021-49,afr,320822,320176,0.0127\nCC-MAIN-2021-49,aka,1745,1705,0.0001\nCC-MAIN-2021-49,amh,68844,68532,0.0027\nCC-MAIN-2021-49,ara,16347478,16269557,0.6469\nCC-MAIN-2021-49,asm,39572,39507,0.0016\nCC-MAIN-2021-49,aym,973,962,0.0000\nCC-MAIN-2021-49,aze,1139930,1136153,0.0451\nCC-MAIN-2021-49,bak,24900,24864,0.0010\nCC-MAIN-2021-49,bel,399247,398160,0.0158\nCC-MAIN-2021-49,ben,2166543,2160379,0.0857\nCC-MAIN-2021-49,bih,10884,10865,0.0004\nCC-MAIN-2021-49,bis,2205,2196,0.0001\nCC-MAIN-2021-49,bod,24899,24789,0.0010\nCC-MAIN-2021-49,bos,1108938,1106381,0.0439\nCC-MAIN-2021-49,bre,64835,64788,0.0026\nCC-MAIN-2021-49,bul,6460279,6432289,0.2556\nCC-MAIN-2021-49,cat,5892859,5857994,0.2332\nCC-MAIN-2021-49,ceb,58334,58238,0.0023\nCC-MAIN-2021-49,ces,23161720,23001718,0.9165\nCC-MAIN-2021-49,chr,733,732,0.0000\nCC-MAIN-2021-49,cos,60143,59888,0.0024\nCC-MAIN-2021-49,crs,2229,2217,0.0001\nCC-MAIN-2021-49,cym,340179,338974,0.0135\nCC-MAIN-2021-49,dan,10122813,10052372,0.4006\nCC-MAIN-2021-49,deu,136673952,135618923,5.4084\nCC-MAIN-2021-49,div,49320,49252,0.0020\nCC-MAIN-2021-49,dzo,3689,3688,0.0001\nCC-MAIN-2021-49,ell,13811330,13758817,0.5465\nCC-MAIN-2021-49,eng,1168824626,1160086034,46.2521\nCC-MAIN-2021-49,epo,253874,251725,0.0100\nCC-MAIN-2021-49,est,3421845,3393267,0.1354\nCC-MAIN-2021-49,eus,824831,817156,0.0326\nCC-MAIN-2021-49,fao,83668,83301,0.0033\nCC-MAIN-2021-49,fas,14860547,14705131,0.5881\nCC-MAIN-2021-49,fij,3538,3524,0.0001\nCC-MAIN-2021-49,fin,9666634,9604676,0.3825\nCC-MAIN-2021-49,fra,111043269,110321731,4.3941\nCC-MAIN-2021-49,fry,84160,83774,0.0033\nCC-MAIN-2021-49,gla,70907,70833,0.0028\nCC-MAIN-2021-49,gle,145869,145197,0.0058\nCC-MAIN-2021-49,glg,1032224,1026969,0.0408\nCC-MAIN-2021-49,glv,6800,6780,0.0003\nCC-MAIN-2021-49,got,550,549,0.0000\nCC-MAIN-2021-49,grn,13550,13499,0.0005\nCC-MAIN-2021-49,guj,287542,286972,0.0114\nCC-MAIN-2021-49,hat,40212,40063,0.0016\nCC-MAIN-2021-49,hau,80351,79346,0.0032\nCC-MAIN-2021-49,haw,15661,15615,0.0006\nCC-MAIN-2021-49,heb,6062463,6032552,0.2399\nCC-MAIN-2021-49,hin,3348259,3335448,0.1325\nCC-MAIN-2021-49,hmn,18017,17939,0.0007\nCC-MAIN-2021-49,hrv,4978946,4951876,0.1970\nCC-MAIN-2021-49,hun,13718200,13649415,0.5428\nCC-MAIN-2021-49,hye,828167,825718,0.0328\nCC-MAIN-2021-49,ibo,15972,15935,0.0006\nCC-MAIN-2021-49,iku,5236,5230,0.0002\nCC-MAIN-2021-49,ile,7613,7591,0.0003\nCC-MAIN-2021-49,ina,15507,15486,0.0006\nCC-MAIN-2021-49,ind,19281673,19173586,0.7630\nCC-MAIN-2021-49,ipk,1970,1956,0.0001\nCC-MAIN-2021-49,isl,922259,917575,0.0365\nCC-MAIN-2021-49,ita,60471297,60132920,2.3929\nCC-MAIN-2021-49,jav,48605,48454,0.0019\nCC-MAIN-2021-49,jpn,108311654,107814521,4.2860\nCC-MAIN-2021-49,kal,27163,27042,0.0011\nCC-MAIN-2021-49,kan,272861,272352,0.0108\nCC-MAIN-2021-49,kas,129,129,0.0000\nCC-MAIN-2021-49,kat,992973,989716,0.0393\nCC-MAIN-2021-49,kaz,555626,554201,0.0220\nCC-MAIN-2021-49,kha,4851,4768,0.0002\nCC-MAIN-2021-49,khm,215425,214859,0.0085\nCC-MAIN-2021-49,kin,49908,49818,0.0020\nCC-MAIN-2021-49,kir,136596,136354,0.0054\nCC-MAIN-2021-49,kor,18604370,18402163,0.7362\nCC-MAIN-2021-49,kur,144914,143823,0.0057\nCC-MAIN-2021-49,lao,93007,92261,0.0037\nCC-MAIN-2021-49,lat,1833865,1827739,0.0726\nCC-MAIN-2021-49,lav,2303398,2291205,0.0911\nCC-MAIN-2021-49,lif,113,113,0.0000\nCC-MAIN-2021-49,lin,5257,5213,0.0002\nCC-MAIN-2021-49,lit,4421902,4402659,0.1750\nCC-MAIN-2021-49,ltz,83693,83398,0.0033\nCC-MAIN-2021-49,lug,3198,3169,0.0001\nCC-MAIN-2021-49,mal,488809,487609,0.0193\nCC-MAIN-2021-49,mar,483980,482991,0.0192\nCC-MAIN-2021-49,mfe,1970,1965,0.0001\nCC-MAIN-2021-49,mkd,811759,809024,0.0321\nCC-MAIN-2021-49,mlg,58250,57991,0.0023\nCC-MAIN-2021-49,mlt,136165,134569,0.0054\nCC-MAIN-2021-49,mon,435278,433913,0.0172\nCC-MAIN-2021-49,mri,38098,37971,0.0015\nCC-MAIN-2021-49,msa,1848097,1842096,0.0731\nCC-MAIN-2021-49,mya,274586,273729,0.0109\nCC-MAIN-2021-49,nau,897,896,0.0000\nCC-MAIN-2021-49,nep,683816,682858,0.0271\nCC-MAIN-2021-49,nld,41843364,41508122,1.6558\nCC-MAIN-2021-49,nno,403536,399628,0.0160\nCC-MAIN-2021-49,nor,8173983,8111060,0.3235\nCC-MAIN-2021-49,nso,1280,1278,0.0001\nCC-MAIN-2021-49,nya,17140,17078,0.0007\nCC-MAIN-2021-49,oci,69114,68919,0.0027\nCC-MAIN-2021-49,ori,120695,120586,0.0048\nCC-MAIN-2021-49,orm,10525,10488,0.0004\nCC-MAIN-2021-49,pan,126256,125450,0.0050\nCC-MAIN-2021-49,pol,39876582,39621338,1.5780\nCC-MAIN-2021-49,por,53292112,52994983,2.1088\nCC-MAIN-2021-49,pus,88650,88425,0.0035\nCC-MAIN-2021-49,que,13441,13433,0.0005\nCC-MAIN-2021-49,roh,29381,28395,0.0012\nCC-MAIN-2021-49,ron,15132705,15063189,0.5988\nCC-MAIN-2021-49,run,1382,1379,0.0001\nCC-MAIN-2021-49,rus,151492137,150615427,5.9948\nCC-MAIN-2021-49,sag,558,558,0.0000\nCC-MAIN-2021-49,san,63773,63523,0.0025\nCC-MAIN-2021-49,sco,11749,11717,0.0005\nCC-MAIN-2021-49,sin,209037,208318,0.0083\nCC-MAIN-2021-49,slk,8390690,8344964,0.3320\nCC-MAIN-2021-49,slv,3754303,3734207,0.1486\nCC-MAIN-2021-49,smo,15362,15340,0.0006\nCC-MAIN-2021-49,sna,15089,15057,0.0006\nCC-MAIN-2021-49,snd,30065,30046,0.0012\nCC-MAIN-2021-49,som,104964,104776,0.0042\nCC-MAIN-2021-49,sot,14332,14251,0.0006\nCC-MAIN-2021-49,spa,105100430,104429291,4.1590\nCC-MAIN-2021-49,sqi,1017679,1014674,0.0403\nCC-MAIN-2021-49,srp,5186480,5157855,0.2052\nCC-MAIN-2021-49,ssw,648,645,0.0000\nCC-MAIN-2021-49,sun,28841,28792,0.0011\nCC-MAIN-2021-49,sux,95,95,0.0000\nCC-MAIN-2021-49,swa,204325,203838,0.0081\nCC-MAIN-2021-49,swe,16793002,16660052,0.6645\nCC-MAIN-2021-49,syr,20263,20249,0.0008\nCC-MAIN-2021-49,tam,1068325,1065490,0.0423\nCC-MAIN-2021-49,tat,185169,184617,0.0073\nCC-MAIN-2021-49,tel,426256,425263,0.0169\nCC-MAIN-2021-49,tgk,101690,101499,0.0040\nCC-MAIN-2021-49,tgl,219958,219197,0.0087\nCC-MAIN-2021-49,tha,9815851,9764283,0.3884\nCC-MAIN-2021-49,tir,11996,11885,0.0005\nCC-MAIN-2021-49,ton,1637,1631,0.0001\nCC-MAIN-2021-49,tsn,3723,3707,0.0001\nCC-MAIN-2021-49,tso,1286,1281,0.0001\nCC-MAIN-2021-49,tuk,64484,64417,0.0026\nCC-MAIN-2021-49,tur,22351327,22240149,0.8845\nCC-MAIN-2021-49,uig,27192,27139,0.0011\nCC-MAIN-2021-49,ukr,9766849,9711382,0.3865\nCC-MAIN-2021-49,urd,687734,684226,0.0272\nCC-MAIN-2021-49,uzb,394696,393074,0.0156\nCC-MAIN-2021-49,ven,1184,1181,0.0000\nCC-MAIN-2021-49,vie,19885107,19748878,0.7869\nCC-MAIN-2021-49,vol,23471,23450,0.0009\nCC-MAIN-2021-49,war,73298,73104,0.0029\nCC-MAIN-2021-49,wol,3656,3613,0.0001\nCC-MAIN-2021-49,xho,72442,72368,0.0029\nCC-MAIN-2021-49,yid,45856,45828,0.0018\nCC-MAIN-2021-49,yor,27734,27666,0.0011\nCC-MAIN-2021-49,zha,1217,1214,0.0000\nCC-MAIN-2021-49,zho,133898761,133469265,5.2986\nCC-MAIN-2021-49,zul,74479,74392,0.0029\nCC-MAIN-2022-05,<unknown>,82498768,82498768,2.7625\nCC-MAIN-2022-05,aar,5021,5006,0.0002\nCC-MAIN-2022-05,abk,12807,12728,0.0004\nCC-MAIN-2022-05,afr,427429,426868,0.0143\nCC-MAIN-2022-05,aka,2637,2589,0.0001\nCC-MAIN-2022-05,amh,91098,90866,0.0031\nCC-MAIN-2022-05,ara,18163911,18071920,0.6082\nCC-MAIN-2022-05,asm,48560,48500,0.0016\nCC-MAIN-2022-05,aym,1256,1229,0.0000\nCC-MAIN-2022-05,aze,1208944,1204992,0.0405\nCC-MAIN-2022-05,bak,59597,59573,0.0020\nCC-MAIN-2022-05,bel,456987,456222,0.0153\nCC-MAIN-2022-05,ben,2405776,2398481,0.0806\nCC-MAIN-2022-05,bih,17529,17515,0.0006\nCC-MAIN-2022-05,bis,3331,3323,0.0001\nCC-MAIN-2022-05,bod,28697,28585,0.0010\nCC-MAIN-2022-05,bos,1239636,1236910,0.0415\nCC-MAIN-2022-05,bre,70696,70623,0.0024\nCC-MAIN-2022-05,bul,7856701,7831332,0.2631\nCC-MAIN-2022-05,cat,6992440,6953796,0.2341\nCC-MAIN-2022-05,ceb,60469,60296,0.0020\nCC-MAIN-2022-05,ces,29979668,29802367,1.0039\nCC-MAIN-2022-05,chr,1176,1176,0.0000\nCC-MAIN-2022-05,cos,71699,71503,0.0024\nCC-MAIN-2022-05,crs,2044,2039,0.0001\nCC-MAIN-2022-05,cym,358449,357470,0.0120\nCC-MAIN-2022-05,dan,12482629,12413621,0.4180\nCC-MAIN-2022-05,deu,167333379,166247626,5.6032\nCC-MAIN-2022-05,div,63860,63792,0.0021\nCC-MAIN-2022-05,dzo,3239,3239,0.0001\nCC-MAIN-2022-05,ell,16115830,16054599,0.5396\nCC-MAIN-2022-05,eng,1387357238,1379336982,46.4560\nCC-MAIN-2022-05,epo,256861,255643,0.0086\nCC-MAIN-2022-05,est,4041128,4012124,0.1353\nCC-MAIN-2022-05,eus,935103,927004,0.0313\nCC-MAIN-2022-05,fao,110865,110531,0.0037\nCC-MAIN-2022-05,fas,18307684,18194352,0.6130\nCC-MAIN-2022-05,fij,4687,4686,0.0002\nCC-MAIN-2022-05,fin,11787069,11724587,0.3947\nCC-MAIN-2022-05,fra,133048407,132347917,4.4552\nCC-MAIN-2022-05,fry,102273,101987,0.0034\nCC-MAIN-2022-05,gla,52279,52141,0.0018\nCC-MAIN-2022-05,gle,170328,169740,0.0057\nCC-MAIN-2022-05,glg,1200584,1196480,0.0402\nCC-MAIN-2022-05,glv,10471,10438,0.0004\nCC-MAIN-2022-05,got,901,899,0.0000\nCC-MAIN-2022-05,grn,20772,20727,0.0007\nCC-MAIN-2022-05,guj,330541,326511,0.0111\nCC-MAIN-2022-05,hat,39640,39504,0.0013\nCC-MAIN-2022-05,hau,80407,79518,0.0027\nCC-MAIN-2022-05,haw,19968,19929,0.0007\nCC-MAIN-2022-05,heb,7008768,6976965,0.2347\nCC-MAIN-2022-05,hin,3818424,3805788,0.1279\nCC-MAIN-2022-05,hmn,16486,16384,0.0006\nCC-MAIN-2022-05,hrv,5822146,5799379,0.1950\nCC-MAIN-2022-05,hun,16365842,16292205,0.5480\nCC-MAIN-2022-05,hye,896285,893433,0.0300\nCC-MAIN-2022-05,ibo,17503,17480,0.0006\nCC-MAIN-2022-05,iku,6038,6033,0.0002\nCC-MAIN-2022-05,ile,10615,10579,0.0004\nCC-MAIN-2022-05,ina,19374,19338,0.0006\nCC-MAIN-2022-05,ind,22711640,22565938,0.7605\nCC-MAIN-2022-05,ipk,2524,2520,0.0001\nCC-MAIN-2022-05,isl,1127976,1123017,0.0378\nCC-MAIN-2022-05,ita,71306214,70966098,2.3877\nCC-MAIN-2022-05,jav,55991,55911,0.0019\nCC-MAIN-2022-05,jpn,142564442,142089605,4.7738\nCC-MAIN-2022-05,kal,31003,30797,0.0010\nCC-MAIN-2022-05,kan,307019,305613,0.0103\nCC-MAIN-2022-05,kas,194,194,0.0000\nCC-MAIN-2022-05,kat,1081365,1077965,0.0362\nCC-MAIN-2022-05,kaz,631938,630272,0.0212\nCC-MAIN-2022-05,kha,4587,4573,0.0002\nCC-MAIN-2022-05,khm,247436,246735,0.0083\nCC-MAIN-2022-05,kin,50298,49981,0.0017\nCC-MAIN-2022-05,kir,145305,144980,0.0049\nCC-MAIN-2022-05,kor,20076437,19990873,0.6723\nCC-MAIN-2022-05,kur,165794,164703,0.0056\nCC-MAIN-2022-05,lao,109084,108696,0.0037\nCC-MAIN-2022-05,lat,2974541,2967060,0.0996\nCC-MAIN-2022-05,lav,2462813,2446013,0.0825\nCC-MAIN-2022-05,lif,94,87,0.0000\nCC-MAIN-2022-05,lin,6583,6541,0.0002\nCC-MAIN-2022-05,lit,4682654,4661205,0.1568\nCC-MAIN-2022-05,ltz,98463,98145,0.0033\nCC-MAIN-2022-05,lug,3311,3280,0.0001\nCC-MAIN-2022-05,mal,572520,570514,0.0192\nCC-MAIN-2022-05,mar,553167,552523,0.0185\nCC-MAIN-2022-05,mfe,2186,2184,0.0001\nCC-MAIN-2022-05,mkd,911033,908572,0.0305\nCC-MAIN-2022-05,mlg,69129,68906,0.0023\nCC-MAIN-2022-05,mlt,126584,122286,0.0042\nCC-MAIN-2022-05,mon,476543,475676,0.0160\nCC-MAIN-2022-05,mri,36046,35905,0.0012\nCC-MAIN-2022-05,msa,2293449,2285273,0.0768\nCC-MAIN-2022-05,mya,324510,322964,0.0109\nCC-MAIN-2022-05,nau,1070,1069,0.0000\nCC-MAIN-2022-05,nep,816721,815714,0.0273\nCC-MAIN-2022-05,nld,52963777,52655258,1.7735\nCC-MAIN-2022-05,nno,479737,477012,0.0161\nCC-MAIN-2022-05,nor,9520368,9460271,0.3188\nCC-MAIN-2022-05,nso,2502,2499,0.0001\nCC-MAIN-2022-05,nya,15587,15545,0.0005\nCC-MAIN-2022-05,oci,94105,90252,0.0032\nCC-MAIN-2022-05,ori,104392,104312,0.0035\nCC-MAIN-2022-05,orm,12288,12252,0.0004\nCC-MAIN-2022-05,pan,153000,152616,0.0051\nCC-MAIN-2022-05,pol,48024355,47791067,1.6081\nCC-MAIN-2022-05,por,61798069,61534375,2.0693\nCC-MAIN-2022-05,pus,85069,84899,0.0028\nCC-MAIN-2022-05,que,17806,17802,0.0006\nCC-MAIN-2022-05,roh,26891,26096,0.0009\nCC-MAIN-2022-05,ron,17424456,17352931,0.5835\nCC-MAIN-2022-05,run,1910,1907,0.0001\nCC-MAIN-2022-05,rus,186390406,185683668,6.2413\nCC-MAIN-2022-05,sag,425,425,0.0000\nCC-MAIN-2022-05,san,63975,63710,0.0021\nCC-MAIN-2022-05,sco,16334,16293,0.0005\nCC-MAIN-2022-05,sin,230318,229681,0.0077\nCC-MAIN-2022-05,slk,10150523,10104580,0.3399\nCC-MAIN-2022-05,slv,4735513,4714969,0.1586\nCC-MAIN-2022-05,smo,14613,14585,0.0005\nCC-MAIN-2022-05,sna,16375,16327,0.0005\nCC-MAIN-2022-05,snd,30187,29967,0.0010\nCC-MAIN-2022-05,som,125650,125447,0.0042\nCC-MAIN-2022-05,sot,12846,12781,0.0004\nCC-MAIN-2022-05,spa,127039018,126370201,4.2539\nCC-MAIN-2022-05,sqi,1098424,1095531,0.0368\nCC-MAIN-2022-05,srp,6119453,6093269,0.2049\nCC-MAIN-2022-05,ssw,941,934,0.0000\nCC-MAIN-2022-05,sun,30978,30911,0.0010\nCC-MAIN-2022-05,sux,130,130,0.0000\nCC-MAIN-2022-05,swa,222504,222111,0.0075\nCC-MAIN-2022-05,swe,20373346,20248061,0.6822\nCC-MAIN-2022-05,syr,19324,19308,0.0006\nCC-MAIN-2022-05,tam,1202017,1198996,0.0402\nCC-MAIN-2022-05,tat,238301,237896,0.0080\nCC-MAIN-2022-05,tel,492080,487437,0.0165\nCC-MAIN-2022-05,tgk,126688,126444,0.0042\nCC-MAIN-2022-05,tgl,246381,243209,0.0083\nCC-MAIN-2022-05,tha,11291658,11239632,0.3781\nCC-MAIN-2022-05,tir,20243,20151,0.0007\nCC-MAIN-2022-05,ton,1648,1644,0.0001\nCC-MAIN-2022-05,tsn,2873,2863,0.0001\nCC-MAIN-2022-05,tso,2327,2326,0.0001\nCC-MAIN-2022-05,tuk,61349,61218,0.0021\nCC-MAIN-2022-05,tur,25532435,25425996,0.8550\nCC-MAIN-2022-05,uig,31140,31105,0.0010\nCC-MAIN-2022-05,ukr,12015620,11952625,0.4023\nCC-MAIN-2022-05,urd,768471,763306,0.0257\nCC-MAIN-2022-05,uzb,442926,441511,0.0148\nCC-MAIN-2022-05,ven,685,679,0.0000\nCC-MAIN-2022-05,vie,25024426,24912070,0.8379\nCC-MAIN-2022-05,vol,26191,26178,0.0009\nCC-MAIN-2022-05,war,81277,81054,0.0027\nCC-MAIN-2022-05,wol,4527,4511,0.0002\nCC-MAIN-2022-05,xho,64460,64357,0.0022\nCC-MAIN-2022-05,yid,48045,48019,0.0016\nCC-MAIN-2022-05,yor,34302,34238,0.0011\nCC-MAIN-2022-05,zha,2037,2036,0.0001\nCC-MAIN-2022-05,zho,144190313,143776927,4.8282\nCC-MAIN-2022-05,zul,70401,70259,0.0024\nCC-MAIN-2022-21,<unknown>,89279358,89279358,2.5879\nCC-MAIN-2022-21,aar,5486,5469,0.0002\nCC-MAIN-2022-21,abk,16086,15958,0.0005\nCC-MAIN-2022-21,afr,372487,369332,0.0108\nCC-MAIN-2022-21,aka,2061,2028,0.0001\nCC-MAIN-2022-21,amh,112813,112382,0.0033\nCC-MAIN-2022-21,ara,19454430,19368286,0.5639\nCC-MAIN-2022-21,asm,68521,68035,0.0020\nCC-MAIN-2022-21,aym,1532,1502,0.0000\nCC-MAIN-2022-21,aze,1334263,1328031,0.0387\nCC-MAIN-2022-21,bak,41044,41034,0.0012\nCC-MAIN-2022-21,bel,462891,462038,0.0134\nCC-MAIN-2022-21,ben,2756029,2746871,0.0799\nCC-MAIN-2022-21,bih,21141,21112,0.0006\nCC-MAIN-2022-21,bis,4972,4837,0.0001\nCC-MAIN-2022-21,bod,29694,29515,0.0009\nCC-MAIN-2022-21,bos,1335430,1329556,0.0387\nCC-MAIN-2022-21,bre,81824,81768,0.0024\nCC-MAIN-2022-21,bul,8782407,8747130,0.2546\nCC-MAIN-2022-21,cat,7708136,7644778,0.2234\nCC-MAIN-2022-21,ceb,69580,69534,0.0020\nCC-MAIN-2022-21,ces,33967256,33722840,0.9846\nCC-MAIN-2022-21,chr,1391,1390,0.0000\nCC-MAIN-2022-21,cos,82890,82683,0.0024\nCC-MAIN-2022-21,crs,2454,2437,0.0001\nCC-MAIN-2022-21,cym,367443,365487,0.0107\nCC-MAIN-2022-21,dan,14061258,13947699,0.4076\nCC-MAIN-2022-21,deu,188695624,187212561,5.4697\nCC-MAIN-2022-21,div,65445,65417,0.0019\nCC-MAIN-2022-21,dzo,4642,4641,0.0001\nCC-MAIN-2022-21,ell,17758841,17686492,0.5148\nCC-MAIN-2022-21,eng,1649444572,1637364487,47.8124\nCC-MAIN-2022-21,epo,277407,275075,0.0080\nCC-MAIN-2022-21,est,4140465,4119751,0.1200\nCC-MAIN-2022-21,eus,1031283,1021220,0.0299\nCC-MAIN-2022-21,fao,126005,125581,0.0037\nCC-MAIN-2022-21,fas,20131308,20022940,0.5835\nCC-MAIN-2022-21,fij,2926,2919,0.0001\nCC-MAIN-2022-21,fin,13274649,13176626,0.3848\nCC-MAIN-2022-21,fra,148023310,146997497,4.2907\nCC-MAIN-2022-21,fry,94449,94094,0.0027\nCC-MAIN-2022-21,gla,55377,55269,0.0016\nCC-MAIN-2022-21,gle,202377,201248,0.0059\nCC-MAIN-2022-21,glg,1271752,1264961,0.0369\nCC-MAIN-2022-21,glv,12797,12757,0.0004\nCC-MAIN-2022-21,got,738,737,0.0000\nCC-MAIN-2022-21,grn,21512,21420,0.0006\nCC-MAIN-2022-21,guj,387403,369082,0.0112\nCC-MAIN-2022-21,hat,48990,48895,0.0014\nCC-MAIN-2022-21,hau,82360,82134,0.0024\nCC-MAIN-2022-21,haw,20755,20735,0.0006\nCC-MAIN-2022-21,heb,7959664,7919696,0.2307\nCC-MAIN-2022-21,hin,4566598,4551627,0.1324\nCC-MAIN-2022-21,hmn,18884,18831,0.0005\nCC-MAIN-2022-21,hrv,6453544,6422192,0.1871\nCC-MAIN-2022-21,hun,18853729,18760337,0.5465\nCC-MAIN-2022-21,hye,978825,974425,0.0284\nCC-MAIN-2022-21,ibo,17818,17782,0.0005\nCC-MAIN-2022-21,iku,5433,5414,0.0002\nCC-MAIN-2022-21,ile,9251,9233,0.0003\nCC-MAIN-2022-21,ina,18106,18064,0.0005\nCC-MAIN-2022-21,ind,24272793,24140389,0.7036\nCC-MAIN-2022-21,ipk,1853,1846,0.0001\nCC-MAIN-2022-21,isl,1272934,1263601,0.0369\nCC-MAIN-2022-21,ita,80476893,79996163,2.3328\nCC-MAIN-2022-21,jav,67086,67041,0.0019\nCC-MAIN-2022-21,jpn,167972833,167286988,4.8690\nCC-MAIN-2022-21,kal,25881,25760,0.0008\nCC-MAIN-2022-21,kan,352409,351422,0.0102\nCC-MAIN-2022-21,kas,145,145,0.0000\nCC-MAIN-2022-21,kat,1104838,1100509,0.0320\nCC-MAIN-2022-21,kaz,682227,680427,0.0198\nCC-MAIN-2022-21,kha,6488,6467,0.0002\nCC-MAIN-2022-21,khm,306429,304952,0.0089\nCC-MAIN-2022-21,kin,57896,57646,0.0017\nCC-MAIN-2022-21,kir,153888,153442,0.0045\nCC-MAIN-2022-21,kor,20130447,20051534,0.5835\nCC-MAIN-2022-21,kur,187001,186476,0.0054\nCC-MAIN-2022-21,lao,115726,114896,0.0034\nCC-MAIN-2022-21,lat,3717257,3705531,0.1078\nCC-MAIN-2022-21,lav,2669221,2654501,0.0774\nCC-MAIN-2022-21,lif,58,58,0.0000\nCC-MAIN-2022-21,lin,7013,6981,0.0002\nCC-MAIN-2022-21,lit,5395529,5365322,0.1564\nCC-MAIN-2022-21,ltz,115675,115316,0.0034\nCC-MAIN-2022-21,lug,4793,4748,0.0001\nCC-MAIN-2022-21,mal,691943,689936,0.0201\nCC-MAIN-2022-21,mar,648697,647081,0.0188\nCC-MAIN-2022-21,mfe,2730,2717,0.0001\nCC-MAIN-2022-21,mkd,1004598,1001529,0.0291\nCC-MAIN-2022-21,mlg,70014,69722,0.0020\nCC-MAIN-2022-21,mlt,119892,118307,0.0035\nCC-MAIN-2022-21,mon,573389,571923,0.0166\nCC-MAIN-2022-21,mri,44275,44106,0.0013\nCC-MAIN-2022-21,msa,2479172,2471607,0.0719\nCC-MAIN-2022-21,mya,331390,330667,0.0096\nCC-MAIN-2022-21,nau,1144,1139,0.0000\nCC-MAIN-2022-21,nep,902827,901296,0.0262\nCC-MAIN-2022-21,nld,62323240,61853434,1.8066\nCC-MAIN-2022-21,nno,550538,548058,0.0160\nCC-MAIN-2022-21,nor,11015304,10928805,0.3193\nCC-MAIN-2022-21,nso,2231,2231,0.0001\nCC-MAIN-2022-21,nya,18593,18511,0.0005\nCC-MAIN-2022-21,oci,98907,98086,0.0029\nCC-MAIN-2022-21,ori,119739,119595,0.0035\nCC-MAIN-2022-21,orm,14628,14566,0.0004\nCC-MAIN-2022-21,pan,171894,171486,0.0050\nCC-MAIN-2022-21,pol,53393071,53071801,1.5477\nCC-MAIN-2022-21,por,73520057,73159037,2.1311\nCC-MAIN-2022-21,pus,81583,81406,0.0024\nCC-MAIN-2022-21,que,21006,20995,0.0006\nCC-MAIN-2022-21,roh,31550,30667,0.0009\nCC-MAIN-2022-21,ron,18208902,18110266,0.5278\nCC-MAIN-2022-21,run,2117,2111,0.0001\nCC-MAIN-2022-21,rus,209101914,207979642,6.0612\nCC-MAIN-2022-21,sag,1766,1764,0.0001\nCC-MAIN-2022-21,san,94218,93987,0.0027\nCC-MAIN-2022-21,sco,16268,16222,0.0005\nCC-MAIN-2022-21,sin,231949,231669,0.0067\nCC-MAIN-2022-21,slk,11564407,11481340,0.3352\nCC-MAIN-2022-21,slv,5287816,5262989,0.1533\nCC-MAIN-2022-21,smo,14904,14895,0.0004\nCC-MAIN-2022-21,sna,19070,19010,0.0006\nCC-MAIN-2022-21,snd,36371,35824,0.0011\nCC-MAIN-2022-21,som,137337,137136,0.0040\nCC-MAIN-2022-21,sot,17781,17755,0.0005\nCC-MAIN-2022-21,spa,146251566,145350187,4.2394\nCC-MAIN-2022-21,sqi,1239081,1234372,0.0359\nCC-MAIN-2022-21,srp,6589980,6553114,0.1910\nCC-MAIN-2022-21,ssw,1096,1084,0.0000\nCC-MAIN-2022-21,sun,34465,34420,0.0010\nCC-MAIN-2022-21,sux,327,327,0.0000\nCC-MAIN-2022-21,swa,239268,238655,0.0069\nCC-MAIN-2022-21,swe,23106441,22932160,0.6698\nCC-MAIN-2022-21,syr,16254,16240,0.0005\nCC-MAIN-2022-21,tam,1404953,1401055,0.0407\nCC-MAIN-2022-21,tat,248976,248604,0.0072\nCC-MAIN-2022-21,tel,614819,604755,0.0178\nCC-MAIN-2022-21,tgk,155278,154990,0.0045\nCC-MAIN-2022-21,tgl,229776,228979,0.0067\nCC-MAIN-2022-21,tha,12363080,12294036,0.3584\nCC-MAIN-2022-21,tir,29678,29478,0.0009\nCC-MAIN-2022-21,ton,1539,1534,0.0000\nCC-MAIN-2022-21,tsn,4593,4567,0.0001\nCC-MAIN-2022-21,tso,1242,1237,0.0000\nCC-MAIN-2022-21,tuk,73803,73695,0.0021\nCC-MAIN-2022-21,tur,31130360,30971513,0.9024\nCC-MAIN-2022-21,uig,39887,39817,0.0012\nCC-MAIN-2022-21,ukr,13083660,13011811,0.3793\nCC-MAIN-2022-21,urd,900259,895497,0.0261\nCC-MAIN-2022-21,uzb,492508,490525,0.0143\nCC-MAIN-2022-21,ven,929,915,0.0000\nCC-MAIN-2022-21,vie,30408908,30261131,0.8815\nCC-MAIN-2022-21,vol,26975,26953,0.0008\nCC-MAIN-2022-21,war,86684,86251,0.0025\nCC-MAIN-2022-21,wol,4242,4229,0.0001\nCC-MAIN-2022-21,xho,48606,48572,0.0014\nCC-MAIN-2022-21,yid,46638,46600,0.0014\nCC-MAIN-2022-21,yor,36555,36497,0.0011\nCC-MAIN-2022-21,zha,1808,1803,0.0001\nCC-MAIN-2022-21,zho,154323429,153908101,4.4734\nCC-MAIN-2022-21,zul,42291,42203,0.0012\nCC-MAIN-2022-27,<unknown>,90293544,90293544,2.9037\nCC-MAIN-2022-27,aar,4523,4494,0.0001\nCC-MAIN-2022-27,abk,16689,16660,0.0005\nCC-MAIN-2022-27,afr,370766,369902,0.0119\nCC-MAIN-2022-27,aka,2392,2364,0.0001\nCC-MAIN-2022-27,amh,94693,94186,0.0030\nCC-MAIN-2022-27,ara,18654406,18583091,0.5999\nCC-MAIN-2022-27,asm,60865,60724,0.0020\nCC-MAIN-2022-27,aym,1411,1400,0.0000\nCC-MAIN-2022-27,aze,1287850,1283604,0.0414\nCC-MAIN-2022-27,bak,40731,40698,0.0013\nCC-MAIN-2022-27,bel,469540,468383,0.0151\nCC-MAIN-2022-27,ben,2653829,2646252,0.0853\nCC-MAIN-2022-27,bih,18663,18653,0.0006\nCC-MAIN-2022-27,bis,4070,4019,0.0001\nCC-MAIN-2022-27,bod,34049,33952,0.0011\nCC-MAIN-2022-27,bos,1313836,1310292,0.0423\nCC-MAIN-2022-27,bre,79457,79361,0.0026\nCC-MAIN-2022-27,bul,8461024,8431909,0.2721\nCC-MAIN-2022-27,cat,7195465,7147750,0.2314\nCC-MAIN-2022-27,ceb,69199,69163,0.0022\nCC-MAIN-2022-27,ces,32075252,31880314,1.0315\nCC-MAIN-2022-27,chr,1427,1426,0.0000\nCC-MAIN-2022-27,cos,80730,80554,0.0026\nCC-MAIN-2022-27,crs,3171,3133,0.0001\nCC-MAIN-2022-27,cym,353980,352527,0.0114\nCC-MAIN-2022-27,dan,13385332,13299508,0.4305\nCC-MAIN-2022-27,deu,170479687,169425221,5.4824\nCC-MAIN-2022-27,div,52767,52734,0.0017\nCC-MAIN-2022-27,dzo,4825,4821,0.0002\nCC-MAIN-2022-27,ell,17381247,17320497,0.5590\nCC-MAIN-2022-27,eng,1447163236,1437323702,46.5384\nCC-MAIN-2022-27,epo,262302,261134,0.0084\nCC-MAIN-2022-27,est,4013648,3988381,0.1291\nCC-MAIN-2022-27,eus,1034372,1028027,0.0333\nCC-MAIN-2022-27,fao,146271,145814,0.0047\nCC-MAIN-2022-27,fas,18857919,18762718,0.6064\nCC-MAIN-2022-27,fij,3146,3141,0.0001\nCC-MAIN-2022-27,fin,12619710,12534144,0.4058\nCC-MAIN-2022-27,fra,136828705,136024269,4.4002\nCC-MAIN-2022-27,fry,99713,99426,0.0032\nCC-MAIN-2022-27,gla,59014,58945,0.0019\nCC-MAIN-2022-27,gle,198826,197380,0.0064\nCC-MAIN-2022-27,glg,1241707,1236437,0.0399\nCC-MAIN-2022-27,glv,14467,14448,0.0005\nCC-MAIN-2022-27,got,885,883,0.0000\nCC-MAIN-2022-27,grn,19325,19266,0.0006\nCC-MAIN-2022-27,guj,381582,372143,0.0123\nCC-MAIN-2022-27,hat,47595,47468,0.0015\nCC-MAIN-2022-27,hau,70951,70417,0.0023\nCC-MAIN-2022-27,haw,18870,18848,0.0006\nCC-MAIN-2022-27,heb,7450598,7415765,0.2396\nCC-MAIN-2022-27,hin,4235908,4218525,0.1362\nCC-MAIN-2022-27,hmn,17645,17615,0.0006\nCC-MAIN-2022-27,hrv,6281347,6256540,0.2020\nCC-MAIN-2022-27,hun,17765132,17686759,0.5713\nCC-MAIN-2022-27,hye,965131,961416,0.0310\nCC-MAIN-2022-27,ibo,19121,19086,0.0006\nCC-MAIN-2022-27,iku,6561,6550,0.0002\nCC-MAIN-2022-27,ile,8613,8597,0.0003\nCC-MAIN-2022-27,ina,19339,19280,0.0006\nCC-MAIN-2022-27,ind,21556146,21421227,0.6932\nCC-MAIN-2022-27,ipk,2177,2175,0.0001\nCC-MAIN-2022-27,isl,1239237,1232978,0.0399\nCC-MAIN-2022-27,ita,75832861,75444908,2.4387\nCC-MAIN-2022-27,jav,67389,67321,0.0022\nCC-MAIN-2022-27,jpn,149679948,149121175,4.8135\nCC-MAIN-2022-27,kal,28471,28383,0.0009\nCC-MAIN-2022-27,kan,363019,362339,0.0117\nCC-MAIN-2022-27,kas,115,115,0.0000\nCC-MAIN-2022-27,kat,1110618,1106334,0.0357\nCC-MAIN-2022-27,kaz,692518,689741,0.0223\nCC-MAIN-2022-27,kha,5099,5092,0.0002\nCC-MAIN-2022-27,khm,298974,297359,0.0096\nCC-MAIN-2022-27,kin,52616,52489,0.0017\nCC-MAIN-2022-27,kir,138111,137802,0.0044\nCC-MAIN-2022-27,kor,20256170,20194653,0.6514\nCC-MAIN-2022-27,kur,180331,179503,0.0058\nCC-MAIN-2022-27,lao,117022,116734,0.0038\nCC-MAIN-2022-27,lat,3309637,3276791,0.1064\nCC-MAIN-2022-27,lav,2545552,2531392,0.0819\nCC-MAIN-2022-27,lif,23,23,0.0000\nCC-MAIN-2022-27,lin,7183,7174,0.0002\nCC-MAIN-2022-27,lit,5069008,5043738,0.1630\nCC-MAIN-2022-27,ltz,114378,113921,0.0037\nCC-MAIN-2022-27,lug,4192,4182,0.0001\nCC-MAIN-2022-27,mal,678418,677379,0.0218\nCC-MAIN-2022-27,mar,615234,614037,0.0198\nCC-MAIN-2022-27,mfe,2329,2320,0.0001\nCC-MAIN-2022-27,mkd,999157,995831,0.0321\nCC-MAIN-2022-27,mlg,67566,67366,0.0022\nCC-MAIN-2022-27,mlt,137544,135500,0.0044\nCC-MAIN-2022-27,mon,620731,619536,0.0200\nCC-MAIN-2022-27,mri,40809,40644,0.0013\nCC-MAIN-2022-27,msa,2370365,2364176,0.0762\nCC-MAIN-2022-27,mya,316872,316344,0.0102\nCC-MAIN-2022-27,nau,1186,1182,0.0000\nCC-MAIN-2022-27,nep,880929,879830,0.0283\nCC-MAIN-2022-27,nld,59159190,58788367,1.9025\nCC-MAIN-2022-27,nno,523022,520933,0.0168\nCC-MAIN-2022-27,nor,10239308,10175331,0.3293\nCC-MAIN-2022-27,nso,2665,2663,0.0001\nCC-MAIN-2022-27,nya,17762,17705,0.0006\nCC-MAIN-2022-27,oci,97991,97605,0.0032\nCC-MAIN-2022-27,ori,110664,110376,0.0036\nCC-MAIN-2022-27,orm,13673,13640,0.0004\nCC-MAIN-2022-27,pan,185503,185218,0.0060\nCC-MAIN-2022-27,pol,50262780,50008137,1.6164\nCC-MAIN-2022-27,por,65936924,65635075,2.1204\nCC-MAIN-2022-27,pus,83574,83134,0.0027\nCC-MAIN-2022-27,que,21978,21945,0.0007\nCC-MAIN-2022-27,roh,31097,30544,0.0010\nCC-MAIN-2022-27,ron,17001550,16937577,0.5467\nCC-MAIN-2022-27,run,1352,1346,0.0000\nCC-MAIN-2022-27,rus,182778927,181990656,5.8779\nCC-MAIN-2022-27,sag,1670,1669,0.0001\nCC-MAIN-2022-27,san,105880,105755,0.0034\nCC-MAIN-2022-27,sco,17393,17353,0.0006\nCC-MAIN-2022-27,sin,221344,220994,0.0071\nCC-MAIN-2022-27,slk,11088107,11039810,0.3566\nCC-MAIN-2022-27,slv,4950620,4927957,0.1592\nCC-MAIN-2022-27,smo,18174,18041,0.0006\nCC-MAIN-2022-27,sna,17401,17348,0.0006\nCC-MAIN-2022-27,snd,43523,42522,0.0014\nCC-MAIN-2022-27,som,131576,131411,0.0042\nCC-MAIN-2022-27,sot,21235,21123,0.0007\nCC-MAIN-2022-27,spa,134266684,133466877,4.3178\nCC-MAIN-2022-27,sqi,1227343,1222793,0.0395\nCC-MAIN-2022-27,srp,6546658,6518760,0.2105\nCC-MAIN-2022-27,ssw,2350,2342,0.0001\nCC-MAIN-2022-27,sun,32120,32084,0.0010\nCC-MAIN-2022-27,sux,286,286,0.0000\nCC-MAIN-2022-27,swa,212840,212069,0.0068\nCC-MAIN-2022-27,swe,21204822,21069603,0.6819\nCC-MAIN-2022-27,syr,18569,18554,0.0006\nCC-MAIN-2022-27,tam,1339001,1336351,0.0431\nCC-MAIN-2022-27,tat,234704,234587,0.0075\nCC-MAIN-2022-27,tel,546631,544405,0.0176\nCC-MAIN-2022-27,tgk,147153,146780,0.0047\nCC-MAIN-2022-27,tgl,239873,238069,0.0077\nCC-MAIN-2022-27,tha,12307849,12243433,0.3958\nCC-MAIN-2022-27,tir,23294,23004,0.0007\nCC-MAIN-2022-27,ton,1784,1780,0.0001\nCC-MAIN-2022-27,tsn,3611,3601,0.0001\nCC-MAIN-2022-27,tso,2160,2152,0.0001\nCC-MAIN-2022-27,tuk,61482,61373,0.0020\nCC-MAIN-2022-27,tur,27001733,26874189,0.8683\nCC-MAIN-2022-27,uig,40669,40631,0.0013\nCC-MAIN-2022-27,ukr,12549813,12467923,0.4036\nCC-MAIN-2022-27,urd,796945,789690,0.0256\nCC-MAIN-2022-27,uzb,475318,473291,0.0153\nCC-MAIN-2022-27,ven,1032,1026,0.0000\nCC-MAIN-2022-27,vie,27265511,27141314,0.8768\nCC-MAIN-2022-27,vol,25182,25162,0.0008\nCC-MAIN-2022-27,war,94700,94307,0.0030\nCC-MAIN-2022-27,wol,4069,4061,0.0001\nCC-MAIN-2022-27,xho,54640,54599,0.0018\nCC-MAIN-2022-27,yid,46318,46268,0.0015\nCC-MAIN-2022-27,yor,35193,35165,0.0011\nCC-MAIN-2022-27,zha,2080,2075,0.0001\nCC-MAIN-2022-27,zho,145458289,145115495,4.6777\nCC-MAIN-2022-27,zul,55089,55059,0.0018\nCC-MAIN-2022-33,<unknown>,88880293,88880293,3.4334\nCC-MAIN-2022-33,aar,2915,2879,0.0001\nCC-MAIN-2022-33,abk,11231,11192,0.0004\nCC-MAIN-2022-33,afr,309776,308511,0.0120\nCC-MAIN-2022-33,aka,1916,1910,0.0001\nCC-MAIN-2022-33,amh,72473,72279,0.0028\nCC-MAIN-2022-33,ara,17006105,16930710,0.6569\nCC-MAIN-2022-33,asm,44679,44171,0.0017\nCC-MAIN-2022-33,aym,1816,1784,0.0001\nCC-MAIN-2022-33,aze,1146246,1142337,0.0443\nCC-MAIN-2022-33,bak,29711,29701,0.0011\nCC-MAIN-2022-33,bel,414183,412701,0.0160\nCC-MAIN-2022-33,ben,2413619,2407539,0.0932\nCC-MAIN-2022-33,bih,14728,14712,0.0006\nCC-MAIN-2022-33,bis,3193,3183,0.0001\nCC-MAIN-2022-33,bod,34873,34370,0.0013\nCC-MAIN-2022-33,bos,1111871,1104754,0.0430\nCC-MAIN-2022-33,bre,65176,65090,0.0025\nCC-MAIN-2022-33,bul,6831808,6801616,0.2639\nCC-MAIN-2022-33,cat,5742610,5691175,0.2218\nCC-MAIN-2022-33,ceb,60973,60948,0.0024\nCC-MAIN-2022-33,ces,24459488,24260458,0.9449\nCC-MAIN-2022-33,chr,838,838,0.0000\nCC-MAIN-2022-33,cos,62526,62404,0.0024\nCC-MAIN-2022-33,crs,1592,1580,0.0001\nCC-MAIN-2022-33,cym,304753,303536,0.0118\nCC-MAIN-2022-33,dan,10958052,10866382,0.4233\nCC-MAIN-2022-33,deu,135647238,134502162,5.2400\nCC-MAIN-2022-33,div,50328,50282,0.0019\nCC-MAIN-2022-33,dzo,2840,2840,0.0001\nCC-MAIN-2022-33,ell,15475694,15412613,0.5978\nCC-MAIN-2022-33,eng,1210921891,1200615375,46.7774\nCC-MAIN-2022-33,epo,257640,256336,0.0100\nCC-MAIN-2022-33,est,3088149,3066601,0.1193\nCC-MAIN-2022-33,eus,902482,894366,0.0349\nCC-MAIN-2022-33,fao,90136,89697,0.0035\nCC-MAIN-2022-33,fas,16501324,16399382,0.6374\nCC-MAIN-2022-33,fij,2565,2557,0.0001\nCC-MAIN-2022-33,fin,9568458,9496471,0.3696\nCC-MAIN-2022-33,fra,111604616,110791415,4.3112\nCC-MAIN-2022-33,fry,73577,73250,0.0028\nCC-MAIN-2022-33,gla,43382,43314,0.0017\nCC-MAIN-2022-33,gle,164777,163363,0.0064\nCC-MAIN-2022-33,glg,1032061,1027187,0.0399\nCC-MAIN-2022-33,glv,8902,8875,0.0003\nCC-MAIN-2022-33,got,367,367,0.0000\nCC-MAIN-2022-33,grn,13840,13797,0.0005\nCC-MAIN-2022-33,guj,337010,336073,0.0130\nCC-MAIN-2022-33,hat,41338,41264,0.0016\nCC-MAIN-2022-33,hau,71486,71163,0.0028\nCC-MAIN-2022-33,haw,17087,17074,0.0007\nCC-MAIN-2022-33,heb,6081479,6043647,0.2349\nCC-MAIN-2022-33,hin,3801292,3788573,0.1468\nCC-MAIN-2022-33,hmn,16846,16812,0.0007\nCC-MAIN-2022-33,hrv,4967526,4943256,0.1919\nCC-MAIN-2022-33,hun,14697231,14610953,0.5677\nCC-MAIN-2022-33,hye,877406,872910,0.0339\nCC-MAIN-2022-33,ibo,14989,14918,0.0006\nCC-MAIN-2022-33,iku,6397,6388,0.0002\nCC-MAIN-2022-33,ile,7330,7302,0.0003\nCC-MAIN-2022-33,ina,14358,14299,0.0006\nCC-MAIN-2022-33,ind,19315087,19193381,0.7461\nCC-MAIN-2022-33,ipk,2111,2110,0.0001\nCC-MAIN-2022-33,isl,890306,884749,0.0344\nCC-MAIN-2022-33,ita,64008140,63592211,2.4726\nCC-MAIN-2022-33,jav,51950,51907,0.0020\nCC-MAIN-2022-33,jpn,112580757,112059816,4.3489\nCC-MAIN-2022-33,kal,21741,21644,0.0008\nCC-MAIN-2022-33,kan,327044,326351,0.0126\nCC-MAIN-2022-33,kas,41,40,0.0000\nCC-MAIN-2022-33,kat,972998,969906,0.0376\nCC-MAIN-2022-33,kaz,608034,599389,0.0235\nCC-MAIN-2022-33,kha,4369,4360,0.0002\nCC-MAIN-2022-33,khm,260976,259543,0.0101\nCC-MAIN-2022-33,kin,53310,53185,0.0021\nCC-MAIN-2022-33,kir,119258,118921,0.0046\nCC-MAIN-2022-33,kor,19004178,18932272,0.7341\nCC-MAIN-2022-33,kur,150863,150233,0.0058\nCC-MAIN-2022-33,lao,90682,90336,0.0035\nCC-MAIN-2022-33,lat,1912081,1904638,0.0739\nCC-MAIN-2022-33,lav,2049455,2030363,0.0792\nCC-MAIN-2022-33,lif,28,28,0.0000\nCC-MAIN-2022-33,lin,4990,4978,0.0002\nCC-MAIN-2022-33,lit,3915506,3889756,0.1513\nCC-MAIN-2022-33,ltz,88020,87683,0.0034\nCC-MAIN-2022-33,lug,4462,4456,0.0002\nCC-MAIN-2022-33,mal,614233,612200,0.0237\nCC-MAIN-2022-33,mar,516232,514925,0.0199\nCC-MAIN-2022-33,mfe,4650,4641,0.0002\nCC-MAIN-2022-33,mkd,858178,855150,0.0332\nCC-MAIN-2022-33,mlg,61758,61492,0.0024\nCC-MAIN-2022-33,mlt,112762,111851,0.0044\nCC-MAIN-2022-33,mon,546479,545343,0.0211\nCC-MAIN-2022-33,mri,36719,36586,0.0014\nCC-MAIN-2022-33,msa,1886960,1879218,0.0729\nCC-MAIN-2022-33,mya,265640,264832,0.0103\nCC-MAIN-2022-33,nau,981,977,0.0000\nCC-MAIN-2022-33,nep,824697,822832,0.0319\nCC-MAIN-2022-33,nld,47807851,47409352,1.8468\nCC-MAIN-2022-33,nno,373510,371764,0.0144\nCC-MAIN-2022-33,nor,8083278,8017850,0.3123\nCC-MAIN-2022-33,nso,1130,1130,0.0000\nCC-MAIN-2022-33,nya,15569,15547,0.0006\nCC-MAIN-2022-33,oci,62213,61425,0.0024\nCC-MAIN-2022-33,ori,121813,121669,0.0047\nCC-MAIN-2022-33,orm,11234,11215,0.0004\nCC-MAIN-2022-33,pan,190480,190059,0.0074\nCC-MAIN-2022-33,pol,41676010,41387193,1.6099\nCC-MAIN-2022-33,por,55467611,55152463,2.1427\nCC-MAIN-2022-33,pus,80786,80325,0.0031\nCC-MAIN-2022-33,que,13483,13477,0.0005\nCC-MAIN-2022-33,roh,24538,23973,0.0009\nCC-MAIN-2022-33,ron,14995106,14922773,0.5793\nCC-MAIN-2022-33,run,3042,3035,0.0001\nCC-MAIN-2022-33,rus,142782540,141987145,5.5156\nCC-MAIN-2022-33,sag,1411,1410,0.0001\nCC-MAIN-2022-33,san,61991,61895,0.0024\nCC-MAIN-2022-33,sco,13973,13929,0.0005\nCC-MAIN-2022-33,sin,198670,198032,0.0077\nCC-MAIN-2022-33,slk,8264246,8209208,0.3192\nCC-MAIN-2022-33,slv,3681131,3658126,0.1422\nCC-MAIN-2022-33,smo,16086,16020,0.0006\nCC-MAIN-2022-33,sna,17777,17707,0.0007\nCC-MAIN-2022-33,snd,34581,34172,0.0013\nCC-MAIN-2022-33,som,108405,108139,0.0042\nCC-MAIN-2022-33,sot,21122,21085,0.0008\nCC-MAIN-2022-33,spa,111093975,110317996,4.2915\nCC-MAIN-2022-33,sqi,1125223,1121320,0.0435\nCC-MAIN-2022-33,srp,5411504,5384104,0.2090\nCC-MAIN-2022-33,ssw,846,843,0.0000\nCC-MAIN-2022-33,sun,22443,22427,0.0009\nCC-MAIN-2022-33,sux,221,220,0.0000\nCC-MAIN-2022-33,swa,189671,188792,0.0073\nCC-MAIN-2022-33,swe,16802380,16654330,0.6491\nCC-MAIN-2022-33,syr,14975,14956,0.0006\nCC-MAIN-2022-33,tam,1171021,1167633,0.0452\nCC-MAIN-2022-33,tat,195832,195654,0.0076\nCC-MAIN-2022-33,tel,516764,512979,0.0200\nCC-MAIN-2022-33,tgk,123725,123589,0.0048\nCC-MAIN-2022-33,tgl,208654,207699,0.0081\nCC-MAIN-2022-33,tha,10888547,10820106,0.4206\nCC-MAIN-2022-33,tir,12000,11852,0.0005\nCC-MAIN-2022-33,ton,1129,1120,0.0000\nCC-MAIN-2022-33,tsn,2418,2408,0.0001\nCC-MAIN-2022-33,tso,1057,1056,0.0000\nCC-MAIN-2022-33,tuk,61071,61027,0.0024\nCC-MAIN-2022-33,tur,23073928,22926353,0.8913\nCC-MAIN-2022-33,uig,34791,34626,0.0013\nCC-MAIN-2022-33,ukr,10928470,10839257,0.4222\nCC-MAIN-2022-33,urd,727746,721592,0.0281\nCC-MAIN-2022-33,uzb,404170,401139,0.0156\nCC-MAIN-2022-33,ven,684,678,0.0000\nCC-MAIN-2022-33,vie,22324661,22201110,0.8624\nCC-MAIN-2022-33,vol,13924,13899,0.0005\nCC-MAIN-2022-33,war,64206,63916,0.0025\nCC-MAIN-2022-33,wol,4555,4518,0.0002\nCC-MAIN-2022-33,xho,43971,43939,0.0017\nCC-MAIN-2022-33,yid,38973,38930,0.0015\nCC-MAIN-2022-33,yor,26081,26055,0.0010\nCC-MAIN-2022-33,zha,1176,1174,0.0000\nCC-MAIN-2022-33,zho,130426952,130060633,5.0383\nCC-MAIN-2022-33,zul,47757,47719,0.0018\nCC-MAIN-2022-40,<unknown>,81556058,81556058,2.5673\nCC-MAIN-2022-40,aar,3620,3597,0.0001\nCC-MAIN-2022-40,abk,24355,24240,0.0008\nCC-MAIN-2022-40,afr,268370,267717,0.0084\nCC-MAIN-2022-40,aka,2078,2074,0.0001\nCC-MAIN-2022-40,amh,118039,117862,0.0037\nCC-MAIN-2022-40,ara,21149346,21066109,0.6658\nCC-MAIN-2022-40,asm,78020,77845,0.0025\nCC-MAIN-2022-40,aym,2133,2100,0.0001\nCC-MAIN-2022-40,aze,1316564,1312736,0.0414\nCC-MAIN-2022-40,bak,42661,42650,0.0013\nCC-MAIN-2022-40,bel,513069,511902,0.0162\nCC-MAIN-2022-40,ben,2955076,2948179,0.0930\nCC-MAIN-2022-40,bih,20232,20222,0.0006\nCC-MAIN-2022-40,bis,4195,4163,0.0001\nCC-MAIN-2022-40,bod,54492,54453,0.0017\nCC-MAIN-2022-40,bos,1503494,1499555,0.0473\nCC-MAIN-2022-40,bre,92313,92199,0.0029\nCC-MAIN-2022-40,bul,9211828,9183300,0.2900\nCC-MAIN-2022-40,cat,7350182,7299380,0.2314\nCC-MAIN-2022-40,ceb,77463,77430,0.0024\nCC-MAIN-2022-40,ces,35163533,34983169,1.1069\nCC-MAIN-2022-40,chr,2335,2335,0.0001\nCC-MAIN-2022-40,cos,83563,83453,0.0026\nCC-MAIN-2022-40,crs,2298,2288,0.0001\nCC-MAIN-2022-40,cym,300823,299624,0.0095\nCC-MAIN-2022-40,dan,13662425,13581598,0.4301\nCC-MAIN-2022-40,deu,186829478,185742847,5.8811\nCC-MAIN-2022-40,div,68095,68045,0.0021\nCC-MAIN-2022-40,dzo,4783,4781,0.0002\nCC-MAIN-2022-40,ell,18649125,18587747,0.5870\nCC-MAIN-2022-40,eng,1457454193,1448381690,45.8786\nCC-MAIN-2022-40,epo,287816,286272,0.0091\nCC-MAIN-2022-40,est,4300315,4276042,0.1354\nCC-MAIN-2022-40,eus,1024671,1018049,0.0323\nCC-MAIN-2022-40,fao,127497,127222,0.0040\nCC-MAIN-2022-40,fas,20907887,20811965,0.6582\nCC-MAIN-2022-40,fij,5016,5012,0.0002\nCC-MAIN-2022-40,fin,12961453,12887458,0.4080\nCC-MAIN-2022-40,fra,150113951,149335182,4.7254\nCC-MAIN-2022-40,fry,100215,99850,0.0032\nCC-MAIN-2022-40,gla,49162,49068,0.0015\nCC-MAIN-2022-40,gle,199757,198833,0.0063\nCC-MAIN-2022-40,glg,1270851,1265434,0.0400\nCC-MAIN-2022-40,glv,16043,16030,0.0005\nCC-MAIN-2022-40,got,988,988,0.0000\nCC-MAIN-2022-40,grn,20443,20375,0.0006\nCC-MAIN-2022-40,guj,399594,398656,0.0126\nCC-MAIN-2022-40,hat,57653,57533,0.0018\nCC-MAIN-2022-40,hau,89866,89606,0.0028\nCC-MAIN-2022-40,haw,22738,22724,0.0007\nCC-MAIN-2022-40,heb,3658867,3643652,0.1152\nCC-MAIN-2022-40,hin,5043521,5029497,0.1588\nCC-MAIN-2022-40,hmn,20558,20545,0.0006\nCC-MAIN-2022-40,hrv,6286031,6264594,0.1979\nCC-MAIN-2022-40,hun,19357344,19279673,0.6093\nCC-MAIN-2022-40,hye,999051,995173,0.0314\nCC-MAIN-2022-40,ibo,19919,19895,0.0006\nCC-MAIN-2022-40,iku,6877,6862,0.0002\nCC-MAIN-2022-40,ile,9604,9579,0.0003\nCC-MAIN-2022-40,ina,22853,22802,0.0007\nCC-MAIN-2022-40,ind,25385245,25273804,0.7991\nCC-MAIN-2022-40,ipk,2527,2521,0.0001\nCC-MAIN-2022-40,isl,1261200,1254859,0.0397\nCC-MAIN-2022-40,ita,81680848,81300960,2.5712\nCC-MAIN-2022-40,jav,72924,72842,0.0023\nCC-MAIN-2022-40,jpn,152116124,151676484,4.7884\nCC-MAIN-2022-40,kal,32967,32900,0.0010\nCC-MAIN-2022-40,kan,388490,387817,0.0122\nCC-MAIN-2022-40,kas,218,218,0.0000\nCC-MAIN-2022-40,kat,1118929,1115973,0.0352\nCC-MAIN-2022-40,kaz,670389,666999,0.0211\nCC-MAIN-2022-40,kha,5497,5484,0.0002\nCC-MAIN-2022-40,khm,343092,342032,0.0108\nCC-MAIN-2022-40,kin,64886,64801,0.0020\nCC-MAIN-2022-40,kir,154294,153605,0.0049\nCC-MAIN-2022-40,kor,20642069,20581631,0.6498\nCC-MAIN-2022-40,kur,173614,172656,0.0055\nCC-MAIN-2022-40,lao,141940,141520,0.0045\nCC-MAIN-2022-40,lat,3913862,3908671,0.1232\nCC-MAIN-2022-40,lav,2639219,2623857,0.0831\nCC-MAIN-2022-40,lif,14,14,0.0000\nCC-MAIN-2022-40,lin,7269,7262,0.0002\nCC-MAIN-2022-40,lit,5136938,5111955,0.1617\nCC-MAIN-2022-40,ltz,118881,118569,0.0037\nCC-MAIN-2022-40,lug,6023,6021,0.0002\nCC-MAIN-2022-40,mal,704562,703194,0.0222\nCC-MAIN-2022-40,mar,676791,675444,0.0213\nCC-MAIN-2022-40,mfe,4792,4776,0.0002\nCC-MAIN-2022-40,mkd,1101605,1098562,0.0347\nCC-MAIN-2022-40,mlg,97960,97402,0.0031\nCC-MAIN-2022-40,mlt,134965,133348,0.0042\nCC-MAIN-2022-40,mon,685400,684332,0.0216\nCC-MAIN-2022-40,mri,42164,41993,0.0013\nCC-MAIN-2022-40,msa,2623861,2616369,0.0826\nCC-MAIN-2022-40,mya,400730,399192,0.0126\nCC-MAIN-2022-40,nau,1601,1601,0.0001\nCC-MAIN-2022-40,nep,967048,965410,0.0304\nCC-MAIN-2022-40,nld,65394910,65030555,2.0585\nCC-MAIN-2022-40,nno,514840,513115,0.0162\nCC-MAIN-2022-40,nor,10867364,10802684,0.3421\nCC-MAIN-2022-40,nso,2760,2759,0.0001\nCC-MAIN-2022-40,nya,19927,19906,0.0006\nCC-MAIN-2022-40,oci,102702,102472,0.0032\nCC-MAIN-2022-40,ori,140393,140047,0.0044\nCC-MAIN-2022-40,orm,16633,16578,0.0005\nCC-MAIN-2022-40,pan,192483,192041,0.0061\nCC-MAIN-2022-40,pol,52849259,52586688,1.6636\nCC-MAIN-2022-40,por,36547124,36385253,1.1505\nCC-MAIN-2022-40,pus,89711,89543,0.0028\nCC-MAIN-2022-40,que,22121,22115,0.0007\nCC-MAIN-2022-40,roh,39709,39203,0.0012\nCC-MAIN-2022-40,ron,17907530,17834841,0.5637\nCC-MAIN-2022-40,run,3251,3250,0.0001\nCC-MAIN-2022-40,rus,189626979,188694580,5.9692\nCC-MAIN-2022-40,sag,6103,6099,0.0002\nCC-MAIN-2022-40,san,90926,90727,0.0029\nCC-MAIN-2022-40,sco,21194,21154,0.0007\nCC-MAIN-2022-40,sin,269996,269249,0.0085\nCC-MAIN-2022-40,slk,12000190,11938806,0.3777\nCC-MAIN-2022-40,slv,5024682,5004229,0.1582\nCC-MAIN-2022-40,smo,18822,18790,0.0006\nCC-MAIN-2022-40,sna,20921,20895,0.0007\nCC-MAIN-2022-40,snd,47010,46059,0.0015\nCC-MAIN-2022-40,som,126274,126002,0.0040\nCC-MAIN-2022-40,sot,22626,22561,0.0007\nCC-MAIN-2022-40,spa,141968166,141245640,4.4690\nCC-MAIN-2022-40,sqi,1389826,1385459,0.0437\nCC-MAIN-2022-40,srp,7005277,6978733,0.2205\nCC-MAIN-2022-40,ssw,1183,1175,0.0000\nCC-MAIN-2022-40,sun,36951,36929,0.0012\nCC-MAIN-2022-40,sux,272,270,0.0000\nCC-MAIN-2022-40,swa,244910,244409,0.0077\nCC-MAIN-2022-40,swe,22138217,22010850,0.6969\nCC-MAIN-2022-40,syr,15580,15567,0.0005\nCC-MAIN-2022-40,tam,1416763,1412804,0.0446\nCC-MAIN-2022-40,tat,199123,199051,0.0063\nCC-MAIN-2022-40,tel,580842,579449,0.0183\nCC-MAIN-2022-40,tgk,149308,149153,0.0047\nCC-MAIN-2022-40,tgl,279172,278469,0.0088\nCC-MAIN-2022-40,tha,13160226,13111602,0.4143\nCC-MAIN-2022-40,tir,28296,28229,0.0009\nCC-MAIN-2022-40,ton,1664,1656,0.0001\nCC-MAIN-2022-40,tsn,2905,2861,0.0001\nCC-MAIN-2022-40,tso,1301,1297,0.0000\nCC-MAIN-2022-40,tuk,84992,84891,0.0027\nCC-MAIN-2022-40,tur,26808055,26701272,0.8439\nCC-MAIN-2022-40,uig,46231,46144,0.0015\nCC-MAIN-2022-40,ukr,10496531,10416588,0.3304\nCC-MAIN-2022-40,urd,869195,865099,0.0274\nCC-MAIN-2022-40,uzb,514038,511819,0.0162\nCC-MAIN-2022-40,ven,893,892,0.0000\nCC-MAIN-2022-40,vie,32717366,32570273,1.0299\nCC-MAIN-2022-40,vol,18025,18008,0.0006\nCC-MAIN-2022-40,war,85928,85621,0.0027\nCC-MAIN-2022-40,wol,4698,4681,0.0001\nCC-MAIN-2022-40,xho,46386,46315,0.0015\nCC-MAIN-2022-40,yid,54006,53953,0.0017\nCC-MAIN-2022-40,yor,31169,31135,0.0010\nCC-MAIN-2022-40,zha,2485,2478,0.0001\nCC-MAIN-2022-40,zho,154858502,154566437,4.8747\nCC-MAIN-2022-40,zul,54408,54310,0.0017\nCC-MAIN-2022-49,<unknown>,91429620,91429620,2.7037\nCC-MAIN-2022-49,aar,5136,5115,0.0002\nCC-MAIN-2022-49,abk,22348,22182,0.0007\nCC-MAIN-2022-49,afr,266836,266259,0.0079\nCC-MAIN-2022-49,aka,2435,2413,0.0001\nCC-MAIN-2022-49,amh,105653,105100,0.0031\nCC-MAIN-2022-49,ara,22683855,22585457,0.6708\nCC-MAIN-2022-49,asm,86142,85853,0.0025\nCC-MAIN-2022-49,aym,2484,2372,0.0001\nCC-MAIN-2022-49,aze,1360635,1355001,0.0402\nCC-MAIN-2022-49,bak,98576,98568,0.0029\nCC-MAIN-2022-49,bel,529012,527885,0.0156\nCC-MAIN-2022-49,ben,3186992,3175562,0.0942\nCC-MAIN-2022-49,bih,23770,23755,0.0007\nCC-MAIN-2022-49,bis,4868,4854,0.0001\nCC-MAIN-2022-49,bod,51861,51567,0.0015\nCC-MAIN-2022-49,bos,1563599,1558968,0.0462\nCC-MAIN-2022-49,bre,92080,91965,0.0027\nCC-MAIN-2022-49,bul,9881343,9843146,0.2922\nCC-MAIN-2022-49,cat,8012489,7949904,0.2369\nCC-MAIN-2022-49,ceb,74302,74229,0.0022\nCC-MAIN-2022-49,ces,37161326,36938683,1.0989\nCC-MAIN-2022-49,chr,1917,1915,0.0001\nCC-MAIN-2022-49,cos,80649,80378,0.0024\nCC-MAIN-2022-49,crs,2702,2684,0.0001\nCC-MAIN-2022-49,cym,345059,343784,0.0102\nCC-MAIN-2022-49,dan,15127579,15020431,0.4473\nCC-MAIN-2022-49,deu,198296288,196886582,5.8640\nCC-MAIN-2022-49,div,77169,77146,0.0023\nCC-MAIN-2022-49,dzo,5168,5167,0.0002\nCC-MAIN-2022-49,ell,20518332,20435734,0.6068\nCC-MAIN-2022-49,eng,1565833888,1554207978,46.3044\nCC-MAIN-2022-49,epo,308245,306938,0.0091\nCC-MAIN-2022-49,est,4624726,4594722,0.1368\nCC-MAIN-2022-49,eus,1151164,1141941,0.0340\nCC-MAIN-2022-49,fao,143339,142755,0.0042\nCC-MAIN-2022-49,fas,22558926,22464006,0.6671\nCC-MAIN-2022-49,fij,3398,3393,0.0001\nCC-MAIN-2022-49,fin,14083477,13977793,0.4165\nCC-MAIN-2022-49,fra,161532974,160493400,4.7768\nCC-MAIN-2022-49,fry,106144,105593,0.0031\nCC-MAIN-2022-49,gla,53903,53792,0.0016\nCC-MAIN-2022-49,gle,220064,218837,0.0065\nCC-MAIN-2022-49,glg,1380228,1374255,0.0408\nCC-MAIN-2022-49,glv,11953,11931,0.0004\nCC-MAIN-2022-49,got,894,893,0.0000\nCC-MAIN-2022-49,grn,20346,20252,0.0006\nCC-MAIN-2022-49,guj,423590,422940,0.0125\nCC-MAIN-2022-49,hat,59759,59616,0.0018\nCC-MAIN-2022-49,hau,88055,87363,0.0026\nCC-MAIN-2022-49,haw,23990,23959,0.0007\nCC-MAIN-2022-49,heb,3955045,3938324,0.1170\nCC-MAIN-2022-49,hin,5382599,5363022,0.1592\nCC-MAIN-2022-49,hmn,24047,24022,0.0007\nCC-MAIN-2022-49,hrv,6729370,6700566,0.1990\nCC-MAIN-2022-49,hun,20976678,20877230,0.6203\nCC-MAIN-2022-49,hye,1064167,1060216,0.0315\nCC-MAIN-2022-49,ibo,21515,21474,0.0006\nCC-MAIN-2022-49,iku,6612,6574,0.0002\nCC-MAIN-2022-49,ile,11345,11329,0.0003\nCC-MAIN-2022-49,ina,22863,22799,0.0007\nCC-MAIN-2022-49,ind,27026770,26868164,0.7992\nCC-MAIN-2022-49,ipk,2096,2084,0.0001\nCC-MAIN-2022-49,isl,1365880,1359305,0.0404\nCC-MAIN-2022-49,ita,90744833,90237807,2.6835\nCC-MAIN-2022-49,jav,77587,77498,0.0023\nCC-MAIN-2022-49,jpn,150771095,150279468,4.4586\nCC-MAIN-2022-49,kal,34751,34552,0.0010\nCC-MAIN-2022-49,kan,410685,409806,0.0121\nCC-MAIN-2022-49,kas,65,65,0.0000\nCC-MAIN-2022-49,kat,1249187,1245650,0.0369\nCC-MAIN-2022-49,kaz,718000,714952,0.0212\nCC-MAIN-2022-49,kha,5469,5457,0.0002\nCC-MAIN-2022-49,khm,358702,356773,0.0106\nCC-MAIN-2022-49,kin,65862,65637,0.0019\nCC-MAIN-2022-49,kir,174708,174044,0.0052\nCC-MAIN-2022-49,kor,22068256,21999019,0.6526\nCC-MAIN-2022-49,kur,188886,188424,0.0056\nCC-MAIN-2022-49,lao,139680,139188,0.0041\nCC-MAIN-2022-49,lat,3582723,3575812,0.1059\nCC-MAIN-2022-49,lav,2813683,2795716,0.0832\nCC-MAIN-2022-49,lif,34,34,0.0000\nCC-MAIN-2022-49,lin,7840,7829,0.0002\nCC-MAIN-2022-49,lit,5440194,5411367,0.1609\nCC-MAIN-2022-49,ltz,127233,126872,0.0038\nCC-MAIN-2022-49,lug,5965,5961,0.0002\nCC-MAIN-2022-49,mal,740801,738877,0.0219\nCC-MAIN-2022-49,mar,717441,716112,0.0212\nCC-MAIN-2022-49,mfe,5770,5762,0.0002\nCC-MAIN-2022-49,mkd,1230063,1225935,0.0364\nCC-MAIN-2022-49,mlg,89702,89202,0.0027\nCC-MAIN-2022-49,mlt,146486,144450,0.0043\nCC-MAIN-2022-49,mon,805680,804518,0.0238\nCC-MAIN-2022-49,mri,42851,42669,0.0013\nCC-MAIN-2022-49,msa,2746448,2735745,0.0812\nCC-MAIN-2022-49,mya,400142,398619,0.0118\nCC-MAIN-2022-49,nau,1201,1199,0.0000\nCC-MAIN-2022-49,nep,1035005,1033609,0.0306\nCC-MAIN-2022-49,nld,72717229,72231155,2.1504\nCC-MAIN-2022-49,nno,537114,534891,0.0159\nCC-MAIN-2022-49,nor,11681345,11593542,0.3454\nCC-MAIN-2022-49,nso,1899,1899,0.0001\nCC-MAIN-2022-49,nya,19420,19383,0.0006\nCC-MAIN-2022-49,oci,112007,111798,0.0033\nCC-MAIN-2022-49,ori,142329,142205,0.0042\nCC-MAIN-2022-49,orm,14828,14807,0.0004\nCC-MAIN-2022-49,pan,211159,210671,0.0062\nCC-MAIN-2022-49,pol,57083805,56756835,1.6881\nCC-MAIN-2022-49,por,39007296,38819469,1.1535\nCC-MAIN-2022-49,pus,97777,97251,0.0029\nCC-MAIN-2022-49,que,22691,22684,0.0007\nCC-MAIN-2022-49,roh,39250,38608,0.0012\nCC-MAIN-2022-49,ron,19518484,19431250,0.5772\nCC-MAIN-2022-49,run,2599,2599,0.0001\nCC-MAIN-2022-49,rus,191558850,190705798,5.6647\nCC-MAIN-2022-49,sag,4524,4523,0.0001\nCC-MAIN-2022-49,san,95520,95387,0.0028\nCC-MAIN-2022-49,sco,21627,21562,0.0006\nCC-MAIN-2022-49,sin,286128,285220,0.0085\nCC-MAIN-2022-49,slk,13153012,13084688,0.3890\nCC-MAIN-2022-49,slv,5493461,5469076,0.1625\nCC-MAIN-2022-49,smo,17763,17741,0.0005\nCC-MAIN-2022-49,sna,19322,19295,0.0006\nCC-MAIN-2022-49,snd,47813,46514,0.0014\nCC-MAIN-2022-49,som,132869,132702,0.0039\nCC-MAIN-2022-49,sot,19423,19398,0.0006\nCC-MAIN-2022-49,spa,153644387,152720822,4.5435\nCC-MAIN-2022-49,sqi,1522628,1516401,0.0450\nCC-MAIN-2022-49,srp,7534743,7495705,0.2228\nCC-MAIN-2022-49,ssw,1804,1105,0.0001\nCC-MAIN-2022-49,sun,37777,37747,0.0011\nCC-MAIN-2022-49,sux,488,488,0.0000\nCC-MAIN-2022-49,swa,252153,251174,0.0075\nCC-MAIN-2022-49,swe,23331279,23157229,0.6899\nCC-MAIN-2022-49,syr,11752,11739,0.0003\nCC-MAIN-2022-49,tam,1522411,1518560,0.0450\nCC-MAIN-2022-49,tat,264399,264313,0.0078\nCC-MAIN-2022-49,tel,610417,606497,0.0181\nCC-MAIN-2022-49,tgk,166597,166396,0.0049\nCC-MAIN-2022-49,tgl,291544,290139,0.0086\nCC-MAIN-2022-49,tha,13618453,13551803,0.4027\nCC-MAIN-2022-49,tir,26151,25773,0.0008\nCC-MAIN-2022-49,ton,1837,1831,0.0001\nCC-MAIN-2022-49,tsn,2518,2488,0.0001\nCC-MAIN-2022-49,tso,1370,1369,0.0000\nCC-MAIN-2022-49,tuk,87665,87477,0.0026\nCC-MAIN-2022-49,tur,27187396,27037010,0.8040\nCC-MAIN-2022-49,uig,44142,44104,0.0013\nCC-MAIN-2022-49,ukr,11328002,11230528,0.3350\nCC-MAIN-2022-49,urd,936482,932318,0.0277\nCC-MAIN-2022-49,uzb,506530,501823,0.0150\nCC-MAIN-2022-49,ven,608,601,0.0000\nCC-MAIN-2022-49,vie,33603032,33397147,0.9937\nCC-MAIN-2022-49,vol,17294,17271,0.0005\nCC-MAIN-2022-49,war,87727,87375,0.0026\nCC-MAIN-2022-49,wol,3768,3763,0.0001\nCC-MAIN-2022-49,xho,50006,49908,0.0015\nCC-MAIN-2022-49,yid,51729,51671,0.0015\nCC-MAIN-2022-49,yor,34113,34079,0.0010\nCC-MAIN-2022-49,zha,1986,1980,0.0001\nCC-MAIN-2022-49,zho,155448839,155086341,4.5969\nCC-MAIN-2022-49,zul,56014,55892,0.0017\nCC-MAIN-2023-06,<unknown>,80339375,80339375,2.5188\nCC-MAIN-2023-06,aar,4071,4060,0.0001\nCC-MAIN-2023-06,abk,19674,19626,0.0006\nCC-MAIN-2023-06,afr,243824,243138,0.0076\nCC-MAIN-2023-06,aka,2104,2103,0.0001\nCC-MAIN-2023-06,amh,118928,118449,0.0037\nCC-MAIN-2023-06,ara,21550117,21472432,0.6756\nCC-MAIN-2023-06,asm,99513,99438,0.0031\nCC-MAIN-2023-06,aym,3397,3376,0.0001\nCC-MAIN-2023-06,aze,1316289,1311988,0.0413\nCC-MAIN-2023-06,bak,87346,87264,0.0027\nCC-MAIN-2023-06,bel,535323,534623,0.0168\nCC-MAIN-2023-06,ben,3071295,3065677,0.0963\nCC-MAIN-2023-06,bih,22279,22264,0.0007\nCC-MAIN-2023-06,bis,3736,3729,0.0001\nCC-MAIN-2023-06,bod,44752,44467,0.0014\nCC-MAIN-2023-06,bos,1521973,1518742,0.0477\nCC-MAIN-2023-06,bre,88065,87906,0.0028\nCC-MAIN-2023-06,bul,9473445,9439127,0.2970\nCC-MAIN-2023-06,cat,7448207,7401712,0.2335\nCC-MAIN-2023-06,ceb,76378,76352,0.0024\nCC-MAIN-2023-06,ces,35066026,34897182,1.0994\nCC-MAIN-2023-06,chr,2594,2577,0.0001\nCC-MAIN-2023-06,cos,78795,78646,0.0025\nCC-MAIN-2023-06,crs,2565,2553,0.0001\nCC-MAIN-2023-06,cym,318468,317406,0.0100\nCC-MAIN-2023-06,dan,14356456,14273532,0.4501\nCC-MAIN-2023-06,deu,188215727,187058230,5.9010\nCC-MAIN-2023-06,div,74478,74439,0.0023\nCC-MAIN-2023-06,dzo,5463,5463,0.0002\nCC-MAIN-2023-06,ell,19452908,19384766,0.6099\nCC-MAIN-2023-06,eng,1475921881,1465675034,46.2733\nCC-MAIN-2023-06,epo,304862,303445,0.0096\nCC-MAIN-2023-06,est,4387542,4364975,0.1376\nCC-MAIN-2023-06,eus,1060079,1050635,0.0332\nCC-MAIN-2023-06,fao,134278,133344,0.0042\nCC-MAIN-2023-06,fas,21016356,20919348,0.6589\nCC-MAIN-2023-06,fij,2521,2514,0.0001\nCC-MAIN-2023-06,fin,13254768,13182097,0.4156\nCC-MAIN-2023-06,fra,151463821,150639618,4.7487\nCC-MAIN-2023-06,fry,92847,92409,0.0029\nCC-MAIN-2023-06,gla,45544,45478,0.0014\nCC-MAIN-2023-06,gle,209358,207961,0.0066\nCC-MAIN-2023-06,glg,1354785,1349640,0.0425\nCC-MAIN-2023-06,glv,11520,11510,0.0004\nCC-MAIN-2023-06,got,887,885,0.0000\nCC-MAIN-2023-06,grn,22318,22255,0.0007\nCC-MAIN-2023-06,guj,408942,408432,0.0128\nCC-MAIN-2023-06,hat,57005,56925,0.0018\nCC-MAIN-2023-06,hau,99438,99029,0.0031\nCC-MAIN-2023-06,haw,20684,20676,0.0006\nCC-MAIN-2023-06,heb,3667273,3649821,0.1150\nCC-MAIN-2023-06,hin,5570847,5554946,0.1747\nCC-MAIN-2023-06,hmn,23368,23350,0.0007\nCC-MAIN-2023-06,hrv,6490924,6468345,0.2035\nCC-MAIN-2023-06,hun,19195271,19112196,0.6018\nCC-MAIN-2023-06,hye,1034003,1030962,0.0324\nCC-MAIN-2023-06,ibo,22053,22033,0.0007\nCC-MAIN-2023-06,iku,6496,6467,0.0002\nCC-MAIN-2023-06,ile,9733,9486,0.0003\nCC-MAIN-2023-06,ina,20885,20854,0.0007\nCC-MAIN-2023-06,ind,25937086,25803550,0.8132\nCC-MAIN-2023-06,ipk,2570,2562,0.0001\nCC-MAIN-2023-06,isl,1332973,1327788,0.0418\nCC-MAIN-2023-06,ita,85618547,85220369,2.6843\nCC-MAIN-2023-06,jav,80779,80714,0.0025\nCC-MAIN-2023-06,jpn,151978476,151560035,4.7648\nCC-MAIN-2023-06,kal,30664,30421,0.0010\nCC-MAIN-2023-06,kan,430279,429800,0.0135\nCC-MAIN-2023-06,kas,306,306,0.0000\nCC-MAIN-2023-06,kat,1141884,1137554,0.0358\nCC-MAIN-2023-06,kaz,653148,650806,0.0205\nCC-MAIN-2023-06,kha,5540,5529,0.0002\nCC-MAIN-2023-06,khm,416779,416003,0.0131\nCC-MAIN-2023-06,kin,63204,63130,0.0020\nCC-MAIN-2023-06,kir,168087,167844,0.0053\nCC-MAIN-2023-06,kor,20790147,20735253,0.6518\nCC-MAIN-2023-06,kur,171573,171254,0.0054\nCC-MAIN-2023-06,lao,139396,138920,0.0044\nCC-MAIN-2023-06,lat,3693918,3689010,0.1158\nCC-MAIN-2023-06,lav,2703770,2686089,0.0848\nCC-MAIN-2023-06,lif,55,54,0.0000\nCC-MAIN-2023-06,lin,7302,7289,0.0002\nCC-MAIN-2023-06,lit,5187360,5162510,0.1626\nCC-MAIN-2023-06,ltz,127981,127580,0.0040\nCC-MAIN-2023-06,lug,6401,6393,0.0002\nCC-MAIN-2023-06,mal,724406,723100,0.0227\nCC-MAIN-2023-06,mar,711949,710182,0.0223\nCC-MAIN-2023-06,mfe,5653,5649,0.0002\nCC-MAIN-2023-06,mkd,1146916,1144132,0.0360\nCC-MAIN-2023-06,mlg,97221,96499,0.0030\nCC-MAIN-2023-06,mlt,129660,129024,0.0041\nCC-MAIN-2023-06,mon,539714,538833,0.0169\nCC-MAIN-2023-06,mri,37955,37850,0.0012\nCC-MAIN-2023-06,msa,2590611,2582795,0.0812\nCC-MAIN-2023-06,mya,399604,398675,0.0125\nCC-MAIN-2023-06,nau,1290,1286,0.0000\nCC-MAIN-2023-06,nep,1042832,1040405,0.0327\nCC-MAIN-2023-06,nld,66003489,65627574,2.0693\nCC-MAIN-2023-06,nno,492584,490569,0.0154\nCC-MAIN-2023-06,nor,10849102,10785148,0.3401\nCC-MAIN-2023-06,nso,2557,2557,0.0001\nCC-MAIN-2023-06,nya,19552,19502,0.0006\nCC-MAIN-2023-06,oci,99546,99400,0.0031\nCC-MAIN-2023-06,ori,155623,155549,0.0049\nCC-MAIN-2023-06,orm,18364,18331,0.0006\nCC-MAIN-2023-06,pan,202472,202166,0.0063\nCC-MAIN-2023-06,pol,54149163,53875484,1.6977\nCC-MAIN-2023-06,por,37189014,37024690,1.1660\nCC-MAIN-2023-06,pus,95296,94857,0.0030\nCC-MAIN-2023-06,que,21952,21948,0.0007\nCC-MAIN-2023-06,roh,37328,36635,0.0012\nCC-MAIN-2023-06,ron,18265494,18192313,0.5727\nCC-MAIN-2023-06,run,2657,2655,0.0001\nCC-MAIN-2023-06,rus,184707324,184024978,5.7910\nCC-MAIN-2023-06,sag,7807,7807,0.0002\nCC-MAIN-2023-06,san,101002,100740,0.0032\nCC-MAIN-2023-06,sco,20907,20872,0.0007\nCC-MAIN-2023-06,sin,250357,249386,0.0078\nCC-MAIN-2023-06,slk,12664763,12612565,0.3971\nCC-MAIN-2023-06,slv,5103744,5079923,0.1600\nCC-MAIN-2023-06,smo,17719,17684,0.0006\nCC-MAIN-2023-06,sna,18652,18625,0.0006\nCC-MAIN-2023-06,snd,51398,50531,0.0016\nCC-MAIN-2023-06,som,130032,129865,0.0041\nCC-MAIN-2023-06,sot,20048,20028,0.0006\nCC-MAIN-2023-06,spa,146647587,145919660,4.5977\nCC-MAIN-2023-06,sqi,1475188,1470622,0.0463\nCC-MAIN-2023-06,srp,7131555,7099819,0.2236\nCC-MAIN-2023-06,ssw,770,766,0.0000\nCC-MAIN-2023-06,sun,43257,43238,0.0014\nCC-MAIN-2023-06,sux,367,367,0.0000\nCC-MAIN-2023-06,swa,245703,245167,0.0077\nCC-MAIN-2023-06,swe,22379047,22248187,0.7016\nCC-MAIN-2023-06,syr,10534,10526,0.0003\nCC-MAIN-2023-06,tam,1478223,1475188,0.0463\nCC-MAIN-2023-06,tat,247406,247089,0.0078\nCC-MAIN-2023-06,tel,603017,601532,0.0189\nCC-MAIN-2023-06,tgk,160933,160755,0.0050\nCC-MAIN-2023-06,tgl,233311,232309,0.0073\nCC-MAIN-2023-06,tha,12921960,12864816,0.4051\nCC-MAIN-2023-06,tir,30396,30149,0.0010\nCC-MAIN-2023-06,ton,1770,1753,0.0001\nCC-MAIN-2023-06,tsn,3476,3383,0.0001\nCC-MAIN-2023-06,tso,1005,1003,0.0000\nCC-MAIN-2023-06,tuk,85119,84894,0.0027\nCC-MAIN-2023-06,tur,26220348,26121458,0.8221\nCC-MAIN-2023-06,uig,45912,45898,0.0014\nCC-MAIN-2023-06,ukr,10709061,10654725,0.3358\nCC-MAIN-2023-06,urd,949824,946764,0.0298\nCC-MAIN-2023-06,uzb,509489,506977,0.0160\nCC-MAIN-2023-06,ven,589,585,0.0000\nCC-MAIN-2023-06,vie,32275734,32083089,1.0119\nCC-MAIN-2023-06,vol,17435,17412,0.0005\nCC-MAIN-2023-06,war,76557,76360,0.0024\nCC-MAIN-2023-06,wol,4142,4138,0.0001\nCC-MAIN-2023-06,xho,34660,34590,0.0011\nCC-MAIN-2023-06,yid,49694,49650,0.0016\nCC-MAIN-2023-06,yor,31217,31166,0.0010\nCC-MAIN-2023-06,zha,2296,2295,0.0001\nCC-MAIN-2023-06,zho,136537357,135870912,4.2807\nCC-MAIN-2023-06,zul,45426,45337,0.0014\nCC-MAIN-2023-14,<unknown>,88925960,88925960,2.8514\nCC-MAIN-2023-14,aar,4605,4582,0.0001\nCC-MAIN-2023-14,abk,15228,15216,0.0005\nCC-MAIN-2023-14,afr,226858,226279,0.0073\nCC-MAIN-2023-14,aka,1984,1973,0.0001\nCC-MAIN-2023-14,amh,111936,111409,0.0036\nCC-MAIN-2023-14,ara,21174932,21094355,0.6790\nCC-MAIN-2023-14,asm,82565,82505,0.0026\nCC-MAIN-2023-14,aym,3496,3444,0.0001\nCC-MAIN-2023-14,aze,1389447,1386405,0.0446\nCC-MAIN-2023-14,bak,82354,82317,0.0026\nCC-MAIN-2023-14,bel,517286,516513,0.0166\nCC-MAIN-2023-14,ben,3230586,3225942,0.1036\nCC-MAIN-2023-14,bih,24501,24490,0.0008\nCC-MAIN-2023-14,bis,4536,4533,0.0001\nCC-MAIN-2023-14,bod,45061,44904,0.0014\nCC-MAIN-2023-14,bos,1442101,1436495,0.0462\nCC-MAIN-2023-14,bre,78946,78882,0.0025\nCC-MAIN-2023-14,bul,9234416,9203409,0.2961\nCC-MAIN-2023-14,cat,7368138,7316446,0.2363\nCC-MAIN-2023-14,ceb,71994,71955,0.0023\nCC-MAIN-2023-14,ces,34518923,34321020,1.1069\nCC-MAIN-2023-14,chr,1468,1455,0.0000\nCC-MAIN-2023-14,cos,76944,76815,0.0025\nCC-MAIN-2023-14,crs,4202,4194,0.0001\nCC-MAIN-2023-14,cym,315386,313815,0.0101\nCC-MAIN-2023-14,dan,13670967,13590756,0.4384\nCC-MAIN-2023-14,deu,179793878,178657560,5.7651\nCC-MAIN-2023-14,div,73300,73277,0.0024\nCC-MAIN-2023-14,dzo,4459,4459,0.0001\nCC-MAIN-2023-14,ell,18985716,18919835,0.6088\nCC-MAIN-2023-14,eng,1440028177,1429750403,46.1750\nCC-MAIN-2023-14,epo,299238,298065,0.0096\nCC-MAIN-2023-14,est,4325628,4303968,0.1387\nCC-MAIN-2023-14,eus,1091847,1081798,0.0350\nCC-MAIN-2023-14,fao,132009,131584,0.0042\nCC-MAIN-2023-14,fas,18716830,18647697,0.6002\nCC-MAIN-2023-14,fij,3343,3099,0.0001\nCC-MAIN-2023-14,fin,12366132,12298762,0.3965\nCC-MAIN-2023-14,fra,145859895,145045621,4.6770\nCC-MAIN-2023-14,fry,88294,88137,0.0028\nCC-MAIN-2023-14,gla,49631,49532,0.0016\nCC-MAIN-2023-14,gle,218289,217470,0.0070\nCC-MAIN-2023-14,glg,1304127,1299110,0.0418\nCC-MAIN-2023-14,glv,10196,10184,0.0003\nCC-MAIN-2023-14,got,798,798,0.0000\nCC-MAIN-2023-14,grn,18694,18561,0.0006\nCC-MAIN-2023-14,guj,441835,441002,0.0142\nCC-MAIN-2023-14,hat,61095,60966,0.0020\nCC-MAIN-2023-14,hau,111319,110884,0.0036\nCC-MAIN-2023-14,haw,23782,23712,0.0008\nCC-MAIN-2023-14,heb,3554767,3537090,0.1140\nCC-MAIN-2023-14,hin,5582918,5568466,0.1790\nCC-MAIN-2023-14,hmn,25771,25727,0.0008\nCC-MAIN-2023-14,hrv,5870244,5846915,0.1882\nCC-MAIN-2023-14,hun,19085046,19005347,0.6120\nCC-MAIN-2023-14,hye,1049428,1045865,0.0337\nCC-MAIN-2023-14,ibo,23538,23417,0.0008\nCC-MAIN-2023-14,iku,6867,6860,0.0002\nCC-MAIN-2023-14,ile,10007,9983,0.0003\nCC-MAIN-2023-14,ina,18440,18418,0.0006\nCC-MAIN-2023-14,ind,24629820,24512597,0.7898\nCC-MAIN-2023-14,ipk,1800,1794,0.0001\nCC-MAIN-2023-14,isl,1247530,1242294,0.0400\nCC-MAIN-2023-14,ita,85018088,84619163,2.7261\nCC-MAIN-2023-14,jav,142556,142489,0.0046\nCC-MAIN-2023-14,jpn,138367872,137956827,4.4368\nCC-MAIN-2023-14,kal,22783,22655,0.0007\nCC-MAIN-2023-14,kan,418669,418011,0.0134\nCC-MAIN-2023-14,kas,54,54,0.0000\nCC-MAIN-2023-14,kat,1195385,1186129,0.0383\nCC-MAIN-2023-14,kaz,697398,694720,0.0224\nCC-MAIN-2023-14,kha,9496,9486,0.0003\nCC-MAIN-2023-14,khm,764344,763335,0.0245\nCC-MAIN-2023-14,kin,65624,65548,0.0021\nCC-MAIN-2023-14,kir,159797,159537,0.0051\nCC-MAIN-2023-14,kor,20508520,20431616,0.6576\nCC-MAIN-2023-14,kur,193649,193274,0.0062\nCC-MAIN-2023-14,lao,134506,134041,0.0043\nCC-MAIN-2023-14,lat,3428510,3424227,0.1099\nCC-MAIN-2023-14,lav,2665485,2652269,0.0855\nCC-MAIN-2023-14,lif,27,27,0.0000\nCC-MAIN-2023-14,lin,7107,7101,0.0002\nCC-MAIN-2023-14,lit,5202601,5177588,0.1668\nCC-MAIN-2023-14,ltz,126829,126347,0.0041\nCC-MAIN-2023-14,lug,6327,6312,0.0002\nCC-MAIN-2023-14,mal,721275,719954,0.0231\nCC-MAIN-2023-14,mar,777758,776407,0.0249\nCC-MAIN-2023-14,mfe,4055,4048,0.0001\nCC-MAIN-2023-14,mkd,1109081,1104724,0.0356\nCC-MAIN-2023-14,mlg,81773,81331,0.0026\nCC-MAIN-2023-14,mlt,132066,129191,0.0042\nCC-MAIN-2023-14,mon,515365,514396,0.0165\nCC-MAIN-2023-14,mri,39141,39065,0.0013\nCC-MAIN-2023-14,msa,2414043,2406999,0.0774\nCC-MAIN-2023-14,mya,397191,396256,0.0127\nCC-MAIN-2023-14,nau,1291,1289,0.0000\nCC-MAIN-2023-14,nep,1019578,1017801,0.0327\nCC-MAIN-2023-14,nld,66139301,65753817,2.1208\nCC-MAIN-2023-14,nno,514070,512485,0.0165\nCC-MAIN-2023-14,nor,10796016,10732943,0.3462\nCC-MAIN-2023-14,nso,1543,1543,0.0000\nCC-MAIN-2023-14,nya,24868,24836,0.0008\nCC-MAIN-2023-14,oci,102022,101853,0.0033\nCC-MAIN-2023-14,ori,164117,163866,0.0053\nCC-MAIN-2023-14,orm,16350,16322,0.0005\nCC-MAIN-2023-14,pan,216408,216162,0.0069\nCC-MAIN-2023-14,pol,51235922,50972462,1.6429\nCC-MAIN-2023-14,por,35261859,35104760,1.1307\nCC-MAIN-2023-14,pus,103288,103053,0.0033\nCC-MAIN-2023-14,que,21632,21616,0.0007\nCC-MAIN-2023-14,roh,40889,40742,0.0013\nCC-MAIN-2023-14,ron,16441273,16374427,0.5272\nCC-MAIN-2023-14,run,2190,2189,0.0001\nCC-MAIN-2023-14,rus,181588655,180830756,5.8227\nCC-MAIN-2023-14,sag,2981,2981,0.0001\nCC-MAIN-2023-14,san,100757,100471,0.0032\nCC-MAIN-2023-14,sco,19324,19277,0.0006\nCC-MAIN-2023-14,sin,252611,251835,0.0081\nCC-MAIN-2023-14,slk,12424095,12368965,0.3984\nCC-MAIN-2023-14,slv,5074186,5053157,0.1627\nCC-MAIN-2023-14,smo,19205,19183,0.0006\nCC-MAIN-2023-14,sna,20867,20824,0.0007\nCC-MAIN-2023-14,snd,54023,54001,0.0017\nCC-MAIN-2023-14,som,129920,129777,0.0042\nCC-MAIN-2023-14,sot,22800,22725,0.0007\nCC-MAIN-2023-14,spa,141834578,141103412,4.5480\nCC-MAIN-2023-14,sqi,1482532,1478560,0.0475\nCC-MAIN-2023-14,srp,6736756,6716034,0.2160\nCC-MAIN-2023-14,ssw,961,959,0.0000\nCC-MAIN-2023-14,sun,35354,35335,0.0011\nCC-MAIN-2023-14,sux,550,550,0.0000\nCC-MAIN-2023-14,swa,248090,247718,0.0080\nCC-MAIN-2023-14,swe,21834317,21707372,0.7001\nCC-MAIN-2023-14,syr,10103,10094,0.0003\nCC-MAIN-2023-14,tam,1409576,1406243,0.0452\nCC-MAIN-2023-14,tat,258069,257623,0.0083\nCC-MAIN-2023-14,tel,605698,604182,0.0194\nCC-MAIN-2023-14,tgk,158394,157943,0.0051\nCC-MAIN-2023-14,tgl,225117,224605,0.0072\nCC-MAIN-2023-14,tha,13728674,13678027,0.4402\nCC-MAIN-2023-14,tir,24779,24529,0.0008\nCC-MAIN-2023-14,ton,3056,3052,0.0001\nCC-MAIN-2023-14,tsn,2389,2380,0.0001\nCC-MAIN-2023-14,tso,1370,1368,0.0000\nCC-MAIN-2023-14,tuk,68876,68771,0.0022\nCC-MAIN-2023-14,tur,24626729,24536423,0.7897\nCC-MAIN-2023-14,uig,46166,46106,0.0015\nCC-MAIN-2023-14,ukr,11331460,11266429,0.3633\nCC-MAIN-2023-14,urd,906878,904760,0.0291\nCC-MAIN-2023-14,uzb,540037,537612,0.0173\nCC-MAIN-2023-14,ven,729,727,0.0000\nCC-MAIN-2023-14,vie,32916196,32629909,1.0555\nCC-MAIN-2023-14,vol,16632,16606,0.0005\nCC-MAIN-2023-14,war,79766,79511,0.0026\nCC-MAIN-2023-14,wol,3563,3559,0.0001\nCC-MAIN-2023-14,xho,33471,33420,0.0011\nCC-MAIN-2023-14,yid,55010,54983,0.0018\nCC-MAIN-2023-14,yor,35267,35229,0.0011\nCC-MAIN-2023-14,zha,1572,1571,0.0001\nCC-MAIN-2023-14,zho,144441597,143862479,4.6316\nCC-MAIN-2023-14,zul,50177,50088,0.0016\nCC-MAIN-2023-23,<unknown>,90329526,90329526,2.8762\nCC-MAIN-2023-23,aar,4916,4818,0.0002\nCC-MAIN-2023-23,abk,15297,15282,0.0005\nCC-MAIN-2023-23,afr,221063,220244,0.0070\nCC-MAIN-2023-23,aka,1917,1910,0.0001\nCC-MAIN-2023-23,amh,117191,116752,0.0037\nCC-MAIN-2023-23,ara,20038578,19942411,0.6381\nCC-MAIN-2023-23,asm,78203,78067,0.0025\nCC-MAIN-2023-23,aym,2553,2518,0.0001\nCC-MAIN-2023-23,aze,1381167,1376987,0.0440\nCC-MAIN-2023-23,bak,83936,83912,0.0027\nCC-MAIN-2023-23,bel,474509,473133,0.0151\nCC-MAIN-2023-23,ben,3031440,3021716,0.0965\nCC-MAIN-2023-23,bih,21455,21447,0.0007\nCC-MAIN-2023-23,bis,3875,3756,0.0001\nCC-MAIN-2023-23,bod,42182,42076,0.0013\nCC-MAIN-2023-23,bos,1448619,1443138,0.0461\nCC-MAIN-2023-23,bre,88344,88253,0.0028\nCC-MAIN-2023-23,bul,9615101,9580953,0.3062\nCC-MAIN-2023-23,cat,7640411,7584774,0.2433\nCC-MAIN-2023-23,ceb,51428,51404,0.0016\nCC-MAIN-2023-23,ces,36059842,35836455,1.1482\nCC-MAIN-2023-23,chr,1672,1648,0.0001\nCC-MAIN-2023-23,cos,74433,74275,0.0024\nCC-MAIN-2023-23,crs,3048,3036,0.0001\nCC-MAIN-2023-23,cym,295521,293789,0.0094\nCC-MAIN-2023-23,dan,13464957,13374596,0.4287\nCC-MAIN-2023-23,deu,189436880,188146552,6.0319\nCC-MAIN-2023-23,div,73033,72928,0.0023\nCC-MAIN-2023-23,dzo,4453,4453,0.0001\nCC-MAIN-2023-23,ell,18647565,18579737,0.5938\nCC-MAIN-2023-23,eng,1420072670,1410144975,45.2170\nCC-MAIN-2023-23,epo,283617,282854,0.0090\nCC-MAIN-2023-23,est,4427564,4393808,0.1410\nCC-MAIN-2023-23,eus,1086293,1076865,0.0346\nCC-MAIN-2023-23,fao,128518,128171,0.0041\nCC-MAIN-2023-23,fas,22314494,22194494,0.7105\nCC-MAIN-2023-23,fij,2307,2304,0.0001\nCC-MAIN-2023-23,fin,12584981,12507703,0.4007\nCC-MAIN-2023-23,fra,149776489,148894676,4.7691\nCC-MAIN-2023-23,fry,90660,90562,0.0029\nCC-MAIN-2023-23,gla,48565,48487,0.0015\nCC-MAIN-2023-23,gle,205233,204487,0.0065\nCC-MAIN-2023-23,glg,1308475,1303146,0.0417\nCC-MAIN-2023-23,glv,12046,12037,0.0004\nCC-MAIN-2023-23,got,900,900,0.0000\nCC-MAIN-2023-23,grn,18913,18867,0.0006\nCC-MAIN-2023-23,guj,444806,443938,0.0142\nCC-MAIN-2023-23,hat,60726,60601,0.0019\nCC-MAIN-2023-23,hau,110528,110102,0.0035\nCC-MAIN-2023-23,haw,19814,19786,0.0006\nCC-MAIN-2023-23,heb,3486958,3470160,0.1110\nCC-MAIN-2023-23,hin,5560111,5544581,0.1770\nCC-MAIN-2023-23,hmn,22538,22300,0.0007\nCC-MAIN-2023-23,hrv,5832483,5806530,0.1857\nCC-MAIN-2023-23,hun,19348581,19265347,0.6161\nCC-MAIN-2023-23,hye,964351,961345,0.0307\nCC-MAIN-2023-23,ibo,19845,19824,0.0006\nCC-MAIN-2023-23,iku,6381,6368,0.0002\nCC-MAIN-2023-23,ile,9807,9767,0.0003\nCC-MAIN-2023-23,ina,15657,15621,0.0005\nCC-MAIN-2023-23,ind,24105965,23971941,0.7676\nCC-MAIN-2023-23,ipk,1883,1877,0.0001\nCC-MAIN-2023-23,isl,1294915,1288545,0.0412\nCC-MAIN-2023-23,ita,86442503,85988235,2.7524\nCC-MAIN-2023-23,jav,73434,73372,0.0023\nCC-MAIN-2023-23,jpn,158081970,157600680,5.0335\nCC-MAIN-2023-23,kal,27068,26828,0.0009\nCC-MAIN-2023-23,kan,414918,414291,0.0132\nCC-MAIN-2023-23,kas,216,215,0.0000\nCC-MAIN-2023-23,kat,1159038,1155614,0.0369\nCC-MAIN-2023-23,kaz,670798,668304,0.0214\nCC-MAIN-2023-23,kha,8854,8846,0.0003\nCC-MAIN-2023-23,khm,346617,345166,0.0110\nCC-MAIN-2023-23,kin,56897,56835,0.0018\nCC-MAIN-2023-23,kir,158970,158730,0.0051\nCC-MAIN-2023-23,kor,21229929,21151898,0.6760\nCC-MAIN-2023-23,kur,185601,184717,0.0059\nCC-MAIN-2023-23,lao,123291,122670,0.0039\nCC-MAIN-2023-23,lat,3701987,3695898,0.1179\nCC-MAIN-2023-23,lav,2712157,2696519,0.0864\nCC-MAIN-2023-23,lif,22,22,0.0000\nCC-MAIN-2023-23,lin,7801,7794,0.0002\nCC-MAIN-2023-23,lit,5284519,5253732,0.1683\nCC-MAIN-2023-23,ltz,134036,133582,0.0043\nCC-MAIN-2023-23,lug,5059,5046,0.0002\nCC-MAIN-2023-23,mal,717877,716643,0.0229\nCC-MAIN-2023-23,mar,743377,742111,0.0237\nCC-MAIN-2023-23,mfe,4057,4053,0.0001\nCC-MAIN-2023-23,mkd,1070136,1066629,0.0341\nCC-MAIN-2023-23,mlg,91712,91023,0.0029\nCC-MAIN-2023-23,mlt,135660,132898,0.0043\nCC-MAIN-2023-23,mon,504112,502606,0.0161\nCC-MAIN-2023-23,mri,34805,34622,0.0011\nCC-MAIN-2023-23,msa,2466720,2456215,0.0785\nCC-MAIN-2023-23,mya,365016,363720,0.0116\nCC-MAIN-2023-23,nau,1233,1223,0.0000\nCC-MAIN-2023-23,nep,1026347,1024472,0.0327\nCC-MAIN-2023-23,nld,67009562,66562830,2.1337\nCC-MAIN-2023-23,nno,487913,485975,0.0155\nCC-MAIN-2023-23,nor,10689018,10619029,0.3404\nCC-MAIN-2023-23,nso,2126,2119,0.0001\nCC-MAIN-2023-23,nya,18834,18791,0.0006\nCC-MAIN-2023-23,oci,103758,103456,0.0033\nCC-MAIN-2023-23,ori,163672,163404,0.0052\nCC-MAIN-2023-23,orm,15980,15963,0.0005\nCC-MAIN-2023-23,pan,193179,192787,0.0062\nCC-MAIN-2023-23,pol,52887114,52601731,1.6840\nCC-MAIN-2023-23,por,35798970,35625875,1.1399\nCC-MAIN-2023-23,pus,99214,99052,0.0032\nCC-MAIN-2023-23,que,21660,21653,0.0007\nCC-MAIN-2023-23,roh,42990,42791,0.0014\nCC-MAIN-2023-23,ron,15698365,15629173,0.4999\nCC-MAIN-2023-23,run,2171,2170,0.0001\nCC-MAIN-2023-23,rus,188113412,187275747,5.9898\nCC-MAIN-2023-23,sag,4286,4286,0.0001\nCC-MAIN-2023-23,san,99691,99509,0.0032\nCC-MAIN-2023-23,sco,21217,21176,0.0007\nCC-MAIN-2023-23,sin,251256,250419,0.0080\nCC-MAIN-2023-23,slk,12661916,12586359,0.4032\nCC-MAIN-2023-23,slv,5201895,5177393,0.1656\nCC-MAIN-2023-23,smo,15443,15422,0.0005\nCC-MAIN-2023-23,sna,18982,18955,0.0006\nCC-MAIN-2023-23,snd,44740,44713,0.0014\nCC-MAIN-2023-23,som,121949,121754,0.0039\nCC-MAIN-2023-23,sot,19436,19417,0.0006\nCC-MAIN-2023-23,spa,144508401,143744399,4.6013\nCC-MAIN-2023-23,sqi,1365974,1361394,0.0435\nCC-MAIN-2023-23,srp,6852343,6828310,0.2182\nCC-MAIN-2023-23,ssw,787,785,0.0000\nCC-MAIN-2023-23,sun,32985,32868,0.0011\nCC-MAIN-2023-23,sux,408,408,0.0000\nCC-MAIN-2023-23,swa,263339,262805,0.0084\nCC-MAIN-2023-23,swe,22657867,22503629,0.7215\nCC-MAIN-2023-23,syr,9891,9870,0.0003\nCC-MAIN-2023-23,tam,1445203,1440663,0.0460\nCC-MAIN-2023-23,tat,202232,201842,0.0064\nCC-MAIN-2023-23,tel,577344,575925,0.0184\nCC-MAIN-2023-23,tgk,168786,168400,0.0054\nCC-MAIN-2023-23,tgl,226027,225436,0.0072\nCC-MAIN-2023-23,tha,12753729,12689214,0.4061\nCC-MAIN-2023-23,tir,27629,27426,0.0009\nCC-MAIN-2023-23,ton,2377,2357,0.0001\nCC-MAIN-2023-23,tsn,2531,2523,0.0001\nCC-MAIN-2023-23,tso,1069,1069,0.0000\nCC-MAIN-2023-23,tuk,63198,63089,0.0020\nCC-MAIN-2023-23,tur,24077559,23973419,0.7667\nCC-MAIN-2023-23,uig,41527,41393,0.0013\nCC-MAIN-2023-23,ukr,11973681,11807131,0.3813\nCC-MAIN-2023-23,urd,858328,854618,0.0273\nCC-MAIN-2023-23,uzb,527582,525424,0.0168\nCC-MAIN-2023-23,ven,768,767,0.0000\nCC-MAIN-2023-23,vie,32268657,31958582,1.0275\nCC-MAIN-2023-23,vol,18113,18085,0.0006\nCC-MAIN-2023-23,war,59071,58899,0.0019\nCC-MAIN-2023-23,wol,3979,3961,0.0001\nCC-MAIN-2023-23,xho,58656,58567,0.0019\nCC-MAIN-2023-23,yid,51123,51091,0.0016\nCC-MAIN-2023-23,yor,31660,31642,0.0010\nCC-MAIN-2023-23,zha,1677,1673,0.0001\nCC-MAIN-2023-23,zho,135159547,134711695,4.3037\nCC-MAIN-2023-23,zul,64245,64175,0.0020\nCC-MAIN-2023-40,<unknown>,93325787,93325787,2.7090\nCC-MAIN-2023-40,aar,4118,4062,0.0001\nCC-MAIN-2023-40,abk,17439,17408,0.0005\nCC-MAIN-2023-40,afr,188997,188243,0.0055\nCC-MAIN-2023-40,aka,2080,2072,0.0001\nCC-MAIN-2023-40,amh,129602,128248,0.0038\nCC-MAIN-2023-40,ara,20775066,20641210,0.6030\nCC-MAIN-2023-40,asm,82722,82678,0.0024\nCC-MAIN-2023-40,aym,4339,4025,0.0001\nCC-MAIN-2023-40,aze,1743493,1737932,0.0506\nCC-MAIN-2023-40,bak,89256,89185,0.0026\nCC-MAIN-2023-40,bel,528254,526436,0.0153\nCC-MAIN-2023-40,ben,3574928,3564529,0.1038\nCC-MAIN-2023-40,bih,22728,22645,0.0007\nCC-MAIN-2023-40,bis,4475,4458,0.0001\nCC-MAIN-2023-40,bod,51964,51849,0.0015\nCC-MAIN-2023-40,bos,1772162,1763655,0.0514\nCC-MAIN-2023-40,bre,67099,66953,0.0019\nCC-MAIN-2023-40,bul,11324157,11267870,0.3287\nCC-MAIN-2023-40,cat,8172439,8102055,0.2372\nCC-MAIN-2023-40,ceb,50295,50259,0.0015\nCC-MAIN-2023-40,ces,36556552,36292295,1.0611\nCC-MAIN-2023-40,chr,1335,1334,0.0000\nCC-MAIN-2023-40,cos,71487,71307,0.0021\nCC-MAIN-2023-40,crs,2758,2744,0.0001\nCC-MAIN-2023-40,cym,334735,332895,0.0097\nCC-MAIN-2023-40,dan,15415957,15282334,0.4475\nCC-MAIN-2023-40,deu,201035267,199402622,5.8355\nCC-MAIN-2023-40,div,84794,84671,0.0025\nCC-MAIN-2023-40,dzo,4478,4474,0.0001\nCC-MAIN-2023-40,ell,20190814,20093428,0.5861\nCC-MAIN-2023-40,eng,1599618192,1585126436,46.4328\nCC-MAIN-2023-40,epo,284100,283246,0.0082\nCC-MAIN-2023-40,est,5245711,5203692,0.1523\nCC-MAIN-2023-40,eus,1151260,1141107,0.0334\nCC-MAIN-2023-40,fao,175368,174463,0.0051\nCC-MAIN-2023-40,fas,23504433,23355216,0.6823\nCC-MAIN-2023-40,fij,3300,3219,0.0001\nCC-MAIN-2023-40,fin,14645794,14531103,0.4251\nCC-MAIN-2023-40,fra,159679989,158471884,4.6351\nCC-MAIN-2023-40,fry,81236,80937,0.0024\nCC-MAIN-2023-40,gla,55657,55564,0.0016\nCC-MAIN-2023-40,gle,232178,230164,0.0067\nCC-MAIN-2023-40,glg,1386534,1379648,0.0402\nCC-MAIN-2023-40,glv,11197,11174,0.0003\nCC-MAIN-2023-40,got,931,928,0.0000\nCC-MAIN-2023-40,grn,22224,22081,0.0006\nCC-MAIN-2023-40,guj,410338,408612,0.0119\nCC-MAIN-2023-40,hat,67250,67134,0.0020\nCC-MAIN-2023-40,hau,109065,108853,0.0032\nCC-MAIN-2023-40,haw,26550,26506,0.0008\nCC-MAIN-2023-40,heb,4217977,4191335,0.1224\nCC-MAIN-2023-40,hin,6045819,6023174,0.1755\nCC-MAIN-2023-40,hmn,28970,28126,0.0008\nCC-MAIN-2023-40,hrv,7746724,7705919,0.2249\nCC-MAIN-2023-40,hun,21522681,21408222,0.6247\nCC-MAIN-2023-40,hye,1106261,1100812,0.0321\nCC-MAIN-2023-40,ibo,25196,25087,0.0007\nCC-MAIN-2023-40,iku,7278,7223,0.0002\nCC-MAIN-2023-40,ile,11328,11233,0.0003\nCC-MAIN-2023-40,ina,19528,19442,0.0006\nCC-MAIN-2023-40,ind,30118440,29931211,0.8743\nCC-MAIN-2023-40,ipk,1894,1890,0.0001\nCC-MAIN-2023-40,isl,1586932,1576830,0.0461\nCC-MAIN-2023-40,ita,93851834,93264514,2.7243\nCC-MAIN-2023-40,jav,73509,73414,0.0021\nCC-MAIN-2023-40,jpn,163550952,162909495,4.7475\nCC-MAIN-2023-40,kal,28535,28370,0.0008\nCC-MAIN-2023-40,kan,477304,474921,0.0139\nCC-MAIN-2023-40,kas,41,41,0.0000\nCC-MAIN-2023-40,kat,1407941,1403163,0.0409\nCC-MAIN-2023-40,kaz,770725,767324,0.0224\nCC-MAIN-2023-40,kha,8849,8800,0.0003\nCC-MAIN-2023-40,khm,408610,405477,0.0119\nCC-MAIN-2023-40,kin,67244,67029,0.0020\nCC-MAIN-2023-40,kir,178026,177350,0.0052\nCC-MAIN-2023-40,kor,22413639,22326467,0.6506\nCC-MAIN-2023-40,kur,214816,213951,0.0062\nCC-MAIN-2023-40,lao,130594,130112,0.0038\nCC-MAIN-2023-40,lat,4032682,4023379,0.1171\nCC-MAIN-2023-40,lav,3503232,3478593,0.1017\nCC-MAIN-2023-40,lif,10,10,0.0000\nCC-MAIN-2023-40,lin,6601,6589,0.0002\nCC-MAIN-2023-40,lit,6991508,6940790,0.2029\nCC-MAIN-2023-40,ltz,130445,129837,0.0038\nCC-MAIN-2023-40,lug,5453,5443,0.0002\nCC-MAIN-2023-40,mal,761573,760190,0.0221\nCC-MAIN-2023-40,mar,803369,801515,0.0233\nCC-MAIN-2023-40,mfe,2852,2846,0.0001\nCC-MAIN-2023-40,mkd,1238508,1234446,0.0360\nCC-MAIN-2023-40,mlg,111292,110343,0.0032\nCC-MAIN-2023-40,mlt,166321,163031,0.0048\nCC-MAIN-2023-40,mon,591841,589862,0.0172\nCC-MAIN-2023-40,mri,46526,46396,0.0014\nCC-MAIN-2023-40,msa,2822681,2807995,0.0819\nCC-MAIN-2023-40,mya,390752,389528,0.0113\nCC-MAIN-2023-40,nau,1141,1133,0.0000\nCC-MAIN-2023-40,nep,1371532,1367947,0.0398\nCC-MAIN-2023-40,nld,74295966,73675675,2.1566\nCC-MAIN-2023-40,nno,532208,529456,0.0154\nCC-MAIN-2023-40,nor,12866650,12754474,0.3735\nCC-MAIN-2023-40,nso,1906,1891,0.0001\nCC-MAIN-2023-40,nya,24027,23992,0.0007\nCC-MAIN-2023-40,oci,91703,91489,0.0027\nCC-MAIN-2023-40,ori,168307,167835,0.0049\nCC-MAIN-2023-40,orm,18188,18181,0.0005\nCC-MAIN-2023-40,pan,210196,209413,0.0061\nCC-MAIN-2023-40,pol,59987966,59594505,1.7413\nCC-MAIN-2023-40,por,38478739,38248469,1.1169\nCC-MAIN-2023-40,pus,108768,108553,0.0032\nCC-MAIN-2023-40,que,22393,22383,0.0007\nCC-MAIN-2023-40,roh,47302,46989,0.0014\nCC-MAIN-2023-40,ron,19786769,19690824,0.5744\nCC-MAIN-2023-40,run,2459,2456,0.0001\nCC-MAIN-2023-40,rus,191917020,190848390,5.5709\nCC-MAIN-2023-40,sag,4797,4794,0.0001\nCC-MAIN-2023-40,san,112835,112307,0.0033\nCC-MAIN-2023-40,sco,20606,20537,0.0006\nCC-MAIN-2023-40,sin,277423,276248,0.0081\nCC-MAIN-2023-40,slk,15734686,15624606,0.4567\nCC-MAIN-2023-40,slv,6661448,6623472,0.1934\nCC-MAIN-2023-40,smo,22828,22772,0.0007\nCC-MAIN-2023-40,sna,21751,21728,0.0006\nCC-MAIN-2023-40,snd,60139,60074,0.0017\nCC-MAIN-2023-40,som,146711,146365,0.0043\nCC-MAIN-2023-40,sot,22245,22212,0.0006\nCC-MAIN-2023-40,spa,159155001,158029217,4.6199\nCC-MAIN-2023-40,sqi,1606526,1599288,0.0466\nCC-MAIN-2023-40,srp,8703162,8662640,0.2526\nCC-MAIN-2023-40,ssw,730,728,0.0000\nCC-MAIN-2023-40,sun,74081,71986,0.0022\nCC-MAIN-2023-40,sux,386,386,0.0000\nCC-MAIN-2023-40,swa,288723,288068,0.0084\nCC-MAIN-2023-40,swe,24158793,23951506,0.7013\nCC-MAIN-2023-40,syr,11268,11251,0.0003\nCC-MAIN-2023-40,tam,1488635,1482818,0.0432\nCC-MAIN-2023-40,tat,200771,200394,0.0058\nCC-MAIN-2023-40,tel,627316,625353,0.0182\nCC-MAIN-2023-40,tgk,183419,182967,0.0053\nCC-MAIN-2023-40,tgl,261715,260756,0.0076\nCC-MAIN-2023-40,tha,15537593,15435020,0.4510\nCC-MAIN-2023-40,tir,28608,28168,0.0008\nCC-MAIN-2023-40,ton,2594,2581,0.0001\nCC-MAIN-2023-40,tsn,2737,2723,0.0001\nCC-MAIN-2023-40,tso,1502,1498,0.0000\nCC-MAIN-2023-40,tuk,78205,78085,0.0023\nCC-MAIN-2023-40,tur,28670749,28518972,0.8322\nCC-MAIN-2023-40,uig,53065,52908,0.0015\nCC-MAIN-2023-40,ukr,11825186,11716205,0.3433\nCC-MAIN-2023-40,urd,944730,940519,0.0274\nCC-MAIN-2023-40,uzb,582179,578315,0.0169\nCC-MAIN-2023-40,ven,541,540,0.0000\nCC-MAIN-2023-40,vie,36414996,36122270,1.0570\nCC-MAIN-2023-40,vol,18001,17970,0.0005\nCC-MAIN-2023-40,war,54498,54236,0.0016\nCC-MAIN-2023-40,wol,3997,3949,0.0001\nCC-MAIN-2023-40,xho,59413,59259,0.0017\nCC-MAIN-2023-40,yid,70164,70063,0.0020\nCC-MAIN-2023-40,yor,39520,39472,0.0011\nCC-MAIN-2023-40,zha,1730,1725,0.0001\nCC-MAIN-2023-40,zho,130812318,130312299,3.7971\nCC-MAIN-2023-40,zul,65299,65150,0.0019\nCC-MAIN-2023-50,<unknown>,108462778,108462778,3.2338\nCC-MAIN-2023-50,aar,4930,4886,0.0001\nCC-MAIN-2023-50,abk,16530,16454,0.0005\nCC-MAIN-2023-50,afr,303548,302365,0.0091\nCC-MAIN-2023-50,aka,2487,2482,0.0001\nCC-MAIN-2023-50,amh,109151,108632,0.0033\nCC-MAIN-2023-50,ara,19677400,19569451,0.5867\nCC-MAIN-2023-50,asm,67797,66927,0.0020\nCC-MAIN-2023-50,aym,1435,1415,0.0000\nCC-MAIN-2023-50,aze,1771280,1764967,0.0528\nCC-MAIN-2023-50,bak,92404,92372,0.0028\nCC-MAIN-2023-50,bel,498765,496222,0.0149\nCC-MAIN-2023-50,ben,3289097,3279881,0.0981\nCC-MAIN-2023-50,bih,22057,22001,0.0007\nCC-MAIN-2023-50,bis,2916,2907,0.0001\nCC-MAIN-2023-50,bod,51582,51501,0.0015\nCC-MAIN-2023-50,bos,1593062,1587914,0.0475\nCC-MAIN-2023-50,bre,86207,86125,0.0026\nCC-MAIN-2023-50,bul,9948791,9903910,0.2966\nCC-MAIN-2023-50,cat,7028474,6960219,0.2096\nCC-MAIN-2023-50,ceb,50278,50240,0.0015\nCC-MAIN-2023-50,ces,34231421,33985466,1.0206\nCC-MAIN-2023-50,chr,1465,1462,0.0000\nCC-MAIN-2023-50,cos,75525,75401,0.0023\nCC-MAIN-2023-50,crs,2697,2674,0.0001\nCC-MAIN-2023-50,cym,336232,333109,0.0100\nCC-MAIN-2023-50,dan,14443483,14321702,0.4306\nCC-MAIN-2023-50,deu,182791342,181278583,5.4499\nCC-MAIN-2023-50,div,83779,83694,0.0025\nCC-MAIN-2023-50,dzo,3982,3980,0.0001\nCC-MAIN-2023-50,ell,19473183,19386236,0.5806\nCC-MAIN-2023-50,eng,1490149909,1475497113,44.4285\nCC-MAIN-2023-50,epo,303023,302151,0.0090\nCC-MAIN-2023-50,est,4492177,4452342,0.1339\nCC-MAIN-2023-50,eus,1100311,1089922,0.0328\nCC-MAIN-2023-50,fao,144533,143863,0.0043\nCC-MAIN-2023-50,fas,22790281,22655068,0.6795\nCC-MAIN-2023-50,fij,3541,3508,0.0001\nCC-MAIN-2023-50,fin,12343987,12238847,0.3680\nCC-MAIN-2023-50,fra,147351767,146218582,4.3933\nCC-MAIN-2023-50,fry,103419,103213,0.0031\nCC-MAIN-2023-50,gla,42929,42801,0.0013\nCC-MAIN-2023-50,gle,199318,197310,0.0059\nCC-MAIN-2023-50,glg,1176579,1170183,0.0351\nCC-MAIN-2023-50,glv,10988,10958,0.0003\nCC-MAIN-2023-50,got,681,681,0.0000\nCC-MAIN-2023-50,grn,21159,20999,0.0006\nCC-MAIN-2023-50,guj,382729,379111,0.0114\nCC-MAIN-2023-50,hat,56442,56311,0.0017\nCC-MAIN-2023-50,hau,70248,70100,0.0021\nCC-MAIN-2023-50,haw,18742,18717,0.0006\nCC-MAIN-2023-50,heb,7014429,6960564,0.2091\nCC-MAIN-2023-50,hin,5865451,5844045,0.1749\nCC-MAIN-2023-50,hmn,21738,21700,0.0006\nCC-MAIN-2023-50,hrv,6756367,6723907,0.2014\nCC-MAIN-2023-50,hun,22455276,22337934,0.6695\nCC-MAIN-2023-50,hye,1005216,1000971,0.0300\nCC-MAIN-2023-50,ibo,16932,16888,0.0005\nCC-MAIN-2023-50,iku,5785,5763,0.0002\nCC-MAIN-2023-50,ile,10303,10225,0.0003\nCC-MAIN-2023-50,ina,16060,16020,0.0005\nCC-MAIN-2023-50,ind,28831219,28650875,0.8596\nCC-MAIN-2023-50,ipk,2144,2136,0.0001\nCC-MAIN-2023-50,isl,1315315,1306857,0.0392\nCC-MAIN-2023-50,ita,86648936,86086759,2.5834\nCC-MAIN-2023-50,jav,75945,75879,0.0023\nCC-MAIN-2023-50,jpn,172759155,171925721,5.1508\nCC-MAIN-2023-50,kal,25444,25273,0.0008\nCC-MAIN-2023-50,kan,411769,410982,0.0123\nCC-MAIN-2023-50,kas,17,17,0.0000\nCC-MAIN-2023-50,kat,1206129,1202238,0.0360\nCC-MAIN-2023-50,kaz,740840,737349,0.0221\nCC-MAIN-2023-50,kha,10470,10427,0.0003\nCC-MAIN-2023-50,khm,325249,323200,0.0097\nCC-MAIN-2023-50,kin,62113,62021,0.0019\nCC-MAIN-2023-50,kir,187056,186413,0.0056\nCC-MAIN-2023-50,kor,24445162,24330107,0.7288\nCC-MAIN-2023-50,kur,188535,188107,0.0056\nCC-MAIN-2023-50,lao,120052,119281,0.0036\nCC-MAIN-2023-50,lat,3920498,3911203,0.1169\nCC-MAIN-2023-50,lav,2848030,2828544,0.0849\nCC-MAIN-2023-50,lif,44,44,0.0000\nCC-MAIN-2023-50,lin,6408,6398,0.0002\nCC-MAIN-2023-50,lit,5208333,5169529,0.1553\nCC-MAIN-2023-50,ltz,130012,129335,0.0039\nCC-MAIN-2023-50,lug,6531,6523,0.0002\nCC-MAIN-2023-50,mal,730196,728159,0.0218\nCC-MAIN-2023-50,mar,710794,708377,0.0212\nCC-MAIN-2023-50,mfe,5647,5639,0.0002\nCC-MAIN-2023-50,mkd,1119125,1115174,0.0334\nCC-MAIN-2023-50,mlg,106540,105335,0.0032\nCC-MAIN-2023-50,mlt,140463,138448,0.0042\nCC-MAIN-2023-50,mon,477266,476254,0.0142\nCC-MAIN-2023-50,mri,34188,33994,0.0010\nCC-MAIN-2023-50,msa,2490129,2478868,0.0742\nCC-MAIN-2023-50,mya,394764,393807,0.0118\nCC-MAIN-2023-50,nau,1310,1305,0.0000\nCC-MAIN-2023-50,nep,1323863,1321155,0.0395\nCC-MAIN-2023-50,nld,66229509,65678419,1.9746\nCC-MAIN-2023-50,nno,458632,455969,0.0137\nCC-MAIN-2023-50,nor,10704200,10614470,0.3191\nCC-MAIN-2023-50,nso,1937,1933,0.0001\nCC-MAIN-2023-50,nya,18135,18106,0.0005\nCC-MAIN-2023-50,oci,105032,104818,0.0031\nCC-MAIN-2023-50,ori,146605,146341,0.0044\nCC-MAIN-2023-50,orm,19583,19566,0.0006\nCC-MAIN-2023-50,pan,183396,182844,0.0055\nCC-MAIN-2023-50,pol,58662332,58258688,1.7490\nCC-MAIN-2023-50,por,59134511,58761376,1.7631\nCC-MAIN-2023-50,pus,94991,94863,0.0028\nCC-MAIN-2023-50,que,19454,19439,0.0006\nCC-MAIN-2023-50,roh,44335,43973,0.0013\nCC-MAIN-2023-50,ron,19083314,18985303,0.5690\nCC-MAIN-2023-50,run,3341,3336,0.0001\nCC-MAIN-2023-50,rus,202259054,201155871,6.0303\nCC-MAIN-2023-50,sag,11977,11974,0.0004\nCC-MAIN-2023-50,san,104975,104809,0.0031\nCC-MAIN-2023-50,sco,23020,22942,0.0007\nCC-MAIN-2023-50,sin,259672,258849,0.0077\nCC-MAIN-2023-50,slk,12041848,11963193,0.3590\nCC-MAIN-2023-50,slv,5469009,5439375,0.1631\nCC-MAIN-2023-50,smo,16271,16229,0.0005\nCC-MAIN-2023-50,sna,17014,16949,0.0005\nCC-MAIN-2023-50,snd,49088,49012,0.0015\nCC-MAIN-2023-50,som,138735,138011,0.0041\nCC-MAIN-2023-50,sot,15861,15807,0.0005\nCC-MAIN-2023-50,spa,152243704,151166099,4.5391\nCC-MAIN-2023-50,sqi,1472798,1466432,0.0439\nCC-MAIN-2023-50,srp,7399787,7364003,0.2206\nCC-MAIN-2023-50,ssw,886,884,0.0000\nCC-MAIN-2023-50,sun,53551,52342,0.0016\nCC-MAIN-2023-50,sux,298,298,0.0000\nCC-MAIN-2023-50,swa,246190,245606,0.0073\nCC-MAIN-2023-50,swe,22260121,22062149,0.6637\nCC-MAIN-2023-50,syr,11403,11378,0.0003\nCC-MAIN-2023-50,tam,1419478,1414607,0.0423\nCC-MAIN-2023-50,tat,206583,206289,0.0062\nCC-MAIN-2023-50,tel,540437,539195,0.0161\nCC-MAIN-2023-50,tgk,172790,172356,0.0052\nCC-MAIN-2023-50,tgl,313126,310536,0.0093\nCC-MAIN-2023-50,tha,14257471,14170455,0.4251\nCC-MAIN-2023-50,tir,27238,26873,0.0008\nCC-MAIN-2023-50,ton,2150,2131,0.0001\nCC-MAIN-2023-50,tsn,3295,3282,0.0001\nCC-MAIN-2023-50,tso,1429,1425,0.0000\nCC-MAIN-2023-50,tuk,82371,82195,0.0025\nCC-MAIN-2023-50,tur,32881965,32700320,0.9804\nCC-MAIN-2023-50,uig,42783,42443,0.0013\nCC-MAIN-2023-50,ukr,12897819,12801699,0.3845\nCC-MAIN-2023-50,urd,890447,886957,0.0265\nCC-MAIN-2023-50,uzb,665517,662862,0.0198\nCC-MAIN-2023-50,ven,795,790,0.0000\nCC-MAIN-2023-50,vie,34514828,34216729,1.0291\nCC-MAIN-2023-50,vol,17471,17442,0.0005\nCC-MAIN-2023-50,war,51692,51433,0.0015\nCC-MAIN-2023-50,wol,6127,6077,0.0002\nCC-MAIN-2023-50,xho,56147,56047,0.0017\nCC-MAIN-2023-50,yid,54774,54654,0.0016\nCC-MAIN-2023-50,yor,25930,25887,0.0008\nCC-MAIN-2023-50,zha,1675,1671,0.0000\nCC-MAIN-2023-50,zho,170377731,169831708,5.0798\nCC-MAIN-2023-50,zul,61397,61286,0.0018\nCC-MAIN-2024-10,<unknown>,85800296,85800296,2.7619\nCC-MAIN-2024-10,aar,3062,3050,0.0001\nCC-MAIN-2024-10,abk,13765,13669,0.0004\nCC-MAIN-2024-10,afr,252801,251822,0.0081\nCC-MAIN-2024-10,aka,2503,2502,0.0001\nCC-MAIN-2024-10,amh,95995,95520,0.0031\nCC-MAIN-2024-10,ara,18251912,18154180,0.5875\nCC-MAIN-2024-10,asm,61843,61659,0.0020\nCC-MAIN-2024-10,aym,1693,1661,0.0001\nCC-MAIN-2024-10,aze,1872199,1865219,0.0603\nCC-MAIN-2024-10,bak,79002,78975,0.0025\nCC-MAIN-2024-10,bel,490955,489282,0.0158\nCC-MAIN-2024-10,ben,3183953,3174268,0.1025\nCC-MAIN-2024-10,bih,19778,19760,0.0006\nCC-MAIN-2024-10,bis,1921,1915,0.0001\nCC-MAIN-2024-10,bod,54561,54498,0.0018\nCC-MAIN-2024-10,bos,1491784,1484720,0.0480\nCC-MAIN-2024-10,bre,53334,53273,0.0017\nCC-MAIN-2024-10,bul,8938049,8902221,0.2877\nCC-MAIN-2024-10,cat,6376519,6315430,0.2053\nCC-MAIN-2024-10,ceb,51512,51490,0.0017\nCC-MAIN-2024-10,ces,30750232,30505254,0.9899\nCC-MAIN-2024-10,chr,1378,1376,0.0000\nCC-MAIN-2024-10,cos,60504,60369,0.0019\nCC-MAIN-2024-10,crs,2565,2550,0.0001\nCC-MAIN-2024-10,cym,320036,317344,0.0103\nCC-MAIN-2024-10,dan,12716772,12602901,0.4094\nCC-MAIN-2024-10,deu,167591310,166202767,5.3948\nCC-MAIN-2024-10,div,81462,81334,0.0026\nCC-MAIN-2024-10,dzo,4040,4039,0.0001\nCC-MAIN-2024-10,ell,16772598,16694655,0.5399\nCC-MAIN-2024-10,eng,1443093126,1428499460,46.4536\nCC-MAIN-2024-10,epo,249738,248994,0.0080\nCC-MAIN-2024-10,est,4006577,3981272,0.1290\nCC-MAIN-2024-10,eus,1020713,1009464,0.0329\nCC-MAIN-2024-10,fao,127823,127226,0.0041\nCC-MAIN-2024-10,fas,20708641,20610261,0.6666\nCC-MAIN-2024-10,fij,3903,3849,0.0001\nCC-MAIN-2024-10,fin,11111827,11018231,0.3577\nCC-MAIN-2024-10,fra,134398716,133334446,4.3263\nCC-MAIN-2024-10,fry,74386,74036,0.0024\nCC-MAIN-2024-10,gla,40531,40378,0.0013\nCC-MAIN-2024-10,gle,190618,187423,0.0061\nCC-MAIN-2024-10,glg,1040186,1033865,0.0335\nCC-MAIN-2024-10,glv,9734,9713,0.0003\nCC-MAIN-2024-10,got,608,607,0.0000\nCC-MAIN-2024-10,grn,17917,17827,0.0006\nCC-MAIN-2024-10,guj,351526,346110,0.0113\nCC-MAIN-2024-10,hat,48583,48286,0.0016\nCC-MAIN-2024-10,hau,64521,64422,0.0021\nCC-MAIN-2024-10,haw,15219,15200,0.0005\nCC-MAIN-2024-10,heb,6849775,6790698,0.2205\nCC-MAIN-2024-10,hin,5542752,5523006,0.1784\nCC-MAIN-2024-10,hmn,15226,15197,0.0005\nCC-MAIN-2024-10,hrv,6091979,6061658,0.1961\nCC-MAIN-2024-10,hun,17538706,17437593,0.5646\nCC-MAIN-2024-10,hye,926524,921940,0.0298\nCC-MAIN-2024-10,ibo,17402,17350,0.0006\nCC-MAIN-2024-10,iku,5762,5741,0.0002\nCC-MAIN-2024-10,ile,9486,9432,0.0003\nCC-MAIN-2024-10,ina,15273,15219,0.0005\nCC-MAIN-2024-10,ind,26856832,26685797,0.8645\nCC-MAIN-2024-10,ipk,1452,1452,0.0000\nCC-MAIN-2024-10,isl,1239564,1232793,0.0399\nCC-MAIN-2024-10,ita,79953116,79438998,2.5737\nCC-MAIN-2024-10,jav,62529,62495,0.0020\nCC-MAIN-2024-10,jpn,158227264,157529103,5.0934\nCC-MAIN-2024-10,kal,27283,27061,0.0009\nCC-MAIN-2024-10,kan,397299,396433,0.0128\nCC-MAIN-2024-10,kas,22,22,0.0000\nCC-MAIN-2024-10,kat,1124367,1120147,0.0362\nCC-MAIN-2024-10,kaz,684286,680024,0.0220\nCC-MAIN-2024-10,kha,8393,8331,0.0003\nCC-MAIN-2024-10,khm,312850,311577,0.0101\nCC-MAIN-2024-10,kin,62878,62708,0.0020\nCC-MAIN-2024-10,kir,239904,238997,0.0077\nCC-MAIN-2024-10,kor,20203715,20117601,0.6504\nCC-MAIN-2024-10,kur,195951,195456,0.0063\nCC-MAIN-2024-10,lao,104352,103731,0.0034\nCC-MAIN-2024-10,lat,3500164,3493148,0.1127\nCC-MAIN-2024-10,lav,2595656,2573259,0.0836\nCC-MAIN-2024-10,lif,19,19,0.0000\nCC-MAIN-2024-10,lin,5304,5295,0.0002\nCC-MAIN-2024-10,lit,4754781,4718575,0.1531\nCC-MAIN-2024-10,ltz,104455,104135,0.0034\nCC-MAIN-2024-10,lug,5872,5865,0.0002\nCC-MAIN-2024-10,mal,666990,665020,0.0215\nCC-MAIN-2024-10,mar,725711,723069,0.0234\nCC-MAIN-2024-10,mfe,6161,6151,0.0002\nCC-MAIN-2024-10,mkd,1110535,1107253,0.0357\nCC-MAIN-2024-10,mlg,88468,88197,0.0028\nCC-MAIN-2024-10,mlt,120070,119363,0.0039\nCC-MAIN-2024-10,mon,436825,435760,0.0141\nCC-MAIN-2024-10,mri,26952,26817,0.0009\nCC-MAIN-2024-10,msa,2325678,2313970,0.0749\nCC-MAIN-2024-10,mya,349823,348910,0.0113\nCC-MAIN-2024-10,nau,1026,1018,0.0000\nCC-MAIN-2024-10,nep,1329517,1325465,0.0428\nCC-MAIN-2024-10,nld,60913977,60401506,1.9608\nCC-MAIN-2024-10,nno,427659,425290,0.0138\nCC-MAIN-2024-10,nor,9930519,9838244,0.3197\nCC-MAIN-2024-10,nso,1595,1595,0.0001\nCC-MAIN-2024-10,nya,15470,15458,0.0005\nCC-MAIN-2024-10,oci,85077,84852,0.0027\nCC-MAIN-2024-10,ori,147836,147633,0.0048\nCC-MAIN-2024-10,orm,14829,14822,0.0005\nCC-MAIN-2024-10,pan,174775,174331,0.0056\nCC-MAIN-2024-10,pol,53573565,53222150,1.7245\nCC-MAIN-2024-10,por,59886888,59535061,1.9278\nCC-MAIN-2024-10,pus,88739,88586,0.0029\nCC-MAIN-2024-10,que,18654,18652,0.0006\nCC-MAIN-2024-10,roh,40066,39786,0.0013\nCC-MAIN-2024-10,ron,16396114,16313282,0.5278\nCC-MAIN-2024-10,run,3455,3451,0.0001\nCC-MAIN-2024-10,rus,180473311,179559017,5.8095\nCC-MAIN-2024-10,sag,3704,3703,0.0001\nCC-MAIN-2024-10,san,92983,92562,0.0030\nCC-MAIN-2024-10,sco,19090,19014,0.0006\nCC-MAIN-2024-10,sin,248885,248133,0.0080\nCC-MAIN-2024-10,slk,11208782,11127803,0.3608\nCC-MAIN-2024-10,slv,4690873,4663240,0.1510\nCC-MAIN-2024-10,smo,16564,16499,0.0005\nCC-MAIN-2024-10,sna,15527,15492,0.0005\nCC-MAIN-2024-10,snd,48203,48141,0.0016\nCC-MAIN-2024-10,som,134478,133943,0.0043\nCC-MAIN-2024-10,sot,15708,15662,0.0005\nCC-MAIN-2024-10,spa,141228455,140200989,4.5462\nCC-MAIN-2024-10,sqi,1398427,1392990,0.0450\nCC-MAIN-2024-10,srp,6677508,6644658,0.2150\nCC-MAIN-2024-10,ssw,869,861,0.0000\nCC-MAIN-2024-10,sun,34227,34091,0.0011\nCC-MAIN-2024-10,sux,390,390,0.0000\nCC-MAIN-2024-10,swa,233908,233008,0.0075\nCC-MAIN-2024-10,swe,20173509,20012048,0.6494\nCC-MAIN-2024-10,syr,10590,10573,0.0003\nCC-MAIN-2024-10,tam,1319921,1314429,0.0425\nCC-MAIN-2024-10,tat,197275,196755,0.0064\nCC-MAIN-2024-10,tel,524152,522538,0.0169\nCC-MAIN-2024-10,tgk,158824,158488,0.0051\nCC-MAIN-2024-10,tgl,259855,259033,0.0084\nCC-MAIN-2024-10,tha,12739349,12671457,0.4101\nCC-MAIN-2024-10,tir,24611,24391,0.0008\nCC-MAIN-2024-10,ton,2539,2528,0.0001\nCC-MAIN-2024-10,tsn,3299,3171,0.0001\nCC-MAIN-2024-10,tso,1282,1280,0.0000\nCC-MAIN-2024-10,tuk,56579,56458,0.0018\nCC-MAIN-2024-10,tur,30643899,30491346,0.9864\nCC-MAIN-2024-10,uig,36569,36495,0.0012\nCC-MAIN-2024-10,ukr,13342135,13230096,0.4295\nCC-MAIN-2024-10,urd,882141,878954,0.0284\nCC-MAIN-2024-10,uzb,682364,679544,0.0220\nCC-MAIN-2024-10,ven,639,638,0.0000\nCC-MAIN-2024-10,vie,30669340,30464174,0.9873\nCC-MAIN-2024-10,vol,13568,13552,0.0004\nCC-MAIN-2024-10,war,58366,57832,0.0019\nCC-MAIN-2024-10,wol,3580,3575,0.0001\nCC-MAIN-2024-10,xho,52932,52887,0.0017\nCC-MAIN-2024-10,yid,47610,47526,0.0015\nCC-MAIN-2024-10,yor,24682,24624,0.0008\nCC-MAIN-2024-10,zha,1502,1498,0.0000\nCC-MAIN-2024-10,zho,129436236,128551170,4.1666\nCC-MAIN-2024-10,zul,54932,54873,0.0018\nCC-MAIN-2024-18,<unknown>,80114263,80114263,2.8748\nCC-MAIN-2024-18,aar,2481,2470,0.0001\nCC-MAIN-2024-18,abk,13012,12908,0.0005\nCC-MAIN-2024-18,afr,250103,249341,0.0090\nCC-MAIN-2024-18,aka,1845,1843,0.0001\nCC-MAIN-2024-18,amh,88665,88168,0.0032\nCC-MAIN-2024-18,ara,17217672,17136665,0.6178\nCC-MAIN-2024-18,asm,61776,61712,0.0022\nCC-MAIN-2024-18,aym,2296,2237,0.0001\nCC-MAIN-2024-18,aze,1720367,1713862,0.0617\nCC-MAIN-2024-18,bak,77281,77254,0.0028\nCC-MAIN-2024-18,bel,516156,514375,0.0185\nCC-MAIN-2024-18,ben,2962532,2955252,0.1063\nCC-MAIN-2024-18,bih,19899,19844,0.0007\nCC-MAIN-2024-18,bis,2372,2355,0.0001\nCC-MAIN-2024-18,bod,47448,47181,0.0017\nCC-MAIN-2024-18,bos,1421756,1409822,0.0510\nCC-MAIN-2024-18,bre,76565,76450,0.0027\nCC-MAIN-2024-18,bul,8157439,8127446,0.2927\nCC-MAIN-2024-18,cat,5674434,5623064,0.2036\nCC-MAIN-2024-18,ceb,57405,57343,0.0021\nCC-MAIN-2024-18,ces,28220519,28011031,1.0126\nCC-MAIN-2024-18,chr,1374,1373,0.0000\nCC-MAIN-2024-18,cos,58251,58125,0.0021\nCC-MAIN-2024-18,crs,3013,2958,0.0001\nCC-MAIN-2024-18,cym,298376,296632,0.0107\nCC-MAIN-2024-18,dan,11957753,11870413,0.4291\nCC-MAIN-2024-18,deu,146671133,145600511,5.2631\nCC-MAIN-2024-18,div,67700,67626,0.0024\nCC-MAIN-2024-18,dzo,3572,3571,0.0001\nCC-MAIN-2024-18,ell,15548949,15489885,0.5579\nCC-MAIN-2024-18,eng,1268287767,1258271680,45.5105\nCC-MAIN-2024-18,epo,257756,257287,0.0092\nCC-MAIN-2024-18,est,3616180,3591868,0.1298\nCC-MAIN-2024-18,eus,923614,918373,0.0331\nCC-MAIN-2024-18,fao,111717,111387,0.0040\nCC-MAIN-2024-18,fas,19160480,19091543,0.6875\nCC-MAIN-2024-18,fij,3638,3620,0.0001\nCC-MAIN-2024-18,fin,10092341,10011678,0.3621\nCC-MAIN-2024-18,fra,120050726,119238541,4.3078\nCC-MAIN-2024-18,fry,86995,86817,0.0031\nCC-MAIN-2024-18,gla,37539,37461,0.0013\nCC-MAIN-2024-18,gle,189101,185213,0.0068\nCC-MAIN-2024-18,glg,1005535,1000442,0.0361\nCC-MAIN-2024-18,glv,9831,9822,0.0004\nCC-MAIN-2024-18,got,571,571,0.0000\nCC-MAIN-2024-18,grn,18200,18155,0.0007\nCC-MAIN-2024-18,guj,334983,331457,0.0120\nCC-MAIN-2024-18,hat,49695,49403,0.0018\nCC-MAIN-2024-18,hau,68993,68824,0.0025\nCC-MAIN-2024-18,haw,14241,14218,0.0005\nCC-MAIN-2024-18,heb,6037880,6003347,0.2167\nCC-MAIN-2024-18,hin,5181082,5164532,0.1859\nCC-MAIN-2024-18,hmn,15295,15272,0.0005\nCC-MAIN-2024-18,hrv,5713721,5687153,0.2050\nCC-MAIN-2024-18,hun,16234757,16151717,0.5826\nCC-MAIN-2024-18,hye,906831,900710,0.0325\nCC-MAIN-2024-18,ibo,13996,13941,0.0005\nCC-MAIN-2024-18,iku,4886,4872,0.0002\nCC-MAIN-2024-18,ile,8080,8029,0.0003\nCC-MAIN-2024-18,ina,13840,13768,0.0005\nCC-MAIN-2024-18,ind,25611435,25458049,0.9190\nCC-MAIN-2024-18,ipk,1313,1310,0.0000\nCC-MAIN-2024-18,isl,1084945,1079499,0.0389\nCC-MAIN-2024-18,ita,72790793,72372667,2.6120\nCC-MAIN-2024-18,jav,57577,57533,0.0021\nCC-MAIN-2024-18,jpn,143727584,143161141,5.1574\nCC-MAIN-2024-18,kal,21340,21100,0.0008\nCC-MAIN-2024-18,kan,366103,365196,0.0131\nCC-MAIN-2024-18,kas,21,21,0.0000\nCC-MAIN-2024-18,kat,1043776,1040034,0.0375\nCC-MAIN-2024-18,kaz,669980,666514,0.0240\nCC-MAIN-2024-18,kha,6759,6722,0.0002\nCC-MAIN-2024-18,khm,307653,306688,0.0110\nCC-MAIN-2024-18,kin,58757,58565,0.0021\nCC-MAIN-2024-18,kir,238026,237208,0.0085\nCC-MAIN-2024-18,kor,19265949,19158635,0.6913\nCC-MAIN-2024-18,kur,169879,169633,0.0061\nCC-MAIN-2024-18,lao,106510,105805,0.0038\nCC-MAIN-2024-18,lat,3179308,3173283,0.1141\nCC-MAIN-2024-18,lav,2402864,2381340,0.0862\nCC-MAIN-2024-18,lif,20,20,0.0000\nCC-MAIN-2024-18,lin,5798,5793,0.0002\nCC-MAIN-2024-18,lit,4349315,4320407,0.1561\nCC-MAIN-2024-18,ltz,106218,105931,0.0038\nCC-MAIN-2024-18,lug,5366,5345,0.0002\nCC-MAIN-2024-18,mal,615725,614111,0.0221\nCC-MAIN-2024-18,mar,689125,687199,0.0247\nCC-MAIN-2024-18,mfe,4161,4158,0.0001\nCC-MAIN-2024-18,mkd,1059056,1056239,0.0380\nCC-MAIN-2024-18,mlg,86629,86242,0.0031\nCC-MAIN-2024-18,mlt,123914,121119,0.0044\nCC-MAIN-2024-18,mon,391151,389762,0.0140\nCC-MAIN-2024-18,mri,30241,30059,0.0011\nCC-MAIN-2024-18,msa,2078918,2069430,0.0746\nCC-MAIN-2024-18,mya,349744,349015,0.0126\nCC-MAIN-2024-18,nau,1027,1023,0.0000\nCC-MAIN-2024-18,nep,1239864,1237105,0.0445\nCC-MAIN-2024-18,nld,53231684,52847138,1.9101\nCC-MAIN-2024-18,nno,395332,393172,0.0142\nCC-MAIN-2024-18,nor,8802737,8732458,0.3159\nCC-MAIN-2024-18,nso,1561,1560,0.0001\nCC-MAIN-2024-18,nya,14276,14224,0.0005\nCC-MAIN-2024-18,oci,91862,91709,0.0033\nCC-MAIN-2024-18,ori,141413,141115,0.0051\nCC-MAIN-2024-18,orm,16237,16221,0.0006\nCC-MAIN-2024-18,pan,164277,163932,0.0059\nCC-MAIN-2024-18,pol,48996624,48717619,1.7582\nCC-MAIN-2024-18,por,54356538,54087240,1.9505\nCC-MAIN-2024-18,pus,94327,94172,0.0034\nCC-MAIN-2024-18,que,17290,17283,0.0006\nCC-MAIN-2024-18,roh,27861,27553,0.0010\nCC-MAIN-2024-18,ron,15215050,15145828,0.5460\nCC-MAIN-2024-18,run,2021,2008,0.0001\nCC-MAIN-2024-18,rus,165751779,165007924,5.9477\nCC-MAIN-2024-18,sag,12757,12756,0.0005\nCC-MAIN-2024-18,san,98326,97918,0.0035\nCC-MAIN-2024-18,sco,16954,16915,0.0006\nCC-MAIN-2024-18,sin,232381,231398,0.0083\nCC-MAIN-2024-18,slk,10235494,10163139,0.3673\nCC-MAIN-2024-18,slv,4388621,4362921,0.1575\nCC-MAIN-2024-18,smo,15904,15855,0.0006\nCC-MAIN-2024-18,sna,15762,15686,0.0006\nCC-MAIN-2024-18,snd,44181,44158,0.0016\nCC-MAIN-2024-18,som,132012,131695,0.0047\nCC-MAIN-2024-18,sot,16186,16108,0.0006\nCC-MAIN-2024-18,spa,128029443,127236557,4.5941\nCC-MAIN-2024-18,sqi,1309379,1304026,0.0470\nCC-MAIN-2024-18,srp,6148120,6123065,0.2206\nCC-MAIN-2024-18,ssw,704,703,0.0000\nCC-MAIN-2024-18,sun,25297,25280,0.0009\nCC-MAIN-2024-18,sux,288,288,0.0000\nCC-MAIN-2024-18,swa,222427,221909,0.0080\nCC-MAIN-2024-18,swe,18107263,17976360,0.6498\nCC-MAIN-2024-18,syr,8725,8711,0.0003\nCC-MAIN-2024-18,tam,1182549,1179012,0.0424\nCC-MAIN-2024-18,tat,190035,189587,0.0068\nCC-MAIN-2024-18,tel,538662,537011,0.0193\nCC-MAIN-2024-18,tgk,177800,177505,0.0064\nCC-MAIN-2024-18,tgl,246536,245803,0.0088\nCC-MAIN-2024-18,tha,11551587,11498877,0.4145\nCC-MAIN-2024-18,tir,22470,22266,0.0008\nCC-MAIN-2024-18,ton,3417,3404,0.0001\nCC-MAIN-2024-18,tsn,2367,2365,0.0001\nCC-MAIN-2024-18,tso,1288,1284,0.0000\nCC-MAIN-2024-18,tuk,50233,50078,0.0018\nCC-MAIN-2024-18,tur,29605530,29476341,1.0623\nCC-MAIN-2024-18,uig,35648,35616,0.0013\nCC-MAIN-2024-18,ukr,12544639,12450456,0.4501\nCC-MAIN-2024-18,urd,870653,867942,0.0312\nCC-MAIN-2024-18,uzb,583642,581105,0.0209\nCC-MAIN-2024-18,ven,620,620,0.0000\nCC-MAIN-2024-18,vie,27264946,27084080,0.9784\nCC-MAIN-2024-18,vol,13875,13858,0.0005\nCC-MAIN-2024-18,war,61208,61019,0.0022\nCC-MAIN-2024-18,wol,3771,3763,0.0001\nCC-MAIN-2024-18,xho,47720,47653,0.0017\nCC-MAIN-2024-18,yid,46218,46157,0.0017\nCC-MAIN-2024-18,yor,21437,21398,0.0008\nCC-MAIN-2024-18,zha,1485,1484,0.0001\nCC-MAIN-2024-18,zho,123282101,122895570,4.4238\nCC-MAIN-2024-18,zul,55005,54914,0.0020\nCC-MAIN-2024-22,<unknown>,77479807,77479807,2.8592\nCC-MAIN-2024-22,aar,2477,2466,0.0001\nCC-MAIN-2024-22,abk,12913,12808,0.0005\nCC-MAIN-2024-22,afr,248627,248014,0.0092\nCC-MAIN-2024-22,aka,2883,2879,0.0001\nCC-MAIN-2024-22,amh,88184,87855,0.0033\nCC-MAIN-2024-22,ara,17214553,17134138,0.6353\nCC-MAIN-2024-22,asm,57044,56968,0.0021\nCC-MAIN-2024-22,aym,2549,2464,0.0001\nCC-MAIN-2024-22,aze,1601226,1595560,0.0591\nCC-MAIN-2024-22,bak,73752,73733,0.0027\nCC-MAIN-2024-22,bel,533545,531284,0.0197\nCC-MAIN-2024-22,ben,2922020,2915490,0.1078\nCC-MAIN-2024-22,bih,17481,17405,0.0006\nCC-MAIN-2024-22,bis,2212,2186,0.0001\nCC-MAIN-2024-22,bod,44689,44495,0.0016\nCC-MAIN-2024-22,bos,1370214,1361445,0.0506\nCC-MAIN-2024-22,bre,54336,54239,0.0020\nCC-MAIN-2024-22,bul,7813219,7781964,0.2883\nCC-MAIN-2024-22,cat,5544163,5493743,0.2046\nCC-MAIN-2024-22,ceb,56196,56150,0.0021\nCC-MAIN-2024-22,ces,30413178,30176434,1.1223\nCC-MAIN-2024-22,chr,1153,1152,0.0000\nCC-MAIN-2024-22,cos,53881,53735,0.0020\nCC-MAIN-2024-22,crs,2351,2319,0.0001\nCC-MAIN-2024-22,cym,307131,305610,0.0113\nCC-MAIN-2024-22,dan,12714581,12600611,0.4692\nCC-MAIN-2024-22,deu,150967674,149736820,5.5710\nCC-MAIN-2024-22,div,53026,52929,0.0020\nCC-MAIN-2024-22,dzo,4091,4088,0.0002\nCC-MAIN-2024-22,ell,14938432,14885935,0.5513\nCC-MAIN-2024-22,eng,1245710985,1236923080,45.9693\nCC-MAIN-2024-22,epo,227863,227486,0.0084\nCC-MAIN-2024-22,est,3812148,3786724,0.1407\nCC-MAIN-2024-22,eus,945611,939821,0.0349\nCC-MAIN-2024-22,fao,113002,112531,0.0042\nCC-MAIN-2024-22,fas,18445012,18379246,0.6807\nCC-MAIN-2024-22,fij,2507,2502,0.0001\nCC-MAIN-2024-22,fin,9520341,9449012,0.3513\nCC-MAIN-2024-22,fra,114239906,113470693,4.2157\nCC-MAIN-2024-22,fry,59304,59183,0.0022\nCC-MAIN-2024-22,gla,36861,36822,0.0014\nCC-MAIN-2024-22,gle,179931,176371,0.0066\nCC-MAIN-2024-22,glg,1038895,1033611,0.0383\nCC-MAIN-2024-22,glv,8468,8458,0.0003\nCC-MAIN-2024-22,got,551,550,0.0000\nCC-MAIN-2024-22,grn,18285,18229,0.0007\nCC-MAIN-2024-22,guj,316592,315625,0.0117\nCC-MAIN-2024-22,hat,49377,49255,0.0018\nCC-MAIN-2024-22,hau,68032,67688,0.0025\nCC-MAIN-2024-22,haw,15049,15029,0.0006\nCC-MAIN-2024-22,heb,6108146,6080169,0.2254\nCC-MAIN-2024-22,hin,5028546,5013365,0.1856\nCC-MAIN-2024-22,hmn,14776,14762,0.0005\nCC-MAIN-2024-22,hrv,5306813,5279805,0.1958\nCC-MAIN-2024-22,hun,15674449,15591987,0.5784\nCC-MAIN-2024-22,hye,863376,857645,0.0319\nCC-MAIN-2024-22,ibo,15134,15119,0.0006\nCC-MAIN-2024-22,iku,4556,4549,0.0002\nCC-MAIN-2024-22,ile,8402,8351,0.0003\nCC-MAIN-2024-22,ina,14620,14535,0.0005\nCC-MAIN-2024-22,ind,24132199,23939276,0.8905\nCC-MAIN-2024-22,ipk,1345,1340,0.0000\nCC-MAIN-2024-22,isl,1006074,1000320,0.0371\nCC-MAIN-2024-22,ita,65592255,65218869,2.4205\nCC-MAIN-2024-22,jav,55116,54776,0.0020\nCC-MAIN-2024-22,jpn,135042653,134541391,4.9833\nCC-MAIN-2024-22,kal,23787,23355,0.0009\nCC-MAIN-2024-22,kan,393836,392947,0.0145\nCC-MAIN-2024-22,kas,16,16,0.0000\nCC-MAIN-2024-22,kat,1003767,1001100,0.0370\nCC-MAIN-2024-22,kaz,676444,671870,0.0250\nCC-MAIN-2024-22,kha,7208,7194,0.0003\nCC-MAIN-2024-22,khm,289879,288959,0.0107\nCC-MAIN-2024-22,kin,61265,61100,0.0023\nCC-MAIN-2024-22,kir,253191,252580,0.0093\nCC-MAIN-2024-22,kor,18990638,18890568,0.7008\nCC-MAIN-2024-22,kur,168333,168144,0.0062\nCC-MAIN-2024-22,lao,103032,102302,0.0038\nCC-MAIN-2024-22,lat,3167310,3159506,0.1169\nCC-MAIN-2024-22,lav,2293263,2272008,0.0846\nCC-MAIN-2024-22,lif,40,40,0.0000\nCC-MAIN-2024-22,lin,6082,6075,0.0002\nCC-MAIN-2024-22,lit,4138878,4112349,0.1527\nCC-MAIN-2024-22,ltz,99760,99448,0.0037\nCC-MAIN-2024-22,lug,5724,5712,0.0002\nCC-MAIN-2024-22,mal,612560,610541,0.0226\nCC-MAIN-2024-22,mar,746736,743424,0.0276\nCC-MAIN-2024-22,mfe,4416,4411,0.0002\nCC-MAIN-2024-22,mkd,1009552,1006646,0.0373\nCC-MAIN-2024-22,mlg,93878,93299,0.0035\nCC-MAIN-2024-22,mlt,126626,125640,0.0047\nCC-MAIN-2024-22,mon,391503,390176,0.0144\nCC-MAIN-2024-22,mri,24822,24702,0.0009\nCC-MAIN-2024-22,msa,2004541,1995878,0.0740\nCC-MAIN-2024-22,mya,345447,344711,0.0127\nCC-MAIN-2024-22,nau,1267,1262,0.0000\nCC-MAIN-2024-22,nep,1182915,1180383,0.0437\nCC-MAIN-2024-22,nld,49727141,49376582,1.8350\nCC-MAIN-2024-22,nno,397074,395288,0.0147\nCC-MAIN-2024-22,nor,8309369,8246437,0.3066\nCC-MAIN-2024-22,nso,1422,1419,0.0001\nCC-MAIN-2024-22,nya,13894,13858,0.0005\nCC-MAIN-2024-22,oci,97096,96996,0.0036\nCC-MAIN-2024-22,ori,146939,146439,0.0054\nCC-MAIN-2024-22,orm,16889,16818,0.0006\nCC-MAIN-2024-22,pan,158365,157966,0.0058\nCC-MAIN-2024-22,pol,46852510,46607867,1.7290\nCC-MAIN-2024-22,por,55300657,55029844,2.0407\nCC-MAIN-2024-22,pus,100627,100492,0.0037\nCC-MAIN-2024-22,que,14193,14188,0.0005\nCC-MAIN-2024-22,roh,28863,28413,0.0011\nCC-MAIN-2024-22,ron,14113555,14055023,0.5208\nCC-MAIN-2024-22,run,1394,1390,0.0001\nCC-MAIN-2024-22,rus,160299726,159538186,5.9154\nCC-MAIN-2024-22,sag,12805,12803,0.0005\nCC-MAIN-2024-22,san,93837,93532,0.0035\nCC-MAIN-2024-22,sco,16122,16081,0.0006\nCC-MAIN-2024-22,sin,263746,263114,0.0097\nCC-MAIN-2024-22,slk,9960732,9902236,0.3676\nCC-MAIN-2024-22,slv,3981793,3960388,0.1469\nCC-MAIN-2024-22,smo,15984,15927,0.0006\nCC-MAIN-2024-22,sna,15207,15163,0.0006\nCC-MAIN-2024-22,snd,41600,41558,0.0015\nCC-MAIN-2024-22,som,125994,125609,0.0046\nCC-MAIN-2024-22,sot,16346,16301,0.0006\nCC-MAIN-2024-22,spa,125134634,124381802,4.6177\nCC-MAIN-2024-22,sqi,1298778,1294352,0.0479\nCC-MAIN-2024-22,srp,5901668,5875487,0.2178\nCC-MAIN-2024-22,ssw,702,697,0.0000\nCC-MAIN-2024-22,sun,26174,26147,0.0010\nCC-MAIN-2024-22,sux,264,263,0.0000\nCC-MAIN-2024-22,swa,244245,243616,0.0090\nCC-MAIN-2024-22,swe,17172888,17043416,0.6337\nCC-MAIN-2024-22,syr,6787,6766,0.0003\nCC-MAIN-2024-22,tam,1112051,1108483,0.0410\nCC-MAIN-2024-22,tat,195493,195159,0.0072\nCC-MAIN-2024-22,tel,562799,559038,0.0208\nCC-MAIN-2024-22,tgk,170561,170360,0.0063\nCC-MAIN-2024-22,tgl,391045,390505,0.0144\nCC-MAIN-2024-22,tha,10807176,10749036,0.3988\nCC-MAIN-2024-22,tir,20931,20798,0.0008\nCC-MAIN-2024-22,ton,2850,2842,0.0001\nCC-MAIN-2024-22,tsn,2518,2515,0.0001\nCC-MAIN-2024-22,tso,1166,1165,0.0000\nCC-MAIN-2024-22,tuk,50188,50081,0.0019\nCC-MAIN-2024-22,tur,30193345,30066799,1.1142\nCC-MAIN-2024-22,uig,28918,28889,0.0011\nCC-MAIN-2024-22,ukr,12088657,12015490,0.4461\nCC-MAIN-2024-22,urd,832965,830250,0.0307\nCC-MAIN-2024-22,uzb,549130,547190,0.0203\nCC-MAIN-2024-22,ven,606,602,0.0000\nCC-MAIN-2024-22,vie,26037948,25850486,0.9609\nCC-MAIN-2024-22,vol,15408,15385,0.0006\nCC-MAIN-2024-22,war,57455,57309,0.0021\nCC-MAIN-2024-22,wol,3805,3800,0.0001\nCC-MAIN-2024-22,xho,52476,52451,0.0019\nCC-MAIN-2024-22,yid,47964,47868,0.0018\nCC-MAIN-2024-22,yor,21049,21026,0.0008\nCC-MAIN-2024-22,zha,1804,1800,0.0001\nCC-MAIN-2024-22,zho,110159487,109770683,4.0651\nCC-MAIN-2024-22,zul,58676,58618,0.0022\nCC-MAIN-2024-26,<unknown>,87747258,87747258,3.1360\nCC-MAIN-2024-26,aar,2413,2401,0.0001\nCC-MAIN-2024-26,abk,12995,12898,0.0005\nCC-MAIN-2024-26,afr,237126,236639,0.0085\nCC-MAIN-2024-26,aka,2939,2938,0.0001\nCC-MAIN-2024-26,amh,89041,88742,0.0032\nCC-MAIN-2024-26,ara,18377345,18267394,0.6568\nCC-MAIN-2024-26,asm,58874,58815,0.0021\nCC-MAIN-2024-26,aym,2569,2536,0.0001\nCC-MAIN-2024-26,aze,1744047,1739033,0.0623\nCC-MAIN-2024-26,bak,75005,74975,0.0027\nCC-MAIN-2024-26,bel,421869,420776,0.0151\nCC-MAIN-2024-26,ben,3227310,3218011,0.1153\nCC-MAIN-2024-26,bih,19671,19634,0.0007\nCC-MAIN-2024-26,bis,2595,2581,0.0001\nCC-MAIN-2024-26,bod,37515,37427,0.0013\nCC-MAIN-2024-26,bos,1416798,1411668,0.0506\nCC-MAIN-2024-26,bre,83129,82983,0.0030\nCC-MAIN-2024-26,bul,8116545,8085306,0.2901\nCC-MAIN-2024-26,cat,5628251,5583198,0.2011\nCC-MAIN-2024-26,ceb,53119,53071,0.0019\nCC-MAIN-2024-26,ces,30508793,30278502,1.0904\nCC-MAIN-2024-26,chr,903,903,0.0000\nCC-MAIN-2024-26,cos,54727,54625,0.0020\nCC-MAIN-2024-26,crs,3654,3628,0.0001\nCC-MAIN-2024-26,cym,305607,304436,0.0109\nCC-MAIN-2024-26,dan,12673385,12562115,0.4529\nCC-MAIN-2024-26,deu,153056149,151870610,5.4701\nCC-MAIN-2024-26,div,61344,61287,0.0022\nCC-MAIN-2024-26,dzo,5144,5140,0.0002\nCC-MAIN-2024-26,ell,15319986,15257765,0.5475\nCC-MAIN-2024-26,eng,1260650171,1251937249,45.0546\nCC-MAIN-2024-26,epo,236008,235580,0.0084\nCC-MAIN-2024-26,est,3862971,3837692,0.1381\nCC-MAIN-2024-26,eus,977997,971220,0.0350\nCC-MAIN-2024-26,fao,112136,111768,0.0040\nCC-MAIN-2024-26,fas,17991330,17932064,0.6430\nCC-MAIN-2024-26,fij,3663,3649,0.0001\nCC-MAIN-2024-26,fin,9787151,9721075,0.3498\nCC-MAIN-2024-26,fra,118008546,117240681,4.2175\nCC-MAIN-2024-26,fry,80689,80503,0.0029\nCC-MAIN-2024-26,gla,37097,37047,0.0013\nCC-MAIN-2024-26,gle,188809,186435,0.0067\nCC-MAIN-2024-26,glg,1096420,1090592,0.0392\nCC-MAIN-2024-26,glv,12363,12353,0.0004\nCC-MAIN-2024-26,got,533,533,0.0000\nCC-MAIN-2024-26,grn,20416,20352,0.0007\nCC-MAIN-2024-26,guj,332907,331400,0.0119\nCC-MAIN-2024-26,hat,53182,53034,0.0019\nCC-MAIN-2024-26,hau,83196,82843,0.0030\nCC-MAIN-2024-26,haw,16628,16595,0.0006\nCC-MAIN-2024-26,heb,6269539,6238119,0.2241\nCC-MAIN-2024-26,hin,5272881,5255113,0.1884\nCC-MAIN-2024-26,hmn,20056,20024,0.0007\nCC-MAIN-2024-26,hrv,5487297,5461168,0.1961\nCC-MAIN-2024-26,hun,15628284,15548553,0.5585\nCC-MAIN-2024-26,hye,920051,914035,0.0329\nCC-MAIN-2024-26,ibo,16032,16005,0.0006\nCC-MAIN-2024-26,iku,5357,5341,0.0002\nCC-MAIN-2024-26,ile,10470,10445,0.0004\nCC-MAIN-2024-26,ina,14102,14033,0.0005\nCC-MAIN-2024-26,ind,27070770,26882191,0.9675\nCC-MAIN-2024-26,ipk,2273,2268,0.0001\nCC-MAIN-2024-26,isl,1076166,1070856,0.0385\nCC-MAIN-2024-26,ita,73810221,73384469,2.6379\nCC-MAIN-2024-26,jav,58566,58523,0.0021\nCC-MAIN-2024-26,jpn,133667653,133174249,4.7772\nCC-MAIN-2024-26,kal,22526,22307,0.0008\nCC-MAIN-2024-26,kan,426492,425494,0.0152\nCC-MAIN-2024-26,kas,20,20,0.0000\nCC-MAIN-2024-26,kat,1095215,1091747,0.0391\nCC-MAIN-2024-26,kaz,745986,740753,0.0267\nCC-MAIN-2024-26,kha,10607,10591,0.0004\nCC-MAIN-2024-26,khm,306608,305858,0.0110\nCC-MAIN-2024-26,kin,62558,62169,0.0022\nCC-MAIN-2024-26,kir,230441,229591,0.0082\nCC-MAIN-2024-26,kor,22361472,22259567,0.7992\nCC-MAIN-2024-26,kur,163340,162810,0.0058\nCC-MAIN-2024-26,lao,95796,95249,0.0034\nCC-MAIN-2024-26,lat,3250533,3243153,0.1162\nCC-MAIN-2024-26,lav,2461657,2440492,0.0880\nCC-MAIN-2024-26,lif,27,27,0.0000\nCC-MAIN-2024-26,lin,7468,7456,0.0003\nCC-MAIN-2024-26,lit,4411233,4379647,0.1577\nCC-MAIN-2024-26,ltz,103093,102785,0.0037\nCC-MAIN-2024-26,lug,5867,5858,0.0002\nCC-MAIN-2024-26,mal,646684,644836,0.0231\nCC-MAIN-2024-26,mar,737184,733740,0.0263\nCC-MAIN-2024-26,mfe,5265,5260,0.0002\nCC-MAIN-2024-26,mkd,1103126,1100016,0.0394\nCC-MAIN-2024-26,mlg,98038,97624,0.0035\nCC-MAIN-2024-26,mlt,120361,117756,0.0043\nCC-MAIN-2024-26,mon,426012,424588,0.0152\nCC-MAIN-2024-26,mri,31360,31245,0.0011\nCC-MAIN-2024-26,msa,2159135,2150657,0.0772\nCC-MAIN-2024-26,mya,370805,369661,0.0133\nCC-MAIN-2024-26,nau,1533,1530,0.0001\nCC-MAIN-2024-26,nep,1370601,1367727,0.0490\nCC-MAIN-2024-26,nld,51171827,50777534,1.8288\nCC-MAIN-2024-26,nno,366837,364909,0.0131\nCC-MAIN-2024-26,nor,8460796,8396694,0.3024\nCC-MAIN-2024-26,nso,1587,1586,0.0001\nCC-MAIN-2024-26,nya,15636,15600,0.0006\nCC-MAIN-2024-26,oci,87855,87733,0.0031\nCC-MAIN-2024-26,ori,164201,163822,0.0059\nCC-MAIN-2024-26,orm,15923,15895,0.0006\nCC-MAIN-2024-26,pan,167379,166710,0.0060\nCC-MAIN-2024-26,pol,46924882,46676006,1.6771\nCC-MAIN-2024-26,por,56608924,56342748,2.0232\nCC-MAIN-2024-26,pus,101567,101421,0.0036\nCC-MAIN-2024-26,que,14835,14831,0.0005\nCC-MAIN-2024-26,roh,29979,29746,0.0011\nCC-MAIN-2024-26,ron,14448255,14385272,0.5164\nCC-MAIN-2024-26,run,2348,2345,0.0001\nCC-MAIN-2024-26,rus,159142632,158391215,5.6876\nCC-MAIN-2024-26,sag,8488,8488,0.0003\nCC-MAIN-2024-26,san,77852,77704,0.0028\nCC-MAIN-2024-26,sco,27689,27626,0.0010\nCC-MAIN-2024-26,sin,237567,236845,0.0085\nCC-MAIN-2024-26,slk,10366651,10301497,0.3705\nCC-MAIN-2024-26,slv,4267408,4243326,0.1525\nCC-MAIN-2024-26,smo,16119,16079,0.0006\nCC-MAIN-2024-26,sna,16833,16780,0.0006\nCC-MAIN-2024-26,snd,46180,46140,0.0017\nCC-MAIN-2024-26,som,126167,125664,0.0045\nCC-MAIN-2024-26,sot,15508,15452,0.0006\nCC-MAIN-2024-26,spa,125981038,125199497,4.5025\nCC-MAIN-2024-26,sqi,1352361,1347616,0.0483\nCC-MAIN-2024-26,srp,6109779,6084818,0.2184\nCC-MAIN-2024-26,ssw,1879,1877,0.0001\nCC-MAIN-2024-26,sun,26685,26660,0.0010\nCC-MAIN-2024-26,sux,259,259,0.0000\nCC-MAIN-2024-26,swa,265975,264987,0.0095\nCC-MAIN-2024-26,swe,17570300,17428652,0.6279\nCC-MAIN-2024-26,syr,7380,7374,0.0003\nCC-MAIN-2024-26,tam,1214534,1210639,0.0434\nCC-MAIN-2024-26,tat,198563,198145,0.0071\nCC-MAIN-2024-26,tel,586811,584409,0.0210\nCC-MAIN-2024-26,tgk,178986,178663,0.0064\nCC-MAIN-2024-26,tgl,341505,340759,0.0122\nCC-MAIN-2024-26,tha,11720226,11662670,0.4189\nCC-MAIN-2024-26,tir,21295,21192,0.0008\nCC-MAIN-2024-26,ton,2256,2243,0.0001\nCC-MAIN-2024-26,tsn,3209,3201,0.0001\nCC-MAIN-2024-26,tso,2256,2253,0.0001\nCC-MAIN-2024-26,tuk,53690,53574,0.0019\nCC-MAIN-2024-26,tur,33424119,33285398,1.1946\nCC-MAIN-2024-26,uig,32221,32162,0.0012\nCC-MAIN-2024-26,ukr,15009560,14469464,0.5364\nCC-MAIN-2024-26,urd,834144,831409,0.0298\nCC-MAIN-2024-26,uzb,583162,581316,0.0208\nCC-MAIN-2024-26,ven,556,554,0.0000\nCC-MAIN-2024-26,vie,27586303,27403140,0.9859\nCC-MAIN-2024-26,vol,14769,14742,0.0005\nCC-MAIN-2024-26,war,58875,58733,0.0021\nCC-MAIN-2024-26,wol,3659,3652,0.0001\nCC-MAIN-2024-26,xho,56986,56941,0.0020\nCC-MAIN-2024-26,yid,49268,49187,0.0018\nCC-MAIN-2024-26,yor,22396,22355,0.0008\nCC-MAIN-2024-26,zha,2143,2135,0.0001\nCC-MAIN-2024-26,zho,136678773,136221271,4.8848\nCC-MAIN-2024-26,zul,60100,60030,0.0021\nCC-MAIN-2024-30,<unknown>,81516162,81516162,3.2009\nCC-MAIN-2024-30,aar,2113,2105,0.0001\nCC-MAIN-2024-30,abk,10396,10310,0.0004\nCC-MAIN-2024-30,afr,227178,226610,0.0089\nCC-MAIN-2024-30,aka,2615,2613,0.0001\nCC-MAIN-2024-30,amh,81917,81725,0.0032\nCC-MAIN-2024-30,ara,17522617,17427628,0.6881\nCC-MAIN-2024-30,asm,59989,59949,0.0024\nCC-MAIN-2024-30,aym,1712,1709,0.0001\nCC-MAIN-2024-30,aze,1733419,1728722,0.0681\nCC-MAIN-2024-30,bak,61530,61417,0.0024\nCC-MAIN-2024-30,bel,385074,383442,0.0151\nCC-MAIN-2024-30,ben,2744825,2739380,0.1078\nCC-MAIN-2024-30,bih,15449,15387,0.0006\nCC-MAIN-2024-30,bis,2814,2807,0.0001\nCC-MAIN-2024-30,bod,30641,30563,0.0012\nCC-MAIN-2024-30,bos,1318534,1312575,0.0518\nCC-MAIN-2024-30,bre,66346,66250,0.0026\nCC-MAIN-2024-30,bul,7634485,7609802,0.2998\nCC-MAIN-2024-30,cat,5110684,5069815,0.2007\nCC-MAIN-2024-30,ceb,47127,47101,0.0019\nCC-MAIN-2024-30,ces,26117446,25936259,1.0256\nCC-MAIN-2024-30,chr,640,638,0.0000\nCC-MAIN-2024-30,cos,48582,48515,0.0019\nCC-MAIN-2024-30,crs,3497,3466,0.0001\nCC-MAIN-2024-30,cym,266328,265516,0.0105\nCC-MAIN-2024-30,dan,11425650,11343265,0.4487\nCC-MAIN-2024-30,deu,134691398,133759760,5.2890\nCC-MAIN-2024-30,div,53641,53587,0.0021\nCC-MAIN-2024-30,dzo,4172,4166,0.0002\nCC-MAIN-2024-30,ell,14345300,14293277,0.5633\nCC-MAIN-2024-30,eng,1115192280,1108347171,43.7909\nCC-MAIN-2024-30,epo,249064,248595,0.0098\nCC-MAIN-2024-30,est,3271893,3254152,0.1285\nCC-MAIN-2024-30,eus,842903,837654,0.0331\nCC-MAIN-2024-30,fao,108929,108338,0.0043\nCC-MAIN-2024-30,fas,19520798,19458444,0.7665\nCC-MAIN-2024-30,fij,2304,2300,0.0001\nCC-MAIN-2024-30,fin,8842983,8789653,0.3472\nCC-MAIN-2024-30,fra,107495441,106881980,4.2211\nCC-MAIN-2024-30,fry,58919,58676,0.0023\nCC-MAIN-2024-30,gla,35831,35766,0.0014\nCC-MAIN-2024-30,gle,176453,175211,0.0069\nCC-MAIN-2024-30,glg,893010,889163,0.0351\nCC-MAIN-2024-30,glv,9384,9369,0.0004\nCC-MAIN-2024-30,got,392,392,0.0000\nCC-MAIN-2024-30,grn,20987,20937,0.0008\nCC-MAIN-2024-30,guj,319631,318711,0.0126\nCC-MAIN-2024-30,hat,47699,47592,0.0019\nCC-MAIN-2024-30,hau,73139,72983,0.0029\nCC-MAIN-2024-30,haw,16473,16449,0.0006\nCC-MAIN-2024-30,heb,5968721,5940608,0.2344\nCC-MAIN-2024-30,hin,4940433,4925596,0.1940\nCC-MAIN-2024-30,hmn,14857,14816,0.0006\nCC-MAIN-2024-30,hrv,5392515,5370915,0.2118\nCC-MAIN-2024-30,hun,14377748,14317090,0.5646\nCC-MAIN-2024-30,hye,903134,897873,0.0355\nCC-MAIN-2024-30,ibo,15331,15310,0.0006\nCC-MAIN-2024-30,iku,5038,5018,0.0002\nCC-MAIN-2024-30,ile,11386,11342,0.0004\nCC-MAIN-2024-30,ina,12581,12553,0.0005\nCC-MAIN-2024-30,ind,26551458,26359445,1.0426\nCC-MAIN-2024-30,ipk,1472,1465,0.0001\nCC-MAIN-2024-30,isl,985663,981598,0.0387\nCC-MAIN-2024-30,ita,66407383,66066835,2.6077\nCC-MAIN-2024-30,jav,52041,51993,0.0020\nCC-MAIN-2024-30,jpn,122186890,121792676,4.7980\nCC-MAIN-2024-30,kal,20627,20400,0.0008\nCC-MAIN-2024-30,kan,404951,404091,0.0159\nCC-MAIN-2024-30,kas,17,17,0.0000\nCC-MAIN-2024-30,kat,1026124,1023373,0.0403\nCC-MAIN-2024-30,kaz,712174,709767,0.0280\nCC-MAIN-2024-30,kha,7646,7636,0.0003\nCC-MAIN-2024-30,khm,285103,284487,0.0112\nCC-MAIN-2024-30,kin,57832,57655,0.0023\nCC-MAIN-2024-30,kir,214132,213658,0.0084\nCC-MAIN-2024-30,kor,17908861,17838752,0.7032\nCC-MAIN-2024-30,kur,155957,155601,0.0061\nCC-MAIN-2024-30,lao,94054,93677,0.0037\nCC-MAIN-2024-30,lat,2773134,2767423,0.1089\nCC-MAIN-2024-30,lav,2246832,2235966,0.0882\nCC-MAIN-2024-30,lif,13,13,0.0000\nCC-MAIN-2024-30,lin,6597,6586,0.0003\nCC-MAIN-2024-30,lit,3946406,3922896,0.1550\nCC-MAIN-2024-30,ltz,88811,88604,0.0035\nCC-MAIN-2024-30,lug,4560,4556,0.0002\nCC-MAIN-2024-30,mal,626274,624827,0.0246\nCC-MAIN-2024-30,mar,721924,719268,0.0283\nCC-MAIN-2024-30,mfe,4835,4831,0.0002\nCC-MAIN-2024-30,mkd,999999,997084,0.0393\nCC-MAIN-2024-30,mlg,82463,82344,0.0032\nCC-MAIN-2024-30,mlt,112377,110384,0.0044\nCC-MAIN-2024-30,mon,399939,398639,0.0157\nCC-MAIN-2024-30,mri,30552,30464,0.0012\nCC-MAIN-2024-30,msa,1871624,1865962,0.0735\nCC-MAIN-2024-30,mya,329741,328840,0.0129\nCC-MAIN-2024-30,nau,1278,1273,0.0001\nCC-MAIN-2024-30,nep,1283457,1281054,0.0504\nCC-MAIN-2024-30,nld,46389138,46111863,1.8216\nCC-MAIN-2024-30,nno,324712,323266,0.0128\nCC-MAIN-2024-30,nor,7730568,7684183,0.3036\nCC-MAIN-2024-30,nso,1249,1249,0.0000\nCC-MAIN-2024-30,nya,14527,14509,0.0006\nCC-MAIN-2024-30,oci,76853,76770,0.0030\nCC-MAIN-2024-30,ori,153911,153670,0.0060\nCC-MAIN-2024-30,orm,14750,14742,0.0006\nCC-MAIN-2024-30,pan,165205,164813,0.0065\nCC-MAIN-2024-30,pol,45745610,45535837,1.7963\nCC-MAIN-2024-30,por,54082208,53849556,2.1237\nCC-MAIN-2024-30,pus,89213,89076,0.0035\nCC-MAIN-2024-30,que,12024,12009,0.0005\nCC-MAIN-2024-30,roh,24196,23989,0.0010\nCC-MAIN-2024-30,ron,14721752,14669268,0.5781\nCC-MAIN-2024-30,run,1779,1777,0.0001\nCC-MAIN-2024-30,rus,155434524,154774924,6.1035\nCC-MAIN-2024-30,sag,8987,8987,0.0004\nCC-MAIN-2024-30,san,72683,72584,0.0029\nCC-MAIN-2024-30,sco,15636,15598,0.0006\nCC-MAIN-2024-30,sin,220892,220494,0.0087\nCC-MAIN-2024-30,slk,10243065,10183288,0.4022\nCC-MAIN-2024-30,slv,4106751,4086381,0.1613\nCC-MAIN-2024-30,smo,17479,17403,0.0007\nCC-MAIN-2024-30,sna,15557,15536,0.0006\nCC-MAIN-2024-30,snd,47388,47300,0.0019\nCC-MAIN-2024-30,som,116936,116462,0.0046\nCC-MAIN-2024-30,sot,15969,15949,0.0006\nCC-MAIN-2024-30,spa,116107570,115447818,4.5593\nCC-MAIN-2024-30,sqi,1283097,1278621,0.0504\nCC-MAIN-2024-30,srp,5839770,5818129,0.2293\nCC-MAIN-2024-30,ssw,885,885,0.0000\nCC-MAIN-2024-30,sun,26069,26045,0.0010\nCC-MAIN-2024-30,sux,221,221,0.0000\nCC-MAIN-2024-30,swa,256685,256061,0.0101\nCC-MAIN-2024-30,swe,17324871,17209929,0.6803\nCC-MAIN-2024-30,syr,8048,8036,0.0003\nCC-MAIN-2024-30,tam,1160666,1157859,0.0456\nCC-MAIN-2024-30,tat,176687,176434,0.0069\nCC-MAIN-2024-30,tel,529157,527315,0.0208\nCC-MAIN-2024-30,tgk,177665,177460,0.0070\nCC-MAIN-2024-30,tgl,244380,243279,0.0096\nCC-MAIN-2024-30,tha,10885937,10837417,0.4275\nCC-MAIN-2024-30,tir,18943,18817,0.0007\nCC-MAIN-2024-30,ton,2448,2422,0.0001\nCC-MAIN-2024-30,tsn,2260,2257,0.0001\nCC-MAIN-2024-30,tso,1487,1484,0.0001\nCC-MAIN-2024-30,tuk,58879,58618,0.0023\nCC-MAIN-2024-30,tur,32597356,32489401,1.2800\nCC-MAIN-2024-30,uig,30318,30266,0.0012\nCC-MAIN-2024-30,ukr,14852506,14278852,0.5832\nCC-MAIN-2024-30,urd,771731,769824,0.0303\nCC-MAIN-2024-30,uzb,610081,608534,0.0240\nCC-MAIN-2024-30,ven,575,575,0.0000\nCC-MAIN-2024-30,vie,25804044,25635022,1.0133\nCC-MAIN-2024-30,vol,11701,11682,0.0005\nCC-MAIN-2024-30,war,53216,53070,0.0021\nCC-MAIN-2024-30,wol,5461,5458,0.0002\nCC-MAIN-2024-30,xho,48414,48389,0.0019\nCC-MAIN-2024-30,yid,48078,47994,0.0019\nCC-MAIN-2024-30,yor,21747,21721,0.0009\nCC-MAIN-2024-30,zha,1405,1401,0.0001\nCC-MAIN-2024-30,zho,130788958,130312411,5.1358\nCC-MAIN-2024-30,zul,59778,59723,0.0023\nCC-MAIN-2024-33,<unknown>,76264540,76264540,3.2930\nCC-MAIN-2024-33,aar,1834,1826,0.0001\nCC-MAIN-2024-33,abk,9780,9678,0.0004\nCC-MAIN-2024-33,afr,241667,240923,0.0104\nCC-MAIN-2024-33,aka,1720,1718,0.0001\nCC-MAIN-2024-33,amh,67580,67347,0.0029\nCC-MAIN-2024-33,ara,16469946,16395665,0.7112\nCC-MAIN-2024-33,asm,53006,52985,0.0023\nCC-MAIN-2024-33,aym,1930,1917,0.0001\nCC-MAIN-2024-33,aze,1713319,1707310,0.0740\nCC-MAIN-2024-33,bak,56742,56676,0.0025\nCC-MAIN-2024-33,bel,369306,368123,0.0159\nCC-MAIN-2024-33,ben,2799504,2794230,0.1209\nCC-MAIN-2024-33,bih,16827,16792,0.0007\nCC-MAIN-2024-33,bis,2769,2766,0.0001\nCC-MAIN-2024-33,bod,30273,30210,0.0013\nCC-MAIN-2024-33,bos,1234694,1228708,0.0533\nCC-MAIN-2024-33,bre,73393,73356,0.0032\nCC-MAIN-2024-33,bul,6956349,6934568,0.3004\nCC-MAIN-2024-33,cat,4736181,4702244,0.2045\nCC-MAIN-2024-33,ceb,46370,46238,0.0020\nCC-MAIN-2024-33,ces,23524700,23349578,1.0158\nCC-MAIN-2024-33,chr,798,798,0.0000\nCC-MAIN-2024-33,cos,47964,47868,0.0021\nCC-MAIN-2024-33,crs,3628,3616,0.0002\nCC-MAIN-2024-33,cym,250058,249263,0.0108\nCC-MAIN-2024-33,dan,10552960,10478840,0.4557\nCC-MAIN-2024-33,deu,117868335,117104616,5.0895\nCC-MAIN-2024-33,div,51733,51687,0.0022\nCC-MAIN-2024-33,dzo,3363,3363,0.0001\nCC-MAIN-2024-33,ell,13438800,13389688,0.5803\nCC-MAIN-2024-33,eng,999987209,993844365,43.1787\nCC-MAIN-2024-33,epo,221315,220581,0.0096\nCC-MAIN-2024-33,est,3016139,3000861,0.1302\nCC-MAIN-2024-33,eus,798878,793866,0.0345\nCC-MAIN-2024-33,fao,104063,103759,0.0045\nCC-MAIN-2024-33,fas,17009451,16961738,0.7345\nCC-MAIN-2024-33,fij,2277,2274,0.0001\nCC-MAIN-2024-33,fin,7879950,7836103,0.3403\nCC-MAIN-2024-33,fra,98284699,97777352,4.2439\nCC-MAIN-2024-33,fry,62582,62393,0.0027\nCC-MAIN-2024-33,gla,34188,34025,0.0015\nCC-MAIN-2024-33,gle,171058,170021,0.0074\nCC-MAIN-2024-33,glg,832385,828770,0.0359\nCC-MAIN-2024-33,glv,7926,7916,0.0003\nCC-MAIN-2024-33,got,443,442,0.0000\nCC-MAIN-2024-33,grn,17903,17820,0.0008\nCC-MAIN-2024-33,guj,281414,280634,0.0122\nCC-MAIN-2024-33,hat,44363,44219,0.0019\nCC-MAIN-2024-33,hau,64214,63977,0.0028\nCC-MAIN-2024-33,haw,15578,15489,0.0007\nCC-MAIN-2024-33,heb,5494936,5474023,0.2373\nCC-MAIN-2024-33,hin,4674682,4659815,0.2018\nCC-MAIN-2024-33,hmn,13922,13846,0.0006\nCC-MAIN-2024-33,hrv,5149854,5132495,0.2224\nCC-MAIN-2024-33,hun,13483143,13428648,0.5822\nCC-MAIN-2024-33,hye,848278,843213,0.0366\nCC-MAIN-2024-33,ibo,14967,14900,0.0006\nCC-MAIN-2024-33,iku,4396,4386,0.0002\nCC-MAIN-2024-33,ile,12572,12537,0.0005\nCC-MAIN-2024-33,ina,11313,11285,0.0005\nCC-MAIN-2024-33,ind,25797142,25621054,1.1139\nCC-MAIN-2024-33,ipk,1271,1269,0.0001\nCC-MAIN-2024-33,isl,869750,866224,0.0376\nCC-MAIN-2024-33,ita,57714385,57445415,2.4921\nCC-MAIN-2024-33,jav,48364,48294,0.0021\nCC-MAIN-2024-33,jpn,112994242,112646383,4.8790\nCC-MAIN-2024-33,kal,18331,18124,0.0008\nCC-MAIN-2024-33,kan,389509,389033,0.0168\nCC-MAIN-2024-33,kas,18,18,0.0000\nCC-MAIN-2024-33,kat,950184,947307,0.0410\nCC-MAIN-2024-33,kaz,666394,663207,0.0288\nCC-MAIN-2024-33,kha,7176,7161,0.0003\nCC-MAIN-2024-33,khm,250203,249462,0.0108\nCC-MAIN-2024-33,kin,51704,51537,0.0022\nCC-MAIN-2024-33,kir,214263,213751,0.0093\nCC-MAIN-2024-33,kor,16729791,16668127,0.7224\nCC-MAIN-2024-33,kur,164283,163832,0.0071\nCC-MAIN-2024-33,lao,81831,81508,0.0035\nCC-MAIN-2024-33,lat,2351948,2347294,0.1016\nCC-MAIN-2024-33,lav,2111082,2100985,0.0912\nCC-MAIN-2024-33,lif,25,25,0.0000\nCC-MAIN-2024-33,lin,8635,8624,0.0004\nCC-MAIN-2024-33,lit,3528625,3510083,0.1524\nCC-MAIN-2024-33,ltz,85250,84991,0.0037\nCC-MAIN-2024-33,lug,4318,4311,0.0002\nCC-MAIN-2024-33,mal,621966,620845,0.0269\nCC-MAIN-2024-33,mar,644499,642914,0.0278\nCC-MAIN-2024-33,mfe,5127,5122,0.0002\nCC-MAIN-2024-33,mkd,976963,973555,0.0422\nCC-MAIN-2024-33,mlg,77813,77533,0.0034\nCC-MAIN-2024-33,mlt,109519,108152,0.0047\nCC-MAIN-2024-33,mon,387245,386206,0.0167\nCC-MAIN-2024-33,mri,30782,30644,0.0013\nCC-MAIN-2024-33,msa,1811404,1806500,0.0782\nCC-MAIN-2024-33,mya,322602,321786,0.0139\nCC-MAIN-2024-33,nau,1237,1234,0.0001\nCC-MAIN-2024-33,nep,1233250,1231207,0.0533\nCC-MAIN-2024-33,nld,41272192,41039604,1.7821\nCC-MAIN-2024-33,nno,291517,290522,0.0126\nCC-MAIN-2024-33,nor,6852663,6816304,0.2959\nCC-MAIN-2024-33,nso,1141,1140,0.0000\nCC-MAIN-2024-33,nya,14152,14075,0.0006\nCC-MAIN-2024-33,oci,75588,75506,0.0033\nCC-MAIN-2024-33,ori,149192,148821,0.0064\nCC-MAIN-2024-33,orm,13571,13550,0.0006\nCC-MAIN-2024-33,pan,171055,170500,0.0074\nCC-MAIN-2024-33,pol,44795062,44598249,1.9342\nCC-MAIN-2024-33,por,51365206,51142942,2.2179\nCC-MAIN-2024-33,pus,74593,74409,0.0032\nCC-MAIN-2024-33,que,11541,11511,0.0005\nCC-MAIN-2024-33,roh,21856,21663,0.0009\nCC-MAIN-2024-33,ron,15146004,15094960,0.6540\nCC-MAIN-2024-33,run,1850,1847,0.0001\nCC-MAIN-2024-33,rus,144147625,143628805,6.2242\nCC-MAIN-2024-33,sag,9572,9572,0.0004\nCC-MAIN-2024-33,san,73215,73041,0.0032\nCC-MAIN-2024-33,sco,16810,16774,0.0007\nCC-MAIN-2024-33,sin,204247,203822,0.0088\nCC-MAIN-2024-33,slk,9392761,9340156,0.4056\nCC-MAIN-2024-33,slv,3705868,3682059,0.1600\nCC-MAIN-2024-33,smo,15118,15023,0.0007\nCC-MAIN-2024-33,sna,14992,14909,0.0006\nCC-MAIN-2024-33,snd,45255,45140,0.0020\nCC-MAIN-2024-33,som,115547,114578,0.0050\nCC-MAIN-2024-33,sot,14180,14118,0.0006\nCC-MAIN-2024-33,spa,106114426,105565131,4.5819\nCC-MAIN-2024-33,sqi,1175579,1173050,0.0508\nCC-MAIN-2024-33,srp,5639235,5620700,0.2435\nCC-MAIN-2024-33,ssw,779,777,0.0000\nCC-MAIN-2024-33,sun,23282,23220,0.0010\nCC-MAIN-2024-33,sux,222,221,0.0000\nCC-MAIN-2024-33,swa,232625,232212,0.0100\nCC-MAIN-2024-33,swe,16040948,15947300,0.6926\nCC-MAIN-2024-33,syr,7763,7756,0.0003\nCC-MAIN-2024-33,tam,1134375,1132159,0.0490\nCC-MAIN-2024-33,tat,165850,165638,0.0072\nCC-MAIN-2024-33,tel,504029,503112,0.0218\nCC-MAIN-2024-33,tgk,160080,159863,0.0069\nCC-MAIN-2024-33,tgl,217757,216466,0.0094\nCC-MAIN-2024-33,tha,9978185,9939421,0.4309\nCC-MAIN-2024-33,tir,17900,17815,0.0008\nCC-MAIN-2024-33,ton,2130,2121,0.0001\nCC-MAIN-2024-33,tsn,2112,2109,0.0001\nCC-MAIN-2024-33,tso,1199,1188,0.0001\nCC-MAIN-2024-33,tuk,56911,56530,0.0025\nCC-MAIN-2024-33,tur,29514788,29417870,1.2744\nCC-MAIN-2024-33,uig,27758,27682,0.0012\nCC-MAIN-2024-33,ukr,14043883,13613634,0.6064\nCC-MAIN-2024-33,urd,757623,756222,0.0327\nCC-MAIN-2024-33,uzb,573662,571749,0.0248\nCC-MAIN-2024-33,ven,589,589,0.0000\nCC-MAIN-2024-33,vie,24350515,24198846,1.0514\nCC-MAIN-2024-33,vol,10981,10959,0.0005\nCC-MAIN-2024-33,war,47123,46467,0.0020\nCC-MAIN-2024-33,wol,3873,3868,0.0002\nCC-MAIN-2024-33,xho,50976,50899,0.0022\nCC-MAIN-2024-33,yid,42535,42408,0.0018\nCC-MAIN-2024-33,yor,17392,17324,0.0008\nCC-MAIN-2024-33,zha,2233,2231,0.0001\nCC-MAIN-2024-33,zho,120234924,119764554,5.1917\nCC-MAIN-2024-33,zul,64503,64386,0.0028\nCC-MAIN-2024-38,<unknown>,74801525,74801525,2.6706\nCC-MAIN-2024-38,aar,2260,2246,0.0001\nCC-MAIN-2024-38,abk,14472,14408,0.0005\nCC-MAIN-2024-38,afr,236116,235508,0.0084\nCC-MAIN-2024-38,aka,3020,3016,0.0001\nCC-MAIN-2024-38,amh,77787,77529,0.0028\nCC-MAIN-2024-38,ara,18397435,18323295,0.6568\nCC-MAIN-2024-38,asm,63910,63792,0.0023\nCC-MAIN-2024-38,aym,2805,2779,0.0001\nCC-MAIN-2024-38,aze,1851131,1845347,0.0661\nCC-MAIN-2024-38,bak,79593,79578,0.0028\nCC-MAIN-2024-38,bel,446314,445016,0.0159\nCC-MAIN-2024-38,ben,3009817,3003179,0.1075\nCC-MAIN-2024-38,bih,18653,18616,0.0007\nCC-MAIN-2024-38,bis,2536,2534,0.0001\nCC-MAIN-2024-38,bod,31465,31400,0.0011\nCC-MAIN-2024-38,bos,1357013,1349577,0.0484\nCC-MAIN-2024-38,bre,52168,52112,0.0019\nCC-MAIN-2024-38,bul,8237050,8214460,0.2941\nCC-MAIN-2024-38,cat,5610590,5581194,0.2003\nCC-MAIN-2024-38,ceb,46707,46617,0.0017\nCC-MAIN-2024-38,ces,30863804,30653393,1.1019\nCC-MAIN-2024-38,chr,1223,1222,0.0000\nCC-MAIN-2024-38,cos,52991,52864,0.0019\nCC-MAIN-2024-38,crs,3090,3074,0.0001\nCC-MAIN-2024-38,cym,279447,278348,0.0100\nCC-MAIN-2024-38,dan,12574235,12490333,0.4489\nCC-MAIN-2024-38,deu,152568820,151684117,5.4471\nCC-MAIN-2024-38,div,58797,58762,0.0021\nCC-MAIN-2024-38,dzo,4042,4041,0.0001\nCC-MAIN-2024-38,ell,15087526,15036556,0.5387\nCC-MAIN-2024-38,eng,1235782634,1228825491,44.1210\nCC-MAIN-2024-38,epo,228644,228127,0.0082\nCC-MAIN-2024-38,est,3847905,3826620,0.1374\nCC-MAIN-2024-38,eus,932793,928328,0.0333\nCC-MAIN-2024-38,fao,125884,125577,0.0045\nCC-MAIN-2024-38,fas,20137841,20078911,0.7190\nCC-MAIN-2024-38,fij,2734,2733,0.0001\nCC-MAIN-2024-38,fin,9910508,9856983,0.3538\nCC-MAIN-2024-38,fra,124058085,123425115,4.4292\nCC-MAIN-2024-38,fry,55416,55094,0.0020\nCC-MAIN-2024-38,gla,36921,36783,0.0013\nCC-MAIN-2024-38,gle,196501,194987,0.0070\nCC-MAIN-2024-38,glg,964890,959503,0.0344\nCC-MAIN-2024-38,glv,11357,11344,0.0004\nCC-MAIN-2024-38,got,672,672,0.0000\nCC-MAIN-2024-38,grn,22851,22771,0.0008\nCC-MAIN-2024-38,guj,315552,314886,0.0113\nCC-MAIN-2024-38,hat,48560,48425,0.0017\nCC-MAIN-2024-38,hau,65065,64679,0.0023\nCC-MAIN-2024-38,haw,15274,15092,0.0005\nCC-MAIN-2024-38,heb,6663633,6641558,0.2379\nCC-MAIN-2024-38,hin,5510008,5491805,0.1967\nCC-MAIN-2024-38,hmn,12918,12837,0.0005\nCC-MAIN-2024-38,hrv,5615423,5596547,0.2005\nCC-MAIN-2024-38,hun,16036462,15969620,0.5725\nCC-MAIN-2024-38,hye,922299,918226,0.0329\nCC-MAIN-2024-38,ibo,15568,15475,0.0006\nCC-MAIN-2024-38,iku,5112,5103,0.0002\nCC-MAIN-2024-38,ile,13654,13630,0.0005\nCC-MAIN-2024-38,ina,14052,14027,0.0005\nCC-MAIN-2024-38,ind,29499767,29310365,1.0532\nCC-MAIN-2024-38,ipk,1417,1413,0.0001\nCC-MAIN-2024-38,isl,1093301,1089172,0.0390\nCC-MAIN-2024-38,ita,70650626,70337437,2.5224\nCC-MAIN-2024-38,jav,57019,56918,0.0020\nCC-MAIN-2024-38,jpn,143177579,142763948,5.1119\nCC-MAIN-2024-38,kal,23544,23298,0.0008\nCC-MAIN-2024-38,kan,405411,404815,0.0145\nCC-MAIN-2024-38,kas,18,18,0.0000\nCC-MAIN-2024-38,kat,1093958,1088245,0.0391\nCC-MAIN-2024-38,kaz,708398,706033,0.0253\nCC-MAIN-2024-38,kha,8615,8607,0.0003\nCC-MAIN-2024-38,khm,288613,287571,0.0103\nCC-MAIN-2024-38,kin,55161,55021,0.0020\nCC-MAIN-2024-38,kir,240460,239720,0.0086\nCC-MAIN-2024-38,kor,18798905,18726478,0.6712\nCC-MAIN-2024-38,kur,192612,192074,0.0069\nCC-MAIN-2024-38,lao,107661,107142,0.0038\nCC-MAIN-2024-38,lat,3203014,3197825,0.1144\nCC-MAIN-2024-38,lav,2535120,2521069,0.0905\nCC-MAIN-2024-38,lif,95,95,0.0000\nCC-MAIN-2024-38,lin,7243,7223,0.0003\nCC-MAIN-2024-38,lit,4531252,4508754,0.1618\nCC-MAIN-2024-38,ltz,103581,103282,0.0037\nCC-MAIN-2024-38,lug,5204,5177,0.0002\nCC-MAIN-2024-38,mal,684190,682509,0.0244\nCC-MAIN-2024-38,mar,675600,673884,0.0241\nCC-MAIN-2024-38,mfe,3918,3917,0.0001\nCC-MAIN-2024-38,mkd,1053058,1046991,0.0376\nCC-MAIN-2024-38,mlg,85640,85202,0.0031\nCC-MAIN-2024-38,mlt,120509,119268,0.0043\nCC-MAIN-2024-38,mon,417134,415743,0.0149\nCC-MAIN-2024-38,mri,26291,26153,0.0009\nCC-MAIN-2024-38,msa,2070260,2064662,0.0739\nCC-MAIN-2024-38,mya,368088,367151,0.0131\nCC-MAIN-2024-38,nau,1253,1248,0.0000\nCC-MAIN-2024-38,nep,1239589,1236721,0.0443\nCC-MAIN-2024-38,nld,53633402,53318308,1.9149\nCC-MAIN-2024-38,nno,379027,377554,0.0135\nCC-MAIN-2024-38,nor,8658377,8611833,0.3091\nCC-MAIN-2024-38,nso,1904,1898,0.0001\nCC-MAIN-2024-38,nya,14294,14198,0.0005\nCC-MAIN-2024-38,oci,97308,97187,0.0035\nCC-MAIN-2024-38,ori,149125,148833,0.0053\nCC-MAIN-2024-38,orm,14920,14900,0.0005\nCC-MAIN-2024-38,pan,190318,189541,0.0068\nCC-MAIN-2024-38,pol,52846066,52597750,1.8868\nCC-MAIN-2024-38,por,62013785,61757563,2.2141\nCC-MAIN-2024-38,pus,88591,88287,0.0032\nCC-MAIN-2024-38,que,16981,16960,0.0006\nCC-MAIN-2024-38,roh,28198,28025,0.0010\nCC-MAIN-2024-38,ron,15562592,15508538,0.5556\nCC-MAIN-2024-38,run,2094,2094,0.0001\nCC-MAIN-2024-38,rus,172412683,171790278,6.1556\nCC-MAIN-2024-38,sag,12501,12501,0.0004\nCC-MAIN-2024-38,san,84667,84482,0.0030\nCC-MAIN-2024-38,sco,17215,17169,0.0006\nCC-MAIN-2024-38,sin,236815,236366,0.0085\nCC-MAIN-2024-38,slk,11675388,11614539,0.4168\nCC-MAIN-2024-38,slv,4357902,4337137,0.1556\nCC-MAIN-2024-38,smo,16518,16404,0.0006\nCC-MAIN-2024-38,sna,15993,15911,0.0006\nCC-MAIN-2024-38,snd,43562,43385,0.0016\nCC-MAIN-2024-38,som,127266,126269,0.0045\nCC-MAIN-2024-38,sot,14066,13975,0.0005\nCC-MAIN-2024-38,spa,125394495,124797940,4.4769\nCC-MAIN-2024-38,sqi,1340356,1337088,0.0479\nCC-MAIN-2024-38,srp,6288275,6267190,0.2245\nCC-MAIN-2024-38,ssw,702,701,0.0000\nCC-MAIN-2024-38,sun,29272,29177,0.0010\nCC-MAIN-2024-38,sux,289,289,0.0000\nCC-MAIN-2024-38,swa,259161,258535,0.0093\nCC-MAIN-2024-38,swe,19209951,19102134,0.6859\nCC-MAIN-2024-38,syr,8309,8301,0.0003\nCC-MAIN-2024-38,tam,1229924,1227462,0.0439\nCC-MAIN-2024-38,tat,204843,204436,0.0073\nCC-MAIN-2024-38,tel,507009,506153,0.0181\nCC-MAIN-2024-38,tgk,169197,168852,0.0060\nCC-MAIN-2024-38,tgl,253394,251507,0.0090\nCC-MAIN-2024-38,tha,11592325,11543412,0.4139\nCC-MAIN-2024-38,tir,22736,22597,0.0008\nCC-MAIN-2024-38,ton,2581,2574,0.0001\nCC-MAIN-2024-38,tsn,2966,2963,0.0001\nCC-MAIN-2024-38,tso,1286,1278,0.0000\nCC-MAIN-2024-38,tuk,54454,54316,0.0019\nCC-MAIN-2024-38,tur,34528339,34413393,1.2328\nCC-MAIN-2024-38,uig,27546,27470,0.0010\nCC-MAIN-2024-38,ukr,15764922,15379441,0.5629\nCC-MAIN-2024-38,urd,835728,832560,0.0298\nCC-MAIN-2024-38,uzb,738616,736371,0.0264\nCC-MAIN-2024-38,ven,645,645,0.0000\nCC-MAIN-2024-38,vie,28939816,28780418,1.0332\nCC-MAIN-2024-38,vol,14135,14114,0.0005\nCC-MAIN-2024-38,war,54423,54306,0.0019\nCC-MAIN-2024-38,wol,3970,3963,0.0001\nCC-MAIN-2024-38,xho,50285,50175,0.0018\nCC-MAIN-2024-38,yid,42158,42026,0.0015\nCC-MAIN-2024-38,yor,23222,23085,0.0008\nCC-MAIN-2024-38,zha,1779,1774,0.0001\nCC-MAIN-2024-38,zho,129584966,129089371,4.6266\nCC-MAIN-2024-38,zul,60168,59960,0.0021\nCC-MAIN-2024-42,<unknown>,81791281,81791281,3.2780\nCC-MAIN-2024-42,aar,2239,2231,0.0001\nCC-MAIN-2024-42,abk,12478,12426,0.0005\nCC-MAIN-2024-42,afr,257379,256851,0.0103\nCC-MAIN-2024-42,aka,3245,3243,0.0001\nCC-MAIN-2024-42,amh,75677,75328,0.0030\nCC-MAIN-2024-42,ara,16741132,16677949,0.6709\nCC-MAIN-2024-42,asm,60812,60723,0.0024\nCC-MAIN-2024-42,aym,2268,2251,0.0001\nCC-MAIN-2024-42,aze,1713701,1706040,0.0687\nCC-MAIN-2024-42,bak,72089,72049,0.0029\nCC-MAIN-2024-42,bel,405378,404154,0.0162\nCC-MAIN-2024-42,ben,2959065,2952660,0.1186\nCC-MAIN-2024-42,bih,14127,14089,0.0006\nCC-MAIN-2024-42,bis,3601,3588,0.0001\nCC-MAIN-2024-42,bod,36426,36232,0.0015\nCC-MAIN-2024-42,bos,1306203,1303276,0.0523\nCC-MAIN-2024-42,bre,84216,84167,0.0034\nCC-MAIN-2024-42,bul,7466418,7443423,0.2992\nCC-MAIN-2024-42,cat,5202242,5166138,0.2085\nCC-MAIN-2024-42,ceb,49577,49509,0.0020\nCC-MAIN-2024-42,ces,26523613,26331032,1.0630\nCC-MAIN-2024-42,chr,1137,1137,0.0000\nCC-MAIN-2024-42,cos,50203,50074,0.0020\nCC-MAIN-2024-42,crs,2858,2841,0.0001\nCC-MAIN-2024-42,cym,292253,291219,0.0117\nCC-MAIN-2024-42,dan,11578641,11490004,0.4640\nCC-MAIN-2024-42,deu,132338944,131500938,5.3038\nCC-MAIN-2024-42,div,57520,57472,0.0023\nCC-MAIN-2024-42,dzo,3534,3534,0.0001\nCC-MAIN-2024-42,ell,14293044,14246131,0.5728\nCC-MAIN-2024-42,eng,1083513299,1077124596,43.4241\nCC-MAIN-2024-42,epo,208797,208418,0.0084\nCC-MAIN-2024-42,est,3307831,3288496,0.1326\nCC-MAIN-2024-42,eus,999461,993610,0.0401\nCC-MAIN-2024-42,fao,120324,119958,0.0048\nCC-MAIN-2024-42,fas,17594396,17545147,0.7051\nCC-MAIN-2024-42,fij,2498,2498,0.0001\nCC-MAIN-2024-42,fin,8593516,8541494,0.3444\nCC-MAIN-2024-42,fra,109687926,109128005,4.3960\nCC-MAIN-2024-42,fry,71537,71367,0.0029\nCC-MAIN-2024-42,gla,34176,34100,0.0014\nCC-MAIN-2024-42,gle,175974,174578,0.0071\nCC-MAIN-2024-42,glg,909830,903845,0.0365\nCC-MAIN-2024-42,glv,8708,8692,0.0003\nCC-MAIN-2024-42,got,447,447,0.0000\nCC-MAIN-2024-42,grn,16269,16222,0.0007\nCC-MAIN-2024-42,guj,282755,282072,0.0113\nCC-MAIN-2024-42,hat,47165,47059,0.0019\nCC-MAIN-2024-42,hau,68262,67896,0.0027\nCC-MAIN-2024-42,haw,17704,17652,0.0007\nCC-MAIN-2024-42,heb,6169483,6145150,0.2473\nCC-MAIN-2024-42,hin,5211550,5198234,0.2089\nCC-MAIN-2024-42,hmn,14399,14351,0.0006\nCC-MAIN-2024-42,hrv,5362886,5344823,0.2149\nCC-MAIN-2024-42,hun,14096256,14032587,0.5649\nCC-MAIN-2024-42,hye,849092,845053,0.0340\nCC-MAIN-2024-42,ibo,16825,16778,0.0007\nCC-MAIN-2024-42,iku,5706,5703,0.0002\nCC-MAIN-2024-42,ile,9051,9018,0.0004\nCC-MAIN-2024-42,ina,13058,13045,0.0005\nCC-MAIN-2024-42,ind,28033891,27837647,1.1235\nCC-MAIN-2024-42,ipk,1736,1734,0.0001\nCC-MAIN-2024-42,isl,992003,987916,0.0398\nCC-MAIN-2024-42,ita,63082635,62785741,2.5282\nCC-MAIN-2024-42,jav,55212,55142,0.0022\nCC-MAIN-2024-42,jpn,125805829,125404049,5.0419\nCC-MAIN-2024-42,kal,22981,22822,0.0009\nCC-MAIN-2024-42,kan,355203,354744,0.0142\nCC-MAIN-2024-42,kas,15,15,0.0000\nCC-MAIN-2024-42,kat,1053050,1042575,0.0422\nCC-MAIN-2024-42,kaz,703746,701334,0.0282\nCC-MAIN-2024-42,kha,9020,9009,0.0004\nCC-MAIN-2024-42,khm,264291,263214,0.0106\nCC-MAIN-2024-42,kin,56377,56231,0.0023\nCC-MAIN-2024-42,kir,244370,243637,0.0098\nCC-MAIN-2024-42,kor,18435212,18366866,0.7388\nCC-MAIN-2024-42,kur,184030,183746,0.0074\nCC-MAIN-2024-42,lao,93468,92865,0.0037\nCC-MAIN-2024-42,lat,2512878,2508096,0.1007\nCC-MAIN-2024-42,lav,2350056,2334490,0.0942\nCC-MAIN-2024-42,lif,42,42,0.0000\nCC-MAIN-2024-42,lin,7514,7497,0.0003\nCC-MAIN-2024-42,lit,4162556,4141732,0.1668\nCC-MAIN-2024-42,ltz,99637,99363,0.0040\nCC-MAIN-2024-42,lug,5425,5381,0.0002\nCC-MAIN-2024-42,mal,670259,668501,0.0269\nCC-MAIN-2024-42,mar,643695,641895,0.0258\nCC-MAIN-2024-42,mfe,3742,3735,0.0001\nCC-MAIN-2024-42,mkd,955225,952511,0.0383\nCC-MAIN-2024-42,mlg,90814,90491,0.0036\nCC-MAIN-2024-42,mlt,122428,120509,0.0049\nCC-MAIN-2024-42,mon,401925,400924,0.0161\nCC-MAIN-2024-42,mri,29912,29758,0.0012\nCC-MAIN-2024-42,msa,1963309,1957982,0.0787\nCC-MAIN-2024-42,mya,348788,347874,0.0140\nCC-MAIN-2024-42,nau,1092,1089,0.0000\nCC-MAIN-2024-42,nep,1229976,1227407,0.0493\nCC-MAIN-2024-42,nld,45275645,45000682,1.8145\nCC-MAIN-2024-42,nno,323831,322475,0.0130\nCC-MAIN-2024-42,nor,7636107,7593408,0.3060\nCC-MAIN-2024-42,nso,1346,1345,0.0001\nCC-MAIN-2024-42,nya,14940,14904,0.0006\nCC-MAIN-2024-42,oci,85086,84852,0.0034\nCC-MAIN-2024-42,ori,141619,141222,0.0057\nCC-MAIN-2024-42,orm,12658,12640,0.0005\nCC-MAIN-2024-42,pan,196613,195754,0.0079\nCC-MAIN-2024-42,pol,45076434,44867835,1.8065\nCC-MAIN-2024-42,por,57754152,57512240,2.3146\nCC-MAIN-2024-42,pus,86340,86196,0.0035\nCC-MAIN-2024-42,que,13575,13525,0.0005\nCC-MAIN-2024-42,roh,25137,24968,0.0010\nCC-MAIN-2024-42,ron,14916026,14861884,0.5978\nCC-MAIN-2024-42,run,1670,1664,0.0001\nCC-MAIN-2024-42,rus,150820146,150248225,6.0444\nCC-MAIN-2024-42,sag,10405,10405,0.0004\nCC-MAIN-2024-42,san,83674,83424,0.0034\nCC-MAIN-2024-42,sco,17887,17842,0.0007\nCC-MAIN-2024-42,sin,224196,223888,0.0090\nCC-MAIN-2024-42,slk,9244448,9200711,0.3705\nCC-MAIN-2024-42,slv,3886713,3861262,0.1558\nCC-MAIN-2024-42,smo,16623,16542,0.0007\nCC-MAIN-2024-42,sna,15401,15349,0.0006\nCC-MAIN-2024-42,snd,42464,42342,0.0017\nCC-MAIN-2024-42,som,124950,123993,0.0050\nCC-MAIN-2024-42,sot,15071,15024,0.0006\nCC-MAIN-2024-42,spa,113249321,112711686,4.5387\nCC-MAIN-2024-42,sqi,1239080,1236250,0.0497\nCC-MAIN-2024-42,srp,5391996,5371839,0.2161\nCC-MAIN-2024-42,ssw,799,797,0.0000\nCC-MAIN-2024-42,sun,26131,26061,0.0010\nCC-MAIN-2024-42,sux,314,313,0.0000\nCC-MAIN-2024-42,swa,240410,239627,0.0096\nCC-MAIN-2024-42,swe,16590009,16496719,0.6649\nCC-MAIN-2024-42,syr,7868,7861,0.0003\nCC-MAIN-2024-42,tam,1179123,1176780,0.0473\nCC-MAIN-2024-42,tat,215926,215677,0.0087\nCC-MAIN-2024-42,tel,548086,547201,0.0220\nCC-MAIN-2024-42,tgk,160623,160335,0.0064\nCC-MAIN-2024-42,tgl,220739,219855,0.0088\nCC-MAIN-2024-42,tha,10158510,10111907,0.4071\nCC-MAIN-2024-42,tir,17881,17747,0.0007\nCC-MAIN-2024-42,ton,1991,1980,0.0001\nCC-MAIN-2024-42,tsn,2808,2802,0.0001\nCC-MAIN-2024-42,tso,1474,1470,0.0001\nCC-MAIN-2024-42,tuk,52562,52462,0.0021\nCC-MAIN-2024-42,tur,30995273,30885982,1.2422\nCC-MAIN-2024-42,uig,25965,25918,0.0010\nCC-MAIN-2024-42,ukr,15063301,14701575,0.6037\nCC-MAIN-2024-42,urd,763665,761940,0.0306\nCC-MAIN-2024-42,uzb,730957,728668,0.0293\nCC-MAIN-2024-42,ven,673,671,0.0000\nCC-MAIN-2024-42,vie,26084993,25900759,1.0454\nCC-MAIN-2024-42,vol,12814,12792,0.0005\nCC-MAIN-2024-42,war,57329,57220,0.0023\nCC-MAIN-2024-42,wol,3500,3496,0.0001\nCC-MAIN-2024-42,xho,57372,57216,0.0023\nCC-MAIN-2024-42,yid,42276,42191,0.0017\nCC-MAIN-2024-42,yor,24547,24265,0.0010\nCC-MAIN-2024-42,zha,2587,2585,0.0001\nCC-MAIN-2024-42,zho,120090598,119635961,4.8129\nCC-MAIN-2024-42,zul,63272,63157,0.0025\nCC-MAIN-2024-46,<unknown>,81132463,81132463,3.0185\nCC-MAIN-2024-46,aar,2942,2923,0.0001\nCC-MAIN-2024-46,abk,13268,13186,0.0005\nCC-MAIN-2024-46,afr,262061,261583,0.0097\nCC-MAIN-2024-46,aka,2289,2288,0.0001\nCC-MAIN-2024-46,amh,74149,73887,0.0028\nCC-MAIN-2024-46,ara,18344689,18274530,0.6825\nCC-MAIN-2024-46,asm,69704,69626,0.0026\nCC-MAIN-2024-46,aym,1774,1773,0.0001\nCC-MAIN-2024-46,aze,1697797,1691472,0.0632\nCC-MAIN-2024-46,bak,75028,74969,0.0028\nCC-MAIN-2024-46,bel,428267,427097,0.0159\nCC-MAIN-2024-46,ben,3109039,3102840,0.1157\nCC-MAIN-2024-46,bih,13998,13978,0.0005\nCC-MAIN-2024-46,bis,3253,3250,0.0001\nCC-MAIN-2024-46,bod,37260,36959,0.0014\nCC-MAIN-2024-46,bos,1390386,1386802,0.0517\nCC-MAIN-2024-46,bre,58576,58481,0.0022\nCC-MAIN-2024-46,bul,7830069,7807909,0.2913\nCC-MAIN-2024-46,cat,5370705,5337676,0.1998\nCC-MAIN-2024-46,ceb,50077,50024,0.0019\nCC-MAIN-2024-46,ces,27367515,27188104,1.0182\nCC-MAIN-2024-46,chr,825,825,0.0000\nCC-MAIN-2024-46,cos,55103,55011,0.0021\nCC-MAIN-2024-46,crs,2853,2847,0.0001\nCC-MAIN-2024-46,cym,324599,323125,0.0121\nCC-MAIN-2024-46,dan,12637983,12552768,0.4702\nCC-MAIN-2024-46,deu,143428305,142603353,5.3362\nCC-MAIN-2024-46,div,60689,60663,0.0023\nCC-MAIN-2024-46,dzo,4442,4441,0.0002\nCC-MAIN-2024-46,ell,15563778,15515421,0.5791\nCC-MAIN-2024-46,eng,1155554705,1149249615,42.9924\nCC-MAIN-2024-46,epo,234033,233680,0.0087\nCC-MAIN-2024-46,est,3580363,3559960,0.1332\nCC-MAIN-2024-46,eus,966440,961498,0.0360\nCC-MAIN-2024-46,fao,120661,120213,0.0045\nCC-MAIN-2024-46,fas,19854104,19802178,0.7387\nCC-MAIN-2024-46,fij,2847,2841,0.0001\nCC-MAIN-2024-46,fin,9297001,9247224,0.3459\nCC-MAIN-2024-46,fra,117030857,116431650,4.3541\nCC-MAIN-2024-46,fry,55038,54868,0.0020\nCC-MAIN-2024-46,gla,34522,34452,0.0013\nCC-MAIN-2024-46,gle,174162,173328,0.0065\nCC-MAIN-2024-46,glg,874520,868608,0.0325\nCC-MAIN-2024-46,glv,9951,9929,0.0004\nCC-MAIN-2024-46,got,490,490,0.0000\nCC-MAIN-2024-46,grn,21424,21364,0.0008\nCC-MAIN-2024-46,guj,330527,329902,0.0123\nCC-MAIN-2024-46,hat,51031,50898,0.0019\nCC-MAIN-2024-46,hau,71117,70718,0.0026\nCC-MAIN-2024-46,haw,19963,19923,0.0007\nCC-MAIN-2024-46,heb,6767347,6743566,0.2518\nCC-MAIN-2024-46,hin,5552268,5537403,0.2066\nCC-MAIN-2024-46,hmn,16458,16415,0.0006\nCC-MAIN-2024-46,hrv,6043330,6022904,0.2248\nCC-MAIN-2024-46,hun,15266264,15201367,0.5680\nCC-MAIN-2024-46,hye,914074,909665,0.0340\nCC-MAIN-2024-46,ibo,16866,16817,0.0006\nCC-MAIN-2024-46,iku,5635,5621,0.0002\nCC-MAIN-2024-46,ile,10011,9980,0.0004\nCC-MAIN-2024-46,ina,15111,15078,0.0006\nCC-MAIN-2024-46,ind,30066768,29860494,1.1186\nCC-MAIN-2024-46,ipk,1574,1571,0.0001\nCC-MAIN-2024-46,isl,1075904,1071717,0.0400\nCC-MAIN-2024-46,ita,67067190,66779634,2.4952\nCC-MAIN-2024-46,jav,57667,57601,0.0021\nCC-MAIN-2024-46,jpn,138324031,137935609,5.1463\nCC-MAIN-2024-46,kal,23987,23595,0.0009\nCC-MAIN-2024-46,kan,380991,379764,0.0142\nCC-MAIN-2024-46,kas,22,22,0.0000\nCC-MAIN-2024-46,kat,1107571,1104663,0.0412\nCC-MAIN-2024-46,kaz,731749,726454,0.0272\nCC-MAIN-2024-46,kha,11443,11428,0.0004\nCC-MAIN-2024-46,khm,281981,281338,0.0105\nCC-MAIN-2024-46,kin,56554,56454,0.0021\nCC-MAIN-2024-46,kir,243869,243312,0.0091\nCC-MAIN-2024-46,kor,19426897,19357553,0.7228\nCC-MAIN-2024-46,kur,191223,190658,0.0071\nCC-MAIN-2024-46,lao,93249,92818,0.0035\nCC-MAIN-2024-46,lat,3414580,3407776,0.1270\nCC-MAIN-2024-46,lav,2425212,2407632,0.0902\nCC-MAIN-2024-46,lif,57,57,0.0000\nCC-MAIN-2024-46,lin,7679,7665,0.0003\nCC-MAIN-2024-46,lit,4297823,4275951,0.1599\nCC-MAIN-2024-46,ltz,105435,105179,0.0039\nCC-MAIN-2024-46,lug,4666,4659,0.0002\nCC-MAIN-2024-46,mal,724320,722009,0.0269\nCC-MAIN-2024-46,mar,737173,735227,0.0274\nCC-MAIN-2024-46,mfe,3844,3833,0.0001\nCC-MAIN-2024-46,mkd,1029521,1027149,0.0383\nCC-MAIN-2024-46,mlg,78089,77934,0.0029\nCC-MAIN-2024-46,mlt,117888,116766,0.0044\nCC-MAIN-2024-46,mon,408709,407451,0.0152\nCC-MAIN-2024-46,mri,30461,30319,0.0011\nCC-MAIN-2024-46,msa,2069184,2062440,0.0770\nCC-MAIN-2024-46,mya,350620,349767,0.0130\nCC-MAIN-2024-46,nau,1274,1266,0.0000\nCC-MAIN-2024-46,nep,1404261,1400690,0.0522\nCC-MAIN-2024-46,nld,49108754,48824021,1.8271\nCC-MAIN-2024-46,nno,371114,366165,0.0138\nCC-MAIN-2024-46,nor,8073489,8028744,0.3004\nCC-MAIN-2024-46,nso,2084,2083,0.0001\nCC-MAIN-2024-46,nya,14363,14322,0.0005\nCC-MAIN-2024-46,oci,87494,87302,0.0033\nCC-MAIN-2024-46,ori,155821,155593,0.0058\nCC-MAIN-2024-46,orm,14112,14102,0.0005\nCC-MAIN-2024-46,pan,215558,214671,0.0080\nCC-MAIN-2024-46,pol,49682575,49476253,1.8484\nCC-MAIN-2024-46,por,62603582,62353834,2.3292\nCC-MAIN-2024-46,pus,85512,85386,0.0032\nCC-MAIN-2024-46,que,15601,15584,0.0006\nCC-MAIN-2024-46,roh,29983,29680,0.0011\nCC-MAIN-2024-46,ron,16571613,16516286,0.6165\nCC-MAIN-2024-46,run,2209,2208,0.0001\nCC-MAIN-2024-46,rus,166895517,166264702,6.2093\nCC-MAIN-2024-46,sag,11514,11512,0.0004\nCC-MAIN-2024-46,san,88890,88683,0.0033\nCC-MAIN-2024-46,sco,20076,20028,0.0007\nCC-MAIN-2024-46,sin,235519,235186,0.0088\nCC-MAIN-2024-46,slk,9967455,9924962,0.3708\nCC-MAIN-2024-46,slv,4368882,4343130,0.1625\nCC-MAIN-2024-46,smo,15912,15830,0.0006\nCC-MAIN-2024-46,sna,14924,14874,0.0006\nCC-MAIN-2024-46,snd,41127,40966,0.0015\nCC-MAIN-2024-46,som,135052,134519,0.0050\nCC-MAIN-2024-46,sot,16176,16072,0.0006\nCC-MAIN-2024-46,spa,124052311,123497642,4.6154\nCC-MAIN-2024-46,sqi,1332983,1329917,0.0496\nCC-MAIN-2024-46,srp,5942774,5919623,0.2211\nCC-MAIN-2024-46,ssw,926,924,0.0000\nCC-MAIN-2024-46,sun,27432,27374,0.0010\nCC-MAIN-2024-46,sux,231,231,0.0000\nCC-MAIN-2024-46,swa,245650,245025,0.0091\nCC-MAIN-2024-46,swe,17679461,17582637,0.6578\nCC-MAIN-2024-46,syr,9836,9811,0.0004\nCC-MAIN-2024-46,tam,1207901,1205534,0.0449\nCC-MAIN-2024-46,tat,204537,204194,0.0076\nCC-MAIN-2024-46,tel,533921,532368,0.0199\nCC-MAIN-2024-46,tgk,181059,180814,0.0067\nCC-MAIN-2024-46,tgl,236197,235032,0.0088\nCC-MAIN-2024-46,tha,11364366,11310769,0.4228\nCC-MAIN-2024-46,tir,19006,18924,0.0007\nCC-MAIN-2024-46,ton,2901,2875,0.0001\nCC-MAIN-2024-46,tsn,2739,2733,0.0001\nCC-MAIN-2024-46,tso,2213,2207,0.0001\nCC-MAIN-2024-46,tuk,55514,55407,0.0021\nCC-MAIN-2024-46,tur,33542246,33425493,1.2479\nCC-MAIN-2024-46,uig,29715,29675,0.0011\nCC-MAIN-2024-46,ukr,16386581,15999151,0.6097\nCC-MAIN-2024-46,urd,807051,804295,0.0300\nCC-MAIN-2024-46,uzb,613046,610977,0.0228\nCC-MAIN-2024-46,ven,993,989,0.0000\nCC-MAIN-2024-46,vie,27811795,27645864,1.0347\nCC-MAIN-2024-46,vol,13253,13227,0.0005\nCC-MAIN-2024-46,war,54186,54106,0.0020\nCC-MAIN-2024-46,wol,3963,3957,0.0001\nCC-MAIN-2024-46,xho,56477,56397,0.0021\nCC-MAIN-2024-46,yid,39441,39290,0.0015\nCC-MAIN-2024-46,yor,23738,23406,0.0009\nCC-MAIN-2024-46,zha,1620,1617,0.0001\nCC-MAIN-2024-46,zho,137756044,137388432,5.1252\nCC-MAIN-2024-46,zul,66260,66158,0.0025\nCC-MAIN-2024-51,<unknown>,80776963,80776963,3.0651\nCC-MAIN-2024-51,aar,1814,1806,0.0001\nCC-MAIN-2024-51,abk,14039,13951,0.0005\nCC-MAIN-2024-51,afr,250545,249778,0.0095\nCC-MAIN-2024-51,aka,1893,1889,0.0001\nCC-MAIN-2024-51,amh,65659,65437,0.0025\nCC-MAIN-2024-51,ara,18019226,17929766,0.6837\nCC-MAIN-2024-51,asm,64916,64853,0.0025\nCC-MAIN-2024-51,aym,1671,1667,0.0001\nCC-MAIN-2024-51,aze,1619700,1614158,0.0615\nCC-MAIN-2024-51,bak,65212,65174,0.0025\nCC-MAIN-2024-51,bel,391272,389772,0.0148\nCC-MAIN-2024-51,ben,2987498,2981453,0.1134\nCC-MAIN-2024-51,bih,13463,13444,0.0005\nCC-MAIN-2024-51,bis,2352,2350,0.0001\nCC-MAIN-2024-51,bod,39297,39234,0.0015\nCC-MAIN-2024-51,bos,1383800,1380522,0.0525\nCC-MAIN-2024-51,bre,88438,88402,0.0034\nCC-MAIN-2024-51,bul,7861707,7836508,0.2983\nCC-MAIN-2024-51,cat,5244334,5209249,0.1990\nCC-MAIN-2024-51,ceb,47821,47757,0.0018\nCC-MAIN-2024-51,ces,26236025,26038433,0.9955\nCC-MAIN-2024-51,chr,699,696,0.0000\nCC-MAIN-2024-51,cos,49816,49719,0.0019\nCC-MAIN-2024-51,crs,2107,2096,0.0001\nCC-MAIN-2024-51,cym,288839,287466,0.0110\nCC-MAIN-2024-51,dan,11692398,11609735,0.4437\nCC-MAIN-2024-51,deu,142212554,141365379,5.3963\nCC-MAIN-2024-51,div,64678,64635,0.0025\nCC-MAIN-2024-51,dzo,4356,4356,0.0002\nCC-MAIN-2024-51,ell,15230193,15179513,0.5779\nCC-MAIN-2024-51,eng,1127889690,1121417327,42.7983\nCC-MAIN-2024-51,epo,186394,186045,0.0071\nCC-MAIN-2024-51,est,3491199,3471403,0.1325\nCC-MAIN-2024-51,eus,967013,961478,0.0367\nCC-MAIN-2024-51,fao,111317,110863,0.0042\nCC-MAIN-2024-51,fas,19610783,19546172,0.7441\nCC-MAIN-2024-51,fij,2351,2346,0.0001\nCC-MAIN-2024-51,fin,9249456,9198215,0.3510\nCC-MAIN-2024-51,fra,116244890,115627515,4.4110\nCC-MAIN-2024-51,fry,71581,71419,0.0027\nCC-MAIN-2024-51,gla,35298,35203,0.0013\nCC-MAIN-2024-51,gle,182090,181199,0.0069\nCC-MAIN-2024-51,glg,850750,844955,0.0323\nCC-MAIN-2024-51,glv,8991,8979,0.0003\nCC-MAIN-2024-51,got,414,414,0.0000\nCC-MAIN-2024-51,grn,20067,20034,0.0008\nCC-MAIN-2024-51,guj,309619,309029,0.0117\nCC-MAIN-2024-51,hat,49621,49475,0.0019\nCC-MAIN-2024-51,hau,71925,71472,0.0027\nCC-MAIN-2024-51,haw,16859,16802,0.0006\nCC-MAIN-2024-51,heb,6591598,6565396,0.2501\nCC-MAIN-2024-51,hin,5257321,5244200,0.1995\nCC-MAIN-2024-51,hmn,14854,14765,0.0006\nCC-MAIN-2024-51,hrv,5825383,5803860,0.2210\nCC-MAIN-2024-51,hun,13627221,13568810,0.5171\nCC-MAIN-2024-51,hye,883531,880547,0.0335\nCC-MAIN-2024-51,ibo,17649,17524,0.0007\nCC-MAIN-2024-51,iku,5866,5855,0.0002\nCC-MAIN-2024-51,ile,8919,8885,0.0003\nCC-MAIN-2024-51,ina,13343,13320,0.0005\nCC-MAIN-2024-51,ind,29123660,28912628,1.1051\nCC-MAIN-2024-51,ipk,1875,1872,0.0001\nCC-MAIN-2024-51,isl,1076544,1072025,0.0408\nCC-MAIN-2024-51,ita,63615674,63344106,2.4139\nCC-MAIN-2024-51,jav,61546,61467,0.0023\nCC-MAIN-2024-51,jpn,139196220,138797908,5.2819\nCC-MAIN-2024-51,kal,21369,21160,0.0008\nCC-MAIN-2024-51,kan,349330,348549,0.0133\nCC-MAIN-2024-51,kas,21,21,0.0000\nCC-MAIN-2024-51,kat,1051485,1048894,0.0399\nCC-MAIN-2024-51,kaz,747400,743797,0.0284\nCC-MAIN-2024-51,kha,11332,11319,0.0004\nCC-MAIN-2024-51,khm,269767,268998,0.0102\nCC-MAIN-2024-51,kin,58165,57998,0.0022\nCC-MAIN-2024-51,kir,272303,271748,0.0103\nCC-MAIN-2024-51,kor,19976446,19907529,0.7580\nCC-MAIN-2024-51,kur,179584,178946,0.0068\nCC-MAIN-2024-51,lao,83653,83265,0.0032\nCC-MAIN-2024-51,lat,2737836,2733499,0.1039\nCC-MAIN-2024-51,lav,2365337,2344611,0.0898\nCC-MAIN-2024-51,lif,46,46,0.0000\nCC-MAIN-2024-51,lin,6096,6088,0.0002\nCC-MAIN-2024-51,lit,4264763,4244084,0.1618\nCC-MAIN-2024-51,ltz,101450,101189,0.0038\nCC-MAIN-2024-51,lug,3839,3828,0.0001\nCC-MAIN-2024-51,mal,670361,668243,0.0254\nCC-MAIN-2024-51,mar,713365,711481,0.0271\nCC-MAIN-2024-51,mfe,4071,4060,0.0002\nCC-MAIN-2024-51,mkd,975726,972819,0.0370\nCC-MAIN-2024-51,mlg,84474,84287,0.0032\nCC-MAIN-2024-51,mlt,90182,88541,0.0034\nCC-MAIN-2024-51,mon,407339,406227,0.0155\nCC-MAIN-2024-51,mri,31531,31384,0.0012\nCC-MAIN-2024-51,msa,2032931,2026982,0.0771\nCC-MAIN-2024-51,mya,337196,336470,0.0128\nCC-MAIN-2024-51,nau,1166,1163,0.0000\nCC-MAIN-2024-51,nep,1372719,1369220,0.0521\nCC-MAIN-2024-51,nld,47682015,47405263,1.8093\nCC-MAIN-2024-51,nno,431262,419265,0.0164\nCC-MAIN-2024-51,nor,7966787,7916825,0.3023\nCC-MAIN-2024-51,nso,2810,2810,0.0001\nCC-MAIN-2024-51,nya,13537,13478,0.0005\nCC-MAIN-2024-51,oci,103005,102805,0.0039\nCC-MAIN-2024-51,ori,160041,159653,0.0061\nCC-MAIN-2024-51,orm,11796,11774,0.0004\nCC-MAIN-2024-51,pan,198448,197606,0.0075\nCC-MAIN-2024-51,pol,50261702,50044646,1.9072\nCC-MAIN-2024-51,por,61565427,61309432,2.3361\nCC-MAIN-2024-51,pus,86341,86183,0.0033\nCC-MAIN-2024-51,que,12951,12943,0.0005\nCC-MAIN-2024-51,roh,29886,29285,0.0011\nCC-MAIN-2024-51,ron,16063213,16007745,0.6095\nCC-MAIN-2024-51,run,1706,1706,0.0001\nCC-MAIN-2024-51,rus,162944109,162235945,6.1830\nCC-MAIN-2024-51,sag,6589,6589,0.0003\nCC-MAIN-2024-51,san,82123,81893,0.0031\nCC-MAIN-2024-51,sco,14716,14564,0.0006\nCC-MAIN-2024-51,sin,246004,245573,0.0093\nCC-MAIN-2024-51,slk,9471646,9429856,0.3594\nCC-MAIN-2024-51,slv,4156336,4126191,0.1577\nCC-MAIN-2024-51,smo,17118,17008,0.0006\nCC-MAIN-2024-51,sna,17871,17783,0.0007\nCC-MAIN-2024-51,snd,37858,37765,0.0014\nCC-MAIN-2024-51,som,124028,123818,0.0047\nCC-MAIN-2024-51,sot,16231,16006,0.0006\nCC-MAIN-2024-51,spa,120762894,120192647,4.5824\nCC-MAIN-2024-51,sqi,1204394,1201119,0.0457\nCC-MAIN-2024-51,srp,5805732,5783509,0.2203\nCC-MAIN-2024-51,ssw,732,727,0.0000\nCC-MAIN-2024-51,sun,27114,27051,0.0010\nCC-MAIN-2024-51,sux,302,302,0.0000\nCC-MAIN-2024-51,swa,219746,219308,0.0083\nCC-MAIN-2024-51,swe,16965363,16862913,0.6438\nCC-MAIN-2024-51,syr,7890,7858,0.0003\nCC-MAIN-2024-51,tam,1152592,1150401,0.0437\nCC-MAIN-2024-51,tat,222649,222411,0.0084\nCC-MAIN-2024-51,tel,529947,528838,0.0201\nCC-MAIN-2024-51,tgk,183732,183430,0.0070\nCC-MAIN-2024-51,tgl,223121,221961,0.0085\nCC-MAIN-2024-51,tha,11068508,11020693,0.4200\nCC-MAIN-2024-51,tir,18037,17968,0.0007\nCC-MAIN-2024-51,ton,2615,2583,0.0001\nCC-MAIN-2024-51,tsn,2460,2452,0.0001\nCC-MAIN-2024-51,tso,1638,1634,0.0001\nCC-MAIN-2024-51,tuk,56441,56323,0.0021\nCC-MAIN-2024-51,tur,33038464,32918864,1.2537\nCC-MAIN-2024-51,uig,32850,32796,0.0012\nCC-MAIN-2024-51,ukr,16290360,15928561,0.6181\nCC-MAIN-2024-51,urd,770635,768362,0.0292\nCC-MAIN-2024-51,uzb,581198,579241,0.0221\nCC-MAIN-2024-51,ven,718,716,0.0000\nCC-MAIN-2024-51,vie,26704566,26532858,1.0133\nCC-MAIN-2024-51,vol,11301,11291,0.0004\nCC-MAIN-2024-51,war,54220,54132,0.0021\nCC-MAIN-2024-51,wol,3379,3375,0.0001\nCC-MAIN-2024-51,xho,22391,22279,0.0008\nCC-MAIN-2024-51,yid,40798,40705,0.0015\nCC-MAIN-2024-51,yor,22401,22343,0.0009\nCC-MAIN-2024-51,zha,2348,2339,0.0001\nCC-MAIN-2024-51,zho,138935062,138467460,5.2720\nCC-MAIN-2024-51,zul,34122,34023,0.0013\nCC-MAIN-2025-05,<unknown>,81689418,81689418,2.6949\nCC-MAIN-2025-05,aar,2430,2418,0.0001\nCC-MAIN-2025-05,abk,16521,16456,0.0005\nCC-MAIN-2025-05,afr,263072,262399,0.0087\nCC-MAIN-2025-05,aka,4414,4362,0.0001\nCC-MAIN-2025-05,amh,84766,84494,0.0028\nCC-MAIN-2025-05,ara,20128173,20025763,0.6640\nCC-MAIN-2025-05,asm,75614,75461,0.0025\nCC-MAIN-2025-05,aym,1608,1602,0.0001\nCC-MAIN-2025-05,aze,1734307,1727702,0.0572\nCC-MAIN-2025-05,bak,77804,77783,0.0026\nCC-MAIN-2025-05,bel,433342,431735,0.0143\nCC-MAIN-2025-05,ben,3300634,3292407,0.1089\nCC-MAIN-2025-05,bih,16591,16565,0.0005\nCC-MAIN-2025-05,bis,3233,3228,0.0001\nCC-MAIN-2025-05,bod,40941,40919,0.0014\nCC-MAIN-2025-05,bos,1575665,1571389,0.0520\nCC-MAIN-2025-05,bre,54833,54783,0.0018\nCC-MAIN-2025-05,bul,9048470,9018684,0.2985\nCC-MAIN-2025-05,cat,5686590,5650439,0.1876\nCC-MAIN-2025-05,ceb,46597,46555,0.0015\nCC-MAIN-2025-05,ces,30996269,30757320,1.0225\nCC-MAIN-2025-05,chr,1030,1030,0.0000\nCC-MAIN-2025-05,cos,57756,57650,0.0019\nCC-MAIN-2025-05,crs,2485,2474,0.0001\nCC-MAIN-2025-05,cym,331255,330364,0.0109\nCC-MAIN-2025-05,dan,14702983,14597627,0.4850\nCC-MAIN-2025-05,deu,169319555,168287738,5.5857\nCC-MAIN-2025-05,div,67481,67446,0.0022\nCC-MAIN-2025-05,dzo,5874,5873,0.0002\nCC-MAIN-2025-05,ell,17399682,17344350,0.5740\nCC-MAIN-2025-05,eng,1314648153,1306609042,43.3694\nCC-MAIN-2025-05,epo,224109,223675,0.0074\nCC-MAIN-2025-05,est,4077291,4055797,0.1345\nCC-MAIN-2025-05,eus,1050759,1045440,0.0347\nCC-MAIN-2025-05,fao,134944,134455,0.0045\nCC-MAIN-2025-05,fas,21976765,21905513,0.7250\nCC-MAIN-2025-05,fij,2922,2922,0.0001\nCC-MAIN-2025-05,fin,11148252,11084255,0.3678\nCC-MAIN-2025-05,fra,137076159,136300509,4.5221\nCC-MAIN-2025-05,fry,60979,60820,0.0020\nCC-MAIN-2025-05,gla,40645,40596,0.0013\nCC-MAIN-2025-05,gle,201170,200118,0.0066\nCC-MAIN-2025-05,glg,968585,962432,0.0320\nCC-MAIN-2025-05,glv,15241,15230,0.0005\nCC-MAIN-2025-05,got,685,685,0.0000\nCC-MAIN-2025-05,grn,21264,21214,0.0007\nCC-MAIN-2025-05,guj,363963,363084,0.0120\nCC-MAIN-2025-05,hat,54663,54573,0.0018\nCC-MAIN-2025-05,hau,80117,79813,0.0026\nCC-MAIN-2025-05,haw,18225,18189,0.0006\nCC-MAIN-2025-05,heb,8188855,8157031,0.2701\nCC-MAIN-2025-05,hin,5914757,5898206,0.1951\nCC-MAIN-2025-05,hmn,15118,15044,0.0005\nCC-MAIN-2025-05,hrv,6783374,6757668,0.2238\nCC-MAIN-2025-05,hun,15225085,15166267,0.5023\nCC-MAIN-2025-05,hye,964957,961926,0.0318\nCC-MAIN-2025-05,ibo,19667,19593,0.0006\nCC-MAIN-2025-05,iku,6244,6232,0.0002\nCC-MAIN-2025-05,ile,11205,11155,0.0004\nCC-MAIN-2025-05,ina,16676,16654,0.0006\nCC-MAIN-2025-05,ind,35391827,35152086,1.1676\nCC-MAIN-2025-05,ipk,2007,2005,0.0001\nCC-MAIN-2025-05,isl,1281851,1277222,0.0423\nCC-MAIN-2025-05,ita,73212403,72870606,2.4152\nCC-MAIN-2025-05,jav,65493,65396,0.0022\nCC-MAIN-2025-05,jpn,163827865,163328416,5.4046\nCC-MAIN-2025-05,kal,24438,24301,0.0008\nCC-MAIN-2025-05,kan,380218,379102,0.0125\nCC-MAIN-2025-05,kas,28,28,0.0000\nCC-MAIN-2025-05,kat,1199117,1195929,0.0396\nCC-MAIN-2025-05,kaz,823094,819401,0.0272\nCC-MAIN-2025-05,kha,10796,10790,0.0004\nCC-MAIN-2025-05,khm,315877,314772,0.0104\nCC-MAIN-2025-05,kin,58557,58393,0.0019\nCC-MAIN-2025-05,kir,293976,293432,0.0097\nCC-MAIN-2025-05,kor,21773756,21699098,0.7183\nCC-MAIN-2025-05,kur,190527,190235,0.0063\nCC-MAIN-2025-05,lao,98990,98591,0.0033\nCC-MAIN-2025-05,lat,3620984,3613974,0.1195\nCC-MAIN-2025-05,lav,2690532,2670493,0.0888\nCC-MAIN-2025-05,lif,86,86,0.0000\nCC-MAIN-2025-05,lin,7821,7794,0.0003\nCC-MAIN-2025-05,lit,5028510,5002779,0.1659\nCC-MAIN-2025-05,ltz,113812,113548,0.0038\nCC-MAIN-2025-05,lug,4772,4706,0.0002\nCC-MAIN-2025-05,mal,692259,690180,0.0228\nCC-MAIN-2025-05,mar,780788,778797,0.0258\nCC-MAIN-2025-05,mfe,2637,2629,0.0001\nCC-MAIN-2025-05,mkd,1095041,1091650,0.0361\nCC-MAIN-2025-05,mlg,85879,85740,0.0028\nCC-MAIN-2025-05,mlt,91219,88784,0.0030\nCC-MAIN-2025-05,mon,441761,440715,0.0146\nCC-MAIN-2025-05,mri,40204,39939,0.0013\nCC-MAIN-2025-05,msa,2366685,2359136,0.0781\nCC-MAIN-2025-05,mya,391556,390762,0.0129\nCC-MAIN-2025-05,nau,1170,1168,0.0000\nCC-MAIN-2025-05,nep,1572438,1568634,0.0519\nCC-MAIN-2025-05,nld,58100470,57760927,1.9167\nCC-MAIN-2025-05,nno,491063,476815,0.0162\nCC-MAIN-2025-05,nor,9524428,9462053,0.3142\nCC-MAIN-2025-05,nso,3394,3394,0.0001\nCC-MAIN-2025-05,nya,15104,15074,0.0005\nCC-MAIN-2025-05,oci,101867,101706,0.0034\nCC-MAIN-2025-05,ori,170948,170681,0.0056\nCC-MAIN-2025-05,orm,18922,18868,0.0006\nCC-MAIN-2025-05,pan,209791,209094,0.0069\nCC-MAIN-2025-05,pol,55314934,55077135,1.8248\nCC-MAIN-2025-05,por,70504093,70215800,2.3259\nCC-MAIN-2025-05,pus,90536,90392,0.0030\nCC-MAIN-2025-05,que,17390,17383,0.0006\nCC-MAIN-2025-05,roh,29361,28696,0.0010\nCC-MAIN-2025-05,ron,18761426,18695225,0.6189\nCC-MAIN-2025-05,run,1515,1514,0.0000\nCC-MAIN-2025-05,rus,183270308,182494228,6.0460\nCC-MAIN-2025-05,sag,17467,17466,0.0006\nCC-MAIN-2025-05,san,90371,90171,0.0030\nCC-MAIN-2025-05,sco,16592,16533,0.0005\nCC-MAIN-2025-05,sin,297173,296625,0.0098\nCC-MAIN-2025-05,slk,10965623,10914391,0.3617\nCC-MAIN-2025-05,slv,4557879,4533626,0.1504\nCC-MAIN-2025-05,smo,18583,18537,0.0006\nCC-MAIN-2025-05,sna,19812,19766,0.0007\nCC-MAIN-2025-05,snd,42434,42383,0.0014\nCC-MAIN-2025-05,som,140859,140385,0.0046\nCC-MAIN-2025-05,sot,17548,17346,0.0006\nCC-MAIN-2025-05,spa,140703803,140014398,4.6417\nCC-MAIN-2025-05,sqi,1370411,1366461,0.0452\nCC-MAIN-2025-05,srp,6588494,6563577,0.2174\nCC-MAIN-2025-05,ssw,857,855,0.0000\nCC-MAIN-2025-05,sun,29273,29236,0.0010\nCC-MAIN-2025-05,sux,284,284,0.0000\nCC-MAIN-2025-05,swa,257158,256585,0.0085\nCC-MAIN-2025-05,swe,19846451,19732258,0.6547\nCC-MAIN-2025-05,syr,8686,8670,0.0003\nCC-MAIN-2025-05,tam,1278483,1276014,0.0422\nCC-MAIN-2025-05,tat,209100,208887,0.0069\nCC-MAIN-2025-05,tel,545415,544198,0.0180\nCC-MAIN-2025-05,tgk,191261,190928,0.0063\nCC-MAIN-2025-05,tgl,237950,237190,0.0078\nCC-MAIN-2025-05,tha,13804516,13743607,0.4554\nCC-MAIN-2025-05,tir,24771,24664,0.0008\nCC-MAIN-2025-05,ton,2380,2353,0.0001\nCC-MAIN-2025-05,tsn,4181,4172,0.0001\nCC-MAIN-2025-05,tso,2063,2055,0.0001\nCC-MAIN-2025-05,tuk,52763,52637,0.0017\nCC-MAIN-2025-05,tur,35617851,35445329,1.1750\nCC-MAIN-2025-05,uig,31565,31516,0.0010\nCC-MAIN-2025-05,ukr,18326621,17960740,0.6046\nCC-MAIN-2025-05,urd,836857,832985,0.0276\nCC-MAIN-2025-05,uzb,603839,601582,0.0199\nCC-MAIN-2025-05,ven,2588,2584,0.0001\nCC-MAIN-2025-05,vie,31606195,31388970,1.0427\nCC-MAIN-2025-05,vol,16340,16329,0.0005\nCC-MAIN-2025-05,war,56575,56489,0.0019\nCC-MAIN-2025-05,wol,4327,4320,0.0001\nCC-MAIN-2025-05,xho,23081,22985,0.0008\nCC-MAIN-2025-05,yid,42471,42358,0.0014\nCC-MAIN-2025-05,yor,26050,25995,0.0009\nCC-MAIN-2025-05,zha,2106,2101,0.0001\nCC-MAIN-2025-05,zho,141618109,141129917,4.6719\nCC-MAIN-2025-05,zul,36375,36298,0.0012\nCC-MAIN-2025-08,<unknown>,80991840,80991840,3.0224\nCC-MAIN-2025-08,aar,1971,1960,0.0001\nCC-MAIN-2025-08,abk,15197,15135,0.0006\nCC-MAIN-2025-08,afr,265118,264312,0.0099\nCC-MAIN-2025-08,aka,5071,5016,0.0002\nCC-MAIN-2025-08,amh,83548,83068,0.0031\nCC-MAIN-2025-08,ara,18371175,18284068,0.6856\nCC-MAIN-2025-08,asm,67933,67675,0.0025\nCC-MAIN-2025-08,aym,1270,1268,0.0000\nCC-MAIN-2025-08,aze,1687667,1681961,0.0630\nCC-MAIN-2025-08,bak,76667,76642,0.0029\nCC-MAIN-2025-08,bel,399487,398621,0.0149\nCC-MAIN-2025-08,ben,3072881,3066043,0.1147\nCC-MAIN-2025-08,bih,13082,13063,0.0005\nCC-MAIN-2025-08,bis,2230,2225,0.0001\nCC-MAIN-2025-08,bod,39131,39094,0.0015\nCC-MAIN-2025-08,bos,1528834,1521061,0.0571\nCC-MAIN-2025-08,bre,76845,76775,0.0029\nCC-MAIN-2025-08,bul,8315639,8287437,0.3103\nCC-MAIN-2025-08,cat,4955519,4922177,0.1849\nCC-MAIN-2025-08,ceb,45450,45398,0.0017\nCC-MAIN-2025-08,ces,27019974,26805739,1.0083\nCC-MAIN-2025-08,chr,774,774,0.0000\nCC-MAIN-2025-08,cos,48059,47959,0.0018\nCC-MAIN-2025-08,crs,2610,2598,0.0001\nCC-MAIN-2025-08,cym,286764,285405,0.0107\nCC-MAIN-2025-08,dan,12516299,12422836,0.4671\nCC-MAIN-2025-08,deu,144808766,143916907,5.4039\nCC-MAIN-2025-08,div,67612,67553,0.0025\nCC-MAIN-2025-08,dzo,5283,5279,0.0002\nCC-MAIN-2025-08,ell,15630926,15578551,0.5833\nCC-MAIN-2025-08,eng,1162441440,1155327662,43.3794\nCC-MAIN-2025-08,epo,197337,196744,0.0074\nCC-MAIN-2025-08,est,3499433,3478273,0.1306\nCC-MAIN-2025-08,eus,926037,920860,0.0346\nCC-MAIN-2025-08,fao,115167,114474,0.0043\nCC-MAIN-2025-08,fas,19491131,19425795,0.7274\nCC-MAIN-2025-08,fij,2553,2549,0.0001\nCC-MAIN-2025-08,fin,9546662,9484609,0.3563\nCC-MAIN-2025-08,fra,115094238,114409960,4.2950\nCC-MAIN-2025-08,fry,72058,71929,0.0027\nCC-MAIN-2025-08,gla,35261,35196,0.0013\nCC-MAIN-2025-08,gle,197253,196378,0.0074\nCC-MAIN-2025-08,glg,797173,790973,0.0297\nCC-MAIN-2025-08,glv,9572,9556,0.0004\nCC-MAIN-2025-08,got,496,496,0.0000\nCC-MAIN-2025-08,grn,19034,18990,0.0007\nCC-MAIN-2025-08,guj,332419,331797,0.0124\nCC-MAIN-2025-08,hat,52975,52886,0.0020\nCC-MAIN-2025-08,hau,72963,72583,0.0027\nCC-MAIN-2025-08,haw,17413,17371,0.0006\nCC-MAIN-2025-08,heb,6869349,6838871,0.2563\nCC-MAIN-2025-08,hin,5467538,5450600,0.2040\nCC-MAIN-2025-08,hmn,15204,15062,0.0006\nCC-MAIN-2025-08,hrv,6051707,6027854,0.2258\nCC-MAIN-2025-08,hun,13456047,13402234,0.5021\nCC-MAIN-2025-08,hye,875408,872156,0.0327\nCC-MAIN-2025-08,ibo,16824,16759,0.0006\nCC-MAIN-2025-08,iku,6063,6052,0.0002\nCC-MAIN-2025-08,ile,8635,8590,0.0003\nCC-MAIN-2025-08,ina,13039,13012,0.0005\nCC-MAIN-2025-08,ind,31740773,31516068,1.1845\nCC-MAIN-2025-08,ipk,1987,1984,0.0001\nCC-MAIN-2025-08,isl,1043021,1038726,0.0389\nCC-MAIN-2025-08,ita,64305725,64008818,2.3997\nCC-MAIN-2025-08,jav,62319,62245,0.0023\nCC-MAIN-2025-08,jpn,138381900,137949264,5.1641\nCC-MAIN-2025-08,kal,21702,21577,0.0008\nCC-MAIN-2025-08,kan,361295,360482,0.0135\nCC-MAIN-2025-08,kas,24,24,0.0000\nCC-MAIN-2025-08,kat,1111095,1108242,0.0415\nCC-MAIN-2025-08,kaz,799032,797005,0.0298\nCC-MAIN-2025-08,kha,9799,9792,0.0004\nCC-MAIN-2025-08,khm,292207,291220,0.0109\nCC-MAIN-2025-08,kin,56223,56085,0.0021\nCC-MAIN-2025-08,kir,243466,242954,0.0091\nCC-MAIN-2025-08,kor,21646756,21570518,0.8078\nCC-MAIN-2025-08,kur,183382,182957,0.0068\nCC-MAIN-2025-08,lao,106528,106074,0.0040\nCC-MAIN-2025-08,lat,2840667,2829323,0.1060\nCC-MAIN-2025-08,lav,2353363,2337930,0.0878\nCC-MAIN-2025-08,lif,55,55,0.0000\nCC-MAIN-2025-08,lin,6909,6895,0.0003\nCC-MAIN-2025-08,lit,4358780,4335633,0.1627\nCC-MAIN-2025-08,ltz,101129,100816,0.0038\nCC-MAIN-2025-08,lug,4843,4779,0.0002\nCC-MAIN-2025-08,mal,672616,670860,0.0251\nCC-MAIN-2025-08,mar,744100,742139,0.0278\nCC-MAIN-2025-08,mfe,3009,2997,0.0001\nCC-MAIN-2025-08,mkd,1017554,1014585,0.0380\nCC-MAIN-2025-08,mlg,92935,92547,0.0035\nCC-MAIN-2025-08,mlt,86171,84765,0.0032\nCC-MAIN-2025-08,mon,434114,433104,0.0162\nCC-MAIN-2025-08,mri,34919,34800,0.0013\nCC-MAIN-2025-08,msa,2102918,2095466,0.0785\nCC-MAIN-2025-08,mya,366841,365965,0.0137\nCC-MAIN-2025-08,nau,1097,1094,0.0000\nCC-MAIN-2025-08,nep,1480299,1476124,0.0552\nCC-MAIN-2025-08,nld,48076024,47778492,1.7941\nCC-MAIN-2025-08,nno,446863,445064,0.0167\nCC-MAIN-2025-08,nor,8150934,8098969,0.3042\nCC-MAIN-2025-08,nso,2614,2611,0.0001\nCC-MAIN-2025-08,nya,13670,13634,0.0005\nCC-MAIN-2025-08,oci,87892,87656,0.0033\nCC-MAIN-2025-08,ori,161575,161249,0.0060\nCC-MAIN-2025-08,orm,13290,13255,0.0005\nCC-MAIN-2025-08,pan,186572,186096,0.0070\nCC-MAIN-2025-08,pol,46815742,46613120,1.7470\nCC-MAIN-2025-08,por,62368181,62104996,2.3274\nCC-MAIN-2025-08,pus,82633,82503,0.0031\nCC-MAIN-2025-08,que,14235,14229,0.0005\nCC-MAIN-2025-08,roh,26550,26434,0.0010\nCC-MAIN-2025-08,ron,16892255,16828189,0.6304\nCC-MAIN-2025-08,run,1689,1687,0.0001\nCC-MAIN-2025-08,rus,163413027,162694966,6.0982\nCC-MAIN-2025-08,sag,3219,3217,0.0001\nCC-MAIN-2025-08,san,87077,86887,0.0032\nCC-MAIN-2025-08,sco,15202,15143,0.0006\nCC-MAIN-2025-08,sin,252631,252115,0.0094\nCC-MAIN-2025-08,slk,9561089,9517274,0.3568\nCC-MAIN-2025-08,slv,4043928,4022032,0.1509\nCC-MAIN-2025-08,smo,16997,16946,0.0006\nCC-MAIN-2025-08,sna,16948,16838,0.0006\nCC-MAIN-2025-08,snd,41752,41670,0.0016\nCC-MAIN-2025-08,som,138936,138563,0.0052\nCC-MAIN-2025-08,sot,14964,14844,0.0006\nCC-MAIN-2025-08,spa,121822815,121216333,4.5461\nCC-MAIN-2025-08,sqi,1305076,1299344,0.0487\nCC-MAIN-2025-08,srp,5768040,5748186,0.2152\nCC-MAIN-2025-08,ssw,881,876,0.0000\nCC-MAIN-2025-08,sun,26631,26581,0.0010\nCC-MAIN-2025-08,sux,289,285,0.0000\nCC-MAIN-2025-08,swa,222870,222378,0.0083\nCC-MAIN-2025-08,swe,17189696,17087247,0.6415\nCC-MAIN-2025-08,syr,9602,9576,0.0004\nCC-MAIN-2025-08,tam,1223551,1220848,0.0457\nCC-MAIN-2025-08,tat,217345,217138,0.0081\nCC-MAIN-2025-08,tel,530267,529025,0.0198\nCC-MAIN-2025-08,tgk,174198,173839,0.0065\nCC-MAIN-2025-08,tgl,222563,221638,0.0083\nCC-MAIN-2025-08,tha,13497351,13438886,0.5037\nCC-MAIN-2025-08,tir,19312,19159,0.0007\nCC-MAIN-2025-08,ton,2281,2273,0.0001\nCC-MAIN-2025-08,tsn,2945,2939,0.0001\nCC-MAIN-2025-08,tso,1774,1770,0.0001\nCC-MAIN-2025-08,tuk,53314,53215,0.0020\nCC-MAIN-2025-08,tur,30578827,30442115,1.1411\nCC-MAIN-2025-08,uig,32224,32171,0.0012\nCC-MAIN-2025-08,ukr,16280144,15940551,0.6075\nCC-MAIN-2025-08,urd,811181,807013,0.0303\nCC-MAIN-2025-08,uzb,605894,603669,0.0226\nCC-MAIN-2025-08,ven,894,893,0.0000\nCC-MAIN-2025-08,vie,28273761,28091125,1.0551\nCC-MAIN-2025-08,vol,12431,12419,0.0005\nCC-MAIN-2025-08,war,61339,61268,0.0023\nCC-MAIN-2025-08,wol,3208,3204,0.0001\nCC-MAIN-2025-08,xho,20538,20465,0.0008\nCC-MAIN-2025-08,yid,44392,44300,0.0017\nCC-MAIN-2025-08,yor,21006,20956,0.0008\nCC-MAIN-2025-08,zha,4175,4169,0.0002\nCC-MAIN-2025-08,zho,136510537,136177689,5.0942\nCC-MAIN-2025-08,zul,34611,34494,0.0013\nCC-MAIN-2025-13,<unknown>,82300022,82300022,3.0027\nCC-MAIN-2025-13,aar,1948,1939,0.0001\nCC-MAIN-2025-13,abk,14155,14095,0.0005\nCC-MAIN-2025-13,afr,261293,260675,0.0095\nCC-MAIN-2025-13,aka,3627,3599,0.0001\nCC-MAIN-2025-13,amh,91459,91082,0.0033\nCC-MAIN-2025-13,ara,18739027,18651235,0.6837\nCC-MAIN-2025-13,asm,64051,63847,0.0023\nCC-MAIN-2025-13,aym,2253,2225,0.0001\nCC-MAIN-2025-13,aze,1677722,1671883,0.0612\nCC-MAIN-2025-13,bak,86601,86597,0.0032\nCC-MAIN-2025-13,bel,451710,450683,0.0165\nCC-MAIN-2025-13,ben,3033293,3024843,0.1107\nCC-MAIN-2025-13,bih,12613,12589,0.0005\nCC-MAIN-2025-13,bis,2151,2140,0.0001\nCC-MAIN-2025-13,bod,40120,40079,0.0015\nCC-MAIN-2025-13,bos,1473804,1463441,0.0538\nCC-MAIN-2025-13,bre,63653,63589,0.0023\nCC-MAIN-2025-13,bul,8296521,8264464,0.3027\nCC-MAIN-2025-13,cat,4841957,4811793,0.1767\nCC-MAIN-2025-13,ceb,49888,49828,0.0018\nCC-MAIN-2025-13,ces,28451138,28227478,1.0380\nCC-MAIN-2025-13,chr,806,805,0.0000\nCC-MAIN-2025-13,cos,56699,56575,0.0021\nCC-MAIN-2025-13,crs,2289,2279,0.0001\nCC-MAIN-2025-13,cym,327827,326478,0.0120\nCC-MAIN-2025-13,dan,12689895,12595398,0.4630\nCC-MAIN-2025-13,deu,140204402,139358953,5.1154\nCC-MAIN-2025-13,div,64431,64377,0.0024\nCC-MAIN-2025-13,dzo,4930,4926,0.0002\nCC-MAIN-2025-13,ell,16175423,16119062,0.5902\nCC-MAIN-2025-13,eng,1204156851,1196822790,43.9338\nCC-MAIN-2025-13,epo,231867,231196,0.0085\nCC-MAIN-2025-13,est,3585717,3562472,0.1308\nCC-MAIN-2025-13,eus,899444,895008,0.0328\nCC-MAIN-2025-13,fao,120230,119653,0.0044\nCC-MAIN-2025-13,fas,20144139,20064242,0.7350\nCC-MAIN-2025-13,fij,2678,2676,0.0001\nCC-MAIN-2025-13,fin,9909858,9844110,0.3616\nCC-MAIN-2025-13,fra,115851868,115153732,4.2269\nCC-MAIN-2025-13,fry,60306,60218,0.0022\nCC-MAIN-2025-13,gla,35342,35288,0.0013\nCC-MAIN-2025-13,gle,201525,200683,0.0074\nCC-MAIN-2025-13,glg,835627,830529,0.0305\nCC-MAIN-2025-13,glv,25967,25933,0.0009\nCC-MAIN-2025-13,got,446,446,0.0000\nCC-MAIN-2025-13,grn,18029,17991,0.0007\nCC-MAIN-2025-13,guj,342820,341785,0.0125\nCC-MAIN-2025-13,hat,51210,51090,0.0019\nCC-MAIN-2025-13,hau,86698,86434,0.0032\nCC-MAIN-2025-13,haw,15594,15550,0.0006\nCC-MAIN-2025-13,heb,7047083,7016592,0.2571\nCC-MAIN-2025-13,hin,5555621,5538797,0.2027\nCC-MAIN-2025-13,hmn,17127,16949,0.0006\nCC-MAIN-2025-13,hrv,6289022,6263051,0.2295\nCC-MAIN-2025-13,hun,13678095,13624335,0.4990\nCC-MAIN-2025-13,hye,899571,894876,0.0328\nCC-MAIN-2025-13,ibo,17611,17571,0.0006\nCC-MAIN-2025-13,iku,5973,5932,0.0002\nCC-MAIN-2025-13,ile,9202,9183,0.0003\nCC-MAIN-2025-13,ina,13321,13246,0.0005\nCC-MAIN-2025-13,ind,32914493,32695963,1.2009\nCC-MAIN-2025-13,ipk,1749,1747,0.0001\nCC-MAIN-2025-13,isl,1064775,1060814,0.0388\nCC-MAIN-2025-13,ita,66277391,65948986,2.4181\nCC-MAIN-2025-13,jav,62364,62283,0.0023\nCC-MAIN-2025-13,jpn,133271896,132828948,4.8624\nCC-MAIN-2025-13,kal,21598,21450,0.0008\nCC-MAIN-2025-13,kan,378900,378159,0.0138\nCC-MAIN-2025-13,kas,10,10,0.0000\nCC-MAIN-2025-13,kat,1215618,1211500,0.0444\nCC-MAIN-2025-13,kaz,870518,867499,0.0318\nCC-MAIN-2025-13,kha,8963,8948,0.0003\nCC-MAIN-2025-13,khm,290330,289035,0.0106\nCC-MAIN-2025-13,kin,62839,62690,0.0023\nCC-MAIN-2025-13,kir,304398,303877,0.0111\nCC-MAIN-2025-13,kor,22002797,21925284,0.8028\nCC-MAIN-2025-13,kur,188065,187674,0.0069\nCC-MAIN-2025-13,lao,106372,105793,0.0039\nCC-MAIN-2025-13,lat,2906860,2902210,0.1061\nCC-MAIN-2025-13,lav,2340300,2322976,0.0854\nCC-MAIN-2025-13,lif,84,84,0.0000\nCC-MAIN-2025-13,lin,6943,6935,0.0003\nCC-MAIN-2025-13,lit,4548331,4522396,0.1659\nCC-MAIN-2025-13,ltz,112657,112274,0.0041\nCC-MAIN-2025-13,lug,4085,4049,0.0001\nCC-MAIN-2025-13,mal,693416,692062,0.0253\nCC-MAIN-2025-13,mar,794274,791915,0.0290\nCC-MAIN-2025-13,mfe,3266,3258,0.0001\nCC-MAIN-2025-13,mkd,1061290,1057350,0.0387\nCC-MAIN-2025-13,mlg,111908,111008,0.0041\nCC-MAIN-2025-13,mlt,87948,85765,0.0032\nCC-MAIN-2025-13,mon,418968,417680,0.0153\nCC-MAIN-2025-13,mri,34497,34223,0.0013\nCC-MAIN-2025-13,msa,2122021,2114418,0.0774\nCC-MAIN-2025-13,mya,406971,405605,0.0148\nCC-MAIN-2025-13,nau,1055,1055,0.0000\nCC-MAIN-2025-13,nep,1516502,1512451,0.0553\nCC-MAIN-2025-13,nld,49285101,48973935,1.7982\nCC-MAIN-2025-13,nno,369745,368218,0.0135\nCC-MAIN-2025-13,nor,8548787,8500796,0.3119\nCC-MAIN-2025-13,nso,1887,1885,0.0001\nCC-MAIN-2025-13,nya,13617,13535,0.0005\nCC-MAIN-2025-13,oci,102166,101995,0.0037\nCC-MAIN-2025-13,ori,167708,167418,0.0061\nCC-MAIN-2025-13,orm,20394,20376,0.0007\nCC-MAIN-2025-13,pan,185091,184429,0.0068\nCC-MAIN-2025-13,pol,46382644,46163942,1.6923\nCC-MAIN-2025-13,por,64900965,64620240,2.3679\nCC-MAIN-2025-13,pus,113252,112989,0.0041\nCC-MAIN-2025-13,que,14633,14625,0.0005\nCC-MAIN-2025-13,roh,28099,27961,0.0010\nCC-MAIN-2025-13,ron,17875496,17797740,0.6522\nCC-MAIN-2025-13,run,1918,1918,0.0001\nCC-MAIN-2025-13,rus,162515317,161712840,5.9294\nCC-MAIN-2025-13,sag,20473,20473,0.0007\nCC-MAIN-2025-13,san,87238,87027,0.0032\nCC-MAIN-2025-13,sco,16470,16370,0.0006\nCC-MAIN-2025-13,sin,253454,252927,0.0092\nCC-MAIN-2025-13,slk,10096106,10050368,0.3684\nCC-MAIN-2025-13,slv,4253209,4229357,0.1552\nCC-MAIN-2025-13,smo,17508,17406,0.0006\nCC-MAIN-2025-13,sna,18814,18756,0.0007\nCC-MAIN-2025-13,snd,42762,42547,0.0016\nCC-MAIN-2025-13,som,132910,132634,0.0048\nCC-MAIN-2025-13,sot,14495,14398,0.0005\nCC-MAIN-2025-13,spa,121764776,121151506,4.4426\nCC-MAIN-2025-13,sqi,1349756,1346104,0.0492\nCC-MAIN-2025-13,srp,5910940,5890328,0.2157\nCC-MAIN-2025-13,ssw,825,821,0.0000\nCC-MAIN-2025-13,sun,32604,32490,0.0012\nCC-MAIN-2025-13,sux,266,266,0.0000\nCC-MAIN-2025-13,swa,260579,260144,0.0095\nCC-MAIN-2025-13,swe,18146052,18034925,0.6621\nCC-MAIN-2025-13,syr,9605,9598,0.0004\nCC-MAIN-2025-13,tam,1197822,1195183,0.0437\nCC-MAIN-2025-13,tat,224677,224406,0.0082\nCC-MAIN-2025-13,tel,533488,531650,0.0195\nCC-MAIN-2025-13,tgk,188257,187837,0.0069\nCC-MAIN-2025-13,tgl,238900,237833,0.0087\nCC-MAIN-2025-13,tha,12423595,12363526,0.4533\nCC-MAIN-2025-13,tir,18829,18742,0.0007\nCC-MAIN-2025-13,ton,2541,2535,0.0001\nCC-MAIN-2025-13,tsn,3854,3849,0.0001\nCC-MAIN-2025-13,tso,1686,1672,0.0001\nCC-MAIN-2025-13,tuk,61581,61447,0.0022\nCC-MAIN-2025-13,tur,31258207,31117563,1.1405\nCC-MAIN-2025-13,uig,34173,34062,0.0012\nCC-MAIN-2025-13,ukr,17102386,16685530,0.6240\nCC-MAIN-2025-13,urd,822344,818268,0.0300\nCC-MAIN-2025-13,uzb,625942,623245,0.0228\nCC-MAIN-2025-13,ven,698,697,0.0000\nCC-MAIN-2025-13,vie,28774150,28556755,1.0498\nCC-MAIN-2025-13,vol,14334,14312,0.0005\nCC-MAIN-2025-13,war,57235,57138,0.0021\nCC-MAIN-2025-13,wol,3754,3748,0.0001\nCC-MAIN-2025-13,xho,19732,19611,0.0007\nCC-MAIN-2025-13,yid,39811,39752,0.0015\nCC-MAIN-2025-13,yor,22000,21965,0.0008\nCC-MAIN-2025-13,zha,2588,2582,0.0001\nCC-MAIN-2025-13,zho,148376315,148049423,5.4135\nCC-MAIN-2025-13,zul,30624,30418,0.0011\nCC-MAIN-2025-18,<unknown>,81917923,81917923,2.9817\nCC-MAIN-2025-18,aar,2433,2414,0.0001\nCC-MAIN-2025-18,abk,13549,13489,0.0005\nCC-MAIN-2025-18,afr,274445,273633,0.0100\nCC-MAIN-2025-18,aka,2965,2964,0.0001\nCC-MAIN-2025-18,amh,85872,85420,0.0031\nCC-MAIN-2025-18,ara,18466909,18370024,0.6722\nCC-MAIN-2025-18,asm,67462,67379,0.0025\nCC-MAIN-2025-18,aym,3524,3475,0.0001\nCC-MAIN-2025-18,aze,1652960,1647697,0.0602\nCC-MAIN-2025-18,bak,51515,51506,0.0019\nCC-MAIN-2025-18,bel,406446,405564,0.0148\nCC-MAIN-2025-18,ben,2922132,2914599,0.1064\nCC-MAIN-2025-18,bih,16244,16197,0.0006\nCC-MAIN-2025-18,bis,2303,2294,0.0001\nCC-MAIN-2025-18,bod,36909,36876,0.0013\nCC-MAIN-2025-18,bos,1535568,1524587,0.0559\nCC-MAIN-2025-18,bre,74704,74581,0.0027\nCC-MAIN-2025-18,bul,8142245,8109405,0.2964\nCC-MAIN-2025-18,cat,5200013,5168685,0.1893\nCC-MAIN-2025-18,ceb,50895,50808,0.0019\nCC-MAIN-2025-18,ces,28790470,28583698,1.0479\nCC-MAIN-2025-18,chr,783,783,0.0000\nCC-MAIN-2025-18,cos,52972,52820,0.0019\nCC-MAIN-2025-18,crs,2282,2273,0.0001\nCC-MAIN-2025-18,cym,312490,310694,0.0114\nCC-MAIN-2025-18,dan,13165631,13069307,0.4792\nCC-MAIN-2025-18,deu,153000641,152010369,5.5691\nCC-MAIN-2025-18,div,69694,69648,0.0025\nCC-MAIN-2025-18,dzo,5266,5263,0.0002\nCC-MAIN-2025-18,ell,15524989,15470617,0.5651\nCC-MAIN-2025-18,eng,1207452488,1199710507,43.9499\nCC-MAIN-2025-18,epo,201609,201014,0.0073\nCC-MAIN-2025-18,est,3637280,3619046,0.1324\nCC-MAIN-2025-18,eus,920989,916423,0.0335\nCC-MAIN-2025-18,fao,123213,122644,0.0045\nCC-MAIN-2025-18,fas,19470020,19396877,0.7087\nCC-MAIN-2025-18,fij,2520,2518,0.0001\nCC-MAIN-2025-18,fin,10025118,9960036,0.3649\nCC-MAIN-2025-18,fra,118879662,118142069,4.3271\nCC-MAIN-2025-18,fry,70895,70654,0.0026\nCC-MAIN-2025-18,gla,34315,34239,0.0012\nCC-MAIN-2025-18,gle,199710,198814,0.0073\nCC-MAIN-2025-18,glg,919115,914568,0.0335\nCC-MAIN-2025-18,glv,9898,9885,0.0004\nCC-MAIN-2025-18,got,529,529,0.0000\nCC-MAIN-2025-18,grn,17689,17637,0.0006\nCC-MAIN-2025-18,guj,305686,304965,0.0111\nCC-MAIN-2025-18,hat,52578,52424,0.0019\nCC-MAIN-2025-18,hau,79775,79464,0.0029\nCC-MAIN-2025-18,haw,17870,17833,0.0007\nCC-MAIN-2025-18,heb,7291661,7254261,0.2654\nCC-MAIN-2025-18,hin,5506347,5488715,0.2004\nCC-MAIN-2025-18,hmn,15333,15155,0.0006\nCC-MAIN-2025-18,hrv,6426815,6400866,0.2339\nCC-MAIN-2025-18,hun,13960932,13902278,0.5082\nCC-MAIN-2025-18,hye,900168,896269,0.0328\nCC-MAIN-2025-18,ibo,19280,19147,0.0007\nCC-MAIN-2025-18,iku,7181,7142,0.0003\nCC-MAIN-2025-18,ile,16310,16217,0.0006\nCC-MAIN-2025-18,ina,13907,13658,0.0005\nCC-MAIN-2025-18,ind,32306367,32098399,1.1759\nCC-MAIN-2025-18,ipk,1877,1872,0.0001\nCC-MAIN-2025-18,isl,1074507,1070229,0.0391\nCC-MAIN-2025-18,ita,66099736,65788639,2.4060\nCC-MAIN-2025-18,jav,59114,58996,0.0022\nCC-MAIN-2025-18,jpn,135037254,134614082,4.9152\nCC-MAIN-2025-18,kal,22484,22347,0.0008\nCC-MAIN-2025-18,kan,356941,355454,0.0130\nCC-MAIN-2025-18,kas,9,9,0.0000\nCC-MAIN-2025-18,kat,1196062,1192516,0.0435\nCC-MAIN-2025-18,kaz,870689,867110,0.0317\nCC-MAIN-2025-18,kha,8809,8700,0.0003\nCC-MAIN-2025-18,khm,280780,279308,0.0102\nCC-MAIN-2025-18,kin,55482,55382,0.0020\nCC-MAIN-2025-18,kir,264190,261280,0.0096\nCC-MAIN-2025-18,kor,21607515,21527166,0.7865\nCC-MAIN-2025-18,kur,187244,186749,0.0068\nCC-MAIN-2025-18,lao,96085,95372,0.0035\nCC-MAIN-2025-18,lat,2815790,2811275,0.1025\nCC-MAIN-2025-18,lav,2462211,2439876,0.0896\nCC-MAIN-2025-18,lif,164,164,0.0000\nCC-MAIN-2025-18,lin,6333,6316,0.0002\nCC-MAIN-2025-18,lit,4597028,4568438,0.1673\nCC-MAIN-2025-18,ltz,104611,104261,0.0038\nCC-MAIN-2025-18,lug,4162,4155,0.0002\nCC-MAIN-2025-18,mal,641389,639430,0.0233\nCC-MAIN-2025-18,mar,749498,747553,0.0273\nCC-MAIN-2025-18,mfe,3373,3362,0.0001\nCC-MAIN-2025-18,mkd,1047943,1043881,0.0381\nCC-MAIN-2025-18,mlg,136042,134858,0.0050\nCC-MAIN-2025-18,mlt,84984,83423,0.0031\nCC-MAIN-2025-18,mon,422013,420184,0.0154\nCC-MAIN-2025-18,mri,39704,39485,0.0014\nCC-MAIN-2025-18,msa,2108445,2100736,0.0767\nCC-MAIN-2025-18,mya,361955,360613,0.0132\nCC-MAIN-2025-18,nau,1036,1031,0.0000\nCC-MAIN-2025-18,nep,1435057,1432074,0.0522\nCC-MAIN-2025-18,nld,49680450,49351675,1.8083\nCC-MAIN-2025-18,nno,394013,392043,0.0143\nCC-MAIN-2025-18,nor,8613103,8561554,0.3135\nCC-MAIN-2025-18,nso,2074,2073,0.0001\nCC-MAIN-2025-18,nya,12349,12256,0.0004\nCC-MAIN-2025-18,oci,89462,89310,0.0033\nCC-MAIN-2025-18,ori,158016,157876,0.0058\nCC-MAIN-2025-18,orm,12024,11985,0.0004\nCC-MAIN-2025-18,pan,187939,187656,0.0068\nCC-MAIN-2025-18,pol,51495096,51234036,1.8744\nCC-MAIN-2025-18,por,64203206,63917214,2.3369\nCC-MAIN-2025-18,pus,108224,108001,0.0039\nCC-MAIN-2025-18,que,14858,14824,0.0005\nCC-MAIN-2025-18,roh,29290,29118,0.0011\nCC-MAIN-2025-18,ron,17511190,17436416,0.6374\nCC-MAIN-2025-18,run,2030,2029,0.0001\nCC-MAIN-2025-18,rus,158285564,157542152,5.7614\nCC-MAIN-2025-18,sag,2251,2250,0.0001\nCC-MAIN-2025-18,san,88706,88199,0.0032\nCC-MAIN-2025-18,sco,17058,16941,0.0006\nCC-MAIN-2025-18,sin,235317,234620,0.0086\nCC-MAIN-2025-18,slk,10182503,10130850,0.3706\nCC-MAIN-2025-18,slv,4408722,4384489,0.1605\nCC-MAIN-2025-18,smo,18117,17979,0.0007\nCC-MAIN-2025-18,sna,18159,18005,0.0007\nCC-MAIN-2025-18,snd,42086,41997,0.0015\nCC-MAIN-2025-18,som,123917,123562,0.0045\nCC-MAIN-2025-18,sot,14066,13866,0.0005\nCC-MAIN-2025-18,spa,124790463,124133997,4.5422\nCC-MAIN-2025-18,sqi,1334248,1330001,0.0486\nCC-MAIN-2025-18,srp,5861284,5840395,0.2133\nCC-MAIN-2025-18,ssw,778,775,0.0000\nCC-MAIN-2025-18,sun,30382,30186,0.0011\nCC-MAIN-2025-18,sux,262,261,0.0000\nCC-MAIN-2025-18,swa,279362,279018,0.0102\nCC-MAIN-2025-18,swe,18507202,18385286,0.6736\nCC-MAIN-2025-18,syr,8657,8639,0.0003\nCC-MAIN-2025-18,tam,1228242,1224814,0.0447\nCC-MAIN-2025-18,tat,205924,205595,0.0075\nCC-MAIN-2025-18,tel,585158,582127,0.0213\nCC-MAIN-2025-18,tgk,177336,176928,0.0065\nCC-MAIN-2025-18,tgl,230087,229093,0.0084\nCC-MAIN-2025-18,tha,11728246,11665913,0.4269\nCC-MAIN-2025-18,tir,21621,21545,0.0008\nCC-MAIN-2025-18,ton,2748,2743,0.0001\nCC-MAIN-2025-18,tsn,4276,4275,0.0002\nCC-MAIN-2025-18,tso,1324,1319,0.0000\nCC-MAIN-2025-18,tuk,56773,56545,0.0021\nCC-MAIN-2025-18,tur,30972320,30830201,1.1274\nCC-MAIN-2025-18,uig,37926,37727,0.0014\nCC-MAIN-2025-18,ukr,16699737,16365582,0.6079\nCC-MAIN-2025-18,urd,793707,790739,0.0289\nCC-MAIN-2025-18,uzb,595719,592576,0.0217\nCC-MAIN-2025-18,ven,658,657,0.0000\nCC-MAIN-2025-18,vie,28059099,27836254,1.0213\nCC-MAIN-2025-18,vol,13213,13176,0.0005\nCC-MAIN-2025-18,war,55544,55441,0.0020\nCC-MAIN-2025-18,wol,3985,3973,0.0001\nCC-MAIN-2025-18,xho,19689,19501,0.0007\nCC-MAIN-2025-18,yid,37475,37427,0.0014\nCC-MAIN-2025-18,yor,22568,22538,0.0008\nCC-MAIN-2025-18,zha,3308,3300,0.0001\nCC-MAIN-2025-18,zho,134008849,133663921,4.8778\nCC-MAIN-2025-18,zul,30140,30050,0.0011\nCC-MAIN-2025-21,<unknown>,72357739,72357739,2.9210\nCC-MAIN-2025-21,aar,2002,1987,0.0001\nCC-MAIN-2025-21,abk,13029,13013,0.0005\nCC-MAIN-2025-21,afr,246581,246175,0.0100\nCC-MAIN-2025-21,aka,3745,3737,0.0002\nCC-MAIN-2025-21,amh,80484,80205,0.0032\nCC-MAIN-2025-21,ara,17316259,17232658,0.6990\nCC-MAIN-2025-21,asm,65454,65278,0.0026\nCC-MAIN-2025-21,aym,2260,2250,0.0001\nCC-MAIN-2025-21,aze,1586403,1582480,0.0640\nCC-MAIN-2025-21,bak,42097,42090,0.0017\nCC-MAIN-2025-21,bel,443943,443289,0.0179\nCC-MAIN-2025-21,ben,2895358,2888686,0.1169\nCC-MAIN-2025-21,bih,15310,15222,0.0006\nCC-MAIN-2025-21,bis,2153,2139,0.0001\nCC-MAIN-2025-21,bod,29774,29761,0.0012\nCC-MAIN-2025-21,bos,1416918,1413468,0.0572\nCC-MAIN-2025-21,bre,66112,66053,0.0027\nCC-MAIN-2025-21,bul,6142406,6123810,0.2480\nCC-MAIN-2025-21,cat,4731015,4702217,0.1910\nCC-MAIN-2025-21,ceb,61244,61185,0.0025\nCC-MAIN-2025-21,ces,24557861,24415357,0.9914\nCC-MAIN-2025-21,chr,809,805,0.0000\nCC-MAIN-2025-21,cos,53072,52976,0.0021\nCC-MAIN-2025-21,crs,1721,1714,0.0001\nCC-MAIN-2025-21,cym,299106,297936,0.0121\nCC-MAIN-2025-21,dan,11790699,11713006,0.4760\nCC-MAIN-2025-21,deu,138273839,137418706,5.5819\nCC-MAIN-2025-21,div,57461,57417,0.0023\nCC-MAIN-2025-21,dzo,4303,4303,0.0002\nCC-MAIN-2025-21,ell,14208665,14164830,0.5736\nCC-MAIN-2025-21,eng,1084690386,1078307430,43.7876\nCC-MAIN-2025-21,epo,232547,232209,0.0094\nCC-MAIN-2025-21,est,3333903,3319490,0.1346\nCC-MAIN-2025-21,eus,830339,826129,0.0335\nCC-MAIN-2025-21,fao,114438,113992,0.0046\nCC-MAIN-2025-21,fas,18618206,18562028,0.7516\nCC-MAIN-2025-21,fij,2546,2544,0.0001\nCC-MAIN-2025-21,fin,9036527,8985910,0.3648\nCC-MAIN-2025-21,fra,105371066,104753558,4.2537\nCC-MAIN-2025-21,fry,55941,55808,0.0023\nCC-MAIN-2025-21,gla,36646,36600,0.0015\nCC-MAIN-2025-21,gle,177269,176654,0.0072\nCC-MAIN-2025-21,glg,838794,836476,0.0339\nCC-MAIN-2025-21,glv,9983,9971,0.0004\nCC-MAIN-2025-21,got,568,562,0.0000\nCC-MAIN-2025-21,grn,17226,17170,0.0007\nCC-MAIN-2025-21,guj,284820,284272,0.0115\nCC-MAIN-2025-21,hat,51242,51123,0.0021\nCC-MAIN-2025-21,hau,79260,79057,0.0032\nCC-MAIN-2025-21,haw,18661,18613,0.0008\nCC-MAIN-2025-21,heb,6766972,6739638,0.2732\nCC-MAIN-2025-21,hin,5329569,5312151,0.2151\nCC-MAIN-2025-21,hmn,14429,14360,0.0006\nCC-MAIN-2025-21,hrv,5849854,5829383,0.2362\nCC-MAIN-2025-21,hun,12477442,12431777,0.5037\nCC-MAIN-2025-21,hye,870589,867356,0.0351\nCC-MAIN-2025-21,ibo,18424,18381,0.0007\nCC-MAIN-2025-21,iku,6159,6145,0.0002\nCC-MAIN-2025-21,ile,7329,7306,0.0003\nCC-MAIN-2025-21,ina,12666,12630,0.0005\nCC-MAIN-2025-21,ind,28931470,28765763,1.1679\nCC-MAIN-2025-21,ipk,1527,1525,0.0001\nCC-MAIN-2025-21,isl,961845,957769,0.0388\nCC-MAIN-2025-21,ita,58591035,58333588,2.3652\nCC-MAIN-2025-21,jav,54176,54082,0.0022\nCC-MAIN-2025-21,jpn,120138356,119782767,4.8498\nCC-MAIN-2025-21,kal,19580,19460,0.0008\nCC-MAIN-2025-21,kan,352782,352163,0.0142\nCC-MAIN-2025-21,kas,67,67,0.0000\nCC-MAIN-2025-21,kat,1080239,1077113,0.0436\nCC-MAIN-2025-21,kaz,877716,874403,0.0354\nCC-MAIN-2025-21,kha,7846,7834,0.0003\nCC-MAIN-2025-21,khm,271265,269049,0.0110\nCC-MAIN-2025-21,kin,51381,51282,0.0021\nCC-MAIN-2025-21,kir,254291,253826,0.0103\nCC-MAIN-2025-21,kor,18346519,18284974,0.7406\nCC-MAIN-2025-21,kur,141462,141239,0.0057\nCC-MAIN-2025-21,lao,102860,102504,0.0042\nCC-MAIN-2025-21,lat,2825205,2820833,0.1140\nCC-MAIN-2025-21,lav,2235169,2224476,0.0902\nCC-MAIN-2025-21,lif,60,60,0.0000\nCC-MAIN-2025-21,lin,8570,8555,0.0003\nCC-MAIN-2025-21,lit,4235289,4213821,0.1710\nCC-MAIN-2025-21,ltz,92314,92066,0.0037\nCC-MAIN-2025-21,lug,3911,3907,0.0002\nCC-MAIN-2025-21,mal,612754,611868,0.0247\nCC-MAIN-2025-21,mar,729378,728189,0.0294\nCC-MAIN-2025-21,mfe,2366,2359,0.0001\nCC-MAIN-2025-21,mkd,969947,967085,0.0392\nCC-MAIN-2025-21,mlg,116939,116796,0.0047\nCC-MAIN-2025-21,mlt,81923,81616,0.0033\nCC-MAIN-2025-21,mon,367564,365996,0.0148\nCC-MAIN-2025-21,mri,33798,33641,0.0014\nCC-MAIN-2025-21,msa,1950008,1943997,0.0787\nCC-MAIN-2025-21,mya,342723,341810,0.0138\nCC-MAIN-2025-21,nau,797,796,0.0000\nCC-MAIN-2025-21,nep,1290578,1288036,0.0521\nCC-MAIN-2025-21,nld,45511608,45232883,1.8372\nCC-MAIN-2025-21,nno,386405,384401,0.0156\nCC-MAIN-2025-21,nor,7882177,7835639,0.3182\nCC-MAIN-2025-21,nso,2010,2009,0.0001\nCC-MAIN-2025-21,nya,14539,14492,0.0006\nCC-MAIN-2025-21,oci,81115,80952,0.0033\nCC-MAIN-2025-21,ori,148164,148001,0.0060\nCC-MAIN-2025-21,orm,15831,15815,0.0006\nCC-MAIN-2025-21,pan,180975,180674,0.0073\nCC-MAIN-2025-21,pol,44547870,44357692,1.7983\nCC-MAIN-2025-21,por,57998100,57753092,2.3413\nCC-MAIN-2025-21,pus,97964,97744,0.0040\nCC-MAIN-2025-21,que,13086,13076,0.0005\nCC-MAIN-2025-21,roh,26426,26326,0.0011\nCC-MAIN-2025-21,ron,16328054,16261305,0.6591\nCC-MAIN-2025-21,run,1938,1936,0.0001\nCC-MAIN-2025-21,rus,145957224,145361382,5.8921\nCC-MAIN-2025-21,sag,15199,15196,0.0006\nCC-MAIN-2025-21,san,82727,82571,0.0033\nCC-MAIN-2025-21,sco,17976,17915,0.0007\nCC-MAIN-2025-21,sin,223087,222382,0.0090\nCC-MAIN-2025-21,slk,9057897,9015513,0.3657\nCC-MAIN-2025-21,slv,4176894,4146531,0.1686\nCC-MAIN-2025-21,smo,17584,17531,0.0007\nCC-MAIN-2025-21,sna,17452,17356,0.0007\nCC-MAIN-2025-21,snd,40839,40741,0.0016\nCC-MAIN-2025-21,som,131117,130862,0.0053\nCC-MAIN-2025-21,sot,14541,14484,0.0006\nCC-MAIN-2025-21,spa,116693094,116148862,4.7108\nCC-MAIN-2025-21,sqi,1244774,1241454,0.0502\nCC-MAIN-2025-21,srp,5438904,5420091,0.2196\nCC-MAIN-2025-21,ssw,810,805,0.0000\nCC-MAIN-2025-21,sun,30288,30240,0.0012\nCC-MAIN-2025-21,sux,249,248,0.0000\nCC-MAIN-2025-21,swa,246105,245714,0.0099\nCC-MAIN-2025-21,swe,16122971,16018864,0.6509\nCC-MAIN-2025-21,syr,6484,6478,0.0003\nCC-MAIN-2025-21,tam,1087100,1085226,0.0439\nCC-MAIN-2025-21,tat,188182,187806,0.0076\nCC-MAIN-2025-21,tel,520064,518741,0.0210\nCC-MAIN-2025-21,tgk,150009,149724,0.0061\nCC-MAIN-2025-21,tgl,214633,213824,0.0087\nCC-MAIN-2025-21,tha,10449160,10394749,0.4218\nCC-MAIN-2025-21,tir,20998,20880,0.0008\nCC-MAIN-2025-21,ton,2768,2763,0.0001\nCC-MAIN-2025-21,tsn,3375,3372,0.0001\nCC-MAIN-2025-21,tso,2141,2136,0.0001\nCC-MAIN-2025-21,tuk,55322,55078,0.0022\nCC-MAIN-2025-21,tur,29765668,29639821,1.2016\nCC-MAIN-2025-21,uig,34640,34405,0.0014\nCC-MAIN-2025-21,ukr,16322955,15942847,0.6589\nCC-MAIN-2025-21,urd,734168,731802,0.0296\nCC-MAIN-2025-21,uzb,575530,572892,0.0232\nCC-MAIN-2025-21,ven,630,630,0.0000\nCC-MAIN-2025-21,vie,25742993,25573690,1.0392\nCC-MAIN-2025-21,vol,18420,18398,0.0007\nCC-MAIN-2025-21,war,67809,67751,0.0027\nCC-MAIN-2025-21,wol,3721,3707,0.0002\nCC-MAIN-2025-21,xho,18172,18087,0.0007\nCC-MAIN-2025-21,yid,34828,34767,0.0014\nCC-MAIN-2025-21,yor,21212,21176,0.0009\nCC-MAIN-2025-21,zha,2763,2755,0.0001\nCC-MAIN-2025-21,zho,120318383,120010602,4.8571\nCC-MAIN-2025-21,zul,32147,32031,0.0013\nCC-MAIN-2025-26,<unknown>,71987411,71987411,3.0176\nCC-MAIN-2025-26,aar,1857,1842,0.0001\nCC-MAIN-2025-26,abk,12586,12576,0.0005\nCC-MAIN-2025-26,afr,205688,205240,0.0086\nCC-MAIN-2025-26,aka,3473,3468,0.0001\nCC-MAIN-2025-26,amh,81209,80972,0.0034\nCC-MAIN-2025-26,ara,16183835,16106401,0.6784\nCC-MAIN-2025-26,asm,68145,68019,0.0029\nCC-MAIN-2025-26,aym,1938,1916,0.0001\nCC-MAIN-2025-26,aze,1459673,1455274,0.0612\nCC-MAIN-2025-26,bak,41091,41089,0.0017\nCC-MAIN-2025-26,bel,399374,398775,0.0167\nCC-MAIN-2025-26,ben,2587500,2581397,0.1085\nCC-MAIN-2025-26,bih,13353,13282,0.0006\nCC-MAIN-2025-26,bis,2217,2203,0.0001\nCC-MAIN-2025-26,bod,31988,31973,0.0013\nCC-MAIN-2025-26,bos,1199230,1196974,0.0503\nCC-MAIN-2025-26,bre,51532,51464,0.0022\nCC-MAIN-2025-26,bul,6102833,6083436,0.2558\nCC-MAIN-2025-26,cat,4277438,4249115,0.1793\nCC-MAIN-2025-26,ceb,57399,57376,0.0024\nCC-MAIN-2025-26,ces,23999798,23844246,1.0060\nCC-MAIN-2025-26,chr,628,628,0.0000\nCC-MAIN-2025-26,cos,52144,52032,0.0022\nCC-MAIN-2025-26,crs,2224,2211,0.0001\nCC-MAIN-2025-26,cym,280692,279319,0.0118\nCC-MAIN-2025-26,dan,10288929,10210092,0.4313\nCC-MAIN-2025-26,deu,131849535,130976647,5.5269\nCC-MAIN-2025-26,div,56342,56302,0.0024\nCC-MAIN-2025-26,dzo,3825,3820,0.0002\nCC-MAIN-2025-26,ell,12038431,11998515,0.5046\nCC-MAIN-2025-26,eng,1080052494,1073945372,45.2738\nCC-MAIN-2025-26,epo,215223,214885,0.0090\nCC-MAIN-2025-26,est,3114544,3098075,0.1306\nCC-MAIN-2025-26,eus,802010,798190,0.0336\nCC-MAIN-2025-26,fao,104034,103636,0.0044\nCC-MAIN-2025-26,fas,12461812,12430485,0.5224\nCC-MAIN-2025-26,fij,2227,2225,0.0001\nCC-MAIN-2025-26,fin,7886498,7839403,0.3306\nCC-MAIN-2025-26,fra,98280758,97654477,4.1197\nCC-MAIN-2025-26,fry,55187,55112,0.0023\nCC-MAIN-2025-26,gla,35665,35618,0.0015\nCC-MAIN-2025-26,gle,171537,170794,0.0072\nCC-MAIN-2025-26,glg,664612,662651,0.0279\nCC-MAIN-2025-26,glv,14975,14957,0.0006\nCC-MAIN-2025-26,got,569,569,0.0000\nCC-MAIN-2025-26,grn,15357,15314,0.0006\nCC-MAIN-2025-26,guj,277786,277210,0.0116\nCC-MAIN-2025-26,hat,49564,49456,0.0021\nCC-MAIN-2025-26,hau,63959,63768,0.0027\nCC-MAIN-2025-26,haw,17387,17358,0.0007\nCC-MAIN-2025-26,heb,5527983,5505741,0.2317\nCC-MAIN-2025-26,hin,4975648,4963133,0.2086\nCC-MAIN-2025-26,hmn,15398,15346,0.0006\nCC-MAIN-2025-26,hrv,4821681,4802076,0.2021\nCC-MAIN-2025-26,hun,11439504,11393521,0.4795\nCC-MAIN-2025-26,hye,808238,805080,0.0339\nCC-MAIN-2025-26,ibo,19457,19386,0.0008\nCC-MAIN-2025-26,iku,5436,5416,0.0002\nCC-MAIN-2025-26,ile,6425,6401,0.0003\nCC-MAIN-2025-26,ina,11387,11358,0.0005\nCC-MAIN-2025-26,ind,23541252,23375143,0.9868\nCC-MAIN-2025-26,ipk,1668,1665,0.0001\nCC-MAIN-2025-26,isl,876485,872386,0.0367\nCC-MAIN-2025-26,ita,52179604,51922416,2.1873\nCC-MAIN-2025-26,jav,58924,58882,0.0025\nCC-MAIN-2025-26,jpn,119652953,119287237,5.0156\nCC-MAIN-2025-26,kal,18365,18274,0.0008\nCC-MAIN-2025-26,kan,337217,336667,0.0141\nCC-MAIN-2025-26,kas,86,86,0.0000\nCC-MAIN-2025-26,kat,1003584,1001043,0.0421\nCC-MAIN-2025-26,kaz,881819,878607,0.0370\nCC-MAIN-2025-26,kha,8114,8098,0.0003\nCC-MAIN-2025-26,khm,247392,245599,0.0104\nCC-MAIN-2025-26,kin,48374,48296,0.0020\nCC-MAIN-2025-26,kir,248932,248319,0.0104\nCC-MAIN-2025-26,kor,18149103,18080499,0.7608\nCC-MAIN-2025-26,kur,132174,131954,0.0055\nCC-MAIN-2025-26,lao,92051,91649,0.0039\nCC-MAIN-2025-26,lat,2233195,2229636,0.0936\nCC-MAIN-2025-26,lav,2144431,2133555,0.0899\nCC-MAIN-2025-26,lif,108,108,0.0000\nCC-MAIN-2025-26,lin,8107,8091,0.0003\nCC-MAIN-2025-26,lit,3961731,3940526,0.1661\nCC-MAIN-2025-26,ltz,90780,90561,0.0038\nCC-MAIN-2025-26,lug,4858,4853,0.0002\nCC-MAIN-2025-26,mal,564479,563506,0.0237\nCC-MAIN-2025-26,mar,683875,682745,0.0287\nCC-MAIN-2025-26,mfe,3032,3017,0.0001\nCC-MAIN-2025-26,mkd,847582,844017,0.0355\nCC-MAIN-2025-26,mlg,122428,122234,0.0051\nCC-MAIN-2025-26,mlt,79419,79184,0.0033\nCC-MAIN-2025-26,mon,382344,381172,0.0160\nCC-MAIN-2025-26,mri,30652,30534,0.0013\nCC-MAIN-2025-26,msa,1721744,1716378,0.0722\nCC-MAIN-2025-26,mya,312991,312021,0.0131\nCC-MAIN-2025-26,nau,817,815,0.0000\nCC-MAIN-2025-26,nep,1141885,1140393,0.0479\nCC-MAIN-2025-26,nld,41465055,41201534,1.7381\nCC-MAIN-2025-26,nno,351861,350538,0.0147\nCC-MAIN-2025-26,nor,7315676,7268152,0.3067\nCC-MAIN-2025-26,nso,1706,1705,0.0001\nCC-MAIN-2025-26,nya,15031,15004,0.0006\nCC-MAIN-2025-26,oci,75455,75321,0.0032\nCC-MAIN-2025-26,ori,134358,134252,0.0056\nCC-MAIN-2025-26,orm,12226,12202,0.0005\nCC-MAIN-2025-26,pan,177344,176887,0.0074\nCC-MAIN-2025-26,pol,40763416,40579138,1.7087\nCC-MAIN-2025-26,por,52437717,52202715,2.1981\nCC-MAIN-2025-26,pus,80468,80261,0.0034\nCC-MAIN-2025-26,que,13557,13542,0.0006\nCC-MAIN-2025-26,roh,22476,22375,0.0009\nCC-MAIN-2025-26,ron,11892728,11845955,0.4985\nCC-MAIN-2025-26,run,1613,1613,0.0001\nCC-MAIN-2025-26,rus,142743970,142162713,5.9836\nCC-MAIN-2025-26,sag,8525,8524,0.0004\nCC-MAIN-2025-26,san,77518,77352,0.0032\nCC-MAIN-2025-26,sco,15924,15833,0.0007\nCC-MAIN-2025-26,sin,203585,202564,0.0085\nCC-MAIN-2025-26,slk,9133986,9090001,0.3829\nCC-MAIN-2025-26,slv,3115633,3097734,0.1306\nCC-MAIN-2025-26,smo,16500,16406,0.0007\nCC-MAIN-2025-26,sna,17647,17596,0.0007\nCC-MAIN-2025-26,snd,45991,45936,0.0019\nCC-MAIN-2025-26,som,117480,117262,0.0049\nCC-MAIN-2025-26,sot,14019,13941,0.0006\nCC-MAIN-2025-26,spa,100360474,99848717,4.2069\nCC-MAIN-2025-26,sqi,1116998,1113837,0.0468\nCC-MAIN-2025-26,srp,5114588,5097662,0.2144\nCC-MAIN-2025-26,ssw,618,611,0.0000\nCC-MAIN-2025-26,sun,33879,33829,0.0014\nCC-MAIN-2025-26,sux,300,299,0.0000\nCC-MAIN-2025-26,swa,247600,247209,0.0104\nCC-MAIN-2025-26,swe,14552387,14462055,0.6100\nCC-MAIN-2025-26,syr,6189,6174,0.0003\nCC-MAIN-2025-26,tam,989927,988076,0.0415\nCC-MAIN-2025-26,tat,183434,183102,0.0077\nCC-MAIN-2025-26,tel,446071,444973,0.0187\nCC-MAIN-2025-26,tgk,162738,162520,0.0068\nCC-MAIN-2025-26,tgl,197809,196928,0.0083\nCC-MAIN-2025-26,tha,9110247,9060638,0.3819\nCC-MAIN-2025-26,tir,18765,18664,0.0008\nCC-MAIN-2025-26,ton,2318,2314,0.0001\nCC-MAIN-2025-26,tsn,4149,4148,0.0002\nCC-MAIN-2025-26,tso,1625,1622,0.0001\nCC-MAIN-2025-26,tuk,63683,63445,0.0027\nCC-MAIN-2025-26,tur,26655492,26505433,1.1173\nCC-MAIN-2025-26,uig,28314,28143,0.0012\nCC-MAIN-2025-26,ukr,16044605,15696607,0.6726\nCC-MAIN-2025-26,urd,697398,695287,0.0292\nCC-MAIN-2025-26,uzb,579054,576240,0.0243\nCC-MAIN-2025-26,ven,526,525,0.0000\nCC-MAIN-2025-26,vie,23751033,23557043,0.9956\nCC-MAIN-2025-26,vol,17148,17132,0.0007\nCC-MAIN-2025-26,war,68681,68622,0.0029\nCC-MAIN-2025-26,wol,3665,3657,0.0002\nCC-MAIN-2025-26,xho,19198,19134,0.0008\nCC-MAIN-2025-26,yid,36994,36935,0.0016\nCC-MAIN-2025-26,yor,22849,22806,0.0010\nCC-MAIN-2025-26,zha,3493,3487,0.0001\nCC-MAIN-2025-26,zho,127689877,127403535,5.3525\nCC-MAIN-2025-26,zul,28130,28058,0.0012\nCC-MAIN-2025-30,<unknown>,72651220,72651220,2.9989\nCC-MAIN-2025-30,aar,1609,1600,0.0001\nCC-MAIN-2025-30,abk,13243,13232,0.0005\nCC-MAIN-2025-30,afr,201390,200735,0.0083\nCC-MAIN-2025-30,aka,4378,4373,0.0002\nCC-MAIN-2025-30,amh,78992,78640,0.0033\nCC-MAIN-2025-30,ara,16534178,16447556,0.6825\nCC-MAIN-2025-30,asm,57278,57185,0.0024\nCC-MAIN-2025-30,aym,1959,1934,0.0001\nCC-MAIN-2025-30,aze,1437131,1433003,0.0593\nCC-MAIN-2025-30,bak,33814,33812,0.0014\nCC-MAIN-2025-30,bel,378223,377655,0.0156\nCC-MAIN-2025-30,ben,2521697,2516670,0.1041\nCC-MAIN-2025-30,bih,13097,13019,0.0005\nCC-MAIN-2025-30,bis,2117,2111,0.0001\nCC-MAIN-2025-30,bod,30567,30526,0.0013\nCC-MAIN-2025-30,bos,1261519,1257936,0.0521\nCC-MAIN-2025-30,bre,36477,36401,0.0015\nCC-MAIN-2025-30,bul,6273396,6253826,0.2590\nCC-MAIN-2025-30,cat,4300178,4269237,0.1775\nCC-MAIN-2025-30,ceb,40603,40548,0.0017\nCC-MAIN-2025-30,ces,24520378,24355216,1.0122\nCC-MAIN-2025-30,chr,535,535,0.0000\nCC-MAIN-2025-30,cos,49572,49484,0.0020\nCC-MAIN-2025-30,crs,1826,1811,0.0001\nCC-MAIN-2025-30,cym,256947,255803,0.0106\nCC-MAIN-2025-30,dan,11332827,11252612,0.4678\nCC-MAIN-2025-30,deu,135270240,134378757,5.5837\nCC-MAIN-2025-30,div,56416,56363,0.0023\nCC-MAIN-2025-30,dzo,2478,2470,0.0001\nCC-MAIN-2025-30,ell,12147756,12110965,0.5014\nCC-MAIN-2025-30,eng,1080823891,1074517353,44.6146\nCC-MAIN-2025-30,epo,192532,191869,0.0079\nCC-MAIN-2025-30,est,2885721,2870334,0.1191\nCC-MAIN-2025-30,eus,834080,830371,0.0344\nCC-MAIN-2025-30,fao,114861,114419,0.0047\nCC-MAIN-2025-30,fas,17861774,17812011,0.7373\nCC-MAIN-2025-30,fij,2091,2087,0.0001\nCC-MAIN-2025-30,fin,8124568,8075495,0.3354\nCC-MAIN-2025-30,fra,99164036,98562658,4.0933\nCC-MAIN-2025-30,fry,49238,49172,0.0020\nCC-MAIN-2025-30,gla,39580,39496,0.0016\nCC-MAIN-2025-30,gle,165369,164743,0.0068\nCC-MAIN-2025-30,glg,703102,701138,0.0290\nCC-MAIN-2025-30,glv,10659,10643,0.0004\nCC-MAIN-2025-30,got,603,601,0.0000\nCC-MAIN-2025-30,grn,17124,17064,0.0007\nCC-MAIN-2025-30,guj,269738,269147,0.0111\nCC-MAIN-2025-30,hat,44957,44898,0.0019\nCC-MAIN-2025-30,hau,66281,66051,0.0027\nCC-MAIN-2025-30,haw,17255,17219,0.0007\nCC-MAIN-2025-30,heb,5777061,5753171,0.2385\nCC-MAIN-2025-30,hin,4836654,4823483,0.1996\nCC-MAIN-2025-30,hmn,15246,15205,0.0006\nCC-MAIN-2025-30,hrv,5094517,5070971,0.2103\nCC-MAIN-2025-30,hun,11578388,11525761,0.4779\nCC-MAIN-2025-30,hye,790481,787485,0.0326\nCC-MAIN-2025-30,ibo,18174,18139,0.0008\nCC-MAIN-2025-30,iku,4745,4728,0.0002\nCC-MAIN-2025-30,ile,7306,7284,0.0003\nCC-MAIN-2025-30,ina,10701,10672,0.0004\nCC-MAIN-2025-30,ind,23117204,22965359,0.9542\nCC-MAIN-2025-30,ipk,1815,1812,0.0001\nCC-MAIN-2025-30,isl,943368,939417,0.0389\nCC-MAIN-2025-30,ita,58446265,58168458,2.4126\nCC-MAIN-2025-30,jav,47184,47115,0.0019\nCC-MAIN-2025-30,jpn,127870029,127458543,5.2783\nCC-MAIN-2025-30,kal,19838,19711,0.0008\nCC-MAIN-2025-30,kan,355177,354532,0.0147\nCC-MAIN-2025-30,kas,13,13,0.0000\nCC-MAIN-2025-30,kat,952609,949636,0.0393\nCC-MAIN-2025-30,kaz,803027,800356,0.0331\nCC-MAIN-2025-30,kha,7504,7498,0.0003\nCC-MAIN-2025-30,khm,264917,263963,0.0109\nCC-MAIN-2025-30,kin,49524,49397,0.0020\nCC-MAIN-2025-30,kir,244571,243796,0.0101\nCC-MAIN-2025-30,kor,18781578,18710755,0.7753\nCC-MAIN-2025-30,kur,144389,144128,0.0060\nCC-MAIN-2025-30,lao,87109,86614,0.0036\nCC-MAIN-2025-30,lat,2101909,2098475,0.0868\nCC-MAIN-2025-30,lav,2167684,2157958,0.0895\nCC-MAIN-2025-30,lif,136,136,0.0000\nCC-MAIN-2025-30,lin,6418,6404,0.0003\nCC-MAIN-2025-30,lit,3934255,3914120,0.1624\nCC-MAIN-2025-30,ltz,84339,84070,0.0035\nCC-MAIN-2025-30,lug,5233,5229,0.0002\nCC-MAIN-2025-30,mal,575159,574313,0.0237\nCC-MAIN-2025-30,mar,645657,644658,0.0267\nCC-MAIN-2025-30,mfe,1613,1606,0.0001\nCC-MAIN-2025-30,mkd,870752,867580,0.0359\nCC-MAIN-2025-30,mlg,88568,88248,0.0037\nCC-MAIN-2025-30,mlt,77260,76930,0.0032\nCC-MAIN-2025-30,mon,360230,358986,0.0149\nCC-MAIN-2025-30,mri,32192,32089,0.0013\nCC-MAIN-2025-30,msa,1761323,1756367,0.0727\nCC-MAIN-2025-30,mya,309069,307937,0.0128\nCC-MAIN-2025-30,nau,769,768,0.0000\nCC-MAIN-2025-30,nep,1162786,1161607,0.0480\nCC-MAIN-2025-30,nld,41502156,41235541,1.7131\nCC-MAIN-2025-30,nno,325225,323870,0.0134\nCC-MAIN-2025-30,nor,7450245,7401935,0.3075\nCC-MAIN-2025-30,nso,1599,1598,0.0001\nCC-MAIN-2025-30,nya,13991,13974,0.0006\nCC-MAIN-2025-30,oci,72352,72230,0.0030\nCC-MAIN-2025-30,ori,139186,139037,0.0057\nCC-MAIN-2025-30,orm,13090,13074,0.0005\nCC-MAIN-2025-30,pan,162637,162174,0.0067\nCC-MAIN-2025-30,pol,40449338,40275080,1.6697\nCC-MAIN-2025-30,por,52356997,52131067,2.1612\nCC-MAIN-2025-30,pus,78835,78621,0.0033\nCC-MAIN-2025-30,que,13516,13506,0.0006\nCC-MAIN-2025-30,roh,22083,21982,0.0009\nCC-MAIN-2025-30,ron,11973393,11926793,0.4942\nCC-MAIN-2025-30,run,1698,1698,0.0001\nCC-MAIN-2025-30,rus,141360999,140753188,5.8351\nCC-MAIN-2025-30,sag,7628,7627,0.0003\nCC-MAIN-2025-30,san,71466,71319,0.0029\nCC-MAIN-2025-30,sco,15831,15786,0.0007\nCC-MAIN-2025-30,sin,201634,200784,0.0083\nCC-MAIN-2025-30,slk,8956480,8912256,0.3697\nCC-MAIN-2025-30,slv,3086781,3070939,0.1274\nCC-MAIN-2025-30,smo,16142,16107,0.0007\nCC-MAIN-2025-30,sna,17713,17638,0.0007\nCC-MAIN-2025-30,snd,44550,44517,0.0018\nCC-MAIN-2025-30,som,109394,109164,0.0045\nCC-MAIN-2025-30,sot,14730,14690,0.0006\nCC-MAIN-2025-30,spa,103863352,103330029,4.2873\nCC-MAIN-2025-30,sqi,1102245,1099414,0.0455\nCC-MAIN-2025-30,srp,5126036,5105501,0.2116\nCC-MAIN-2025-30,ssw,635,631,0.0000\nCC-MAIN-2025-30,sun,31962,31936,0.0013\nCC-MAIN-2025-30,sux,221,219,0.0000\nCC-MAIN-2025-30,swa,239948,239539,0.0099\nCC-MAIN-2025-30,swe,14828964,14733326,0.6121\nCC-MAIN-2025-30,syr,6577,6562,0.0003\nCC-MAIN-2025-30,tam,1036263,1034006,0.0428\nCC-MAIN-2025-30,tat,186350,185964,0.0077\nCC-MAIN-2025-30,tel,429713,428999,0.0177\nCC-MAIN-2025-30,tgk,159303,158995,0.0066\nCC-MAIN-2025-30,tgl,197338,196359,0.0081\nCC-MAIN-2025-30,tha,8919966,8876282,0.3682\nCC-MAIN-2025-30,tir,17100,17024,0.0007\nCC-MAIN-2025-30,ton,1725,1720,0.0001\nCC-MAIN-2025-30,tsn,3228,3225,0.0001\nCC-MAIN-2025-30,tso,1385,1382,0.0001\nCC-MAIN-2025-30,tuk,61044,60780,0.0025\nCC-MAIN-2025-30,tur,26663432,26500621,1.1006\nCC-MAIN-2025-30,uig,28772,28604,0.0012\nCC-MAIN-2025-30,ukr,15672731,15401348,0.6469\nCC-MAIN-2025-30,urd,701557,698995,0.0290\nCC-MAIN-2025-30,uzb,575935,573697,0.0238\nCC-MAIN-2025-30,ven,856,855,0.0000\nCC-MAIN-2025-30,vie,23059893,22886566,0.9519\nCC-MAIN-2025-30,vol,15300,15280,0.0006\nCC-MAIN-2025-30,war,61713,61620,0.0025\nCC-MAIN-2025-30,wol,3593,3576,0.0001\nCC-MAIN-2025-30,xho,21494,21388,0.0009\nCC-MAIN-2025-30,yid,41170,41099,0.0017\nCC-MAIN-2025-30,yor,25635,25605,0.0011\nCC-MAIN-2025-30,zha,3454,3447,0.0001\nCC-MAIN-2025-30,zho,135624228,135327269,5.5983\nCC-MAIN-2025-30,zul,33453,33391,0.0014\nCC-MAIN-2025-33,<unknown>,68205678,68205678,2.7925\nCC-MAIN-2025-33,aar,1511,1503,0.0001\nCC-MAIN-2025-33,abk,14340,14325,0.0006\nCC-MAIN-2025-33,afr,209151,208685,0.0086\nCC-MAIN-2025-33,aka,4082,4079,0.0002\nCC-MAIN-2025-33,amh,78830,78549,0.0032\nCC-MAIN-2025-33,ara,15589993,15510746,0.6383\nCC-MAIN-2025-33,asm,60747,60693,0.0025\nCC-MAIN-2025-33,aym,1528,1510,0.0001\nCC-MAIN-2025-33,aze,1405679,1401020,0.0576\nCC-MAIN-2025-33,bak,35759,35753,0.0015\nCC-MAIN-2025-33,bel,366358,365889,0.0150\nCC-MAIN-2025-33,ben,2541153,2536036,0.1040\nCC-MAIN-2025-33,bih,12425,12407,0.0005\nCC-MAIN-2025-33,bis,2296,2268,0.0001\nCC-MAIN-2025-33,bod,30563,30519,0.0013\nCC-MAIN-2025-33,bos,1294711,1291525,0.0530\nCC-MAIN-2025-33,bre,80937,80850,0.0033\nCC-MAIN-2025-33,bul,6310445,6290240,0.2584\nCC-MAIN-2025-33,cat,4229416,4199364,0.1732\nCC-MAIN-2025-33,ceb,46620,46584,0.0019\nCC-MAIN-2025-33,ces,24917197,24760679,1.0202\nCC-MAIN-2025-33,chr,934,934,0.0000\nCC-MAIN-2025-33,cos,54822,54729,0.0022\nCC-MAIN-2025-33,crs,1637,1635,0.0001\nCC-MAIN-2025-33,cym,244284,243271,0.0100\nCC-MAIN-2025-33,dan,11777135,11694191,0.4822\nCC-MAIN-2025-33,deu,142130573,141220469,5.8191\nCC-MAIN-2025-33,div,59439,59379,0.0024\nCC-MAIN-2025-33,dzo,2361,2361,0.0001\nCC-MAIN-2025-33,ell,12834675,12794801,0.5255\nCC-MAIN-2025-33,eng,1081214884,1075138077,44.2668\nCC-MAIN-2025-33,epo,190041,189670,0.0078\nCC-MAIN-2025-33,est,2887003,2873593,0.1182\nCC-MAIN-2025-33,eus,753354,750021,0.0308\nCC-MAIN-2025-33,fao,115050,114624,0.0047\nCC-MAIN-2025-33,fas,19262528,19205384,0.7886\nCC-MAIN-2025-33,fij,2099,2096,0.0001\nCC-MAIN-2025-33,fin,8357716,8311967,0.3422\nCC-MAIN-2025-33,fra,108835763,108160260,4.4559\nCC-MAIN-2025-33,fry,41408,41302,0.0017\nCC-MAIN-2025-33,gla,37265,37206,0.0015\nCC-MAIN-2025-33,gle,171333,170817,0.0070\nCC-MAIN-2025-33,glg,664327,662102,0.0272\nCC-MAIN-2025-33,glv,9170,9157,0.0004\nCC-MAIN-2025-33,got,633,632,0.0000\nCC-MAIN-2025-33,grn,19245,19211,0.0008\nCC-MAIN-2025-33,guj,258506,257812,0.0106\nCC-MAIN-2025-33,hat,61119,61012,0.0025\nCC-MAIN-2025-33,hau,59616,59433,0.0024\nCC-MAIN-2025-33,haw,17069,17030,0.0007\nCC-MAIN-2025-33,heb,5985208,5960947,0.2450\nCC-MAIN-2025-33,hin,4707810,4697113,0.1927\nCC-MAIN-2025-33,hmn,17871,17826,0.0007\nCC-MAIN-2025-33,hrv,5327084,5306129,0.2181\nCC-MAIN-2025-33,hun,12010113,11961223,0.4917\nCC-MAIN-2025-33,hye,795438,792324,0.0326\nCC-MAIN-2025-33,ibo,18564,18510,0.0008\nCC-MAIN-2025-33,iku,5072,5024,0.0002\nCC-MAIN-2025-33,ile,9102,9078,0.0004\nCC-MAIN-2025-33,ina,11930,11904,0.0005\nCC-MAIN-2025-33,ind,23668200,23535714,0.9690\nCC-MAIN-2025-33,ipk,1480,1479,0.0001\nCC-MAIN-2025-33,isl,1005186,1001291,0.0412\nCC-MAIN-2025-33,ita,51832253,51576169,2.1221\nCC-MAIN-2025-33,jav,61370,61304,0.0025\nCC-MAIN-2025-33,jpn,124798510,124401364,5.1095\nCC-MAIN-2025-33,kal,19858,19759,0.0008\nCC-MAIN-2025-33,kan,341405,340852,0.0140\nCC-MAIN-2025-33,kas,48,48,0.0000\nCC-MAIN-2025-33,kat,980060,977629,0.0401\nCC-MAIN-2025-33,kaz,851521,848049,0.0349\nCC-MAIN-2025-33,kha,7366,7364,0.0003\nCC-MAIN-2025-33,khm,241044,239920,0.0099\nCC-MAIN-2025-33,kin,48746,48522,0.0020\nCC-MAIN-2025-33,kir,258327,257530,0.0106\nCC-MAIN-2025-33,kor,18476985,18416439,0.7565\nCC-MAIN-2025-33,kur,139344,139142,0.0057\nCC-MAIN-2025-33,lao,91468,91172,0.0037\nCC-MAIN-2025-33,lat,2288359,2284584,0.0937\nCC-MAIN-2025-33,lav,2160419,2151356,0.0885\nCC-MAIN-2025-33,lif,28,28,0.0000\nCC-MAIN-2025-33,lin,6921,6900,0.0003\nCC-MAIN-2025-33,lit,4094243,4073074,0.1676\nCC-MAIN-2025-33,ltz,84001,83673,0.0034\nCC-MAIN-2025-33,lug,2987,2978,0.0001\nCC-MAIN-2025-33,mal,552084,550466,0.0226\nCC-MAIN-2025-33,mar,608961,607796,0.0249\nCC-MAIN-2025-33,mfe,4904,4896,0.0002\nCC-MAIN-2025-33,mkd,910122,906617,0.0373\nCC-MAIN-2025-33,mlg,102343,102099,0.0042\nCC-MAIN-2025-33,mlt,74220,73835,0.0030\nCC-MAIN-2025-33,mon,348023,346807,0.0142\nCC-MAIN-2025-33,mri,30091,29932,0.0012\nCC-MAIN-2025-33,msa,1826212,1821135,0.0748\nCC-MAIN-2025-33,mya,332497,331517,0.0136\nCC-MAIN-2025-33,nau,796,795,0.0000\nCC-MAIN-2025-33,nep,1115432,1113858,0.0457\nCC-MAIN-2025-33,nld,44287771,44005959,1.8132\nCC-MAIN-2025-33,nno,335789,334784,0.0137\nCC-MAIN-2025-33,nor,7649717,7606292,0.3132\nCC-MAIN-2025-33,nso,1967,1961,0.0001\nCC-MAIN-2025-33,nya,13469,13421,0.0006\nCC-MAIN-2025-33,oci,74707,74587,0.0031\nCC-MAIN-2025-33,ori,139576,139356,0.0057\nCC-MAIN-2025-33,orm,14098,14075,0.0006\nCC-MAIN-2025-33,pan,173548,173067,0.0071\nCC-MAIN-2025-33,pol,41911861,41741007,1.7159\nCC-MAIN-2025-33,por,53237518,53014053,2.1796\nCC-MAIN-2025-33,pus,92554,92323,0.0038\nCC-MAIN-2025-33,que,15297,15290,0.0006\nCC-MAIN-2025-33,roh,26243,26026,0.0011\nCC-MAIN-2025-33,ron,13001276,12948324,0.5323\nCC-MAIN-2025-33,run,1431,1428,0.0001\nCC-MAIN-2025-33,rus,149267804,148654057,6.1113\nCC-MAIN-2025-33,sag,7712,7712,0.0003\nCC-MAIN-2025-33,san,73276,73121,0.0030\nCC-MAIN-2025-33,sco,14644,14602,0.0006\nCC-MAIN-2025-33,sin,210190,209443,0.0086\nCC-MAIN-2025-33,slk,9593278,9542924,0.3928\nCC-MAIN-2025-33,slv,3280242,3266692,0.1343\nCC-MAIN-2025-33,smo,16815,16771,0.0007\nCC-MAIN-2025-33,sna,17534,17460,0.0007\nCC-MAIN-2025-33,snd,41181,41125,0.0017\nCC-MAIN-2025-33,som,108426,108183,0.0044\nCC-MAIN-2025-33,sot,14273,14201,0.0006\nCC-MAIN-2025-33,spa,106432508,105902987,4.3575\nCC-MAIN-2025-33,sqi,1128056,1125578,0.0462\nCC-MAIN-2025-33,srp,5230180,5212297,0.2141\nCC-MAIN-2025-33,ssw,609,601,0.0000\nCC-MAIN-2025-33,sun,33730,33687,0.0014\nCC-MAIN-2025-33,sux,214,214,0.0000\nCC-MAIN-2025-33,swa,257298,256898,0.0105\nCC-MAIN-2025-33,swe,15306528,15215291,0.6267\nCC-MAIN-2025-33,syr,6059,6049,0.0002\nCC-MAIN-2025-33,tam,1041041,1039359,0.0426\nCC-MAIN-2025-33,tat,181070,180739,0.0074\nCC-MAIN-2025-33,tel,408418,407740,0.0167\nCC-MAIN-2025-33,tgk,162107,161905,0.0066\nCC-MAIN-2025-33,tgl,198930,198100,0.0081\nCC-MAIN-2025-33,tha,9141736,9098250,0.3743\nCC-MAIN-2025-33,tir,17609,17536,0.0007\nCC-MAIN-2025-33,ton,2104,2101,0.0001\nCC-MAIN-2025-33,tsn,3264,3261,0.0001\nCC-MAIN-2025-33,tso,1254,1249,0.0001\nCC-MAIN-2025-33,tuk,26114,25928,0.0011\nCC-MAIN-2025-33,tur,26938192,26790505,1.1029\nCC-MAIN-2025-33,uig,28856,28689,0.0012\nCC-MAIN-2025-33,ukr,16748693,16372540,0.6857\nCC-MAIN-2025-33,urd,670293,667863,0.0274\nCC-MAIN-2025-33,uzb,578680,576637,0.0237\nCC-MAIN-2025-33,ven,517,513,0.0000\nCC-MAIN-2025-33,vie,25221098,25059809,1.0326\nCC-MAIN-2025-33,vol,15003,14982,0.0006\nCC-MAIN-2025-33,war,57804,57764,0.0024\nCC-MAIN-2025-33,wol,3097,3086,0.0001\nCC-MAIN-2025-33,xho,20562,20496,0.0008\nCC-MAIN-2025-33,yid,41988,41941,0.0017\nCC-MAIN-2025-33,yor,25934,25875,0.0011\nCC-MAIN-2025-33,zha,3398,3390,0.0001\nCC-MAIN-2025-33,zho,127147205,126851559,5.2056\nCC-MAIN-2025-33,zul,33718,33598,0.0014\nCC-MAIN-2025-38,<unknown>,65968491,65968491,2.7649\nCC-MAIN-2025-38,aar,1621,1615,0.0001\nCC-MAIN-2025-38,abk,14374,14365,0.0006\nCC-MAIN-2025-38,afr,195077,194579,0.0082\nCC-MAIN-2025-38,aka,3495,3486,0.0001\nCC-MAIN-2025-38,amh,78701,78377,0.0033\nCC-MAIN-2025-38,ara,15625490,15550969,0.6549\nCC-MAIN-2025-38,asm,59982,59935,0.0025\nCC-MAIN-2025-38,aym,1945,1927,0.0001\nCC-MAIN-2025-38,aze,1488881,1485088,0.0624\nCC-MAIN-2025-38,bak,34134,34132,0.0014\nCC-MAIN-2025-38,bel,364189,363567,0.0153\nCC-MAIN-2025-38,ben,2608568,2603610,0.1093\nCC-MAIN-2025-38,bih,12461,12432,0.0005\nCC-MAIN-2025-38,bis,2117,2107,0.0001\nCC-MAIN-2025-38,bod,20427,20420,0.0009\nCC-MAIN-2025-38,bos,1328186,1324526,0.0557\nCC-MAIN-2025-38,bre,38739,38639,0.0016\nCC-MAIN-2025-38,bul,6775684,6752698,0.2840\nCC-MAIN-2025-38,cat,4154845,4127407,0.1741\nCC-MAIN-2025-38,ceb,50173,50112,0.0021\nCC-MAIN-2025-38,ces,23575841,23447912,0.9881\nCC-MAIN-2025-38,chr,893,893,0.0000\nCC-MAIN-2025-38,cos,52049,51865,0.0022\nCC-MAIN-2025-38,crs,1661,1574,0.0001\nCC-MAIN-2025-38,cym,224249,223122,0.0094\nCC-MAIN-2025-38,dan,10575358,10506504,0.4432\nCC-MAIN-2025-38,deu,143301622,142348472,6.0060\nCC-MAIN-2025-38,div,59600,59500,0.0025\nCC-MAIN-2025-38,dzo,1402,1401,0.0001\nCC-MAIN-2025-38,ell,11685958,11650870,0.4898\nCC-MAIN-2025-38,eng,1057662483,1051537054,44.3285\nCC-MAIN-2025-38,epo,175222,174974,0.0073\nCC-MAIN-2025-38,est,2792272,2779819,0.1170\nCC-MAIN-2025-38,eus,729564,726625,0.0306\nCC-MAIN-2025-38,fao,107715,107404,0.0045\nCC-MAIN-2025-38,fas,18644214,18591164,0.7814\nCC-MAIN-2025-38,fij,2638,2635,0.0001\nCC-MAIN-2025-38,fin,7597452,7555688,0.3184\nCC-MAIN-2025-38,fra,106425942,105790229,4.4605\nCC-MAIN-2025-38,fry,76355,76216,0.0032\nCC-MAIN-2025-38,gla,34144,34046,0.0014\nCC-MAIN-2025-38,gle,165290,164510,0.0069\nCC-MAIN-2025-38,glg,665518,663378,0.0279\nCC-MAIN-2025-38,glv,10650,10634,0.0004\nCC-MAIN-2025-38,got,541,540,0.0000\nCC-MAIN-2025-38,grn,18195,18036,0.0008\nCC-MAIN-2025-38,guj,261744,261120,0.0110\nCC-MAIN-2025-38,hat,40143,40008,0.0017\nCC-MAIN-2025-38,hau,64265,64113,0.0027\nCC-MAIN-2025-38,haw,19738,19671,0.0008\nCC-MAIN-2025-38,heb,5452239,5432939,0.2285\nCC-MAIN-2025-38,hin,4604613,4594477,0.1930\nCC-MAIN-2025-38,hmn,15881,15816,0.0007\nCC-MAIN-2025-38,hrv,4964667,4943652,0.2081\nCC-MAIN-2025-38,hun,11080924,11034719,0.4644\nCC-MAIN-2025-38,hye,841059,837507,0.0353\nCC-MAIN-2025-38,ibo,19154,19069,0.0008\nCC-MAIN-2025-38,iku,5280,5262,0.0002\nCC-MAIN-2025-38,ile,8250,8216,0.0003\nCC-MAIN-2025-38,ina,11990,11817,0.0005\nCC-MAIN-2025-38,ind,22678559,22537008,0.9505\nCC-MAIN-2025-38,ipk,1346,1344,0.0001\nCC-MAIN-2025-38,isl,989427,984827,0.0415\nCC-MAIN-2025-38,ita,48690497,48454797,2.0407\nCC-MAIN-2025-38,jav,58079,58002,0.0024\nCC-MAIN-2025-38,jpn,124113848,123713572,5.2018\nCC-MAIN-2025-38,kal,21184,21074,0.0009\nCC-MAIN-2025-38,kan,339666,339065,0.0142\nCC-MAIN-2025-38,kas,60,60,0.0000\nCC-MAIN-2025-38,kat,1032197,1029289,0.0433\nCC-MAIN-2025-38,kaz,840783,837918,0.0352\nCC-MAIN-2025-38,kha,6694,6688,0.0003\nCC-MAIN-2025-38,khm,249462,248343,0.0105\nCC-MAIN-2025-38,kin,50606,50352,0.0021\nCC-MAIN-2025-38,kir,245862,245236,0.0103\nCC-MAIN-2025-38,kor,18499657,18445242,0.7754\nCC-MAIN-2025-38,kur,138820,138616,0.0058\nCC-MAIN-2025-38,lao,98512,98067,0.0041\nCC-MAIN-2025-38,lat,2345551,2341960,0.0983\nCC-MAIN-2025-38,lav,2065280,2055827,0.0866\nCC-MAIN-2025-38,lif,53,53,0.0000\nCC-MAIN-2025-38,lin,6435,6428,0.0003\nCC-MAIN-2025-38,lit,3819192,3800623,0.1601\nCC-MAIN-2025-38,ltz,94507,94179,0.0040\nCC-MAIN-2025-38,lug,3545,3529,0.0001\nCC-MAIN-2025-38,mal,540700,539976,0.0227\nCC-MAIN-2025-38,mar,632447,631134,0.0265\nCC-MAIN-2025-38,mfe,4810,4802,0.0002\nCC-MAIN-2025-38,mkd,894454,891479,0.0375\nCC-MAIN-2025-38,mlg,73254,72993,0.0031\nCC-MAIN-2025-38,mlt,85827,85268,0.0036\nCC-MAIN-2025-38,mon,352161,350885,0.0148\nCC-MAIN-2025-38,mri,34143,33980,0.0014\nCC-MAIN-2025-38,msa,1609531,1604540,0.0675\nCC-MAIN-2025-38,mya,323571,322505,0.0136\nCC-MAIN-2025-38,nau,725,723,0.0000\nCC-MAIN-2025-38,nep,1084307,1083211,0.0454\nCC-MAIN-2025-38,nld,44749673,44451103,1.8755\nCC-MAIN-2025-38,nno,333776,332733,0.0140\nCC-MAIN-2025-38,nor,7667260,7622961,0.3213\nCC-MAIN-2025-38,nso,2134,2133,0.0001\nCC-MAIN-2025-38,nya,13436,13366,0.0006\nCC-MAIN-2025-38,oci,78500,78290,0.0033\nCC-MAIN-2025-38,ori,123441,123193,0.0052\nCC-MAIN-2025-38,orm,11512,11497,0.0005\nCC-MAIN-2025-38,pan,176705,176366,0.0074\nCC-MAIN-2025-38,pol,39611977,39446043,1.6602\nCC-MAIN-2025-38,por,49379728,49179228,2.0696\nCC-MAIN-2025-38,pus,83466,83198,0.0035\nCC-MAIN-2025-38,que,15401,15394,0.0006\nCC-MAIN-2025-38,roh,26775,26638,0.0011\nCC-MAIN-2025-38,ron,11498389,11453641,0.4819\nCC-MAIN-2025-38,run,1510,1501,0.0001\nCC-MAIN-2025-38,rus,145741365,145150267,6.1083\nCC-MAIN-2025-38,sag,8600,8599,0.0004\nCC-MAIN-2025-38,san,57256,57102,0.0024\nCC-MAIN-2025-38,sco,15757,15698,0.0007\nCC-MAIN-2025-38,sin,196749,196162,0.0082\nCC-MAIN-2025-38,slk,9192047,9141983,0.3853\nCC-MAIN-2025-38,slv,3016017,3003729,0.1264\nCC-MAIN-2025-38,smo,17440,17365,0.0007\nCC-MAIN-2025-38,sna,17200,17112,0.0007\nCC-MAIN-2025-38,snd,38482,38399,0.0016\nCC-MAIN-2025-38,som,103999,103746,0.0044\nCC-MAIN-2025-38,sot,15297,15215,0.0006\nCC-MAIN-2025-38,spa,104199271,103587656,4.3672\nCC-MAIN-2025-38,sqi,1131119,1128498,0.0474\nCC-MAIN-2025-38,srp,4899526,4882010,0.2053\nCC-MAIN-2025-38,ssw,663,660,0.0000\nCC-MAIN-2025-38,sun,36168,36091,0.0015\nCC-MAIN-2025-38,sux,265,265,0.0000\nCC-MAIN-2025-38,swa,248037,247668,0.0104\nCC-MAIN-2025-38,swe,14015640,13933044,0.5874\nCC-MAIN-2025-38,syr,6899,6886,0.0003\nCC-MAIN-2025-38,tam,943952,942281,0.0396\nCC-MAIN-2025-38,tat,190762,190328,0.0080\nCC-MAIN-2025-38,tel,415735,414917,0.0174\nCC-MAIN-2025-38,tgk,168658,168299,0.0071\nCC-MAIN-2025-38,tgl,209435,208731,0.0088\nCC-MAIN-2025-38,tha,9166176,9120203,0.3842\nCC-MAIN-2025-38,tir,22409,22302,0.0009\nCC-MAIN-2025-38,ton,2462,2457,0.0001\nCC-MAIN-2025-38,tsn,3142,3134,0.0001\nCC-MAIN-2025-38,tso,1414,1412,0.0001\nCC-MAIN-2025-38,tuk,28203,27996,0.0012\nCC-MAIN-2025-38,tur,28566927,28425462,1.1973\nCC-MAIN-2025-38,uig,29424,29218,0.0012\nCC-MAIN-2025-38,ukr,16898981,16524477,0.7083\nCC-MAIN-2025-38,urd,675646,673851,0.0283\nCC-MAIN-2025-38,uzb,595623,593288,0.0250\nCC-MAIN-2025-38,ven,953,952,0.0000\nCC-MAIN-2025-38,vie,25169123,24991503,1.0549\nCC-MAIN-2025-38,vol,19413,19395,0.0008\nCC-MAIN-2025-38,war,57658,57547,0.0024\nCC-MAIN-2025-38,wol,3512,3500,0.0001\nCC-MAIN-2025-38,xho,19184,19088,0.0008\nCC-MAIN-2025-38,yid,44404,44316,0.0019\nCC-MAIN-2025-38,yor,26236,26138,0.0011\nCC-MAIN-2025-38,zha,2495,2488,0.0001\nCC-MAIN-2025-38,zho,123110314,122836459,5.1598\nCC-MAIN-2025-38,zul,30381,30277,0.0013\nCC-MAIN-2025-43,<unknown>,67562821,67562821,2.5819\nCC-MAIN-2025-43,aar,1780,1769,0.0001\nCC-MAIN-2025-43,abk,15772,15748,0.0006\nCC-MAIN-2025-43,afr,213848,213089,0.0082\nCC-MAIN-2025-43,aka,3057,3052,0.0001\nCC-MAIN-2025-43,amh,90040,89701,0.0034\nCC-MAIN-2025-43,ara,17280169,17204755,0.6604\nCC-MAIN-2025-43,asm,66498,66433,0.0025\nCC-MAIN-2025-43,aym,1870,1854,0.0001\nCC-MAIN-2025-43,aze,1417566,1413741,0.0542\nCC-MAIN-2025-43,bak,22224,22223,0.0008\nCC-MAIN-2025-43,bel,348256,347251,0.0133\nCC-MAIN-2025-43,ben,2908882,2903545,0.1112\nCC-MAIN-2025-43,bih,15657,15586,0.0006\nCC-MAIN-2025-43,bis,2284,2280,0.0001\nCC-MAIN-2025-43,bod,27802,27728,0.0011\nCC-MAIN-2025-43,bos,1292358,1289600,0.0494\nCC-MAIN-2025-43,bre,81628,81474,0.0031\nCC-MAIN-2025-43,bul,6744174,6722526,0.2577\nCC-MAIN-2025-43,cat,4643673,4616475,0.1775\nCC-MAIN-2025-43,ceb,46758,46733,0.0018\nCC-MAIN-2025-43,ces,27933042,27783229,1.0675\nCC-MAIN-2025-43,chr,714,712,0.0000\nCC-MAIN-2025-43,cos,54501,54361,0.0021\nCC-MAIN-2025-43,crs,2037,2012,0.0001\nCC-MAIN-2025-43,cym,262368,260891,0.0100\nCC-MAIN-2025-43,dan,13234465,13144519,0.5058\nCC-MAIN-2025-43,deu,147879804,146902440,5.6512\nCC-MAIN-2025-43,div,53839,53767,0.0021\nCC-MAIN-2025-43,dzo,2106,2104,0.0001\nCC-MAIN-2025-43,ell,12818676,12780425,0.4899\nCC-MAIN-2025-43,eng,1173089039,1166625625,44.8292\nCC-MAIN-2025-43,epo,177312,177107,0.0068\nCC-MAIN-2025-43,est,3025935,3010506,0.1156\nCC-MAIN-2025-43,eus,793832,790612,0.0303\nCC-MAIN-2025-43,fao,121977,121551,0.0047\nCC-MAIN-2025-43,fas,19306899,19251032,0.7378\nCC-MAIN-2025-43,fij,2320,2318,0.0001\nCC-MAIN-2025-43,fin,8824460,8775388,0.3372\nCC-MAIN-2025-43,fra,116221365,115514672,4.4414\nCC-MAIN-2025-43,fry,37401,37328,0.0014\nCC-MAIN-2025-43,gla,35665,35614,0.0014\nCC-MAIN-2025-43,gle,150233,149839,0.0057\nCC-MAIN-2025-43,glg,681170,679015,0.0260\nCC-MAIN-2025-43,glv,11376,11358,0.0004\nCC-MAIN-2025-43,got,535,534,0.0000\nCC-MAIN-2025-43,grn,21485,21434,0.0008\nCC-MAIN-2025-43,guj,302728,302019,0.0116\nCC-MAIN-2025-43,hat,60007,59914,0.0023\nCC-MAIN-2025-43,hau,64524,64302,0.0025\nCC-MAIN-2025-43,haw,17715,17636,0.0007\nCC-MAIN-2025-43,heb,6407452,6381547,0.2449\nCC-MAIN-2025-43,hin,5160541,5149330,0.1972\nCC-MAIN-2025-43,hmn,14565,14536,0.0006\nCC-MAIN-2025-43,hrv,5018732,4999264,0.1918\nCC-MAIN-2025-43,hun,12332477,12285101,0.4713\nCC-MAIN-2025-43,hye,775574,772898,0.0296\nCC-MAIN-2025-43,ibo,19280,19233,0.0007\nCC-MAIN-2025-43,iku,5933,5917,0.0002\nCC-MAIN-2025-43,ile,7765,7746,0.0003\nCC-MAIN-2025-43,ina,12478,12441,0.0005\nCC-MAIN-2025-43,ind,26492739,26362781,1.0124\nCC-MAIN-2025-43,ipk,1503,1500,0.0001\nCC-MAIN-2025-43,isl,1006403,1001637,0.0385\nCC-MAIN-2025-43,ita,53250061,53001238,2.0349\nCC-MAIN-2025-43,jav,44071,43979,0.0017\nCC-MAIN-2025-43,jpn,137913697,137498240,5.2703\nCC-MAIN-2025-43,kal,21167,21066,0.0008\nCC-MAIN-2025-43,kan,368868,368152,0.0141\nCC-MAIN-2025-43,kas,112,112,0.0000\nCC-MAIN-2025-43,kat,1010164,1007249,0.0386\nCC-MAIN-2025-43,kaz,869456,864462,0.0332\nCC-MAIN-2025-43,kha,7050,7040,0.0003\nCC-MAIN-2025-43,khm,278868,278140,0.0107\nCC-MAIN-2025-43,kin,55677,55524,0.0021\nCC-MAIN-2025-43,kir,249748,249049,0.0095\nCC-MAIN-2025-43,kor,18696716,18639278,0.7145\nCC-MAIN-2025-43,kur,158102,157684,0.0060\nCC-MAIN-2025-43,lao,99558,99009,0.0038\nCC-MAIN-2025-43,lat,2612486,2608424,0.0998\nCC-MAIN-2025-43,lav,2249044,2239211,0.0859\nCC-MAIN-2025-43,lif,117,117,0.0000\nCC-MAIN-2025-43,lin,6475,6465,0.0002\nCC-MAIN-2025-43,lit,4254374,4234181,0.1626\nCC-MAIN-2025-43,ltz,73540,73298,0.0028\nCC-MAIN-2025-43,lug,3609,3600,0.0001\nCC-MAIN-2025-43,mal,573042,572302,0.0219\nCC-MAIN-2025-43,mar,698378,696870,0.0267\nCC-MAIN-2025-43,mfe,4553,4549,0.0002\nCC-MAIN-2025-43,mkd,881449,878329,0.0337\nCC-MAIN-2025-43,mlg,97422,97200,0.0037\nCC-MAIN-2025-43,mlt,84008,83673,0.0032\nCC-MAIN-2025-43,mon,372966,371885,0.0143\nCC-MAIN-2025-43,mri,33565,33461,0.0013\nCC-MAIN-2025-43,msa,1871996,1866127,0.0715\nCC-MAIN-2025-43,mya,354913,353855,0.0136\nCC-MAIN-2025-43,nau,1045,1043,0.0000\nCC-MAIN-2025-43,nep,1292666,1291470,0.0494\nCC-MAIN-2025-43,nld,46251677,45953656,1.7675\nCC-MAIN-2025-43,nno,350471,345563,0.0134\nCC-MAIN-2025-43,nor,7813587,7760373,0.2986\nCC-MAIN-2025-43,nso,1906,1905,0.0001\nCC-MAIN-2025-43,nya,14900,14870,0.0006\nCC-MAIN-2025-43,oci,51561,51444,0.0020\nCC-MAIN-2025-43,ori,147182,146625,0.0056\nCC-MAIN-2025-43,orm,15536,15511,0.0006\nCC-MAIN-2025-43,pan,168635,168303,0.0064\nCC-MAIN-2025-43,pol,47680851,47485556,1.8221\nCC-MAIN-2025-43,por,58938573,58697163,2.2523\nCC-MAIN-2025-43,pus,99128,98875,0.0038\nCC-MAIN-2025-43,que,15311,15298,0.0006\nCC-MAIN-2025-43,roh,26657,26478,0.0010\nCC-MAIN-2025-43,ron,13503243,13448256,0.5160\nCC-MAIN-2025-43,run,2335,2334,0.0001\nCC-MAIN-2025-43,rus,152892019,152311119,5.8427\nCC-MAIN-2025-43,sag,7457,7457,0.0003\nCC-MAIN-2025-43,san,65178,65016,0.0025\nCC-MAIN-2025-43,sco,34732,34688,0.0013\nCC-MAIN-2025-43,sin,218148,217806,0.0083\nCC-MAIN-2025-43,slk,9932512,9874227,0.3796\nCC-MAIN-2025-43,slv,3000399,2988333,0.1147\nCC-MAIN-2025-43,smo,16624,16607,0.0006\nCC-MAIN-2025-43,sna,19686,19628,0.0008\nCC-MAIN-2025-43,snd,37557,37539,0.0014\nCC-MAIN-2025-43,som,119286,118918,0.0046\nCC-MAIN-2025-43,sot,15344,15278,0.0006\nCC-MAIN-2025-43,spa,116759569,116164909,4.4619\nCC-MAIN-2025-43,sqi,1170146,1167713,0.0447\nCC-MAIN-2025-43,srp,5473573,5453091,0.2092\nCC-MAIN-2025-43,ssw,670,664,0.0000\nCC-MAIN-2025-43,sun,30157,30134,0.0012\nCC-MAIN-2025-43,sux,271,271,0.0000\nCC-MAIN-2025-43,swa,253440,252904,0.0097\nCC-MAIN-2025-43,swe,17215601,17110100,0.6579\nCC-MAIN-2025-43,syr,7124,7106,0.0003\nCC-MAIN-2025-43,tam,1127520,1125054,0.0431\nCC-MAIN-2025-43,tat,167204,166867,0.0064\nCC-MAIN-2025-43,tel,483678,482931,0.0185\nCC-MAIN-2025-43,tgk,140528,140299,0.0054\nCC-MAIN-2025-43,tgl,197860,197212,0.0076\nCC-MAIN-2025-43,tha,10081391,10037906,0.3853\nCC-MAIN-2025-43,tir,23354,23290,0.0009\nCC-MAIN-2025-43,ton,2082,2077,0.0001\nCC-MAIN-2025-43,tsn,3156,3152,0.0001\nCC-MAIN-2025-43,tso,1904,1899,0.0001\nCC-MAIN-2025-43,tuk,29589,29475,0.0011\nCC-MAIN-2025-43,tur,30135653,30008253,1.1516\nCC-MAIN-2025-43,uig,32095,31840,0.0012\nCC-MAIN-2025-43,ukr,16829114,16413391,0.6431\nCC-MAIN-2025-43,urd,699139,695941,0.0267\nCC-MAIN-2025-43,uzb,542763,540565,0.0207\nCC-MAIN-2025-43,ven,1167,1167,0.0000\nCC-MAIN-2025-43,vie,26896723,26732629,1.0278\nCC-MAIN-2025-43,vol,18244,18215,0.0007\nCC-MAIN-2025-43,war,40393,40302,0.0015\nCC-MAIN-2025-43,wol,4649,4545,0.0002\nCC-MAIN-2025-43,xho,20486,20447,0.0008\nCC-MAIN-2025-43,yid,46306,46251,0.0018\nCC-MAIN-2025-43,yor,26171,26129,0.0010\nCC-MAIN-2025-43,zha,1827,1822,0.0001\nCC-MAIN-2025-43,zho,133138627,132797805,5.0878\nCC-MAIN-2025-43,zul,35136,35090,0.0013\nCC-MAIN-2025-47,<unknown>,67560732,67560732,2.9445\nCC-MAIN-2025-47,aar,1767,1758,0.0001\nCC-MAIN-2025-47,abk,14511,14156,0.0006\nCC-MAIN-2025-47,afr,210396,208806,0.0092\nCC-MAIN-2025-47,aka,4022,4009,0.0002\nCC-MAIN-2025-47,amh,82166,81802,0.0036\nCC-MAIN-2025-47,ara,15086615,15015490,0.6575\nCC-MAIN-2025-47,asm,65612,65088,0.0029\nCC-MAIN-2025-47,aym,2085,2067,0.0001\nCC-MAIN-2025-47,aze,1313122,1309357,0.0572\nCC-MAIN-2025-47,bak,60806,59565,0.0027\nCC-MAIN-2025-47,bel,387243,385171,0.0169\nCC-MAIN-2025-47,ben,2615881,2608472,0.1140\nCC-MAIN-2025-47,bih,18073,17847,0.0008\nCC-MAIN-2025-47,bis,1837,1804,0.0001\nCC-MAIN-2025-47,bod,25723,25686,0.0011\nCC-MAIN-2025-47,bos,1257884,1254602,0.0548\nCC-MAIN-2025-47,bre,45832,45283,0.0020\nCC-MAIN-2025-47,bul,6405222,6383924,0.2792\nCC-MAIN-2025-47,cat,4423833,4394810,0.1928\nCC-MAIN-2025-47,ceb,47830,47678,0.0021\nCC-MAIN-2025-47,ces,26026822,25872678,1.1343\nCC-MAIN-2025-47,chr,654,652,0.0000\nCC-MAIN-2025-47,cos,54604,53613,0.0024\nCC-MAIN-2025-47,crs,1648,1626,0.0001\nCC-MAIN-2025-47,cym,236644,235297,0.0103\nCC-MAIN-2025-47,dan,11427081,11346498,0.4980\nCC-MAIN-2025-47,deu,131742497,130888068,5.7417\nCC-MAIN-2025-47,div,49323,49147,0.0021\nCC-MAIN-2025-47,dzo,1446,1444,0.0001\nCC-MAIN-2025-47,ell,11785370,11749957,0.5136\nCC-MAIN-2025-47,eng,965469499,960098965,42.0781\nCC-MAIN-2025-47,epo,173473,171829,0.0076\nCC-MAIN-2025-47,est,3152671,3136924,0.1374\nCC-MAIN-2025-47,eus,816160,812555,0.0356\nCC-MAIN-2025-47,fao,120241,119535,0.0052\nCC-MAIN-2025-47,fas,18452306,18393461,0.8042\nCC-MAIN-2025-47,fij,2705,2687,0.0001\nCC-MAIN-2025-47,fin,8003636,7958698,0.3488\nCC-MAIN-2025-47,fra,100971978,100389684,4.4007\nCC-MAIN-2025-47,fry,78314,76892,0.0034\nCC-MAIN-2025-47,gla,40198,39789,0.0018\nCC-MAIN-2025-47,gle,167372,165752,0.0073\nCC-MAIN-2025-47,glg,667448,663854,0.0291\nCC-MAIN-2025-47,glv,11004,10875,0.0005\nCC-MAIN-2025-47,got,685,640,0.0000\nCC-MAIN-2025-47,grn,18061,17712,0.0008\nCC-MAIN-2025-47,guj,288279,287355,0.0126\nCC-MAIN-2025-47,hat,45628,45502,0.0020\nCC-MAIN-2025-47,hau,71938,71256,0.0031\nCC-MAIN-2025-47,haw,17568,17511,0.0008\nCC-MAIN-2025-47,heb,5413447,5389436,0.2359\nCC-MAIN-2025-47,hin,4785472,4774995,0.2086\nCC-MAIN-2025-47,hmn,15965,15916,0.0007\nCC-MAIN-2025-47,hrv,4721379,4702808,0.2058\nCC-MAIN-2025-47,hun,11532942,11485483,0.5026\nCC-MAIN-2025-47,hye,708389,705484,0.0309\nCC-MAIN-2025-47,ibo,21313,21077,0.0009\nCC-MAIN-2025-47,iku,5367,5336,0.0002\nCC-MAIN-2025-47,ile,7141,7059,0.0003\nCC-MAIN-2025-47,ina,12036,11905,0.0005\nCC-MAIN-2025-47,ind,24070715,23962179,1.0491\nCC-MAIN-2025-47,ipk,1513,1491,0.0001\nCC-MAIN-2025-47,isl,875859,872231,0.0382\nCC-MAIN-2025-47,ita,50090593,49849171,2.1831\nCC-MAIN-2025-47,jav,87342,86137,0.0038\nCC-MAIN-2025-47,jpn,127911068,127531495,5.5747\nCC-MAIN-2025-47,kal,20483,20364,0.0009\nCC-MAIN-2025-47,kan,369576,368848,0.0161\nCC-MAIN-2025-47,kas,39,39,0.0000\nCC-MAIN-2025-47,kat,954847,951458,0.0416\nCC-MAIN-2025-47,kaz,819156,813290,0.0357\nCC-MAIN-2025-47,kha,8437,8431,0.0004\nCC-MAIN-2025-47,khm,224047,223385,0.0098\nCC-MAIN-2025-47,kin,50517,49997,0.0022\nCC-MAIN-2025-47,kir,228504,227972,0.0100\nCC-MAIN-2025-47,kor,18565489,18514943,0.8091\nCC-MAIN-2025-47,kur,167526,166664,0.0073\nCC-MAIN-2025-47,lao,94118,93840,0.0041\nCC-MAIN-2025-47,lat,2334502,2329554,0.1017\nCC-MAIN-2025-47,lav,2118401,2108974,0.0923\nCC-MAIN-2025-47,lif,81,81,0.0000\nCC-MAIN-2025-47,lin,6979,6917,0.0003\nCC-MAIN-2025-47,lit,3829422,3810773,0.1669\nCC-MAIN-2025-47,ltz,109854,107994,0.0048\nCC-MAIN-2025-47,lug,3349,3340,0.0001\nCC-MAIN-2025-47,mal,594897,593069,0.0259\nCC-MAIN-2025-47,mar,716423,713284,0.0312\nCC-MAIN-2025-47,mfe,3019,3013,0.0001\nCC-MAIN-2025-47,mkd,801278,797839,0.0349\nCC-MAIN-2025-47,mlg,72964,72666,0.0032\nCC-MAIN-2025-47,mlt,63489,63235,0.0028\nCC-MAIN-2025-47,mon,367144,365294,0.0160\nCC-MAIN-2025-47,mri,27989,27793,0.0012\nCC-MAIN-2025-47,msa,1811981,1806222,0.0790\nCC-MAIN-2025-47,mya,354673,353098,0.0155\nCC-MAIN-2025-47,nau,879,877,0.0000\nCC-MAIN-2025-47,nep,1189566,1187240,0.0518\nCC-MAIN-2025-47,nld,39677760,39434891,1.7293\nCC-MAIN-2025-47,nno,356029,353645,0.0155\nCC-MAIN-2025-47,nor,7042632,7000378,0.3069\nCC-MAIN-2025-47,nso,2218,2152,0.0001\nCC-MAIN-2025-47,nya,15916,15847,0.0007\nCC-MAIN-2025-47,oci,99577,98052,0.0043\nCC-MAIN-2025-47,ori,143939,143127,0.0063\nCC-MAIN-2025-47,orm,15519,15484,0.0007\nCC-MAIN-2025-47,pan,190635,189845,0.0083\nCC-MAIN-2025-47,pol,44297820,44108058,1.9306\nCC-MAIN-2025-47,por,53621847,53399867,2.3370\nCC-MAIN-2025-47,pus,91691,91296,0.0040\nCC-MAIN-2025-47,que,16646,16103,0.0007\nCC-MAIN-2025-47,roh,26944,26664,0.0012\nCC-MAIN-2025-47,ron,12033475,11988735,0.5245\nCC-MAIN-2025-47,run,1981,1979,0.0001\nCC-MAIN-2025-47,rus,148731952,148151161,6.4822\nCC-MAIN-2025-47,sag,8485,8478,0.0004\nCC-MAIN-2025-47,san,57971,56939,0.0025\nCC-MAIN-2025-47,sco,13246,13183,0.0006\nCC-MAIN-2025-47,sin,190043,189613,0.0083\nCC-MAIN-2025-47,slk,9367563,9318461,0.4083\nCC-MAIN-2025-47,slv,2825351,2813309,0.1231\nCC-MAIN-2025-47,smo,16351,16307,0.0007\nCC-MAIN-2025-47,sna,21730,21426,0.0009\nCC-MAIN-2025-47,snd,40164,39920,0.0018\nCC-MAIN-2025-47,som,113114,112778,0.0049\nCC-MAIN-2025-47,sot,14788,14715,0.0006\nCC-MAIN-2025-47,spa,101625930,101108373,4.4292\nCC-MAIN-2025-47,sqi,1048763,1045587,0.0457\nCC-MAIN-2025-47,srp,5398051,5377760,0.2353\nCC-MAIN-2025-47,ssw,704,702,0.0000\nCC-MAIN-2025-47,sun,30668,30250,0.0013\nCC-MAIN-2025-47,sux,274,273,0.0000\nCC-MAIN-2025-47,swa,252894,251859,0.0110\nCC-MAIN-2025-47,swe,14871589,14776428,0.6481\nCC-MAIN-2025-47,syr,6978,6953,0.0003\nCC-MAIN-2025-47,tam,1119029,1115136,0.0488\nCC-MAIN-2025-47,tat,168260,167891,0.0073\nCC-MAIN-2025-47,tel,460155,459412,0.0201\nCC-MAIN-2025-47,tgk,178332,177112,0.0078\nCC-MAIN-2025-47,tgl,214385,212275,0.0093\nCC-MAIN-2025-47,tha,8889333,8850506,0.3874\nCC-MAIN-2025-47,tir,22332,22235,0.0010\nCC-MAIN-2025-47,ton,2332,2298,0.0001\nCC-MAIN-2025-47,tsn,2829,2807,0.0001\nCC-MAIN-2025-47,tso,1495,1487,0.0001\nCC-MAIN-2025-47,tuk,32860,32665,0.0014\nCC-MAIN-2025-47,tur,26183361,26083224,1.1411\nCC-MAIN-2025-47,uig,34596,34133,0.0015\nCC-MAIN-2025-47,ukr,15529545,15181462,0.6768\nCC-MAIN-2025-47,urd,682475,677905,0.0297\nCC-MAIN-2025-47,uzb,558966,555874,0.0244\nCC-MAIN-2025-47,ven,696,695,0.0000\nCC-MAIN-2025-47,vie,24868458,24697266,1.0838\nCC-MAIN-2025-47,vol,20019,19866,0.0009\nCC-MAIN-2025-47,war,43597,43414,0.0019\nCC-MAIN-2025-47,wol,4071,3991,0.0002\nCC-MAIN-2025-47,xho,22066,22027,0.0010\nCC-MAIN-2025-47,yid,41893,41574,0.0018\nCC-MAIN-2025-47,yor,31754,31569,0.0014\nCC-MAIN-2025-47,zha,1680,1660,0.0001\nCC-MAIN-2025-47,zho,127355169,126732709,5.5505\nCC-MAIN-2025-47,zul,35371,35285,0.0015\nCC-MAIN-2025-51,<unknown>,66656970,66656970,3.0730\nCC-MAIN-2025-51,aar,1772,1760,0.0001\nCC-MAIN-2025-51,abk,14780,14563,0.0007\nCC-MAIN-2025-51,afr,171747,171204,0.0079\nCC-MAIN-2025-51,aka,3999,3991,0.0002\nCC-MAIN-2025-51,amh,75659,75353,0.0035\nCC-MAIN-2025-51,ara,14471252,14401229,0.6672\nCC-MAIN-2025-51,asm,61643,61421,0.0028\nCC-MAIN-2025-51,aym,2048,2031,0.0001\nCC-MAIN-2025-51,aze,1266634,1263388,0.0584\nCC-MAIN-2025-51,bak,20927,20877,0.0010\nCC-MAIN-2025-51,bel,333816,332856,0.0154\nCC-MAIN-2025-51,ben,2385201,2379769,0.1100\nCC-MAIN-2025-51,bih,13699,13620,0.0006\nCC-MAIN-2025-51,bis,2278,2144,0.0001\nCC-MAIN-2025-51,bod,25058,25037,0.0012\nCC-MAIN-2025-51,bos,1185218,1182065,0.0546\nCC-MAIN-2025-51,bre,59890,59074,0.0028\nCC-MAIN-2025-51,bul,5708563,5689490,0.2632\nCC-MAIN-2025-51,cat,3999754,3973027,0.1844\nCC-MAIN-2025-51,ceb,50595,50470,0.0023\nCC-MAIN-2025-51,ces,24046650,23890866,1.1086\nCC-MAIN-2025-51,chr,672,671,0.0000\nCC-MAIN-2025-51,cos,50660,50180,0.0023\nCC-MAIN-2025-51,crs,2305,2080,0.0001\nCC-MAIN-2025-51,cym,226994,225458,0.0105\nCC-MAIN-2025-51,dan,10527581,10448652,0.4853\nCC-MAIN-2025-51,deu,124485737,123668622,5.7391\nCC-MAIN-2025-51,div,53301,53225,0.0025\nCC-MAIN-2025-51,dzo,1196,1195,0.0001\nCC-MAIN-2025-51,ell,11261515,11225462,0.5192\nCC-MAIN-2025-51,eng,898170425,893089456,41.4078\nCC-MAIN-2025-51,epo,166704,165243,0.0077\nCC-MAIN-2025-51,est,2946671,2932201,0.1358\nCC-MAIN-2025-51,eus,760889,757375,0.0351\nCC-MAIN-2025-51,fao,107267,106627,0.0049\nCC-MAIN-2025-51,fas,18395273,18337661,0.8481\nCC-MAIN-2025-51,fij,2355,2345,0.0001\nCC-MAIN-2025-51,fin,7345095,7301546,0.3386\nCC-MAIN-2025-51,fra,96498314,95936434,4.4488\nCC-MAIN-2025-51,fry,40084,39945,0.0018\nCC-MAIN-2025-51,gla,38517,38237,0.0018\nCC-MAIN-2025-51,gle,120604,120279,0.0056\nCC-MAIN-2025-51,glg,574935,571621,0.0265\nCC-MAIN-2025-51,glv,10054,10026,0.0005\nCC-MAIN-2025-51,got,726,718,0.0000\nCC-MAIN-2025-51,grn,14707,14610,0.0007\nCC-MAIN-2025-51,guj,267534,266930,0.0123\nCC-MAIN-2025-51,hat,61084,60752,0.0028\nCC-MAIN-2025-51,hau,60277,59973,0.0028\nCC-MAIN-2025-51,haw,15954,15918,0.0007\nCC-MAIN-2025-51,heb,5180882,5156697,0.2389\nCC-MAIN-2025-51,hin,4631762,4621603,0.2135\nCC-MAIN-2025-51,hmn,15262,15246,0.0007\nCC-MAIN-2025-51,hrv,4397105,4379658,0.2027\nCC-MAIN-2025-51,hun,10601463,10555265,0.4888\nCC-MAIN-2025-51,hye,643684,641722,0.0297\nCC-MAIN-2025-51,ibo,20172,20090,0.0009\nCC-MAIN-2025-51,iku,5735,5665,0.0003\nCC-MAIN-2025-51,ile,6190,6139,0.0003\nCC-MAIN-2025-51,ina,11488,11416,0.0005\nCC-MAIN-2025-51,ind,22522599,22425481,1.0383\nCC-MAIN-2025-51,ipk,1695,1693,0.0001\nCC-MAIN-2025-51,isl,823786,819727,0.0380\nCC-MAIN-2025-51,ita,48976415,48749779,2.2579\nCC-MAIN-2025-51,jav,40761,40636,0.0019\nCC-MAIN-2025-51,jpn,118353302,117982410,5.4564\nCC-MAIN-2025-51,kal,19461,19348,0.0009\nCC-MAIN-2025-51,kan,344304,343272,0.0159\nCC-MAIN-2025-51,kas,34,34,0.0000\nCC-MAIN-2025-51,kat,910673,908075,0.0420\nCC-MAIN-2025-51,kaz,844079,837461,0.0389\nCC-MAIN-2025-51,kha,7888,7882,0.0004\nCC-MAIN-2025-51,khm,203044,202411,0.0094\nCC-MAIN-2025-51,kin,51798,51555,0.0024\nCC-MAIN-2025-51,kir,221567,220881,0.0102\nCC-MAIN-2025-51,kor,17286238,17236091,0.7969\nCC-MAIN-2025-51,kur,119658,119381,0.0055\nCC-MAIN-2025-51,lao,92725,92314,0.0043\nCC-MAIN-2025-51,lat,2163196,2159364,0.0997\nCC-MAIN-2025-51,lav,1957022,1948299,0.0902\nCC-MAIN-2025-51,lif,50,49,0.0000\nCC-MAIN-2025-51,lin,7103,7029,0.0003\nCC-MAIN-2025-51,lit,3590435,3573014,0.1655\nCC-MAIN-2025-51,ltz,66172,65842,0.0031\nCC-MAIN-2025-51,lug,4120,4108,0.0002\nCC-MAIN-2025-51,mal,553483,552434,0.0255\nCC-MAIN-2025-51,mar,637752,635453,0.0294\nCC-MAIN-2025-51,mfe,4241,4236,0.0002\nCC-MAIN-2025-51,mkd,769423,765998,0.0355\nCC-MAIN-2025-51,mlg,100842,100256,0.0046\nCC-MAIN-2025-51,mlt,53943,53806,0.0025\nCC-MAIN-2025-51,mon,317797,317038,0.0147\nCC-MAIN-2025-51,mri,27113,26981,0.0012\nCC-MAIN-2025-51,msa,1721514,1716889,0.0794\nCC-MAIN-2025-51,mya,308537,307579,0.0142\nCC-MAIN-2025-51,nau,700,698,0.0000\nCC-MAIN-2025-51,nep,1172504,1171256,0.0541\nCC-MAIN-2025-51,nld,36743545,36522188,1.6940\nCC-MAIN-2025-51,nno,306351,304864,0.0141\nCC-MAIN-2025-51,nor,6632719,6593394,0.3058\nCC-MAIN-2025-51,nso,2099,2032,0.0001\nCC-MAIN-2025-51,nya,14327,14296,0.0007\nCC-MAIN-2025-51,oci,59012,58591,0.0027\nCC-MAIN-2025-51,ori,141910,141240,0.0065\nCC-MAIN-2025-51,orm,14102,14041,0.0007\nCC-MAIN-2025-51,pan,163840,163611,0.0076\nCC-MAIN-2025-51,pol,41507955,41336680,1.9136\nCC-MAIN-2025-51,por,51070633,50859359,2.3545\nCC-MAIN-2025-51,pus,93855,93555,0.0043\nCC-MAIN-2025-51,que,8101,8055,0.0004\nCC-MAIN-2025-51,roh,31527,31345,0.0015\nCC-MAIN-2025-51,ron,10554874,10517056,0.4866\nCC-MAIN-2025-51,run,2072,2072,0.0001\nCC-MAIN-2025-51,rus,140612963,140060915,6.4826\nCC-MAIN-2025-51,sag,7365,7360,0.0003\nCC-MAIN-2025-51,san,49818,49562,0.0023\nCC-MAIN-2025-51,sco,12185,12150,0.0006\nCC-MAIN-2025-51,sin,201017,200433,0.0093\nCC-MAIN-2025-51,slk,8569863,8524039,0.3951\nCC-MAIN-2025-51,slv,2634238,2623743,0.1214\nCC-MAIN-2025-51,smo,15352,15321,0.0007\nCC-MAIN-2025-51,sna,19916,19782,0.0009\nCC-MAIN-2025-51,snd,39481,39305,0.0018\nCC-MAIN-2025-51,som,103866,103563,0.0048\nCC-MAIN-2025-51,sot,15442,15394,0.0007\nCC-MAIN-2025-51,spa,95694864,95126399,4.4118\nCC-MAIN-2025-51,sqi,1057525,1054625,0.0488\nCC-MAIN-2025-51,srp,5169688,5149578,0.2383\nCC-MAIN-2025-51,ssw,589,588,0.0000\nCC-MAIN-2025-51,sun,26992,26806,0.0012\nCC-MAIN-2025-51,sux,365,364,0.0000\nCC-MAIN-2025-51,swa,203510,202781,0.0094\nCC-MAIN-2025-51,swe,14114061,14024276,0.6507\nCC-MAIN-2025-51,syr,7061,7029,0.0003\nCC-MAIN-2025-51,tam,1008415,1005147,0.0465\nCC-MAIN-2025-51,tat,156314,156045,0.0072\nCC-MAIN-2025-51,tel,421450,420570,0.0194\nCC-MAIN-2025-51,tgk,133334,132885,0.0061\nCC-MAIN-2025-51,tgl,168889,168037,0.0078\nCC-MAIN-2025-51,tha,8553965,8515605,0.3944\nCC-MAIN-2025-51,tir,19722,19635,0.0009\nCC-MAIN-2025-51,ton,2408,2377,0.0001\nCC-MAIN-2025-51,tsn,2548,2539,0.0001\nCC-MAIN-2025-51,tso,1189,1182,0.0001\nCC-MAIN-2025-51,tuk,32697,32561,0.0015\nCC-MAIN-2025-51,tur,25139068,25049263,1.1590\nCC-MAIN-2025-51,uig,38916,38621,0.0018\nCC-MAIN-2025-51,ukr,16206660,15881346,0.7472\nCC-MAIN-2025-51,urd,641727,639216,0.0296\nCC-MAIN-2025-51,uzb,568813,566740,0.0262\nCC-MAIN-2025-51,ven,553,553,0.0000\nCC-MAIN-2025-51,vie,23371496,23219396,1.0775\nCC-MAIN-2025-51,vol,17690,17594,0.0008\nCC-MAIN-2025-51,war,37934,37778,0.0017\nCC-MAIN-2025-51,wol,3697,3671,0.0002\nCC-MAIN-2025-51,xho,20278,20219,0.0009\nCC-MAIN-2025-51,yid,43298,43072,0.0020\nCC-MAIN-2025-51,yor,28336,28252,0.0013\nCC-MAIN-2025-51,zha,1366,1348,0.0001\nCC-MAIN-2025-51,zho,133978663,133616944,6.1767\nCC-MAIN-2025-51,zul,29470,29422,0.0014\nCC-MAIN-2026-04,<unknown>,68611738,68611738,2.9452\nCC-MAIN-2026-04,aar,1983,1973,0.0001\nCC-MAIN-2026-04,abk,20293,20092,0.0009\nCC-MAIN-2026-04,afr,220320,219590,0.0095\nCC-MAIN-2026-04,aka,10226,10217,0.0004\nCC-MAIN-2026-04,amh,101547,101239,0.0044\nCC-MAIN-2026-04,ara,15444953,15375162,0.6630\nCC-MAIN-2026-04,asm,81061,80950,0.0035\nCC-MAIN-2026-04,aym,3066,3012,0.0001\nCC-MAIN-2026-04,aze,1355060,1350334,0.0582\nCC-MAIN-2026-04,bak,45483,45340,0.0020\nCC-MAIN-2026-04,bel,374657,372511,0.0161\nCC-MAIN-2026-04,ben,2572687,2567578,0.1104\nCC-MAIN-2026-04,bih,29482,29432,0.0013\nCC-MAIN-2026-04,bis,2374,2355,0.0001\nCC-MAIN-2026-04,bod,45256,45177,0.0019\nCC-MAIN-2026-04,bos,1359058,1356264,0.0583\nCC-MAIN-2026-04,bre,61049,60901,0.0026\nCC-MAIN-2026-04,bul,5982457,5964081,0.2568\nCC-MAIN-2026-04,cat,4749693,4719665,0.2039\nCC-MAIN-2026-04,ceb,46732,46591,0.0020\nCC-MAIN-2026-04,ces,26584343,26409435,1.1411\nCC-MAIN-2026-04,chr,1503,1495,0.0001\nCC-MAIN-2026-04,cos,76852,76514,0.0033\nCC-MAIN-2026-04,crs,2171,2157,0.0001\nCC-MAIN-2026-04,cym,250010,248669,0.0107\nCC-MAIN-2026-04,dan,11839520,11761462,0.5082\nCC-MAIN-2026-04,deu,138788342,137914500,5.9575\nCC-MAIN-2026-04,div,61544,61359,0.0026\nCC-MAIN-2026-04,dzo,4335,4334,0.0002\nCC-MAIN-2026-04,ell,12503859,12465777,0.5367\nCC-MAIN-2026-04,eng,971358233,965898156,41.6958\nCC-MAIN-2026-04,epo,188916,186388,0.0081\nCC-MAIN-2026-04,est,3260542,3243244,0.1400\nCC-MAIN-2026-04,eus,850614,846361,0.0365\nCC-MAIN-2026-04,fao,125277,124758,0.0054\nCC-MAIN-2026-04,fas,4540556,4526464,0.1949\nCC-MAIN-2026-04,fij,3259,3252,0.0001\nCC-MAIN-2026-04,fin,8461724,8411336,0.3632\nCC-MAIN-2026-04,fra,108850506,108240192,4.6724\nCC-MAIN-2026-04,fry,55381,55232,0.0024\nCC-MAIN-2026-04,gla,43570,43283,0.0019\nCC-MAIN-2026-04,gle,144593,143646,0.0062\nCC-MAIN-2026-04,glg,836152,833121,0.0359\nCC-MAIN-2026-04,glv,17380,17347,0.0007\nCC-MAIN-2026-04,got,2271,2267,0.0001\nCC-MAIN-2026-04,grn,21084,20956,0.0009\nCC-MAIN-2026-04,guj,291412,290874,0.0125\nCC-MAIN-2026-04,hat,51844,51710,0.0022\nCC-MAIN-2026-04,hau,91419,91260,0.0039\nCC-MAIN-2026-04,haw,18179,18090,0.0008\nCC-MAIN-2026-04,heb,5925745,5898370,0.2544\nCC-MAIN-2026-04,hin,5214443,5203685,0.2238\nCC-MAIN-2026-04,hmn,14822,14752,0.0006\nCC-MAIN-2026-04,hrv,5042028,5023746,0.2164\nCC-MAIN-2026-04,hun,11971838,11923468,0.5139\nCC-MAIN-2026-04,hye,745330,743528,0.0320\nCC-MAIN-2026-04,ibo,45134,45052,0.0019\nCC-MAIN-2026-04,iku,8557,8473,0.0004\nCC-MAIN-2026-04,ile,7478,7422,0.0003\nCC-MAIN-2026-04,ina,15415,15356,0.0007\nCC-MAIN-2026-04,ind,26756567,26656033,1.1485\nCC-MAIN-2026-04,ipk,2098,2093,0.0001\nCC-MAIN-2026-04,isl,824952,821620,0.0354\nCC-MAIN-2026-04,ita,56165174,55912941,2.4109\nCC-MAIN-2026-04,jav,104258,104119,0.0045\nCC-MAIN-2026-04,jpn,134495814,134116106,5.7733\nCC-MAIN-2026-04,kal,23313,23139,0.0010\nCC-MAIN-2026-04,kan,454015,453333,0.0195\nCC-MAIN-2026-04,kas,93,93,0.0000\nCC-MAIN-2026-04,kat,1020877,1018374,0.0438\nCC-MAIN-2026-04,kaz,875476,871147,0.0376\nCC-MAIN-2026-04,kha,7561,7549,0.0003\nCC-MAIN-2026-04,khm,261138,260510,0.0112\nCC-MAIN-2026-04,kin,59693,59458,0.0026\nCC-MAIN-2026-04,kir,246384,245994,0.0106\nCC-MAIN-2026-04,kor,18458793,18407805,0.7923\nCC-MAIN-2026-04,kur,151115,150754,0.0065\nCC-MAIN-2026-04,lao,122662,122074,0.0053\nCC-MAIN-2026-04,lat,2712571,2708448,0.1164\nCC-MAIN-2026-04,lav,2095645,2085159,0.0900\nCC-MAIN-2026-04,lif,112,112,0.0000\nCC-MAIN-2026-04,lin,12720,12632,0.0005\nCC-MAIN-2026-04,lit,4073475,4053114,0.1749\nCC-MAIN-2026-04,ltz,89862,89532,0.0039\nCC-MAIN-2026-04,lug,10693,10680,0.0005\nCC-MAIN-2026-04,mal,664813,663436,0.0285\nCC-MAIN-2026-04,mar,760423,755703,0.0326\nCC-MAIN-2026-04,mfe,4288,4282,0.0002\nCC-MAIN-2026-04,mkd,844241,840939,0.0362\nCC-MAIN-2026-04,mlg,87156,86914,0.0037\nCC-MAIN-2026-04,mlt,71552,71331,0.0031\nCC-MAIN-2026-04,mon,388893,387667,0.0167\nCC-MAIN-2026-04,mri,33916,33758,0.0015\nCC-MAIN-2026-04,msa,1935497,1930428,0.0831\nCC-MAIN-2026-04,mya,431868,430906,0.0185\nCC-MAIN-2026-04,nau,697,696,0.0000\nCC-MAIN-2026-04,nep,1336345,1334670,0.0574\nCC-MAIN-2026-04,nld,41754155,41503505,1.7923\nCC-MAIN-2026-04,nno,333993,332410,0.0143\nCC-MAIN-2026-04,nor,7440358,7397336,0.3194\nCC-MAIN-2026-04,nso,2969,2880,0.0001\nCC-MAIN-2026-04,nya,18241,18167,0.0008\nCC-MAIN-2026-04,oci,83071,82858,0.0036\nCC-MAIN-2026-04,ori,189980,189604,0.0082\nCC-MAIN-2026-04,orm,18721,18680,0.0008\nCC-MAIN-2026-04,pan,207443,206927,0.0089\nCC-MAIN-2026-04,pol,47229235,47033201,2.0273\nCC-MAIN-2026-04,por,57220604,56995609,2.4562\nCC-MAIN-2026-04,pus,118209,118006,0.0051\nCC-MAIN-2026-04,que,22711,22459,0.0010\nCC-MAIN-2026-04,roh,35204,35016,0.0015\nCC-MAIN-2026-04,ron,12438097,12394692,0.5339\nCC-MAIN-2026-04,run,2939,2934,0.0001\nCC-MAIN-2026-04,rus,145901486,145356043,6.2629\nCC-MAIN-2026-04,sag,26460,26458,0.0011\nCC-MAIN-2026-04,san,108490,108382,0.0047\nCC-MAIN-2026-04,sco,14300,14265,0.0006\nCC-MAIN-2026-04,sin,240193,239665,0.0103\nCC-MAIN-2026-04,slk,9195693,9150779,0.3947\nCC-MAIN-2026-04,slv,3070632,3058317,0.1318\nCC-MAIN-2026-04,smo,16581,16530,0.0007\nCC-MAIN-2026-04,sna,28694,28502,0.0012\nCC-MAIN-2026-04,snd,50559,50466,0.0022\nCC-MAIN-2026-04,som,137036,136779,0.0059\nCC-MAIN-2026-04,sot,16053,15966,0.0007\nCC-MAIN-2026-04,spa,107641802,107110774,4.6206\nCC-MAIN-2026-04,sqi,1169261,1166383,0.0502\nCC-MAIN-2026-04,srp,5834815,5815583,0.2505\nCC-MAIN-2026-04,ssw,955,953,0.0000\nCC-MAIN-2026-04,sun,38124,37945,0.0016\nCC-MAIN-2026-04,sux,171,171,0.0000\nCC-MAIN-2026-04,swa,294364,293725,0.0126\nCC-MAIN-2026-04,swe,16048273,15947880,0.6889\nCC-MAIN-2026-04,syr,9047,8995,0.0004\nCC-MAIN-2026-04,tam,1158981,1155723,0.0497\nCC-MAIN-2026-04,tat,170609,170292,0.0073\nCC-MAIN-2026-04,tel,512028,510583,0.0220\nCC-MAIN-2026-04,tgk,160462,159975,0.0069\nCC-MAIN-2026-04,tgl,227520,226677,0.0098\nCC-MAIN-2026-04,tha,9151330,9114392,0.3928\nCC-MAIN-2026-04,tir,19462,19300,0.0008\nCC-MAIN-2026-04,ton,4002,3965,0.0002\nCC-MAIN-2026-04,tsn,9656,9641,0.0004\nCC-MAIN-2026-04,tso,2332,2328,0.0001\nCC-MAIN-2026-04,tuk,83072,82817,0.0036\nCC-MAIN-2026-04,tur,27932444,27832031,1.1990\nCC-MAIN-2026-04,uig,47439,47184,0.0020\nCC-MAIN-2026-04,ukr,16204415,15955156,0.6956\nCC-MAIN-2026-04,urd,743860,741643,0.0319\nCC-MAIN-2026-04,uzb,588441,586580,0.0253\nCC-MAIN-2026-04,ven,624,624,0.0000\nCC-MAIN-2026-04,vie,25581840,25428571,1.0981\nCC-MAIN-2026-04,vol,32114,32089,0.0014\nCC-MAIN-2026-04,war,39598,39478,0.0017\nCC-MAIN-2026-04,wol,7244,7208,0.0003\nCC-MAIN-2026-04,xho,22462,22373,0.0010\nCC-MAIN-2026-04,yid,55649,55313,0.0024\nCC-MAIN-2026-04,yor,36632,36561,0.0016\nCC-MAIN-2026-04,zha,2391,2374,0.0001\nCC-MAIN-2026-04,zho,114812782,114487122,4.9284\nCC-MAIN-2026-04,zul,44341,44242,0.0019\nCC-MAIN-2026-08,<unknown>,68205334,68205334,3.1475\nCC-MAIN-2026-08,aar,1602,1594,0.0001\nCC-MAIN-2026-08,abk,16089,15901,0.0007\nCC-MAIN-2026-08,afr,158131,157355,0.0073\nCC-MAIN-2026-08,aka,5969,5917,0.0003\nCC-MAIN-2026-08,amh,86857,86425,0.0040\nCC-MAIN-2026-08,ara,13796391,13729036,0.6367\nCC-MAIN-2026-08,asm,63670,63532,0.0029\nCC-MAIN-2026-08,aym,1948,1920,0.0001\nCC-MAIN-2026-08,aze,1231452,1227179,0.0568\nCC-MAIN-2026-08,bak,75755,75661,0.0035\nCC-MAIN-2026-08,bel,342463,341226,0.0158\nCC-MAIN-2026-08,ben,2249306,2243058,0.1038\nCC-MAIN-2026-08,bih,14458,14397,0.0007\nCC-MAIN-2026-08,bis,3562,3538,0.0002\nCC-MAIN-2026-08,bod,27627,27584,0.0013\nCC-MAIN-2026-08,bos,1177432,1174740,0.0543\nCC-MAIN-2026-08,bre,69270,68360,0.0032\nCC-MAIN-2026-08,bul,5717863,5699756,0.2639\nCC-MAIN-2026-08,cat,4492478,4465751,0.2073\nCC-MAIN-2026-08,ceb,48041,47873,0.0022\nCC-MAIN-2026-08,ces,24331176,24150159,1.1228\nCC-MAIN-2026-08,chr,662,658,0.0000\nCC-MAIN-2026-08,cos,61050,60431,0.0028\nCC-MAIN-2026-08,crs,1829,1815,0.0001\nCC-MAIN-2026-08,cym,225374,223893,0.0104\nCC-MAIN-2026-08,dan,10619846,10544791,0.4901\nCC-MAIN-2026-08,deu,124929784,124056302,5.7651\nCC-MAIN-2026-08,div,50754,50631,0.0023\nCC-MAIN-2026-08,dzo,1903,1903,0.0001\nCC-MAIN-2026-08,ell,10952561,10916733,0.5054\nCC-MAIN-2026-08,eng,923201168,917743002,42.6029\nCC-MAIN-2026-08,epo,231677,230092,0.0107\nCC-MAIN-2026-08,est,2970851,2955978,0.1371\nCC-MAIN-2026-08,eus,901830,897313,0.0416\nCC-MAIN-2026-08,fao,103972,103573,0.0048\nCC-MAIN-2026-08,fas,19018607,18967302,0.8777\nCC-MAIN-2026-08,fij,2789,2778,0.0001\nCC-MAIN-2026-08,fin,7421283,7372149,0.3425\nCC-MAIN-2026-08,fra,96575739,96005383,4.4567\nCC-MAIN-2026-08,fry,58564,58093,0.0027\nCC-MAIN-2026-08,gla,40391,40062,0.0019\nCC-MAIN-2026-08,gle,141227,140263,0.0065\nCC-MAIN-2026-08,glg,775716,771024,0.0358\nCC-MAIN-2026-08,glv,13777,13663,0.0006\nCC-MAIN-2026-08,got,654,649,0.0000\nCC-MAIN-2026-08,grn,18480,18373,0.0009\nCC-MAIN-2026-08,guj,249341,248432,0.0115\nCC-MAIN-2026-08,hat,60719,60427,0.0028\nCC-MAIN-2026-08,hau,72102,71923,0.0033\nCC-MAIN-2026-08,haw,17818,17703,0.0008\nCC-MAIN-2026-08,heb,4991517,4966677,0.2303\nCC-MAIN-2026-08,hin,4564314,4553824,0.2106\nCC-MAIN-2026-08,hmn,14248,14168,0.0007\nCC-MAIN-2026-08,hrv,4196497,4181317,0.1937\nCC-MAIN-2026-08,hun,10731924,10684233,0.4952\nCC-MAIN-2026-08,hye,699723,697867,0.0323\nCC-MAIN-2026-08,ibo,27317,27169,0.0013\nCC-MAIN-2026-08,iku,6589,6533,0.0003\nCC-MAIN-2026-08,ile,8300,8250,0.0004\nCC-MAIN-2026-08,ina,14143,14076,0.0007\nCC-MAIN-2026-08,ind,21797567,21707071,1.0059\nCC-MAIN-2026-08,ipk,2386,2384,0.0001\nCC-MAIN-2026-08,isl,856953,850773,0.0395\nCC-MAIN-2026-08,ita,49456252,49212220,2.2823\nCC-MAIN-2026-08,jav,64383,63984,0.0030\nCC-MAIN-2026-08,jpn,122632999,122249571,5.6591\nCC-MAIN-2026-08,kal,23315,23133,0.0011\nCC-MAIN-2026-08,kan,418199,416449,0.0193\nCC-MAIN-2026-08,kas,78,78,0.0000\nCC-MAIN-2026-08,kat,929644,927036,0.0429\nCC-MAIN-2026-08,kaz,838099,834769,0.0387\nCC-MAIN-2026-08,kha,5548,5540,0.0003\nCC-MAIN-2026-08,khm,206519,205845,0.0095\nCC-MAIN-2026-08,kin,47071,46824,0.0022\nCC-MAIN-2026-08,kir,245640,245041,0.0113\nCC-MAIN-2026-08,kor,17650874,17592271,0.8145\nCC-MAIN-2026-08,kur,142941,142630,0.0066\nCC-MAIN-2026-08,lao,91338,90761,0.0042\nCC-MAIN-2026-08,lat,2206179,2202052,0.1018\nCC-MAIN-2026-08,lav,1853839,1844715,0.0855\nCC-MAIN-2026-08,lif,95,95,0.0000\nCC-MAIN-2026-08,lin,9666,9621,0.0004\nCC-MAIN-2026-08,lit,3668564,3648732,0.1693\nCC-MAIN-2026-08,ltz,74522,74168,0.0034\nCC-MAIN-2026-08,lug,6429,6372,0.0003\nCC-MAIN-2026-08,mal,596056,594749,0.0275\nCC-MAIN-2026-08,mar,679437,676121,0.0314\nCC-MAIN-2026-08,mfe,3953,3949,0.0002\nCC-MAIN-2026-08,mkd,740821,738431,0.0342\nCC-MAIN-2026-08,mlg,122320,121994,0.0056\nCC-MAIN-2026-08,mlt,63464,63206,0.0029\nCC-MAIN-2026-08,mon,334064,333295,0.0154\nCC-MAIN-2026-08,mri,25370,25207,0.0012\nCC-MAIN-2026-08,msa,1704772,1700237,0.0787\nCC-MAIN-2026-08,mya,386447,385355,0.0178\nCC-MAIN-2026-08,nau,659,656,0.0000\nCC-MAIN-2026-08,nep,1155904,1154149,0.0533\nCC-MAIN-2026-08,nld,36368080,36131931,1.6783\nCC-MAIN-2026-08,nno,302109,300380,0.0139\nCC-MAIN-2026-08,nor,6631135,6591788,0.3060\nCC-MAIN-2026-08,nso,2123,2054,0.0001\nCC-MAIN-2026-08,nya,15692,15577,0.0007\nCC-MAIN-2026-08,oci,78221,77510,0.0036\nCC-MAIN-2026-08,ori,153891,153352,0.0071\nCC-MAIN-2026-08,orm,20381,20322,0.0009\nCC-MAIN-2026-08,pan,165033,164713,0.0076\nCC-MAIN-2026-08,pol,41199760,41022871,1.9012\nCC-MAIN-2026-08,por,52219927,52005048,2.4098\nCC-MAIN-2026-08,pus,95520,95135,0.0044\nCC-MAIN-2026-08,que,22988,22682,0.0011\nCC-MAIN-2026-08,roh,30731,30561,0.0014\nCC-MAIN-2026-08,ron,10102545,10062803,0.4662\nCC-MAIN-2026-08,run,1957,1954,0.0001\nCC-MAIN-2026-08,rus,133435813,132899640,6.1577\nCC-MAIN-2026-08,sag,33720,33672,0.0016\nCC-MAIN-2026-08,san,111906,111701,0.0052\nCC-MAIN-2026-08,sco,14723,14683,0.0007\nCC-MAIN-2026-08,sin,213607,213071,0.0099\nCC-MAIN-2026-08,slk,8503716,8459020,0.3924\nCC-MAIN-2026-08,slv,2663916,2653453,0.1229\nCC-MAIN-2026-08,smo,15794,15707,0.0007\nCC-MAIN-2026-08,sna,17250,17049,0.0008\nCC-MAIN-2026-08,snd,51651,51443,0.0024\nCC-MAIN-2026-08,som,110631,110292,0.0051\nCC-MAIN-2026-08,sot,13752,13620,0.0006\nCC-MAIN-2026-08,spa,96826296,96319701,4.4682\nCC-MAIN-2026-08,sqi,1081227,1078328,0.0499\nCC-MAIN-2026-08,srp,4997642,4978641,0.2306\nCC-MAIN-2026-08,ssw,716,714,0.0000\nCC-MAIN-2026-08,sun,40869,40598,0.0019\nCC-MAIN-2026-08,sux,246,246,0.0000\nCC-MAIN-2026-08,swa,272632,271728,0.0126\nCC-MAIN-2026-08,swe,14122119,14026449,0.6517\nCC-MAIN-2026-08,syr,6689,6665,0.0003\nCC-MAIN-2026-08,tam,1013431,1010443,0.0468\nCC-MAIN-2026-08,tat,178125,177751,0.0082\nCC-MAIN-2026-08,tel,466502,465495,0.0215\nCC-MAIN-2026-08,tgk,138333,137908,0.0064\nCC-MAIN-2026-08,tgl,212143,211344,0.0098\nCC-MAIN-2026-08,tha,8104217,8069956,0.3740\nCC-MAIN-2026-08,tir,14694,14613,0.0007\nCC-MAIN-2026-08,ton,2686,2666,0.0001\nCC-MAIN-2026-08,tsn,6198,6195,0.0003\nCC-MAIN-2026-08,tso,1277,1267,0.0001\nCC-MAIN-2026-08,tuk,83799,83459,0.0039\nCC-MAIN-2026-08,tur,25172133,25077956,1.1616\nCC-MAIN-2026-08,uig,39122,38915,0.0018\nCC-MAIN-2026-08,ukr,14470796,14256069,0.6678\nCC-MAIN-2026-08,urd,694950,692173,0.0321\nCC-MAIN-2026-08,uzb,551411,549343,0.0254\nCC-MAIN-2026-08,ven,484,483,0.0000\nCC-MAIN-2026-08,vie,22307790,22165420,1.0294\nCC-MAIN-2026-08,vol,16629,16562,0.0008\nCC-MAIN-2026-08,war,40760,40578,0.0019\nCC-MAIN-2026-08,wol,5997,5970,0.0003\nCC-MAIN-2026-08,xho,19447,19325,0.0009\nCC-MAIN-2026-08,yid,48078,47414,0.0022\nCC-MAIN-2026-08,yor,32046,31831,0.0015\nCC-MAIN-2026-08,zha,1738,1725,0.0001\nCC-MAIN-2026-08,zho,108263379,107906890,4.9960\nCC-MAIN-2026-08,zul,26268,26143,0.0012\nCC-MAIN-2026-12,<unknown>,61213059,61213059,3.0996\nCC-MAIN-2026-12,aar,2787,2777,0.0001\nCC-MAIN-2026-12,abk,12213,12041,0.0006\nCC-MAIN-2026-12,afr,178777,177839,0.0091\nCC-MAIN-2026-12,aka,3595,3514,0.0002\nCC-MAIN-2026-12,amh,77198,76957,0.0039\nCC-MAIN-2026-12,ara,12879301,12827210,0.6522\nCC-MAIN-2026-12,asm,74532,74235,0.0038\nCC-MAIN-2026-12,aym,2006,1950,0.0001\nCC-MAIN-2026-12,aze,1194070,1189071,0.0605\nCC-MAIN-2026-12,bak,91398,91147,0.0046\nCC-MAIN-2026-12,bel,355176,350646,0.0180\nCC-MAIN-2026-12,ben,2165825,2160409,0.1097\nCC-MAIN-2026-12,bih,16799,16712,0.0009\nCC-MAIN-2026-12,bis,2308,2300,0.0001\nCC-MAIN-2026-12,bod,28960,28883,0.0015\nCC-MAIN-2026-12,bos,1218126,1214987,0.0617\nCC-MAIN-2026-12,bre,41986,41595,0.0021\nCC-MAIN-2026-12,bul,5354192,5338084,0.2711\nCC-MAIN-2026-12,cat,4122638,4099122,0.2088\nCC-MAIN-2026-12,ceb,40702,40549,0.0021\nCC-MAIN-2026-12,ces,22618462,22404838,1.1453\nCC-MAIN-2026-12,chr,814,805,0.0000\nCC-MAIN-2026-12,cos,53241,52875,0.0027\nCC-MAIN-2026-12,crs,1421,1405,0.0001\nCC-MAIN-2026-12,cym,212859,211719,0.0108\nCC-MAIN-2026-12,dan,10366346,10301022,0.5249\nCC-MAIN-2026-12,deu,118131124,117311510,5.9818\nCC-MAIN-2026-12,div,45718,45450,0.0023\nCC-MAIN-2026-12,dzo,1668,1666,0.0001\nCC-MAIN-2026-12,ell,10849832,10811904,0.5494\nCC-MAIN-2026-12,eng,810847147,805695437,41.0588\nCC-MAIN-2026-12,epo,206312,204559,0.0104\nCC-MAIN-2026-12,est,2851461,2837426,0.1444\nCC-MAIN-2026-12,eus,776913,772044,0.0393\nCC-MAIN-2026-12,fao,106562,106014,0.0054\nCC-MAIN-2026-12,fas,3913283,3901847,0.1982\nCC-MAIN-2026-12,fij,2655,2642,0.0001\nCC-MAIN-2026-12,fin,7316452,7269121,0.3705\nCC-MAIN-2026-12,fra,90945321,90389603,4.6052\nCC-MAIN-2026-12,fry,50730,50236,0.0026\nCC-MAIN-2026-12,gla,34861,34637,0.0018\nCC-MAIN-2026-12,gle,136418,135682,0.0069\nCC-MAIN-2026-12,glg,642657,639492,0.0325\nCC-MAIN-2026-12,glv,9270,9225,0.0005\nCC-MAIN-2026-12,got,576,573,0.0000\nCC-MAIN-2026-12,grn,14054,13919,0.0007\nCC-MAIN-2026-12,guj,248149,247380,0.0126\nCC-MAIN-2026-12,hat,50328,50098,0.0025\nCC-MAIN-2026-12,hau,79549,79383,0.0040\nCC-MAIN-2026-12,haw,14732,14708,0.0007\nCC-MAIN-2026-12,heb,4678935,4652881,0.2369\nCC-MAIN-2026-12,hin,4294888,4284863,0.2175\nCC-MAIN-2026-12,hmn,12910,12886,0.0007\nCC-MAIN-2026-12,hrv,4234449,4217509,0.2144\nCC-MAIN-2026-12,hun,10465457,10419018,0.5299\nCC-MAIN-2026-12,hye,678532,675998,0.0344\nCC-MAIN-2026-12,ibo,21564,21526,0.0011\nCC-MAIN-2026-12,iku,7184,7145,0.0004\nCC-MAIN-2026-12,ile,6946,6892,0.0004\nCC-MAIN-2026-12,ina,12558,12502,0.0006\nCC-MAIN-2026-12,ind,21709758,21624489,1.0993\nCC-MAIN-2026-12,ipk,1773,1770,0.0001\nCC-MAIN-2026-12,isl,756092,752315,0.0383\nCC-MAIN-2026-12,ita,47046598,46813681,2.3823\nCC-MAIN-2026-12,jav,70902,70551,0.0036\nCC-MAIN-2026-12,jpn,112974803,112618434,5.7207\nCC-MAIN-2026-12,kal,21267,21069,0.0011\nCC-MAIN-2026-12,kan,354341,353366,0.0179\nCC-MAIN-2026-12,kas,92,92,0.0000\nCC-MAIN-2026-12,kat,908493,905806,0.0460\nCC-MAIN-2026-12,kaz,749788,746706,0.0380\nCC-MAIN-2026-12,kha,5000,4993,0.0003\nCC-MAIN-2026-12,khm,185799,185156,0.0094\nCC-MAIN-2026-12,kin,55182,55010,0.0028\nCC-MAIN-2026-12,kir,250677,249884,0.0127\nCC-MAIN-2026-12,kor,16544803,16492382,0.8378\nCC-MAIN-2026-12,kur,127938,127648,0.0065\nCC-MAIN-2026-12,lao,82756,82448,0.0042\nCC-MAIN-2026-12,lat,2006983,2002693,0.1016\nCC-MAIN-2026-12,lav,1813569,1804551,0.0918\nCC-MAIN-2026-12,lif,53,53,0.0000\nCC-MAIN-2026-12,lin,8843,8797,0.0004\nCC-MAIN-2026-12,lit,3470053,3452704,0.1757\nCC-MAIN-2026-12,ltz,79566,79027,0.0040\nCC-MAIN-2026-12,lug,3626,3557,0.0002\nCC-MAIN-2026-12,mal,544920,543757,0.0276\nCC-MAIN-2026-12,mar,620748,618578,0.0314\nCC-MAIN-2026-12,mfe,3902,3898,0.0002\nCC-MAIN-2026-12,mkd,784473,781696,0.0397\nCC-MAIN-2026-12,mlg,104841,104124,0.0053\nCC-MAIN-2026-12,mlt,60415,60318,0.0031\nCC-MAIN-2026-12,mon,318633,317599,0.0161\nCC-MAIN-2026-12,mri,23974,23902,0.0012\nCC-MAIN-2026-12,msa,1628012,1623380,0.0824\nCC-MAIN-2026-12,mya,331972,330751,0.0168\nCC-MAIN-2026-12,nau,640,639,0.0000\nCC-MAIN-2026-12,nep,1045331,1043739,0.0529\nCC-MAIN-2026-12,nld,35732496,35500515,1.8094\nCC-MAIN-2026-12,nno,289102,287430,0.0146\nCC-MAIN-2026-12,nor,6654989,6616029,0.3370\nCC-MAIN-2026-12,nso,1871,1817,0.0001\nCC-MAIN-2026-12,nya,13685,13655,0.0007\nCC-MAIN-2026-12,oci,78225,77691,0.0040\nCC-MAIN-2026-12,ori,140593,140225,0.0071\nCC-MAIN-2026-12,orm,12176,12146,0.0006\nCC-MAIN-2026-12,pan,180682,180240,0.0091\nCC-MAIN-2026-12,pol,40337138,40165913,2.0425\nCC-MAIN-2026-12,por,49899895,49690329,2.5268\nCC-MAIN-2026-12,pus,83619,83307,0.0042\nCC-MAIN-2026-12,que,15880,15745,0.0008\nCC-MAIN-2026-12,roh,33737,33521,0.0017\nCC-MAIN-2026-12,ron,11101910,11057508,0.5622\nCC-MAIN-2026-12,run,2376,2372,0.0001\nCC-MAIN-2026-12,rus,128164788,127670405,6.4899\nCC-MAIN-2026-12,sag,13231,13219,0.0007\nCC-MAIN-2026-12,san,72786,72101,0.0037\nCC-MAIN-2026-12,sco,13806,13769,0.0007\nCC-MAIN-2026-12,sin,187060,186599,0.0095\nCC-MAIN-2026-12,slk,8041655,8000128,0.4072\nCC-MAIN-2026-12,slv,2864359,2850126,0.1450\nCC-MAIN-2026-12,smo,15183,15161,0.0008\nCC-MAIN-2026-12,sna,18494,18382,0.0009\nCC-MAIN-2026-12,snd,34120,34037,0.0017\nCC-MAIN-2026-12,som,110423,110165,0.0056\nCC-MAIN-2026-12,sot,12356,12285,0.0006\nCC-MAIN-2026-12,spa,91990534,91506963,4.6581\nCC-MAIN-2026-12,sqi,1036314,1033555,0.0525\nCC-MAIN-2026-12,srp,5248931,5230286,0.2658\nCC-MAIN-2026-12,ssw,622,618,0.0000\nCC-MAIN-2026-12,sun,32720,32613,0.0017\nCC-MAIN-2026-12,sux,191,190,0.0000\nCC-MAIN-2026-12,swa,275898,275101,0.0140\nCC-MAIN-2026-12,swe,14366618,14267782,0.7275\nCC-MAIN-2026-12,syr,6722,6700,0.0003\nCC-MAIN-2026-12,tam,960842,956801,0.0487\nCC-MAIN-2026-12,tat,176022,175347,0.0089\nCC-MAIN-2026-12,tel,492823,491619,0.0250\nCC-MAIN-2026-12,tgk,138171,137753,0.0070\nCC-MAIN-2026-12,tgl,192516,191551,0.0097\nCC-MAIN-2026-12,tha,7359710,7327012,0.3727\nCC-MAIN-2026-12,tir,12391,12298,0.0006\nCC-MAIN-2026-12,ton,2920,2904,0.0001\nCC-MAIN-2026-12,tsn,2863,2861,0.0001\nCC-MAIN-2026-12,tso,1306,1296,0.0001\nCC-MAIN-2026-12,tuk,81003,80784,0.0041\nCC-MAIN-2026-12,tur,24139547,24044111,1.2224\nCC-MAIN-2026-12,uig,32650,32554,0.0017\nCC-MAIN-2026-12,ukr,14123377,13906240,0.7152\nCC-MAIN-2026-12,urd,620989,618804,0.0314\nCC-MAIN-2026-12,uzb,510419,508706,0.0258\nCC-MAIN-2026-12,ven,475,475,0.0000\nCC-MAIN-2026-12,vie,21553213,21421504,1.0914\nCC-MAIN-2026-12,vol,29400,29292,0.0015\nCC-MAIN-2026-12,war,42765,42549,0.0022\nCC-MAIN-2026-12,wol,3330,3307,0.0002\nCC-MAIN-2026-12,xho,16834,16803,0.0009\nCC-MAIN-2026-12,yid,38302,38092,0.0019\nCC-MAIN-2026-12,yor,33183,32995,0.0017\nCC-MAIN-2026-12,zha,1471,1456,0.0001\nCC-MAIN-2026-12,zho,98455846,98195820,4.9855\nCC-MAIN-2026-12,zul,23079,23037,0.0012\nCC-MAIN-2026-17,<unknown>,68248748,68248748,3.1136\nCC-MAIN-2026-17,aar,1791,1783,0.0001\nCC-MAIN-2026-17,abk,12294,12163,0.0006\nCC-MAIN-2026-17,afr,182499,181682,0.0083\nCC-MAIN-2026-17,aka,4437,4357,0.0002\nCC-MAIN-2026-17,amh,97694,97403,0.0045\nCC-MAIN-2026-17,ara,14461912,14402905,0.6598\nCC-MAIN-2026-17,asm,78386,78146,0.0036\nCC-MAIN-2026-17,aym,2105,2085,0.0001\nCC-MAIN-2026-17,aze,1334602,1331258,0.0609\nCC-MAIN-2026-17,bak,40037,39904,0.0018\nCC-MAIN-2026-17,bel,360839,356334,0.0165\nCC-MAIN-2026-17,ben,2499860,2492392,0.1140\nCC-MAIN-2026-17,bih,17541,17440,0.0008\nCC-MAIN-2026-17,bis,2568,2538,0.0001\nCC-MAIN-2026-17,bod,27282,27184,0.0012\nCC-MAIN-2026-17,bos,1348616,1344388,0.0615\nCC-MAIN-2026-17,bre,62465,61858,0.0028\nCC-MAIN-2026-17,bul,5784964,5764901,0.2639\nCC-MAIN-2026-17,cat,4406810,4376871,0.2010\nCC-MAIN-2026-17,ceb,43196,43095,0.0020\nCC-MAIN-2026-17,ces,25192086,24915549,1.1493\nCC-MAIN-2026-17,chr,868,864,0.0000\nCC-MAIN-2026-17,cos,61878,61535,0.0028\nCC-MAIN-2026-17,crs,1773,1758,0.0001\nCC-MAIN-2026-17,cym,247934,245778,0.0113\nCC-MAIN-2026-17,dan,11670088,11592997,0.5324\nCC-MAIN-2026-17,deu,129396475,128486272,5.9033\nCC-MAIN-2026-17,div,52978,52748,0.0024\nCC-MAIN-2026-17,dzo,1817,1808,0.0001\nCC-MAIN-2026-17,ell,12684022,12635292,0.5787\nCC-MAIN-2026-17,eng,899140276,893075806,41.0204\nCC-MAIN-2026-17,epo,180684,179028,0.0082\nCC-MAIN-2026-17,est,3106165,3089651,0.1417\nCC-MAIN-2026-17,eus,889582,884576,0.0406\nCC-MAIN-2026-17,fao,116667,116091,0.0053\nCC-MAIN-2026-17,fas,5009907,4995144,0.2286\nCC-MAIN-2026-17,fij,2987,2973,0.0001\nCC-MAIN-2026-17,fin,8400671,8342212,0.3833\nCC-MAIN-2026-17,fra,104228894,103608108,4.7551\nCC-MAIN-2026-17,fry,44890,44736,0.0020\nCC-MAIN-2026-17,gla,41606,41377,0.0019\nCC-MAIN-2026-17,gle,154766,154009,0.0071\nCC-MAIN-2026-17,glg,711984,709455,0.0325\nCC-MAIN-2026-17,glv,13204,13174,0.0006\nCC-MAIN-2026-17,got,530,526,0.0000\nCC-MAIN-2026-17,grn,16806,16683,0.0008\nCC-MAIN-2026-17,guj,282925,282137,0.0129\nCC-MAIN-2026-17,hat,48444,48317,0.0022\nCC-MAIN-2026-17,hau,78109,77851,0.0036\nCC-MAIN-2026-17,haw,16367,16309,0.0007\nCC-MAIN-2026-17,heb,5716016,5687326,0.2608\nCC-MAIN-2026-17,hin,4952172,4940617,0.2259\nCC-MAIN-2026-17,hmn,15623,15568,0.0007\nCC-MAIN-2026-17,hrv,4774087,4754816,0.2178\nCC-MAIN-2026-17,hun,12006252,11947940,0.5477\nCC-MAIN-2026-17,hye,716845,714350,0.0327\nCC-MAIN-2026-17,ibo,27041,26992,0.0012\nCC-MAIN-2026-17,iku,11757,11724,0.0005\nCC-MAIN-2026-17,ile,7565,7522,0.0003\nCC-MAIN-2026-17,ina,15832,15770,0.0007\nCC-MAIN-2026-17,ind,26699490,26605371,1.2181\nCC-MAIN-2026-17,ipk,1775,1772,0.0001\nCC-MAIN-2026-17,isl,760556,755950,0.0347\nCC-MAIN-2026-17,ita,51036444,50768354,2.3284\nCC-MAIN-2026-17,jav,77656,77401,0.0035\nCC-MAIN-2026-17,jpn,113042841,112603929,5.1572\nCC-MAIN-2026-17,kal,20218,20064,0.0009\nCC-MAIN-2026-17,kan,387889,387011,0.0177\nCC-MAIN-2026-17,kas,187,186,0.0000\nCC-MAIN-2026-17,kat,981749,978753,0.0448\nCC-MAIN-2026-17,kaz,778321,775650,0.0355\nCC-MAIN-2026-17,kha,6885,6875,0.0003\nCC-MAIN-2026-17,khm,232487,231999,0.0106\nCC-MAIN-2026-17,kin,61930,61798,0.0028\nCC-MAIN-2026-17,kir,247261,246225,0.0113\nCC-MAIN-2026-17,kor,18038678,17974981,0.8230\nCC-MAIN-2026-17,kur,148750,148427,0.0068\nCC-MAIN-2026-17,lao,127357,127038,0.0058\nCC-MAIN-2026-17,lat,2568257,2564132,0.1172\nCC-MAIN-2026-17,lav,2019856,2007092,0.0921\nCC-MAIN-2026-17,lif,117,116,0.0000\nCC-MAIN-2026-17,lin,7303,7258,0.0003\nCC-MAIN-2026-17,lit,3841634,3823365,0.1753\nCC-MAIN-2026-17,ltz,76637,76337,0.0035\nCC-MAIN-2026-17,lug,5223,5157,0.0002\nCC-MAIN-2026-17,mal,559447,558192,0.0255\nCC-MAIN-2026-17,mar,691396,689831,0.0315\nCC-MAIN-2026-17,mfe,2785,2779,0.0001\nCC-MAIN-2026-17,mkd,898109,893684,0.0410\nCC-MAIN-2026-17,mlg,123244,121631,0.0056\nCC-MAIN-2026-17,mlt,73570,73327,0.0034\nCC-MAIN-2026-17,mon,331829,330714,0.0151\nCC-MAIN-2026-17,mri,30843,30757,0.0014\nCC-MAIN-2026-17,msa,1839103,1834133,0.0839\nCC-MAIN-2026-17,mya,359779,358861,0.0164\nCC-MAIN-2026-17,nau,795,791,0.0000\nCC-MAIN-2026-17,nep,1372340,1370397,0.0626\nCC-MAIN-2026-17,nld,40375158,40107693,1.8420\nCC-MAIN-2026-17,nno,322659,320530,0.0147\nCC-MAIN-2026-17,nor,7463556,7417204,0.3405\nCC-MAIN-2026-17,nso,2527,2457,0.0001\nCC-MAIN-2026-17,nya,16275,16233,0.0007\nCC-MAIN-2026-17,oci,83617,83138,0.0038\nCC-MAIN-2026-17,ori,159666,159277,0.0073\nCC-MAIN-2026-17,orm,13166,13136,0.0006\nCC-MAIN-2026-17,pan,208384,207956,0.0095\nCC-MAIN-2026-17,pol,45887634,45683397,2.0935\nCC-MAIN-2026-17,por,55052116,54799306,2.5116\nCC-MAIN-2026-17,pus,88613,88299,0.0040\nCC-MAIN-2026-17,que,21790,21687,0.0010\nCC-MAIN-2026-17,roh,38941,38704,0.0018\nCC-MAIN-2026-17,ron,13292208,13232562,0.6064\nCC-MAIN-2026-17,run,2043,2033,0.0001\nCC-MAIN-2026-17,rus,143050462,142456462,6.5262\nCC-MAIN-2026-17,sag,12675,12659,0.0006\nCC-MAIN-2026-17,san,84351,83857,0.0038\nCC-MAIN-2026-17,sco,16081,16023,0.0007\nCC-MAIN-2026-17,sin,217387,216884,0.0099\nCC-MAIN-2026-17,slk,9026885,8960140,0.4118\nCC-MAIN-2026-17,slv,3364134,3345896,0.1535\nCC-MAIN-2026-17,smo,17882,17863,0.0008\nCC-MAIN-2026-17,sna,17249,17164,0.0008\nCC-MAIN-2026-17,snd,44468,44408,0.0020\nCC-MAIN-2026-17,som,127692,127403,0.0058\nCC-MAIN-2026-17,sot,15709,15689,0.0007\nCC-MAIN-2026-17,spa,103732271,103176589,4.7324\nCC-MAIN-2026-17,sqi,1119749,1116371,0.0511\nCC-MAIN-2026-17,srp,5721990,5698933,0.2610\nCC-MAIN-2026-17,ssw,860,851,0.0000\nCC-MAIN-2026-17,sun,33156,33039,0.0015\nCC-MAIN-2026-17,sux,278,276,0.0000\nCC-MAIN-2026-17,swa,269279,268579,0.0123\nCC-MAIN-2026-17,swe,16019427,15914670,0.7308\nCC-MAIN-2026-17,syr,6853,6827,0.0003\nCC-MAIN-2026-17,tam,1017764,1014591,0.0464\nCC-MAIN-2026-17,tat,155870,155276,0.0071\nCC-MAIN-2026-17,tel,495251,493763,0.0226\nCC-MAIN-2026-17,tgk,147217,146612,0.0067\nCC-MAIN-2026-17,tgl,226333,225451,0.0103\nCC-MAIN-2026-17,tha,8636717,8594090,0.3940\nCC-MAIN-2026-17,tir,26981,26893,0.0012\nCC-MAIN-2026-17,ton,2904,2883,0.0001\nCC-MAIN-2026-17,tsn,3602,3600,0.0002\nCC-MAIN-2026-17,tso,1548,1544,0.0001\nCC-MAIN-2026-17,tuk,79893,79549,0.0036\nCC-MAIN-2026-17,tur,28462464,28356283,1.2985\nCC-MAIN-2026-17,uig,48208,48112,0.0022\nCC-MAIN-2026-17,ukr,17561193,17403579,0.8012\nCC-MAIN-2026-17,urd,705357,702366,0.0322\nCC-MAIN-2026-17,uzb,541363,539353,0.0247\nCC-MAIN-2026-17,ven,529,527,0.0000\nCC-MAIN-2026-17,vie,24734463,24602203,1.1284\nCC-MAIN-2026-17,vol,30277,30210,0.0014\nCC-MAIN-2026-17,war,43400,43222,0.0020\nCC-MAIN-2026-17,wol,4614,4584,0.0002\nCC-MAIN-2026-17,xho,19636,19586,0.0009\nCC-MAIN-2026-17,yid,37404,37246,0.0017\nCC-MAIN-2026-17,yor,35118,34936,0.0016\nCC-MAIN-2026-17,zha,1629,1615,0.0001\nCC-MAIN-2026-17,zho,106448228,106115897,4.8564\nCC-MAIN-2026-17,zul,31186,31113,0.0014\n"
  },
  {
    "path": "plots/languages.md",
    "content": "---\nlayout: table\ntable_include: languages-top-200.html\ntable_sortlist: \"{sortList: [[1,1]]}\"\n---\n\nDistribution of Languages\n=========================\n\nThe language of a document is identified by [Compact Language Detector 2 (CLD2)](https://github.com/CLD2Owners/cld2). It is able to identify 160 different languages and up to 3 languages per document. The table lists the percentage covered by the primary language of a document (returned first by CLD2). So far, only HTML pages are passed to the language detector. The underlying data including page counts is provided in [languages.csv](./languages.csv).\n\n"
  },
  {
    "path": "plots/mimetypes-top-100.html",
    "content": "<table border=\"1\" class=\"dataframe tablesorter tablepercentage tablesearcher\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th>crawl</th>\n      <th>CC-MAIN-2026-08</th>\n      <th>CC-MAIN-2026-12</th>\n      <th>CC-MAIN-2026-17</th>\n    </tr>\n    <tr>\n      <th>mimetype</th>\n      <th></th>\n      <th></th>\n      <th></th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>&lt;other&gt;</th>\n      <td>0.0642</td>\n      <td>0.0646</td>\n      <td>0.0610</td>\n    </tr>\n    <tr>\n      <th>application/atom+xml</th>\n      <td>0.1461</td>\n      <td>0.1511</td>\n      <td>0.1469</td>\n    </tr>\n    <tr>\n      <th>application/calendar</th>\n      <td>0.0003</td>\n      <td>0.0002</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>application/download</th>\n      <td>0.0020</td>\n      <td>0.0013</td>\n      <td>0.0018</td>\n    </tr>\n    <tr>\n      <th>application/epub+zip</th>\n      <td>0.0017</td>\n      <td>0.0019</td>\n      <td>0.0015</td>\n    </tr>\n    <tr>\n      <th>application/force-download</th>\n      <td>0.0089</td>\n      <td>0.0075</td>\n      <td>0.0073</td>\n    </tr>\n    <tr>\n      <th>application/gpx+xml</th>\n      <td>0.0008</td>\n      <td>0.0008</td>\n      <td>0.0009</td>\n    </tr>\n    <tr>\n      <th>application/ics</th>\n      <td>0.0004</td>\n      <td>0.0004</td>\n      <td>0.0004</td>\n    </tr>\n    <tr>\n      <th>application/javascript</th>\n      <td>0.0008</td>\n      <td>0.0008</td>\n      <td>0.0008</td>\n    </tr>\n    <tr>\n      <th>application/json</th>\n      <td>0.0262</td>\n      <td>0.0256</td>\n      <td>0.0251</td>\n    </tr>\n    <tr>\n      <th>application/ld+json</th>\n      <td>0.0015</td>\n      <td>0.0014</td>\n      <td>0.0015</td>\n    </tr>\n    <tr>\n      <th>application/marc</th>\n      <td>0.0003</td>\n      <td>0.0003</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>application/msword</th>\n      <td>0.0025</td>\n      <td>0.0023</td>\n      <td>0.0025</td>\n    </tr>\n    <tr>\n      <th>application/octet-stream</th>\n      <td>0.0449</td>\n      <td>0.0487</td>\n      <td>0.0469</td>\n    </tr>\n    <tr>\n      <th>application/octetstream</th>\n      <td>0.0002</td>\n      <td>0.0002</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>application/pdf</th>\n      <td>0.7330</td>\n      <td>0.7988</td>\n      <td>0.8655</td>\n    </tr>\n    <tr>\n      <th>application/pgp-encrypted</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>application/pgp-signature</th>\n      <td>0.0014</td>\n      <td>0.0016</td>\n      <td>0.0020</td>\n    </tr>\n    <tr>\n      <th>application/postscript</th>\n      <td>0.0002</td>\n      <td>0.0002</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>application/rdf+xml</th>\n      <td>0.0038</td>\n      <td>0.0036</td>\n      <td>0.0031</td>\n    </tr>\n    <tr>\n      <th>application/rss+xml</th>\n      <td>0.0430</td>\n      <td>0.0439</td>\n      <td>0.0418</td>\n    </tr>\n    <tr>\n      <th>application/rtf</th>\n      <td>0.0008</td>\n      <td>0.0007</td>\n      <td>0.0005</td>\n    </tr>\n    <tr>\n      <th>application/save-to-disk</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>application/text</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>application/unknown</th>\n      <td>0.0002</td>\n      <td>0.0002</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>application/vnd.android.package-archive</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>application/vnd.google-earth.kml+xml</th>\n      <td>0.0012</td>\n      <td>0.0012</td>\n      <td>0.0011</td>\n    </tr>\n    <tr>\n      <th>application/vnd.google-earth.kmz</th>\n      <td>0.0003</td>\n      <td>0.0005</td>\n      <td>0.0005</td>\n    </tr>\n    <tr>\n      <th>application/vnd.ms-excel</th>\n      <td>0.0014</td>\n      <td>0.0015</td>\n      <td>0.0012</td>\n    </tr>\n    <tr>\n      <th>application/vnd.ms-powerpoint</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>application/vnd.ms-word</th>\n      <td>0.0002</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>application/vnd.oasis.opendocument.text</th>\n      <td>0.0007</td>\n      <td>0.0008</td>\n      <td>0.0007</td>\n    </tr>\n    <tr>\n      <th>application/vnd.openxmlformats-officedocument.presentationml.presentation</th>\n      <td>0.0002</td>\n      <td>0.0003</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>application/vnd.openxmlformats-officedocument.spreadsheetml.sheet</th>\n      <td>0.0019</td>\n      <td>0.0017</td>\n      <td>0.0016</td>\n    </tr>\n    <tr>\n      <th>application/vnd.openxmlformats-officedocument.wordprocessingml.document</th>\n      <td>0.0024</td>\n      <td>0.0028</td>\n      <td>0.0028</td>\n    </tr>\n    <tr>\n      <th>application/vnd.wap.xhtml+xml</th>\n      <td>0.0005</td>\n      <td>0.0010</td>\n      <td>0.0009</td>\n    </tr>\n    <tr>\n      <th>application/x-bibtex</th>\n      <td>0.0086</td>\n      <td>0.0090</td>\n      <td>0.0088</td>\n    </tr>\n    <tr>\n      <th>application/x-bittorrent</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>application/x-debian-package</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>application/x-download</th>\n      <td>0.0026</td>\n      <td>0.0025</td>\n      <td>0.0022</td>\n    </tr>\n    <tr>\n      <th>application/x-endnote-refer</th>\n      <td>0.0004</td>\n      <td>0.0004</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>application/x-gzip</th>\n      <td>0.0003</td>\n      <td>0.0002</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>application/x-httpd-php</th>\n      <td>0.0003</td>\n      <td>0.0003</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>application/x-java-jnlp-file</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>application/x-javascript</th>\n      <td>0.0002</td>\n      <td>0.0002</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>application/x-json</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>application/x-mobipocket-ebook</th>\n      <td>0.0005</td>\n      <td>0.0007</td>\n      <td>0.0004</td>\n    </tr>\n    <tr>\n      <th>application/x-msdownload</th>\n      <td>0.0003</td>\n      <td>0.0003</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>application/x-netcdf</th>\n      <td>0.0001</td>\n      <td>0.0003</td>\n      <td>0.0004</td>\n    </tr>\n    <tr>\n      <th>application/x-research-info-systems</th>\n      <td>0.0115</td>\n      <td>0.0117</td>\n      <td>0.0116</td>\n    </tr>\n    <tr>\n      <th>application/x-shockwave-flash</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>application/x-tar</th>\n      <td>0.0000</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>application/x-tex</th>\n      <td>0.0001</td>\n      <td>0.0002</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>application/x-troff-man</th>\n      <td>0.0004</td>\n      <td>0.0003</td>\n      <td>0.0004</td>\n    </tr>\n    <tr>\n      <th>application/x-zip-compressed</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>application/xhtml+xml</th>\n      <td>0.0111</td>\n      <td>0.0109</td>\n      <td>0.0104</td>\n    </tr>\n    <tr>\n      <th>application/xml</th>\n      <td>0.0291</td>\n      <td>0.0266</td>\n      <td>0.0254</td>\n    </tr>\n    <tr>\n      <th>application/zip</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>audio/mpeg</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>audio/x-mpegurl</th>\n      <td>0.0005</td>\n      <td>0.0006</td>\n      <td>0.0006</td>\n    </tr>\n    <tr>\n      <th>audio/x-scpls</th>\n      <td>0.0002</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>audio/x-wav</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>binary/octet-stream</th>\n      <td>0.0005</td>\n      <td>0.0005</td>\n      <td>0.0005</td>\n    </tr>\n    <tr>\n      <th>image/gif</th>\n      <td>0.0004</td>\n      <td>0.0003</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>image/jp2</th>\n      <td>NaN</td>\n      <td>0.0000</td>\n      <td>NaN</td>\n    </tr>\n    <tr>\n      <th>image/jpeg</th>\n      <td>0.0003</td>\n      <td>0.0004</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>image/jpg</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>image/pjpeg</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>image/png</th>\n      <td>0.0002</td>\n      <td>0.0004</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>image/svg+xml</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>image/tiff</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>image/vnd.djvu</th>\n      <td>0.0006</td>\n      <td>0.0003</td>\n      <td>0.0005</td>\n    </tr>\n    <tr>\n      <th>image/webp</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>message/rfc822</th>\n      <td>0.0002</td>\n      <td>0.0003</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>text/calendar</th>\n      <td>0.0374</td>\n      <td>0.0383</td>\n      <td>0.0354</td>\n    </tr>\n    <tr>\n      <th>text/css</th>\n      <td>0.0006</td>\n      <td>0.0006</td>\n      <td>0.0006</td>\n    </tr>\n    <tr>\n      <th>text/csv</th>\n      <td>0.0034</td>\n      <td>0.0032</td>\n      <td>0.0030</td>\n    </tr>\n    <tr>\n      <th>text/directory</th>\n      <td>0.0002</td>\n      <td>0.0002</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>text/enriched</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>text/html</th>\n      <td>98.6720</td>\n      <td>98.5946</td>\n      <td>98.5388</td>\n    </tr>\n    <tr>\n      <th>text/javascript</th>\n      <td>0.0004</td>\n      <td>0.0004</td>\n      <td>0.0004</td>\n    </tr>\n    <tr>\n      <th>text/markdown</th>\n      <td>0.0013</td>\n      <td>0.0034</td>\n      <td>0.0298</td>\n    </tr>\n    <tr>\n      <th>text/pdf</th>\n      <td>0.0001</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>text/plain</th>\n      <td>0.0521</td>\n      <td>0.0541</td>\n      <td>0.0485</td>\n    </tr>\n    <tr>\n      <th>text/prs.lines.tag</th>\n      <td>0.0025</td>\n      <td>0.0039</td>\n      <td>0.0030</td>\n    </tr>\n    <tr>\n      <th>text/tab-separated-values</th>\n      <td>0.0005</td>\n      <td>0.0004</td>\n      <td>0.0004</td>\n    </tr>\n    <tr>\n      <th>text/turtle</th>\n      <td>0.0014</td>\n      <td>0.0012</td>\n      <td>0.0010</td>\n    </tr>\n    <tr>\n      <th>text/vcard</th>\n      <td>0.0011</td>\n      <td>0.0012</td>\n      <td>0.0012</td>\n    </tr>\n    <tr>\n      <th>text/x-bibtex</th>\n      <td>0.0006</td>\n      <td>0.0005</td>\n      <td>0.0005</td>\n    </tr>\n    <tr>\n      <th>text/x-c</th>\n      <td>0.0001</td>\n      <td>0.0002</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>text/x-csrc</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>text/x-diff</th>\n      <td>0.0002</td>\n      <td>0.0003</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>text/x-patch</th>\n      <td>0.0003</td>\n      <td>0.0003</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>text/x-perl</th>\n      <td>0.0000</td>\n      <td>0.0001</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>text/x-vcalendar</th>\n      <td>0.0003</td>\n      <td>0.0004</td>\n      <td>0.0004</td>\n    </tr>\n    <tr>\n      <th>text/x-vcard</th>\n      <td>0.0020</td>\n      <td>0.0019</td>\n      <td>0.0019</td>\n    </tr>\n    <tr>\n      <th>text/xml</th>\n      <td>0.0622</td>\n      <td>0.0613</td>\n      <td>0.0496</td>\n    </tr>\n    <tr>\n      <th>unknown/unknown</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>video/mp4</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>video/webm</th>\n      <td>0.0000</td>\n      <td>NaN</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>video/x-ms-asf</th>\n      <td>0.0001</td>\n      <td>0.0002</td>\n      <td>0.0002</td>\n    </tr>\n  </tbody>\n</table>"
  },
  {
    "path": "plots/mimetypes.csv",
    "content": "crawl,mimetype,pages,urls,%pages/crawl\nCC-MAIN-2008-2009,<other>,818049,815434,0.0455\nCC-MAIN-2008-2009,application/atom+xml,520258,518338,0.0289\nCC-MAIN-2008-2009,application/download,198,198,0.0000\nCC-MAIN-2008-2009,application/force-download,448,448,0.0000\nCC-MAIN-2008-2009,application/gpx+xml,756,742,0.0000\nCC-MAIN-2008-2009,application/javascript,2880,2872,0.0002\nCC-MAIN-2008-2009,application/json,30,30,0.0000\nCC-MAIN-2008-2009,application/marc,7,7,0.0000\nCC-MAIN-2008-2009,application/msword,102626,102624,0.0057\nCC-MAIN-2008-2009,application/octet-stream,10739,10739,0.0006\nCC-MAIN-2008-2009,application/octetstream,33,33,0.0000\nCC-MAIN-2008-2009,application/pdf,21192930,21123709,1.1786\nCC-MAIN-2008-2009,application/pgp-encrypted,2,2,0.0000\nCC-MAIN-2008-2009,application/pgp-signature,390,390,0.0000\nCC-MAIN-2008-2009,application/postscript,489,489,0.0000\nCC-MAIN-2008-2009,application/rdf+xml,213121,212730,0.0119\nCC-MAIN-2008-2009,application/rss+xml,1622341,1615587,0.0902\nCC-MAIN-2008-2009,application/rtf,35261,35101,0.0020\nCC-MAIN-2008-2009,application/text,3168,3148,0.0002\nCC-MAIN-2008-2009,application/unknown,166,166,0.0000\nCC-MAIN-2008-2009,application/vnd.google-earth.kml+xml,93062,92819,0.0052\nCC-MAIN-2008-2009,application/vnd.google-earth.kmz,458,458,0.0000\nCC-MAIN-2008-2009,application/vnd.ms-excel,303,303,0.0000\nCC-MAIN-2008-2009,application/vnd.ms-powerpoint,24064,23965,0.0013\nCC-MAIN-2008-2009,application/vnd.ms-word,64,64,0.0000\nCC-MAIN-2008-2009,application/vnd.oasis.opendocument.text,2914,2903,0.0002\nCC-MAIN-2008-2009,application/vnd.openxmlformats-officedocument.presentationml.presentation,2,2,0.0000\nCC-MAIN-2008-2009,application/vnd.openxmlformats-officedocument.wordprocessingml.document,4,4,0.0000\nCC-MAIN-2008-2009,application/vnd.wap.xhtml+xml,844,843,0.0000\nCC-MAIN-2008-2009,application/x-bittorrent,2291,2291,0.0001\nCC-MAIN-2008-2009,application/x-debian-package,1,1,0.0000\nCC-MAIN-2008-2009,application/x-download,124,124,0.0000\nCC-MAIN-2008-2009,application/x-endnote-refer,20,20,0.0000\nCC-MAIN-2008-2009,application/x-gzip,306,306,0.0000\nCC-MAIN-2008-2009,application/x-httpd-php,1409,1409,0.0001\nCC-MAIN-2008-2009,application/x-java-jnlp-file,166,166,0.0000\nCC-MAIN-2008-2009,application/x-javascript,162713,162291,0.0090\nCC-MAIN-2008-2009,application/x-msdownload,86,86,0.0000\nCC-MAIN-2008-2009,application/x-netcdf,90,90,0.0000\nCC-MAIN-2008-2009,application/x-research-info-systems,48,48,0.0000\nCC-MAIN-2008-2009,application/x-shockwave-flash,32085,32085,0.0018\nCC-MAIN-2008-2009,application/x-tar,1708,1708,0.0001\nCC-MAIN-2008-2009,application/x-tex,11368,11334,0.0006\nCC-MAIN-2008-2009,application/x-troff-man,21,21,0.0000\nCC-MAIN-2008-2009,application/x-zip-compressed,96,96,0.0000\nCC-MAIN-2008-2009,application/xhtml+xml,719150,716477,0.0400\nCC-MAIN-2008-2009,application/xml,2987620,2977275,0.1661\nCC-MAIN-2008-2009,application/zip,285,285,0.0000\nCC-MAIN-2008-2009,audio/mpeg,289,289,0.0000\nCC-MAIN-2008-2009,audio/x-mpegurl,16517,16517,0.0009\nCC-MAIN-2008-2009,audio/x-scpls,766,766,0.0000\nCC-MAIN-2008-2009,audio/x-wav,35,35,0.0000\nCC-MAIN-2008-2009,binary/octet-stream,33,33,0.0000\nCC-MAIN-2008-2009,image/gif,27388,27388,0.0015\nCC-MAIN-2008-2009,image/jp2,51,51,0.0000\nCC-MAIN-2008-2009,image/jpeg,66920,66919,0.0037\nCC-MAIN-2008-2009,image/jpg,615,615,0.0000\nCC-MAIN-2008-2009,image/pjpeg,1897,1897,0.0001\nCC-MAIN-2008-2009,image/png,8926,8925,0.0005\nCC-MAIN-2008-2009,image/svg+xml,679,679,0.0000\nCC-MAIN-2008-2009,image/tiff,39,39,0.0000\nCC-MAIN-2008-2009,image/vnd.djvu,159,159,0.0000\nCC-MAIN-2008-2009,message/rfc822,21464,21362,0.0012\nCC-MAIN-2008-2009,text/calendar,71950,71475,0.0040\nCC-MAIN-2008-2009,text/css,79129,78835,0.0044\nCC-MAIN-2008-2009,text/csv,4895,4873,0.0003\nCC-MAIN-2008-2009,text/directory,1456,1415,0.0001\nCC-MAIN-2008-2009,text/enriched,64,64,0.0000\nCC-MAIN-2008-2009,text/html,1752379890,1745330892,97.4542\nCC-MAIN-2008-2009,text/javascript,74988,74776,0.0042\nCC-MAIN-2008-2009,text/pdf,114,114,0.0000\nCC-MAIN-2008-2009,text/plain,5150776,5134374,0.2864\nCC-MAIN-2008-2009,text/prs.lines.tag,99,95,0.0000\nCC-MAIN-2008-2009,text/tab-separated-values,383,383,0.0000\nCC-MAIN-2008-2009,text/turtle,104,104,0.0000\nCC-MAIN-2008-2009,text/vcard,4397,4394,0.0002\nCC-MAIN-2008-2009,text/x-bibtex,2791,2786,0.0002\nCC-MAIN-2008-2009,text/x-c,7855,7805,0.0004\nCC-MAIN-2008-2009,text/x-csrc,8942,8898,0.0005\nCC-MAIN-2008-2009,text/x-diff,7269,7228,0.0004\nCC-MAIN-2008-2009,text/x-patch,395,394,0.0000\nCC-MAIN-2008-2009,text/x-perl,3657,3642,0.0002\nCC-MAIN-2008-2009,text/x-vcalendar,20131,20027,0.0011\nCC-MAIN-2008-2009,text/x-vcard,42555,42471,0.0024\nCC-MAIN-2008-2009,text/xml,11576732,11513141,0.6438\nCC-MAIN-2008-2009,unknown/unknown,2509,2508,0.0001\nCC-MAIN-2008-2009,video/mp4,1209,1209,0.0001\nCC-MAIN-2008-2009,video/x-ms-asf,4829,4829,0.0003\nCC-MAIN-2009-2010,<other>,1278619,1185296,0.0447\nCC-MAIN-2009-2010,application/atom+xml,2963111,2682964,0.1035\nCC-MAIN-2009-2010,application/gpx+xml,234,215,0.0000\nCC-MAIN-2009-2010,application/javascript,7712363,7558783,0.2693\nCC-MAIN-2009-2010,application/octet-stream,1750877,1620751,0.0611\nCC-MAIN-2009-2010,application/pdf,47086416,44891743,1.6444\nCC-MAIN-2009-2010,application/rdf+xml,499681,453511,0.0175\nCC-MAIN-2009-2010,application/rss+xml,3868122,3501841,0.1351\nCC-MAIN-2009-2010,application/rtf,116462,112178,0.0041\nCC-MAIN-2009-2010,application/text,16106,15980,0.0006\nCC-MAIN-2009-2010,application/vnd.google-earth.kml+xml,231326,202826,0.0081\nCC-MAIN-2009-2010,application/vnd.google-earth.kmz,28104,26463,0.0010\nCC-MAIN-2009-2010,application/vnd.ms-excel,637242,621361,0.0223\nCC-MAIN-2009-2010,application/vnd.ms-powerpoint,81553,76984,0.0028\nCC-MAIN-2009-2010,application/vnd.oasis.opendocument.text,6657,6441,0.0002\nCC-MAIN-2009-2010,application/vnd.wap.xhtml+xml,5319,3435,0.0002\nCC-MAIN-2009-2010,application/x-javascript,25198745,24550069,0.8800\nCC-MAIN-2009-2010,application/x-tar,219935,217021,0.0077\nCC-MAIN-2009-2010,application/x-tex,12966,12812,0.0005\nCC-MAIN-2009-2010,application/xhtml+xml,8940011,6997137,0.3122\nCC-MAIN-2009-2010,application/xml,8767027,7437607,0.3062\nCC-MAIN-2009-2010,message/rfc822,45178,43809,0.0016\nCC-MAIN-2009-2010,text/calendar,190076,175389,0.0066\nCC-MAIN-2009-2010,text/css,25554279,25495830,0.8924\nCC-MAIN-2009-2010,text/csv,31717,30960,0.0011\nCC-MAIN-2009-2010,text/directory,5875,5769,0.0002\nCC-MAIN-2009-2010,text/enriched,634,465,0.0000\nCC-MAIN-2009-2010,text/html,2609478137,2076939999,91.1291\nCC-MAIN-2009-2010,text/javascript,3154591,2894644,0.1102\nCC-MAIN-2009-2010,text/pdf,304,281,0.0000\nCC-MAIN-2009-2010,text/plain,67578620,49275974,2.3600\nCC-MAIN-2009-2010,text/prs.lines.tag,310,309,0.0000\nCC-MAIN-2009-2010,text/tab-separated-values,1974,1966,0.0001\nCC-MAIN-2009-2010,text/turtle,180,172,0.0000\nCC-MAIN-2009-2010,text/vcard,364,362,0.0000\nCC-MAIN-2009-2010,text/x-bibtex,4504,4370,0.0002\nCC-MAIN-2009-2010,text/x-c,12356,12098,0.0004\nCC-MAIN-2009-2010,text/x-csrc,8886,8669,0.0003\nCC-MAIN-2009-2010,text/x-diff,9334,9070,0.0003\nCC-MAIN-2009-2010,text/x-patch,3771,3702,0.0001\nCC-MAIN-2009-2010,text/x-perl,5742,5543,0.0002\nCC-MAIN-2009-2010,text/x-vcalendar,32803,32285,0.0011\nCC-MAIN-2009-2010,text/x-vcard,150568,140520,0.0053\nCC-MAIN-2009-2010,text/xml,47799382,43873601,1.6693\nCC-MAIN-2009-2010,unknown/unknown,4750,4676,0.0002\nCC-MAIN-2012,<other>,3213662,3155612,0.0839\nCC-MAIN-2012,application/atom+xml,3416865,2268176,0.0892\nCC-MAIN-2012,application/calendar,907,906,0.0000\nCC-MAIN-2012,application/download,41631,40318,0.0011\nCC-MAIN-2012,application/epub+zip,21817,20317,0.0006\nCC-MAIN-2012,application/force-download,107775,104675,0.0028\nCC-MAIN-2012,application/gpx+xml,1803,1802,0.0000\nCC-MAIN-2012,application/ics,372,363,0.0000\nCC-MAIN-2012,application/javascript,11534877,11439978,0.3013\nCC-MAIN-2012,application/json,59572,57852,0.0016\nCC-MAIN-2012,application/marc,25792,23164,0.0007\nCC-MAIN-2012,application/msword,6639825,6593489,0.1734\nCC-MAIN-2012,application/octet-stream,1874679,1843384,0.0490\nCC-MAIN-2012,application/octetstream,20451,20276,0.0005\nCC-MAIN-2012,application/pdf,92567905,91522066,2.4178\nCC-MAIN-2012,application/pgp-encrypted,972,972,0.0000\nCC-MAIN-2012,application/pgp-signature,46327,46175,0.0012\nCC-MAIN-2012,application/postscript,38345,37910,0.0010\nCC-MAIN-2012,application/rdf+xml,135494,126123,0.0035\nCC-MAIN-2012,application/rss+xml,4216661,3880824,0.1101\nCC-MAIN-2012,application/rtf,295308,291228,0.0077\nCC-MAIN-2012,application/save-to-disk,3,3,0.0000\nCC-MAIN-2012,application/text,7840,7761,0.0002\nCC-MAIN-2012,application/unknown,62555,62337,0.0016\nCC-MAIN-2012,application/vnd.android.package-archive,4492,4404,0.0001\nCC-MAIN-2012,application/vnd.google-earth.kml+xml,119328,116997,0.0031\nCC-MAIN-2012,application/vnd.google-earth.kmz,54432,53610,0.0014\nCC-MAIN-2012,application/vnd.ms-excel,1381181,1366233,0.0361\nCC-MAIN-2012,application/vnd.ms-powerpoint,984185,981169,0.0257\nCC-MAIN-2012,application/vnd.ms-word,20001,19924,0.0005\nCC-MAIN-2012,application/vnd.oasis.opendocument.text,16473,16207,0.0004\nCC-MAIN-2012,application/vnd.openxmlformats-officedocument.presentationml.presentation,38672,38341,0.0010\nCC-MAIN-2012,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,27214,27040,0.0007\nCC-MAIN-2012,application/vnd.openxmlformats-officedocument.wordprocessingml.document,151358,150626,0.0040\nCC-MAIN-2012,application/vnd.wap.xhtml+xml,30850,28700,0.0008\nCC-MAIN-2012,application/x-bibtex,185,184,0.0000\nCC-MAIN-2012,application/x-bittorrent,155973,154651,0.0041\nCC-MAIN-2012,application/x-debian-package,95469,95283,0.0025\nCC-MAIN-2012,application/x-download,37255,36811,0.0010\nCC-MAIN-2012,application/x-endnote-refer,5765,5686,0.0002\nCC-MAIN-2012,application/x-gzip,559197,554962,0.0146\nCC-MAIN-2012,application/x-httpd-php,172430,169721,0.0045\nCC-MAIN-2012,application/x-java-jnlp-file,7906,7617,0.0002\nCC-MAIN-2012,application/x-javascript,21166615,20995252,0.5529\nCC-MAIN-2012,application/x-json,76,76,0.0000\nCC-MAIN-2012,application/x-mobipocket-ebook,14801,14352,0.0004\nCC-MAIN-2012,application/x-msdownload,26458,25154,0.0007\nCC-MAIN-2012,application/x-netcdf,4464,4425,0.0001\nCC-MAIN-2012,application/x-research-info-systems,341,339,0.0000\nCC-MAIN-2012,application/x-shockwave-flash,848694,834015,0.0222\nCC-MAIN-2012,application/x-tar,82765,82091,0.0022\nCC-MAIN-2012,application/x-tex,24961,24707,0.0007\nCC-MAIN-2012,application/x-troff-man,11980,11929,0.0003\nCC-MAIN-2012,application/x-zip-compressed,426199,424310,0.0111\nCC-MAIN-2012,application/xhtml+xml,2814799,2650293,0.0735\nCC-MAIN-2012,application/xml,5008141,4684319,0.1308\nCC-MAIN-2012,application/zip,1585432,1567787,0.0414\nCC-MAIN-2012,audio/mpeg,203080,199300,0.0053\nCC-MAIN-2012,audio/x-mpegurl,420104,416988,0.0110\nCC-MAIN-2012,audio/x-scpls,18416,17650,0.0005\nCC-MAIN-2012,audio/x-wav,28500,28379,0.0007\nCC-MAIN-2012,binary/octet-stream,99942,92075,0.0026\nCC-MAIN-2012,image/gif,1106754,1084096,0.0289\nCC-MAIN-2012,image/jp2,184,184,0.0000\nCC-MAIN-2012,image/jpeg,14090322,13945877,0.3680\nCC-MAIN-2012,image/jpg,119061,118093,0.0031\nCC-MAIN-2012,image/pjpeg,122955,121096,0.0032\nCC-MAIN-2012,image/png,1205276,1182794,0.0315\nCC-MAIN-2012,image/svg+xml,34266,33439,0.0009\nCC-MAIN-2012,image/tiff,16354,16328,0.0004\nCC-MAIN-2012,image/vnd.djvu,42972,42700,0.0011\nCC-MAIN-2012,image/webp,14377,14374,0.0004\nCC-MAIN-2012,message/rfc822,79249,78778,0.0021\nCC-MAIN-2012,text/calendar,337508,330475,0.0088\nCC-MAIN-2012,text/css,22831268,22745136,0.5963\nCC-MAIN-2012,text/csv,35875,35174,0.0009\nCC-MAIN-2012,text/directory,14497,12674,0.0004\nCC-MAIN-2012,text/enriched,526,522,0.0000\nCC-MAIN-2012,text/html,3533120134,3322995305,92.2837\nCC-MAIN-2012,text/javascript,2744495,2715954,0.0717\nCC-MAIN-2012,text/pdf,590,589,0.0000\nCC-MAIN-2012,text/plain,10699434,10507977,0.2795\nCC-MAIN-2012,text/prs.lines.tag,3961,3941,0.0001\nCC-MAIN-2012,text/tab-separated-values,776,765,0.0000\nCC-MAIN-2012,text/turtle,584,501,0.0000\nCC-MAIN-2012,text/vcard,1488,1434,0.0000\nCC-MAIN-2012,text/x-bibtex,20344,20231,0.0005\nCC-MAIN-2012,text/x-c,37948,37377,0.0010\nCC-MAIN-2012,text/x-csrc,20525,20162,0.0005\nCC-MAIN-2012,text/x-diff,26716,26168,0.0007\nCC-MAIN-2012,text/x-patch,1997,1993,0.0001\nCC-MAIN-2012,text/x-perl,10567,10382,0.0003\nCC-MAIN-2012,text/x-vcalendar,56974,54642,0.0015\nCC-MAIN-2012,text/x-vcard,151185,148298,0.0039\nCC-MAIN-2012,text/xml,80074779,63065590,2.0915\nCC-MAIN-2012,unknown/unknown,11085,10933,0.0003\nCC-MAIN-2012,video/mp4,300424,285876,0.0078\nCC-MAIN-2012,video/webm,4114,4092,0.0001\nCC-MAIN-2012,video/x-ms-asf,220741,217061,0.0058\nCC-MAIN-2013-20,<other>,1794120,1713390,0.0999\nCC-MAIN-2013-20,application/atom+xml,2683814,2649369,0.1494\nCC-MAIN-2013-20,application/calendar,6510,5239,0.0004\nCC-MAIN-2013-20,application/download,30547,29866,0.0017\nCC-MAIN-2013-20,application/epub+zip,35274,34361,0.0020\nCC-MAIN-2013-20,application/force-download,44903,42965,0.0025\nCC-MAIN-2013-20,application/gpx+xml,602,601,0.0000\nCC-MAIN-2013-20,application/ics,1641,1630,0.0001\nCC-MAIN-2013-20,application/javascript,186,182,0.0000\nCC-MAIN-2013-20,application/json,139341,132552,0.0078\nCC-MAIN-2013-20,application/ld+json,5,5,0.0000\nCC-MAIN-2013-20,application/marc,9861,9785,0.0005\nCC-MAIN-2013-20,application/msword,92771,89728,0.0052\nCC-MAIN-2013-20,application/octet-stream,735440,716240,0.0409\nCC-MAIN-2013-20,application/octetstream,12736,12648,0.0007\nCC-MAIN-2013-20,application/pdf,2911626,2768018,0.1621\nCC-MAIN-2013-20,application/pgp-encrypted,2461,2449,0.0001\nCC-MAIN-2013-20,application/pgp-signature,25296,24969,0.0014\nCC-MAIN-2013-20,application/postscript,7071,6952,0.0004\nCC-MAIN-2013-20,application/rdf+xml,68517,67805,0.0038\nCC-MAIN-2013-20,application/rss+xml,3109748,2934616,0.1731\nCC-MAIN-2013-20,application/rtf,2209,2173,0.0001\nCC-MAIN-2013-20,application/save-to-disk,32894,32763,0.0018\nCC-MAIN-2013-20,application/text,27585,27219,0.0015\nCC-MAIN-2013-20,application/unknown,12190,11925,0.0007\nCC-MAIN-2013-20,application/vnd.android.package-archive,2120,2094,0.0001\nCC-MAIN-2013-20,application/vnd.google-earth.kml+xml,150822,143737,0.0084\nCC-MAIN-2013-20,application/vnd.google-earth.kmz,36513,36184,0.0020\nCC-MAIN-2013-20,application/vnd.ms-excel,51246,50169,0.0029\nCC-MAIN-2013-20,application/vnd.ms-powerpoint,58991,51631,0.0033\nCC-MAIN-2013-20,application/vnd.ms-word,14047,13596,0.0008\nCC-MAIN-2013-20,application/vnd.oasis.opendocument.text,2936,2882,0.0002\nCC-MAIN-2013-20,application/vnd.openxmlformats-officedocument.presentationml.presentation,2215,2140,0.0001\nCC-MAIN-2013-20,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,2487,2280,0.0001\nCC-MAIN-2013-20,application/vnd.openxmlformats-officedocument.wordprocessingml.document,14276,13657,0.0008\nCC-MAIN-2013-20,application/vnd.wap.xhtml+xml,71372,66624,0.0040\nCC-MAIN-2013-20,application/x-bibtex,22336,22246,0.0012\nCC-MAIN-2013-20,application/x-bittorrent,19361,19207,0.0011\nCC-MAIN-2013-20,application/x-debian-package,112500,111690,0.0063\nCC-MAIN-2013-20,application/x-download,17485,16379,0.0010\nCC-MAIN-2013-20,application/x-endnote-refer,42226,41608,0.0024\nCC-MAIN-2013-20,application/x-gzip,38993,38555,0.0022\nCC-MAIN-2013-20,application/x-httpd-php,9463,9334,0.0005\nCC-MAIN-2013-20,application/x-java-jnlp-file,10316,9354,0.0006\nCC-MAIN-2013-20,application/x-javascript,2194,2086,0.0001\nCC-MAIN-2013-20,application/x-json,20684,20548,0.0012\nCC-MAIN-2013-20,application/x-mobipocket-ebook,11214,10589,0.0006\nCC-MAIN-2013-20,application/x-msdownload,4288,3925,0.0002\nCC-MAIN-2013-20,application/x-netcdf,12329,12224,0.0007\nCC-MAIN-2013-20,application/x-research-info-systems,40871,40665,0.0023\nCC-MAIN-2013-20,application/x-shockwave-flash,24818,24108,0.0014\nCC-MAIN-2013-20,application/x-tar,6149,6075,0.0003\nCC-MAIN-2013-20,application/x-tex,19448,19153,0.0011\nCC-MAIN-2013-20,application/x-troff-man,9391,9303,0.0005\nCC-MAIN-2013-20,application/x-zip-compressed,17909,16290,0.0010\nCC-MAIN-2013-20,application/xhtml+xml,1694954,1572684,0.0944\nCC-MAIN-2013-20,application/xml,1592456,1552675,0.0887\nCC-MAIN-2013-20,application/zip,97191,95726,0.0054\nCC-MAIN-2013-20,audio/mpeg,107302,102608,0.0060\nCC-MAIN-2013-20,audio/x-mpegurl,47189,26404,0.0026\nCC-MAIN-2013-20,audio/x-scpls,43973,43384,0.0024\nCC-MAIN-2013-20,audio/x-wav,169835,168936,0.0095\nCC-MAIN-2013-20,binary/octet-stream,23197,23005,0.0013\nCC-MAIN-2013-20,image/gif,654415,646598,0.0364\nCC-MAIN-2013-20,image/jp2,11736,11662,0.0007\nCC-MAIN-2013-20,image/jpeg,8489582,8391675,0.4727\nCC-MAIN-2013-20,image/jpg,114719,114042,0.0064\nCC-MAIN-2013-20,image/pjpeg,51600,49635,0.0029\nCC-MAIN-2013-20,image/png,732441,722926,0.0408\nCC-MAIN-2013-20,image/svg+xml,1776,1759,0.0001\nCC-MAIN-2013-20,image/tiff,14754,14583,0.0008\nCC-MAIN-2013-20,image/vnd.djvu,7093,7042,0.0004\nCC-MAIN-2013-20,image/webp,37,36,0.0000\nCC-MAIN-2013-20,message/rfc822,22397,21990,0.0012\nCC-MAIN-2013-20,text/calendar,993011,958607,0.0553\nCC-MAIN-2013-20,text/css,492,475,0.0000\nCC-MAIN-2013-20,text/csv,67459,65697,0.0038\nCC-MAIN-2013-20,text/directory,19966,19411,0.0011\nCC-MAIN-2013-20,text/enriched,14138,13854,0.0008\nCC-MAIN-2013-20,text/html,1754393474,1626550439,97.6780\nCC-MAIN-2013-20,text/javascript,12490,11944,0.0007\nCC-MAIN-2013-20,text/pdf,288,288,0.0000\nCC-MAIN-2013-20,text/plain,3479510,3300101,0.1937\nCC-MAIN-2013-20,text/prs.lines.tag,655,652,0.0000\nCC-MAIN-2013-20,text/tab-separated-values,48268,46769,0.0027\nCC-MAIN-2013-20,text/turtle,455,442,0.0000\nCC-MAIN-2013-20,text/vcard,1490,1434,0.0001\nCC-MAIN-2013-20,text/x-bibtex,24374,24210,0.0014\nCC-MAIN-2013-20,text/x-c,5023,4888,0.0003\nCC-MAIN-2013-20,text/x-csrc,5938,5865,0.0003\nCC-MAIN-2013-20,text/x-diff,19403,19028,0.0011\nCC-MAIN-2013-20,text/x-patch,70795,70185,0.0039\nCC-MAIN-2013-20,text/x-perl,21864,21723,0.0012\nCC-MAIN-2013-20,text/x-vcalendar,81742,79297,0.0046\nCC-MAIN-2013-20,text/x-vcard,48237,46951,0.0027\nCC-MAIN-2013-20,text/xml,9857229,9516945,0.5488\nCC-MAIN-2013-20,unknown/unknown,278946,271527,0.0155\nCC-MAIN-2013-20,video/mp4,5171,5047,0.0003\nCC-MAIN-2013-20,video/webm,4407,4266,0.0002\nCC-MAIN-2013-20,video/x-ms-asf,130823,114508,0.0073\nCC-MAIN-2013-48,<other>,1979014,1885820,0.0881\nCC-MAIN-2013-48,application/atom+xml,2438365,2414438,0.1086\nCC-MAIN-2013-48,application/calendar,10162,9678,0.0005\nCC-MAIN-2013-48,application/download,56758,54904,0.0025\nCC-MAIN-2013-48,application/epub+zip,65482,59149,0.0029\nCC-MAIN-2013-48,application/force-download,30325,28619,0.0014\nCC-MAIN-2013-48,application/gpx+xml,520,518,0.0000\nCC-MAIN-2013-48,application/ics,2116,2103,0.0001\nCC-MAIN-2013-48,application/javascript,414,372,0.0000\nCC-MAIN-2013-48,application/json,256056,248509,0.0114\nCC-MAIN-2013-48,application/ld+json,5,5,0.0000\nCC-MAIN-2013-48,application/marc,22395,22316,0.0010\nCC-MAIN-2013-48,application/msword,103656,97445,0.0046\nCC-MAIN-2013-48,application/octet-stream,809094,782347,0.0360\nCC-MAIN-2013-48,application/octetstream,14431,14181,0.0006\nCC-MAIN-2013-48,application/pdf,3508137,3278175,0.1562\nCC-MAIN-2013-48,application/pgp-encrypted,34639,32783,0.0015\nCC-MAIN-2013-48,application/pgp-signature,16390,16180,0.0007\nCC-MAIN-2013-48,application/postscript,5634,5482,0.0003\nCC-MAIN-2013-48,application/rdf+xml,82396,81307,0.0037\nCC-MAIN-2013-48,application/rss+xml,3766716,3576283,0.1677\nCC-MAIN-2013-48,application/rtf,1316,1248,0.0001\nCC-MAIN-2013-48,application/save-to-disk,37006,36650,0.0016\nCC-MAIN-2013-48,application/text,22293,22116,0.0010\nCC-MAIN-2013-48,application/unknown,9902,9733,0.0004\nCC-MAIN-2013-48,application/vnd.android.package-archive,1079,1062,0.0000\nCC-MAIN-2013-48,application/vnd.google-earth.kml+xml,194922,187921,0.0087\nCC-MAIN-2013-48,application/vnd.google-earth.kmz,35606,35101,0.0016\nCC-MAIN-2013-48,application/vnd.ms-excel,83815,81698,0.0037\nCC-MAIN-2013-48,application/vnd.ms-powerpoint,92892,79824,0.0041\nCC-MAIN-2013-48,application/vnd.ms-word,20416,19607,0.0009\nCC-MAIN-2013-48,application/vnd.oasis.opendocument.text,2242,2162,0.0001\nCC-MAIN-2013-48,application/vnd.openxmlformats-officedocument.presentationml.presentation,2959,2673,0.0001\nCC-MAIN-2013-48,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,3485,3014,0.0002\nCC-MAIN-2013-48,application/vnd.openxmlformats-officedocument.wordprocessingml.document,19593,17852,0.0009\nCC-MAIN-2013-48,application/vnd.wap.xhtml+xml,61544,60045,0.0027\nCC-MAIN-2013-48,application/x-bibtex,31421,31247,0.0014\nCC-MAIN-2013-48,application/x-bittorrent,8070,8011,0.0004\nCC-MAIN-2013-48,application/x-debian-package,86052,85386,0.0038\nCC-MAIN-2013-48,application/x-download,12532,12302,0.0006\nCC-MAIN-2013-48,application/x-endnote-refer,45451,45160,0.0020\nCC-MAIN-2013-48,application/x-gzip,36699,36187,0.0016\nCC-MAIN-2013-48,application/x-httpd-php,6886,6724,0.0003\nCC-MAIN-2013-48,application/x-java-jnlp-file,11946,11136,0.0005\nCC-MAIN-2013-48,application/x-javascript,13289,13249,0.0006\nCC-MAIN-2013-48,application/x-json,62393,62298,0.0028\nCC-MAIN-2013-48,application/x-mobipocket-ebook,34281,32717,0.0015\nCC-MAIN-2013-48,application/x-msdownload,1693,1647,0.0001\nCC-MAIN-2013-48,application/x-netcdf,24610,24432,0.0011\nCC-MAIN-2013-48,application/x-research-info-systems,86789,84519,0.0039\nCC-MAIN-2013-48,application/x-shockwave-flash,7691,7348,0.0003\nCC-MAIN-2013-48,application/x-tar,5571,5518,0.0002\nCC-MAIN-2013-48,application/x-tex,16637,16462,0.0007\nCC-MAIN-2013-48,application/x-troff-man,20280,18152,0.0009\nCC-MAIN-2013-48,application/x-zip-compressed,12466,11817,0.0006\nCC-MAIN-2013-48,application/xhtml+xml,1474364,1411435,0.0657\nCC-MAIN-2013-48,application/xml,2102144,2061509,0.0936\nCC-MAIN-2013-48,application/zip,109452,107778,0.0049\nCC-MAIN-2013-48,audio/mpeg,103975,89108,0.0046\nCC-MAIN-2013-48,audio/x-mpegurl,32652,32456,0.0015\nCC-MAIN-2013-48,audio/x-scpls,62043,61299,0.0028\nCC-MAIN-2013-48,audio/x-wav,363535,360691,0.0162\nCC-MAIN-2013-48,binary/octet-stream,21233,21046,0.0009\nCC-MAIN-2013-48,image/gif,796425,785610,0.0355\nCC-MAIN-2013-48,image/jp2,43937,43559,0.0020\nCC-MAIN-2013-48,image/jpeg,12104266,11930487,0.5390\nCC-MAIN-2013-48,image/jpg,135361,133488,0.0060\nCC-MAIN-2013-48,image/pjpeg,49062,46307,0.0022\nCC-MAIN-2013-48,image/png,868667,856897,0.0387\nCC-MAIN-2013-48,image/svg+xml,1517,1501,0.0001\nCC-MAIN-2013-48,image/tiff,24059,23884,0.0011\nCC-MAIN-2013-48,image/vnd.djvu,9115,9073,0.0004\nCC-MAIN-2013-48,image/webp,42,42,0.0000\nCC-MAIN-2013-48,message/rfc822,20859,20279,0.0009\nCC-MAIN-2013-48,text/calendar,1556809,1510898,0.0693\nCC-MAIN-2013-48,text/css,623,604,0.0000\nCC-MAIN-2013-48,text/csv,85916,84387,0.0038\nCC-MAIN-2013-48,text/directory,10703,10490,0.0005\nCC-MAIN-2013-48,text/enriched,12267,11816,0.0005\nCC-MAIN-2013-48,text/html,2196648300,2037889035,97.8125\nCC-MAIN-2013-48,text/javascript,18203,18035,0.0008\nCC-MAIN-2013-48,text/pdf,91,91,0.0000\nCC-MAIN-2013-48,text/plain,3734584,3556575,0.1663\nCC-MAIN-2013-48,text/prs.lines.tag,105,104,0.0000\nCC-MAIN-2013-48,text/tab-separated-values,52712,51575,0.0023\nCC-MAIN-2013-48,text/turtle,1325,1036,0.0001\nCC-MAIN-2013-48,text/vcard,1586,1462,0.0001\nCC-MAIN-2013-48,text/x-bibtex,22346,22203,0.0010\nCC-MAIN-2013-48,text/x-c,4412,4196,0.0002\nCC-MAIN-2013-48,text/x-csrc,4309,4245,0.0002\nCC-MAIN-2013-48,text/x-diff,21450,20807,0.0010\nCC-MAIN-2013-48,text/x-patch,103119,101376,0.0046\nCC-MAIN-2013-48,text/x-perl,31344,30933,0.0014\nCC-MAIN-2013-48,text/x-vcalendar,108561,104086,0.0048\nCC-MAIN-2013-48,text/x-vcard,46372,45445,0.0021\nCC-MAIN-2013-48,text/xml,10069428,9803236,0.4484\nCC-MAIN-2013-48,unknown/unknown,320180,272298,0.0143\nCC-MAIN-2013-48,video/mp4,3643,3565,0.0002\nCC-MAIN-2013-48,video/webm,5973,5805,0.0003\nCC-MAIN-2013-48,video/x-ms-asf,270066,264977,0.0120\nCC-MAIN-2014-10,<other>,2405722,2185033,0.1045\nCC-MAIN-2014-10,application/atom+xml,2437858,2302238,0.1059\nCC-MAIN-2014-10,application/calendar,11879,10833,0.0005\nCC-MAIN-2014-10,application/download,66339,62042,0.0029\nCC-MAIN-2014-10,application/epub+zip,55109,46654,0.0024\nCC-MAIN-2014-10,application/force-download,29609,25431,0.0013\nCC-MAIN-2014-10,application/gpx+xml,329,311,0.0000\nCC-MAIN-2014-10,application/ics,2319,2197,0.0001\nCC-MAIN-2014-10,application/javascript,461,395,0.0000\nCC-MAIN-2014-10,application/json,263578,247072,0.0115\nCC-MAIN-2014-10,application/ld+json,5,5,0.0000\nCC-MAIN-2014-10,application/marc,7663,7360,0.0003\nCC-MAIN-2014-10,application/msword,113833,100693,0.0049\nCC-MAIN-2014-10,application/octet-stream,905819,834343,0.0394\nCC-MAIN-2014-10,application/octetstream,15731,14789,0.0007\nCC-MAIN-2014-10,application/pdf,3955642,3490211,0.1719\nCC-MAIN-2014-10,application/pgp-encrypted,18520,17262,0.0008\nCC-MAIN-2014-10,application/pgp-signature,18753,17793,0.0008\nCC-MAIN-2014-10,application/postscript,6636,6159,0.0003\nCC-MAIN-2014-10,application/rdf+xml,81176,76811,0.0035\nCC-MAIN-2014-10,application/rss+xml,3727174,3375650,0.1620\nCC-MAIN-2014-10,application/rtf,1663,1521,0.0001\nCC-MAIN-2014-10,application/save-to-disk,40968,38886,0.0018\nCC-MAIN-2014-10,application/text,19310,18373,0.0008\nCC-MAIN-2014-10,application/unknown,8645,7948,0.0004\nCC-MAIN-2014-10,application/vnd.android.package-archive,1280,1189,0.0001\nCC-MAIN-2014-10,application/vnd.google-earth.kml+xml,156845,142468,0.0068\nCC-MAIN-2014-10,application/vnd.google-earth.kmz,37173,34908,0.0016\nCC-MAIN-2014-10,application/vnd.ms-excel,89447,83109,0.0039\nCC-MAIN-2014-10,application/vnd.ms-powerpoint,93014,83473,0.0040\nCC-MAIN-2014-10,application/vnd.ms-word,22468,20733,0.0010\nCC-MAIN-2014-10,application/vnd.oasis.opendocument.text,2088,1885,0.0001\nCC-MAIN-2014-10,application/vnd.openxmlformats-officedocument.presentationml.presentation,3990,3380,0.0002\nCC-MAIN-2014-10,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,4407,3571,0.0002\nCC-MAIN-2014-10,application/vnd.openxmlformats-officedocument.wordprocessingml.document,25250,21542,0.0011\nCC-MAIN-2014-10,application/vnd.wap.xhtml+xml,54807,50965,0.0024\nCC-MAIN-2014-10,application/x-bibtex,30237,28720,0.0013\nCC-MAIN-2014-10,application/x-bittorrent,5893,5547,0.0003\nCC-MAIN-2014-10,application/x-debian-package,81973,77514,0.0036\nCC-MAIN-2014-10,application/x-download,14669,13922,0.0006\nCC-MAIN-2014-10,application/x-endnote-refer,37715,35830,0.0016\nCC-MAIN-2014-10,application/x-gzip,41940,39366,0.0018\nCC-MAIN-2014-10,application/x-httpd-php,6487,6034,0.0003\nCC-MAIN-2014-10,application/x-java-jnlp-file,9654,8389,0.0004\nCC-MAIN-2014-10,application/x-javascript,7762,7363,0.0003\nCC-MAIN-2014-10,application/x-json,72135,69526,0.0031\nCC-MAIN-2014-10,application/x-mobipocket-ebook,20410,18072,0.0009\nCC-MAIN-2014-10,application/x-msdownload,1984,1791,0.0001\nCC-MAIN-2014-10,application/x-netcdf,15711,14975,0.0007\nCC-MAIN-2014-10,application/x-research-info-systems,99609,94472,0.0043\nCC-MAIN-2014-10,application/x-shockwave-flash,61607,59084,0.0027\nCC-MAIN-2014-10,application/x-tar,5754,5412,0.0003\nCC-MAIN-2014-10,application/x-tex,17010,16002,0.0007\nCC-MAIN-2014-10,application/x-troff-man,27782,23914,0.0012\nCC-MAIN-2014-10,application/x-zip-compressed,14269,12804,0.0006\nCC-MAIN-2014-10,application/xhtml+xml,1588669,1453835,0.0690\nCC-MAIN-2014-10,application/xml,1771232,1654156,0.0770\nCC-MAIN-2014-10,application/zip,129575,121349,0.0056\nCC-MAIN-2014-10,audio/mpeg,104953,87283,0.0046\nCC-MAIN-2014-10,audio/x-mpegurl,26029,24685,0.0011\nCC-MAIN-2014-10,audio/x-scpls,73419,69404,0.0032\nCC-MAIN-2014-10,audio/x-wav,432329,412070,0.0188\nCC-MAIN-2014-10,binary/octet-stream,6326,5890,0.0003\nCC-MAIN-2014-10,image/gif,812961,771001,0.0353\nCC-MAIN-2014-10,image/jp2,53926,51098,0.0023\nCC-MAIN-2014-10,image/jpeg,12147867,11497259,0.5279\nCC-MAIN-2014-10,image/jpg,159030,149812,0.0069\nCC-MAIN-2014-10,image/pjpeg,55796,50153,0.0024\nCC-MAIN-2014-10,image/png,885026,831909,0.0385\nCC-MAIN-2014-10,image/svg+xml,1417,1335,0.0001\nCC-MAIN-2014-10,image/tiff,37514,35723,0.0016\nCC-MAIN-2014-10,image/vnd.djvu,18770,17733,0.0008\nCC-MAIN-2014-10,image/webp,66,63,0.0000\nCC-MAIN-2014-10,message/rfc822,20711,19314,0.0009\nCC-MAIN-2014-10,text/calendar,1757154,1634368,0.0764\nCC-MAIN-2014-10,text/css,693,645,0.0000\nCC-MAIN-2014-10,text/csv,118879,110767,0.0052\nCC-MAIN-2014-10,text/directory,5289,4661,0.0002\nCC-MAIN-2014-10,text/enriched,10277,9467,0.0004\nCC-MAIN-2014-10,text/html,2250799620,1985398996,97.8088\nCC-MAIN-2014-10,text/javascript,18033,17198,0.0008\nCC-MAIN-2014-10,text/pdf,29328,28331,0.0013\nCC-MAIN-2014-10,text/plain,3871322,3544651,0.1682\nCC-MAIN-2014-10,text/prs.lines.tag,68,65,0.0000\nCC-MAIN-2014-10,text/tab-separated-values,75971,69531,0.0033\nCC-MAIN-2014-10,text/turtle,1273,988,0.0001\nCC-MAIN-2014-10,text/vcard,2909,1834,0.0001\nCC-MAIN-2014-10,text/x-bibtex,23930,22560,0.0010\nCC-MAIN-2014-10,text/x-c,4891,4423,0.0002\nCC-MAIN-2014-10,text/x-csrc,4243,3973,0.0002\nCC-MAIN-2014-10,text/x-diff,22779,21196,0.0010\nCC-MAIN-2014-10,text/x-patch,93694,88224,0.0041\nCC-MAIN-2014-10,text/x-perl,38315,36235,0.0017\nCC-MAIN-2014-10,text/x-vcalendar,123715,114224,0.0054\nCC-MAIN-2014-10,text/x-vcard,54164,50198,0.0024\nCC-MAIN-2014-10,text/xml,9925574,9190807,0.4313\nCC-MAIN-2014-10,unknown/unknown,396443,320294,0.0172\nCC-MAIN-2014-10,video/mp4,4444,4159,0.0002\nCC-MAIN-2014-10,video/webm,8818,8217,0.0004\nCC-MAIN-2014-10,video/x-ms-asf,247921,234557,0.0108\nCC-MAIN-2014-15,<other>,3410056,2153653,0.1291\nCC-MAIN-2014-15,application/atom+xml,3335685,2105066,0.1263\nCC-MAIN-2014-15,application/calendar,9331,6483,0.0004\nCC-MAIN-2014-15,application/download,57639,40502,0.0022\nCC-MAIN-2014-15,application/epub+zip,66114,38186,0.0025\nCC-MAIN-2014-15,application/force-download,45246,24444,0.0017\nCC-MAIN-2014-15,application/gpx+xml,248,157,0.0000\nCC-MAIN-2014-15,application/ics,3297,2248,0.0001\nCC-MAIN-2014-15,application/javascript,694,410,0.0000\nCC-MAIN-2014-15,application/json,346272,243047,0.0131\nCC-MAIN-2014-15,application/ld+json,8,5,0.0000\nCC-MAIN-2014-15,application/marc,9322,8646,0.0004\nCC-MAIN-2014-15,application/msword,165724,95470,0.0063\nCC-MAIN-2014-15,application/octet-stream,1226939,805576,0.0465\nCC-MAIN-2014-15,application/octetstream,25170,15200,0.0010\nCC-MAIN-2014-15,application/pdf,5561389,3195186,0.2105\nCC-MAIN-2014-15,application/pgp-encrypted,20210,16707,0.0008\nCC-MAIN-2014-15,application/pgp-signature,29840,18021,0.0011\nCC-MAIN-2014-15,application/postscript,8773,5616,0.0003\nCC-MAIN-2014-15,application/rdf+xml,74600,55488,0.0028\nCC-MAIN-2014-15,application/rss+xml,3917534,2624567,0.1483\nCC-MAIN-2014-15,application/rtf,4096,2914,0.0002\nCC-MAIN-2014-15,application/save-to-disk,43448,38623,0.0016\nCC-MAIN-2014-15,application/text,28165,18562,0.0011\nCC-MAIN-2014-15,application/unknown,13186,8152,0.0005\nCC-MAIN-2014-15,application/vnd.android.package-archive,2267,1441,0.0001\nCC-MAIN-2014-15,application/vnd.google-earth.kml+xml,171463,123296,0.0065\nCC-MAIN-2014-15,application/vnd.google-earth.kmz,56050,36139,0.0021\nCC-MAIN-2014-15,application/vnd.ms-excel,114006,76677,0.0043\nCC-MAIN-2014-15,application/vnd.ms-powerpoint,99859,71793,0.0038\nCC-MAIN-2014-15,application/vnd.ms-word,27634,19276,0.0010\nCC-MAIN-2014-15,application/vnd.oasis.opendocument.text,2931,1758,0.0001\nCC-MAIN-2014-15,application/vnd.openxmlformats-officedocument.presentationml.presentation,6271,3225,0.0002\nCC-MAIN-2014-15,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,6592,3118,0.0002\nCC-MAIN-2014-15,application/vnd.openxmlformats-officedocument.wordprocessingml.document,40808,21055,0.0015\nCC-MAIN-2014-15,application/vnd.wap.xhtml+xml,95163,51696,0.0036\nCC-MAIN-2014-15,application/x-bibtex,36263,26136,0.0014\nCC-MAIN-2014-15,application/x-bittorrent,12586,5657,0.0005\nCC-MAIN-2014-15,application/x-debian-package,131421,77057,0.0050\nCC-MAIN-2014-15,application/x-download,18962,11609,0.0007\nCC-MAIN-2014-15,application/x-endnote-refer,46990,35973,0.0018\nCC-MAIN-2014-15,application/x-gzip,39707,29358,0.0015\nCC-MAIN-2014-15,application/x-httpd-php,9252,5518,0.0004\nCC-MAIN-2014-15,application/x-java-jnlp-file,15282,8047,0.0006\nCC-MAIN-2014-15,application/x-javascript,2757,1855,0.0001\nCC-MAIN-2014-15,application/x-json,43265,39883,0.0016\nCC-MAIN-2014-15,application/x-mobipocket-ebook,20826,15067,0.0008\nCC-MAIN-2014-15,application/x-msdownload,3513,1832,0.0001\nCC-MAIN-2014-15,application/x-netcdf,5765,4310,0.0002\nCC-MAIN-2014-15,application/x-research-info-systems,72970,57476,0.0028\nCC-MAIN-2014-15,application/x-shockwave-flash,112137,57888,0.0042\nCC-MAIN-2014-15,application/x-tar,9116,5833,0.0003\nCC-MAIN-2014-15,application/x-tex,30862,18028,0.0012\nCC-MAIN-2014-15,application/x-troff-man,37908,24944,0.0014\nCC-MAIN-2014-15,application/x-zip-compressed,21817,12644,0.0008\nCC-MAIN-2014-15,application/xhtml+xml,1685823,1100133,0.0638\nCC-MAIN-2014-15,application/xml,1958185,1390637,0.0741\nCC-MAIN-2014-15,application/zip,175695,108015,0.0067\nCC-MAIN-2014-15,audio/mpeg,155498,85472,0.0059\nCC-MAIN-2014-15,audio/x-mpegurl,40797,28508,0.0015\nCC-MAIN-2014-15,audio/x-scpls,108057,68999,0.0041\nCC-MAIN-2014-15,audio/x-wav,549998,355908,0.0208\nCC-MAIN-2014-15,binary/octet-stream,10798,6046,0.0004\nCC-MAIN-2014-15,image/gif,943488,622540,0.0357\nCC-MAIN-2014-15,image/jp2,24552,21879,0.0009\nCC-MAIN-2014-15,image/jpeg,13879319,9095219,0.5255\nCC-MAIN-2014-15,image/jpg,242325,149025,0.0092\nCC-MAIN-2014-15,image/pjpeg,83501,49369,0.0032\nCC-MAIN-2014-15,image/png,1223821,773704,0.0463\nCC-MAIN-2014-15,image/svg+xml,1854,1213,0.0001\nCC-MAIN-2014-15,image/tiff,40925,31211,0.0015\nCC-MAIN-2014-15,image/vnd.djvu,36857,18201,0.0014\nCC-MAIN-2014-15,image/webp,116,72,0.0000\nCC-MAIN-2014-15,message/rfc822,37025,19431,0.0014\nCC-MAIN-2014-15,text/calendar,1991744,1415839,0.0754\nCC-MAIN-2014-15,text/css,1049,593,0.0000\nCC-MAIN-2014-15,text/csv,95716,70865,0.0036\nCC-MAIN-2014-15,text/directory,8094,4599,0.0003\nCC-MAIN-2014-15,text/enriched,12658,9478,0.0005\nCC-MAIN-2014-15,text/html,2578854193,1678331216,97.6332\nCC-MAIN-2014-15,text/javascript,20948,15525,0.0008\nCC-MAIN-2014-15,text/pdf,15985,14779,0.0006\nCC-MAIN-2014-15,text/plain,5054040,3281336,0.1913\nCC-MAIN-2014-15,text/prs.lines.tag,108,69,0.0000\nCC-MAIN-2014-15,text/tab-separated-values,66889,48033,0.0025\nCC-MAIN-2014-15,text/turtle,572,428,0.0000\nCC-MAIN-2014-15,text/vcard,3717,1630,0.0001\nCC-MAIN-2014-15,text/x-bibtex,31473,22735,0.0012\nCC-MAIN-2014-15,text/x-c,7702,4517,0.0003\nCC-MAIN-2014-15,text/x-csrc,6582,4146,0.0002\nCC-MAIN-2014-15,text/x-diff,20870,14025,0.0008\nCC-MAIN-2014-15,text/x-patch,123586,94077,0.0047\nCC-MAIN-2014-15,text/x-perl,61600,34316,0.0023\nCC-MAIN-2014-15,text/x-vcalendar,152256,96923,0.0058\nCC-MAIN-2014-15,text/x-vcard,75536,47040,0.0029\nCC-MAIN-2014-15,text/xml,13404080,8509269,0.5075\nCC-MAIN-2014-15,unknown/unknown,205621,133011,0.0078\nCC-MAIN-2014-15,video/mp4,7899,4018,0.0003\nCC-MAIN-2014-15,video/webm,14602,8348,0.0006\nCC-MAIN-2014-15,video/x-ms-asf,237733,182847,0.0090\nCC-MAIN-2014-23,<other>,4765101,2991171,0.1320\nCC-MAIN-2014-23,application/atom+xml,3760881,2190052,0.1042\nCC-MAIN-2014-23,application/calendar,13986,8806,0.0004\nCC-MAIN-2014-23,application/download,100016,70989,0.0028\nCC-MAIN-2014-23,application/epub+zip,109845,64779,0.0030\nCC-MAIN-2014-23,application/force-download,43669,23129,0.0012\nCC-MAIN-2014-23,application/gpx+xml,407,222,0.0000\nCC-MAIN-2014-23,application/ics,5422,3196,0.0002\nCC-MAIN-2014-23,application/javascript,752,378,0.0000\nCC-MAIN-2014-23,application/json,685214,442907,0.0190\nCC-MAIN-2014-23,application/ld+json,8222,7954,0.0002\nCC-MAIN-2014-23,application/marc,33982,22093,0.0009\nCC-MAIN-2014-23,application/msword,184522,98997,0.0051\nCC-MAIN-2014-23,application/octet-stream,1452455,861465,0.0402\nCC-MAIN-2014-23,application/octetstream,30780,15683,0.0009\nCC-MAIN-2014-23,application/pdf,6272079,3434030,0.1738\nCC-MAIN-2014-23,application/pgp-encrypted,10075,6090,0.0003\nCC-MAIN-2014-23,application/pgp-signature,33399,19968,0.0009\nCC-MAIN-2014-23,application/postscript,11091,6522,0.0003\nCC-MAIN-2014-23,application/rdf+xml,119561,80500,0.0033\nCC-MAIN-2014-23,application/rss+xml,5383812,3276668,0.1492\nCC-MAIN-2014-23,application/rtf,2614,1366,0.0001\nCC-MAIN-2014-23,application/save-to-disk,56239,38726,0.0016\nCC-MAIN-2014-23,application/text,43163,26882,0.0012\nCC-MAIN-2014-23,application/unknown,16286,8941,0.0005\nCC-MAIN-2014-23,application/vnd.android.package-archive,2662,1457,0.0001\nCC-MAIN-2014-23,application/vnd.google-earth.kml+xml,287718,176166,0.0080\nCC-MAIN-2014-23,application/vnd.google-earth.kmz,60993,36527,0.0017\nCC-MAIN-2014-23,application/vnd.ms-excel,150193,91825,0.0042\nCC-MAIN-2014-23,application/vnd.ms-powerpoint,150205,97872,0.0042\nCC-MAIN-2014-23,application/vnd.ms-word,36574,23001,0.0010\nCC-MAIN-2014-23,application/vnd.oasis.opendocument.text,3287,1751,0.0001\nCC-MAIN-2014-23,application/vnd.openxmlformats-officedocument.presentationml.presentation,6460,3242,0.0002\nCC-MAIN-2014-23,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,6841,3411,0.0002\nCC-MAIN-2014-23,application/vnd.openxmlformats-officedocument.wordprocessingml.document,42302,21625,0.0012\nCC-MAIN-2014-23,application/vnd.wap.xhtml+xml,89126,51947,0.0025\nCC-MAIN-2014-23,application/x-bibtex,54787,34064,0.0015\nCC-MAIN-2014-23,application/x-bittorrent,11591,5982,0.0003\nCC-MAIN-2014-23,application/x-debian-package,98039,52439,0.0027\nCC-MAIN-2014-23,application/x-download,23025,12744,0.0006\nCC-MAIN-2014-23,application/x-endnote-refer,69776,47724,0.0019\nCC-MAIN-2014-23,application/x-gzip,18346,10319,0.0005\nCC-MAIN-2014-23,application/x-httpd-php,173095,168203,0.0048\nCC-MAIN-2014-23,application/x-java-jnlp-file,25634,12588,0.0007\nCC-MAIN-2014-23,application/x-javascript,8485,6871,0.0002\nCC-MAIN-2014-23,application/x-json,111151,93375,0.0031\nCC-MAIN-2014-23,application/x-mobipocket-ebook,43570,30767,0.0012\nCC-MAIN-2014-23,application/x-msdownload,3442,1891,0.0001\nCC-MAIN-2014-23,application/x-netcdf,17874,11951,0.0005\nCC-MAIN-2014-23,application/x-research-info-systems,147675,108365,0.0041\nCC-MAIN-2014-23,application/x-shockwave-flash,64704,42959,0.0018\nCC-MAIN-2014-23,application/x-tar,9876,6201,0.0003\nCC-MAIN-2014-23,application/x-tex,31848,17679,0.0009\nCC-MAIN-2014-23,application/x-troff-man,45156,23716,0.0013\nCC-MAIN-2014-23,application/x-zip-compressed,21367,13117,0.0006\nCC-MAIN-2014-23,application/xhtml+xml,1980391,1297456,0.0549\nCC-MAIN-2014-23,application/xml,2682697,1690358,0.0743\nCC-MAIN-2014-23,application/zip,184432,105155,0.0051\nCC-MAIN-2014-23,audio/mpeg,141200,68097,0.0039\nCC-MAIN-2014-23,audio/x-mpegurl,68678,40036,0.0019\nCC-MAIN-2014-23,audio/x-scpls,118837,71771,0.0033\nCC-MAIN-2014-23,audio/x-wav,742914,438546,0.0206\nCC-MAIN-2014-23,binary/octet-stream,11605,6557,0.0003\nCC-MAIN-2014-23,image/gif,1291243,860635,0.0358\nCC-MAIN-2014-23,image/jp2,54737,39721,0.0015\nCC-MAIN-2014-23,image/jpeg,18204051,11360620,0.5044\nCC-MAIN-2014-23,image/jpg,257658,145637,0.0071\nCC-MAIN-2014-23,image/pjpeg,83248,46048,0.0023\nCC-MAIN-2014-23,image/png,1354931,786496,0.0375\nCC-MAIN-2014-23,image/svg+xml,2410,1346,0.0001\nCC-MAIN-2014-23,image/tiff,69157,49739,0.0019\nCC-MAIN-2014-23,image/vnd.djvu,84809,48677,0.0024\nCC-MAIN-2014-23,image/webp,88,49,0.0000\nCC-MAIN-2014-23,message/rfc822,37234,20036,0.0010\nCC-MAIN-2014-23,text/calendar,3072946,1832652,0.0852\nCC-MAIN-2014-23,text/css,1269,658,0.0000\nCC-MAIN-2014-23,text/csv,111818,74348,0.0031\nCC-MAIN-2014-23,text/directory,8607,4848,0.0002\nCC-MAIN-2014-23,text/enriched,16234,11167,0.0004\nCC-MAIN-2014-23,text/html,3529062423,2068347457,97.7926\nCC-MAIN-2014-23,text/javascript,40238,30240,0.0011\nCC-MAIN-2014-23,text/pdf,10040,9979,0.0003\nCC-MAIN-2014-23,text/plain,6360140,3886191,0.1762\nCC-MAIN-2014-23,text/prs.lines.tag,140,77,0.0000\nCC-MAIN-2014-23,text/tab-separated-values,56762,35415,0.0016\nCC-MAIN-2014-23,text/turtle,10033,9034,0.0003\nCC-MAIN-2014-23,text/vcard,1672,955,0.0000\nCC-MAIN-2014-23,text/x-bibtex,37531,23011,0.0010\nCC-MAIN-2014-23,text/x-c,8883,4908,0.0002\nCC-MAIN-2014-23,text/x-csrc,5973,3545,0.0002\nCC-MAIN-2014-23,text/x-diff,16113,9285,0.0004\nCC-MAIN-2014-23,text/x-patch,158254,96260,0.0044\nCC-MAIN-2014-23,text/x-perl,58593,35395,0.0016\nCC-MAIN-2014-23,text/x-vcalendar,144656,80408,0.0040\nCC-MAIN-2014-23,text/x-vcard,88064,49568,0.0024\nCC-MAIN-2014-23,text/xml,16236686,9508904,0.4499\nCC-MAIN-2014-23,unknown/unknown,360537,203218,0.0100\nCC-MAIN-2014-23,video/mp4,7598,4401,0.0002\nCC-MAIN-2014-23,video/webm,14245,7578,0.0004\nCC-MAIN-2014-23,video/x-ms-asf,501726,382478,0.0139\nCC-MAIN-2014-35,<other>,4499417,3004778,0.1567\nCC-MAIN-2014-35,application/atom+xml,3293966,2070045,0.1147\nCC-MAIN-2014-35,application/calendar,12630,8242,0.0004\nCC-MAIN-2014-35,application/download,76778,57041,0.0027\nCC-MAIN-2014-35,application/epub+zip,81076,50473,0.0028\nCC-MAIN-2014-35,application/force-download,37820,22263,0.0013\nCC-MAIN-2014-35,application/gpx+xml,365,233,0.0000\nCC-MAIN-2014-35,application/ics,5059,3109,0.0002\nCC-MAIN-2014-35,application/javascript,653,356,0.0000\nCC-MAIN-2014-35,application/json,534425,368747,0.0186\nCC-MAIN-2014-35,application/ld+json,6834,6654,0.0002\nCC-MAIN-2014-35,application/marc,18740,16791,0.0007\nCC-MAIN-2014-35,application/msword,155639,93092,0.0054\nCC-MAIN-2014-35,application/octet-stream,1246095,824072,0.0434\nCC-MAIN-2014-35,application/octetstream,25869,15267,0.0009\nCC-MAIN-2014-35,application/pdf,5434404,3200291,0.1893\nCC-MAIN-2014-35,application/pgp-encrypted,8352,5551,0.0003\nCC-MAIN-2014-35,application/pgp-signature,28826,18286,0.0010\nCC-MAIN-2014-35,application/postscript,9750,6451,0.0003\nCC-MAIN-2014-35,application/rdf+xml,105136,79957,0.0037\nCC-MAIN-2014-35,application/rss+xml,4274663,2829496,0.1489\nCC-MAIN-2014-35,application/rtf,2316,1356,0.0001\nCC-MAIN-2014-35,application/save-to-disk,54600,38826,0.0019\nCC-MAIN-2014-35,application/text,36236,23353,0.0013\nCC-MAIN-2014-35,application/unknown,14849,8649,0.0005\nCC-MAIN-2014-35,application/vnd.android.package-archive,2302,1405,0.0001\nCC-MAIN-2014-35,application/vnd.google-earth.kml+xml,235817,165950,0.0082\nCC-MAIN-2014-35,application/vnd.google-earth.kmz,58830,35434,0.0020\nCC-MAIN-2014-35,application/vnd.ms-excel,129975,87002,0.0045\nCC-MAIN-2014-35,application/vnd.ms-powerpoint,120212,89376,0.0042\nCC-MAIN-2014-35,application/vnd.ms-word,31769,20406,0.0011\nCC-MAIN-2014-35,application/vnd.oasis.opendocument.text,2904,1674,0.0001\nCC-MAIN-2014-35,application/vnd.openxmlformats-officedocument.presentationml.presentation,5729,3084,0.0002\nCC-MAIN-2014-35,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,5704,3028,0.0002\nCC-MAIN-2014-35,application/vnd.openxmlformats-officedocument.wordprocessingml.document,37579,20633,0.0013\nCC-MAIN-2014-35,application/vnd.wap.xhtml+xml,78909,48612,0.0027\nCC-MAIN-2014-35,application/x-bibtex,46341,32240,0.0016\nCC-MAIN-2014-35,application/x-bittorrent,6639,5223,0.0002\nCC-MAIN-2014-35,application/x-debian-package,85670,50590,0.0030\nCC-MAIN-2014-35,application/x-download,20266,12540,0.0007\nCC-MAIN-2014-35,application/x-endnote-refer,50859,38372,0.0018\nCC-MAIN-2014-35,application/x-gzip,65060,38399,0.0023\nCC-MAIN-2014-35,application/x-httpd-php,12504,7092,0.0004\nCC-MAIN-2014-35,application/x-java-jnlp-file,22189,12323,0.0008\nCC-MAIN-2014-35,application/x-javascript,5547,4752,0.0002\nCC-MAIN-2014-35,application/x-json,60278,57312,0.0021\nCC-MAIN-2014-35,application/x-mobipocket-ebook,29244,21456,0.0010\nCC-MAIN-2014-35,application/x-msdownload,3113,1850,0.0001\nCC-MAIN-2014-35,application/x-netcdf,22309,17127,0.0008\nCC-MAIN-2014-35,application/x-research-info-systems,98888,82453,0.0034\nCC-MAIN-2014-35,application/x-shockwave-flash,24423,18943,0.0009\nCC-MAIN-2014-35,application/x-tar,8878,5878,0.0003\nCC-MAIN-2014-35,application/x-tex,27531,17302,0.0010\nCC-MAIN-2014-35,application/x-troff-man,34815,21914,0.0012\nCC-MAIN-2014-35,application/x-zip-compressed,18695,12527,0.0007\nCC-MAIN-2014-35,application/xhtml+xml,1408480,991530,0.0491\nCC-MAIN-2014-35,application/xml,2097943,1471549,0.0731\nCC-MAIN-2014-35,application/zip,146153,96105,0.0051\nCC-MAIN-2014-35,audio/mpeg,126250,67331,0.0044\nCC-MAIN-2014-35,audio/x-mpegurl,55557,37572,0.0019\nCC-MAIN-2014-35,audio/x-scpls,117088,70164,0.0041\nCC-MAIN-2014-35,audio/x-wav,635617,417943,0.0221\nCC-MAIN-2014-35,binary/octet-stream,10351,6040,0.0004\nCC-MAIN-2014-35,image/gif,1116133,785917,0.0389\nCC-MAIN-2014-35,image/jp2,37479,33260,0.0013\nCC-MAIN-2014-35,image/jpeg,16433557,11106850,0.5725\nCC-MAIN-2014-35,image/jpg,229372,140505,0.0080\nCC-MAIN-2014-35,image/pjpeg,66803,38506,0.0023\nCC-MAIN-2014-35,image/png,1190157,741412,0.0415\nCC-MAIN-2014-35,image/svg+xml,2120,1297,0.0001\nCC-MAIN-2014-35,image/tiff,53592,40919,0.0019\nCC-MAIN-2014-35,image/vnd.djvu,78856,47099,0.0027\nCC-MAIN-2014-35,image/webp,82,48,0.0000\nCC-MAIN-2014-35,message/rfc822,32758,19316,0.0011\nCC-MAIN-2014-35,text/calendar,2250679,1565332,0.0784\nCC-MAIN-2014-35,text/css,1037,615,0.0000\nCC-MAIN-2014-35,text/csv,83478,61045,0.0029\nCC-MAIN-2014-35,text/directory,8308,4699,0.0003\nCC-MAIN-2014-35,text/enriched,12668,10145,0.0004\nCC-MAIN-2014-35,text/html,2802737236,1833191386,97.6328\nCC-MAIN-2014-35,text/javascript,31365,25661,0.0011\nCC-MAIN-2014-35,text/pdf,129,73,0.0000\nCC-MAIN-2014-35,text/plain,5195005,3405543,0.1810\nCC-MAIN-2014-35,text/prs.lines.tag,128,74,0.0000\nCC-MAIN-2014-35,text/tab-separated-values,46414,31764,0.0016\nCC-MAIN-2014-35,text/turtle,8308,7745,0.0003\nCC-MAIN-2014-35,text/vcard,1525,914,0.0001\nCC-MAIN-2014-35,text/x-bibtex,36852,22381,0.0013\nCC-MAIN-2014-35,text/x-c,8099,4790,0.0003\nCC-MAIN-2014-35,text/x-csrc,5225,3433,0.0002\nCC-MAIN-2014-35,text/x-diff,14387,8398,0.0005\nCC-MAIN-2014-35,text/x-patch,133928,91643,0.0047\nCC-MAIN-2014-35,text/x-perl,40811,26648,0.0014\nCC-MAIN-2014-35,text/x-vcalendar,127566,78241,0.0044\nCC-MAIN-2014-35,text/x-vcard,78186,46565,0.0027\nCC-MAIN-2014-35,text/xml,14147028,8941218,0.4928\nCC-MAIN-2014-35,unknown/unknown,269707,179823,0.0094\nCC-MAIN-2014-35,video/mp4,7195,4265,0.0003\nCC-MAIN-2014-35,video/webm,12816,7441,0.0004\nCC-MAIN-2014-35,video/x-ms-asf,278518,225398,0.0097\nCC-MAIN-2014-41,<other>,4214446,3034506,0.1414\nCC-MAIN-2014-41,application/atom+xml,3232057,2171954,0.1085\nCC-MAIN-2014-41,application/calendar,13231,8765,0.0004\nCC-MAIN-2014-41,application/download,77729,60257,0.0026\nCC-MAIN-2014-41,application/epub+zip,84510,61881,0.0028\nCC-MAIN-2014-41,application/force-download,36903,23260,0.0012\nCC-MAIN-2014-41,application/gpx+xml,384,261,0.0000\nCC-MAIN-2014-41,application/ics,5527,3539,0.0002\nCC-MAIN-2014-41,application/javascript,645,380,0.0000\nCC-MAIN-2014-41,application/json,591509,414454,0.0199\nCC-MAIN-2014-41,application/ld+json,11701,11141,0.0004\nCC-MAIN-2014-41,application/marc,21884,18813,0.0007\nCC-MAIN-2014-41,application/msword,158269,99955,0.0053\nCC-MAIN-2014-41,application/octet-stream,1268695,872172,0.0426\nCC-MAIN-2014-41,application/octetstream,24796,15883,0.0008\nCC-MAIN-2014-41,application/pdf,5466329,3426220,0.1834\nCC-MAIN-2014-41,application/pgp-encrypted,8514,5847,0.0003\nCC-MAIN-2014-41,application/pgp-signature,29287,19569,0.0010\nCC-MAIN-2014-41,application/postscript,10134,6926,0.0003\nCC-MAIN-2014-41,application/rdf+xml,118480,88880,0.0040\nCC-MAIN-2014-41,application/rss+xml,4431144,3002734,0.1487\nCC-MAIN-2014-41,application/rtf,2266,1448,0.0001\nCC-MAIN-2014-41,application/save-to-disk,63286,41456,0.0021\nCC-MAIN-2014-41,application/text,31060,23360,0.0010\nCC-MAIN-2014-41,application/unknown,13730,8636,0.0005\nCC-MAIN-2014-41,application/vnd.android.package-archive,2258,1516,0.0001\nCC-MAIN-2014-41,application/vnd.google-earth.kml+xml,241006,172444,0.0081\nCC-MAIN-2014-41,application/vnd.google-earth.kmz,57543,37423,0.0019\nCC-MAIN-2014-41,application/vnd.ms-excel,131628,90999,0.0044\nCC-MAIN-2014-41,application/vnd.ms-powerpoint,134107,97467,0.0045\nCC-MAIN-2014-41,application/vnd.ms-word,32698,22107,0.0011\nCC-MAIN-2014-41,application/vnd.oasis.opendocument.text,2975,1894,0.0001\nCC-MAIN-2014-41,application/vnd.openxmlformats-officedocument.presentationml.presentation,5789,3404,0.0002\nCC-MAIN-2014-41,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,6007,3432,0.0002\nCC-MAIN-2014-41,application/vnd.openxmlformats-officedocument.wordprocessingml.document,38179,22557,0.0013\nCC-MAIN-2014-41,application/vnd.wap.xhtml+xml,71119,45841,0.0024\nCC-MAIN-2014-41,application/x-bibtex,56845,38148,0.0019\nCC-MAIN-2014-41,application/x-bittorrent,8492,5689,0.0003\nCC-MAIN-2014-41,application/x-debian-package,81988,53304,0.0028\nCC-MAIN-2014-41,application/x-download,19295,12930,0.0006\nCC-MAIN-2014-41,application/x-endnote-refer,59992,44007,0.0020\nCC-MAIN-2014-41,application/x-gzip,61656,39595,0.0021\nCC-MAIN-2014-41,application/x-httpd-php,10314,6735,0.0003\nCC-MAIN-2014-41,application/x-java-jnlp-file,21594,13459,0.0007\nCC-MAIN-2014-41,application/x-javascript,5615,4921,0.0002\nCC-MAIN-2014-41,application/x-json,36941,36214,0.0012\nCC-MAIN-2014-41,application/x-mobipocket-ebook,37131,28711,0.0012\nCC-MAIN-2014-41,application/x-msdownload,3093,1963,0.0001\nCC-MAIN-2014-41,application/x-netcdf,24244,18541,0.0008\nCC-MAIN-2014-41,application/x-research-info-systems,104284,85973,0.0035\nCC-MAIN-2014-41,application/x-shockwave-flash,62070,46494,0.0021\nCC-MAIN-2014-41,application/x-tar,8906,6187,0.0003\nCC-MAIN-2014-41,application/x-tex,26371,17892,0.0009\nCC-MAIN-2014-41,application/x-troff-man,47241,26001,0.0016\nCC-MAIN-2014-41,application/x-zip-compressed,19444,13102,0.0007\nCC-MAIN-2014-41,application/xhtml+xml,1514890,1030740,0.0508\nCC-MAIN-2014-41,application/xml,2176637,1544597,0.0730\nCC-MAIN-2014-41,application/zip,164762,111427,0.0055\nCC-MAIN-2014-41,audio/mpeg,128984,70400,0.0043\nCC-MAIN-2014-41,audio/x-mpegurl,61242,41299,0.0021\nCC-MAIN-2014-41,audio/x-scpls,111133,71845,0.0037\nCC-MAIN-2014-41,audio/x-wav,632576,434536,0.0212\nCC-MAIN-2014-41,binary/octet-stream,9883,6333,0.0003\nCC-MAIN-2014-41,image/gif,1121785,828361,0.0376\nCC-MAIN-2014-41,image/jp2,53374,45218,0.0018\nCC-MAIN-2014-41,image/jpeg,16861809,11765490,0.5659\nCC-MAIN-2014-41,image/jpg,225535,147455,0.0076\nCC-MAIN-2014-41,image/pjpeg,64106,40103,0.0022\nCC-MAIN-2014-41,image/png,1147733,766427,0.0385\nCC-MAIN-2014-41,image/svg+xml,2027,1350,0.0001\nCC-MAIN-2014-41,image/tiff,58472,45331,0.0020\nCC-MAIN-2014-41,image/vnd.djvu,78995,51560,0.0027\nCC-MAIN-2014-41,image/webp,73,51,0.0000\nCC-MAIN-2014-41,message/rfc822,30495,19712,0.0010\nCC-MAIN-2014-41,text/calendar,2838174,1930665,0.0952\nCC-MAIN-2014-41,text/css,1002,677,0.0000\nCC-MAIN-2014-41,text/csv,90479,67182,0.0030\nCC-MAIN-2014-41,text/directory,8979,5257,0.0003\nCC-MAIN-2014-41,text/enriched,14851,11331,0.0005\nCC-MAIN-2014-41,text/html,2910392456,1933315429,97.6726\nCC-MAIN-2014-41,text/javascript,46001,39246,0.0015\nCC-MAIN-2014-41,text/pdf,117,73,0.0000\nCC-MAIN-2014-41,text/plain,5281349,3601243,0.1772\nCC-MAIN-2014-41,text/prs.lines.tag,111,75,0.0000\nCC-MAIN-2014-41,text/tab-separated-values,49078,33706,0.0016\nCC-MAIN-2014-41,text/turtle,13034,11992,0.0004\nCC-MAIN-2014-41,text/vcard,1937,1220,0.0001\nCC-MAIN-2014-41,text/x-bibtex,36274,23289,0.0012\nCC-MAIN-2014-41,text/x-c,7785,5074,0.0003\nCC-MAIN-2014-41,text/x-csrc,5096,3481,0.0002\nCC-MAIN-2014-41,text/x-diff,13643,8669,0.0005\nCC-MAIN-2014-41,text/x-patch,146193,97113,0.0049\nCC-MAIN-2014-41,text/x-perl,32870,21491,0.0011\nCC-MAIN-2014-41,text/x-vcalendar,127908,81860,0.0043\nCC-MAIN-2014-41,text/x-vcard,75357,49769,0.0025\nCC-MAIN-2014-41,text/xml,14063695,9337103,0.4720\nCC-MAIN-2014-41,unknown/unknown,320947,206636,0.0108\nCC-MAIN-2014-41,video/mp4,7196,4638,0.0002\nCC-MAIN-2014-41,video/webm,13308,8534,0.0004\nCC-MAIN-2014-41,video/x-ms-asf,375851,311610,0.0126\nCC-MAIN-2014-42,<other>,5294339,2143699,0.1422\nCC-MAIN-2014-42,application/atom+xml,5412175,1983515,0.1454\nCC-MAIN-2014-42,application/calendar,19044,7954,0.0005\nCC-MAIN-2014-42,application/download,106249,51784,0.0029\nCC-MAIN-2014-42,application/epub+zip,113658,44503,0.0031\nCC-MAIN-2014-42,application/force-download,66031,22396,0.0018\nCC-MAIN-2014-42,application/gpx+xml,731,260,0.0000\nCC-MAIN-2014-42,application/ics,9208,3464,0.0002\nCC-MAIN-2014-42,application/javascript,1099,355,0.0000\nCC-MAIN-2014-42,application/json,723032,344951,0.0194\nCC-MAIN-2014-42,application/ld+json,6921,6428,0.0002\nCC-MAIN-2014-42,application/marc,10728,9336,0.0003\nCC-MAIN-2014-42,application/msword,256046,87448,0.0069\nCC-MAIN-2014-42,application/octet-stream,1825470,813749,0.0490\nCC-MAIN-2014-42,application/octetstream,49612,15874,0.0013\nCC-MAIN-2014-42,application/pdf,9010631,3185272,0.2421\nCC-MAIN-2014-42,application/pgp-encrypted,12299,5019,0.0003\nCC-MAIN-2014-42,application/pgp-signature,50196,19175,0.0013\nCC-MAIN-2014-42,application/postscript,15315,5726,0.0004\nCC-MAIN-2014-42,application/rdf+xml,131970,69921,0.0035\nCC-MAIN-2014-42,application/rss+xml,5470520,2410358,0.1470\nCC-MAIN-2014-42,application/rtf,4333,1440,0.0001\nCC-MAIN-2014-42,application/save-to-disk,71781,40144,0.0019\nCC-MAIN-2014-42,application/text,38943,17155,0.0010\nCC-MAIN-2014-42,application/unknown,24557,8495,0.0007\nCC-MAIN-2014-42,application/vnd.android.package-archive,4544,1661,0.0001\nCC-MAIN-2014-42,application/vnd.google-earth.kml+xml,305893,137240,0.0082\nCC-MAIN-2014-42,application/vnd.google-earth.kmz,96075,36897,0.0026\nCC-MAIN-2014-42,application/vnd.ms-excel,192106,85106,0.0052\nCC-MAIN-2014-42,application/vnd.ms-powerpoint,94529,59069,0.0025\nCC-MAIN-2014-42,application/vnd.ms-word,52294,20045,0.0014\nCC-MAIN-2014-42,application/vnd.oasis.opendocument.text,5463,1855,0.0001\nCC-MAIN-2014-42,application/vnd.openxmlformats-officedocument.presentationml.presentation,10601,3245,0.0003\nCC-MAIN-2014-42,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,10771,3261,0.0003\nCC-MAIN-2014-42,application/vnd.openxmlformats-officedocument.wordprocessingml.document,69088,21683,0.0019\nCC-MAIN-2014-42,application/vnd.wap.xhtml+xml,141357,45995,0.0038\nCC-MAIN-2014-42,application/x-bibtex,76901,32445,0.0021\nCC-MAIN-2014-42,application/x-bittorrent,17759,5790,0.0005\nCC-MAIN-2014-42,application/x-debian-package,168679,53930,0.0045\nCC-MAIN-2014-42,application/x-download,37891,13675,0.0010\nCC-MAIN-2014-42,application/x-endnote-refer,61866,32915,0.0017\nCC-MAIN-2014-42,application/x-gzip,101746,39344,0.0027\nCC-MAIN-2014-42,application/x-httpd-php,19194,6909,0.0005\nCC-MAIN-2014-42,application/x-java-jnlp-file,40163,12514,0.0011\nCC-MAIN-2014-42,application/x-javascript,7452,5109,0.0002\nCC-MAIN-2014-42,application/x-json,31471,29926,0.0008\nCC-MAIN-2014-42,application/x-mobipocket-ebook,30816,16032,0.0008\nCC-MAIN-2014-42,application/x-msdownload,4556,1581,0.0001\nCC-MAIN-2014-42,application/x-netcdf,29664,15352,0.0008\nCC-MAIN-2014-42,application/x-research-info-systems,108265,62830,0.0029\nCC-MAIN-2014-42,application/x-shockwave-flash,55379,32678,0.0015\nCC-MAIN-2014-42,application/x-tar,15898,6892,0.0004\nCC-MAIN-2014-42,application/x-tex,50110,18778,0.0013\nCC-MAIN-2014-42,application/x-troff-man,63125,28562,0.0017\nCC-MAIN-2014-42,application/x-zip-compressed,30225,13400,0.0008\nCC-MAIN-2014-42,application/xhtml+xml,2046045,999956,0.0550\nCC-MAIN-2014-42,application/xml,2653286,1227930,0.0713\nCC-MAIN-2014-42,application/zip,261842,104036,0.0070\nCC-MAIN-2014-42,audio/mpeg,198264,64770,0.0053\nCC-MAIN-2014-42,audio/x-mpegurl,88275,35962,0.0024\nCC-MAIN-2014-42,audio/x-scpls,211343,71828,0.0057\nCC-MAIN-2014-42,audio/x-wav,977943,368879,0.0263\nCC-MAIN-2014-42,binary/octet-stream,19498,6301,0.0005\nCC-MAIN-2014-42,image/gif,1412105,587236,0.0379\nCC-MAIN-2014-42,image/jp2,31416,25234,0.0008\nCC-MAIN-2014-42,image/jpeg,22155091,8723037,0.5952\nCC-MAIN-2014-42,image/jpg,379767,137801,0.0102\nCC-MAIN-2014-42,image/pjpeg,114300,38545,0.0031\nCC-MAIN-2014-42,image/png,3959738,2481047,0.1064\nCC-MAIN-2014-42,image/svg+xml,3842,1297,0.0001\nCC-MAIN-2014-42,image/tiff,63129,33200,0.0017\nCC-MAIN-2014-42,image/vnd.djvu,124614,50289,0.0033\nCC-MAIN-2014-42,image/webp,126,41,0.0000\nCC-MAIN-2014-42,message/rfc822,60166,19590,0.0016\nCC-MAIN-2014-42,text/calendar,3427213,1573174,0.0921\nCC-MAIN-2014-42,text/css,2102,710,0.0001\nCC-MAIN-2014-42,text/csv,108135,52546,0.0029\nCC-MAIN-2014-42,text/directory,17792,5936,0.0005\nCC-MAIN-2014-42,text/enriched,12118,7319,0.0003\nCC-MAIN-2014-42,text/html,3622771534,1561159392,97.3306\nCC-MAIN-2014-42,text/javascript,25397,16119,0.0007\nCC-MAIN-2014-42,text/pdf,232,75,0.0000\nCC-MAIN-2014-42,text/plain,7457484,3097704,0.2004\nCC-MAIN-2014-42,text/prs.lines.tag,220,73,0.0000\nCC-MAIN-2014-42,text/tab-separated-values,63691,28500,0.0017\nCC-MAIN-2014-42,text/turtle,8316,7164,0.0002\nCC-MAIN-2014-42,text/vcard,2464,1021,0.0001\nCC-MAIN-2014-42,text/x-bibtex,64743,23246,0.0017\nCC-MAIN-2014-42,text/x-c,14262,4977,0.0004\nCC-MAIN-2014-42,text/x-csrc,8256,3287,0.0002\nCC-MAIN-2014-42,text/x-diff,23863,8262,0.0006\nCC-MAIN-2014-42,text/x-patch,155683,77865,0.0042\nCC-MAIN-2014-42,text/x-perl,67504,21537,0.0018\nCC-MAIN-2014-42,text/x-vcalendar,184868,71604,0.0050\nCC-MAIN-2014-42,text/x-vcard,120871,45420,0.0032\nCC-MAIN-2014-42,text/xml,21446092,8460067,0.5762\nCC-MAIN-2014-42,unknown/unknown,359094,193260,0.0096\nCC-MAIN-2014-42,video/mp4,13887,4567,0.0004\nCC-MAIN-2014-42,video/webm,27069,8816,0.0007\nCC-MAIN-2014-42,video/x-ms-asf,329229,182489,0.0088\nCC-MAIN-2014-49,<other>,2734412,1855078,0.1403\nCC-MAIN-2014-49,application/atom+xml,2533569,1718743,0.1300\nCC-MAIN-2014-49,application/calendar,10284,6968,0.0005\nCC-MAIN-2014-49,application/download,56670,42063,0.0029\nCC-MAIN-2014-49,application/epub+zip,57529,37763,0.0030\nCC-MAIN-2014-49,application/force-download,30235,19390,0.0016\nCC-MAIN-2014-49,application/gpx+xml,351,232,0.0000\nCC-MAIN-2014-49,application/ics,4606,3091,0.0002\nCC-MAIN-2014-49,application/javascript,547,332,0.0000\nCC-MAIN-2014-49,application/json,391504,277409,0.0201\nCC-MAIN-2014-49,application/ld+json,4566,4431,0.0002\nCC-MAIN-2014-49,application/marc,8239,7531,0.0004\nCC-MAIN-2014-49,application/msword,119943,75623,0.0062\nCC-MAIN-2014-49,application/octet-stream,924691,650656,0.0475\nCC-MAIN-2014-49,application/octetstream,22370,14380,0.0011\nCC-MAIN-2014-49,application/pdf,4290813,2745567,0.2202\nCC-MAIN-2014-49,application/pgp-encrypted,6565,4474,0.0003\nCC-MAIN-2014-49,application/pgp-signature,24438,16476,0.0013\nCC-MAIN-2014-49,application/postscript,7191,4857,0.0004\nCC-MAIN-2014-49,application/rdf+xml,68792,51543,0.0035\nCC-MAIN-2014-49,application/rss+xml,2977792,2044454,0.1528\nCC-MAIN-2014-49,application/rtf,1510,1008,0.0001\nCC-MAIN-2014-49,application/save-to-disk,44725,33082,0.0023\nCC-MAIN-2014-49,application/text,20679,14976,0.0011\nCC-MAIN-2014-49,application/unknown,11584,7480,0.0006\nCC-MAIN-2014-49,application/vnd.android.package-archive,1991,1350,0.0001\nCC-MAIN-2014-49,application/vnd.google-earth.kml+xml,165031,117926,0.0085\nCC-MAIN-2014-49,application/vnd.google-earth.kmz,48389,32232,0.0025\nCC-MAIN-2014-49,application/vnd.ms-excel,101570,70965,0.0052\nCC-MAIN-2014-49,application/vnd.ms-powerpoint,40182,31778,0.0021\nCC-MAIN-2014-49,application/vnd.ms-word,26652,17770,0.0014\nCC-MAIN-2014-49,application/vnd.oasis.opendocument.text,2683,1687,0.0001\nCC-MAIN-2014-49,application/vnd.openxmlformats-officedocument.presentationml.presentation,4757,2853,0.0002\nCC-MAIN-2014-49,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,4869,2807,0.0002\nCC-MAIN-2014-49,application/vnd.openxmlformats-officedocument.wordprocessingml.document,31751,19202,0.0016\nCC-MAIN-2014-49,application/vnd.wap.xhtml+xml,63614,41126,0.0033\nCC-MAIN-2014-49,application/x-bibtex,41207,28197,0.0021\nCC-MAIN-2014-49,application/x-bittorrent,6560,4586,0.0003\nCC-MAIN-2014-49,application/x-debian-package,73457,47902,0.0038\nCC-MAIN-2014-49,application/x-download,17431,11852,0.0009\nCC-MAIN-2014-49,application/x-endnote-refer,37716,28390,0.0019\nCC-MAIN-2014-49,application/x-gzip,53418,34609,0.0027\nCC-MAIN-2014-49,application/x-httpd-php,8447,5495,0.0004\nCC-MAIN-2014-49,application/x-java-jnlp-file,18124,11185,0.0009\nCC-MAIN-2014-49,application/x-javascript,5416,4641,0.0003\nCC-MAIN-2014-49,application/x-json,22742,21967,0.0012\nCC-MAIN-2014-49,application/x-mobipocket-ebook,18048,13594,0.0009\nCC-MAIN-2014-49,application/x-msdownload,2098,1360,0.0001\nCC-MAIN-2014-49,application/x-netcdf,19658,14683,0.0010\nCC-MAIN-2014-49,application/x-research-info-systems,58705,46828,0.0030\nCC-MAIN-2014-49,application/x-shockwave-flash,22694,18332,0.0012\nCC-MAIN-2014-49,application/x-tar,6336,4494,0.0003\nCC-MAIN-2014-49,application/x-tex,23464,15833,0.0012\nCC-MAIN-2014-49,application/x-troff-man,36873,24213,0.0019\nCC-MAIN-2014-49,application/x-zip-compressed,16654,11120,0.0009\nCC-MAIN-2014-49,application/xhtml+xml,1120239,807437,0.0575\nCC-MAIN-2014-49,application/xml,1424832,1024128,0.0731\nCC-MAIN-2014-49,application/zip,132955,89546,0.0068\nCC-MAIN-2014-49,audio/mpeg,98467,57436,0.0051\nCC-MAIN-2014-49,audio/x-mpegurl,45014,31495,0.0023\nCC-MAIN-2014-49,audio/x-scpls,94743,63016,0.0049\nCC-MAIN-2014-49,audio/x-wav,465723,320900,0.0239\nCC-MAIN-2014-49,binary/octet-stream,8569,5540,0.0004\nCC-MAIN-2014-49,image/gif,720028,508823,0.0370\nCC-MAIN-2014-49,image/jp2,18847,16960,0.0010\nCC-MAIN-2014-49,image/jpeg,11130461,7585359,0.5712\nCC-MAIN-2014-49,image/jpg,182283,122486,0.0094\nCC-MAIN-2014-49,image/pjpeg,53310,33980,0.0027\nCC-MAIN-2014-49,image/png,2167992,1772199,0.1113\nCC-MAIN-2014-49,image/svg+xml,1678,1117,0.0001\nCC-MAIN-2014-49,image/tiff,37165,27689,0.0019\nCC-MAIN-2014-49,image/vnd.djvu,68747,45209,0.0035\nCC-MAIN-2014-49,image/webp,60,41,0.0000\nCC-MAIN-2014-49,message/rfc822,26450,17208,0.0014\nCC-MAIN-2014-49,text/calendar,1841184,1308709,0.0945\nCC-MAIN-2014-49,text/css,947,628,0.0000\nCC-MAIN-2014-49,text/csv,61071,44149,0.0031\nCC-MAIN-2014-49,text/directory,8507,5305,0.0004\nCC-MAIN-2014-49,text/enriched,7721,6075,0.0004\nCC-MAIN-2014-49,text/html,1898524211,1287495053,97.4346\nCC-MAIN-2014-49,text/javascript,16992,14334,0.0009\nCC-MAIN-2014-49,text/pdf,97,67,0.0000\nCC-MAIN-2014-49,text/plain,3849121,2655017,0.1975\nCC-MAIN-2014-49,text/prs.lines.tag,103,68,0.0000\nCC-MAIN-2014-49,text/tab-separated-values,36971,26024,0.0019\nCC-MAIN-2014-49,text/turtle,5663,5285,0.0003\nCC-MAIN-2014-49,text/vcard,1286,854,0.0001\nCC-MAIN-2014-49,text/x-bibtex,31535,20640,0.0016\nCC-MAIN-2014-49,text/x-c,5856,3896,0.0003\nCC-MAIN-2014-49,text/x-csrc,3985,2780,0.0002\nCC-MAIN-2014-49,text/x-diff,11496,7432,0.0006\nCC-MAIN-2014-49,text/x-patch,89027,65360,0.0046\nCC-MAIN-2014-49,text/x-perl,30653,19559,0.0016\nCC-MAIN-2014-49,text/x-vcalendar,96555,63093,0.0050\nCC-MAIN-2014-49,text/x-vcard,58621,39061,0.0030\nCC-MAIN-2014-49,text/xml,10286054,6936751,0.5279\nCC-MAIN-2014-49,unknown/unknown,230997,160878,0.0119\nCC-MAIN-2014-49,video/mp4,6148,4007,0.0003\nCC-MAIN-2014-49,video/webm,11858,7658,0.0006\nCC-MAIN-2014-49,video/x-ms-asf,162069,126137,0.0083\nCC-MAIN-2014-52,<other>,2566086,2449767,0.1230\nCC-MAIN-2014-52,application/atom+xml,2167647,2148479,0.1039\nCC-MAIN-2014-52,application/calendar,8195,7848,0.0004\nCC-MAIN-2014-52,application/download,66356,64676,0.0032\nCC-MAIN-2014-52,application/epub+zip,72755,64678,0.0035\nCC-MAIN-2014-52,application/force-download,24819,23442,0.0012\nCC-MAIN-2014-52,application/gpx+xml,273,272,0.0000\nCC-MAIN-2014-52,application/ics,3559,3538,0.0002\nCC-MAIN-2014-52,application/javascript,416,369,0.0000\nCC-MAIN-2014-52,application/json,421611,412174,0.0202\nCC-MAIN-2014-52,application/ld+json,10860,10836,0.0005\nCC-MAIN-2014-52,application/marc,17864,17812,0.0009\nCC-MAIN-2014-52,application/msword,102505,93334,0.0049\nCC-MAIN-2014-52,application/octet-stream,811790,779331,0.0389\nCC-MAIN-2014-52,application/octetstream,15799,15654,0.0008\nCC-MAIN-2014-52,application/pdf,3494807,3231125,0.1675\nCC-MAIN-2014-52,application/pgp-encrypted,5728,5696,0.0003\nCC-MAIN-2014-52,application/pgp-signature,19482,19331,0.0009\nCC-MAIN-2014-52,application/postscript,6696,6491,0.0003\nCC-MAIN-2014-52,application/rdf+xml,80137,79231,0.0038\nCC-MAIN-2014-52,application/rss+xml,3146015,2964237,0.1508\nCC-MAIN-2014-52,application/rtf,1219,1175,0.0001\nCC-MAIN-2014-52,application/save-to-disk,41913,41641,0.0020\nCC-MAIN-2014-52,application/text,21152,21056,0.0010\nCC-MAIN-2014-52,application/unknown,8514,8241,0.0004\nCC-MAIN-2014-52,application/vnd.android.package-archive,1391,1375,0.0001\nCC-MAIN-2014-52,application/vnd.google-earth.kml+xml,169690,167607,0.0081\nCC-MAIN-2014-52,application/vnd.google-earth.kmz,35949,35451,0.0017\nCC-MAIN-2014-52,application/vnd.ms-excel,90510,87164,0.0043\nCC-MAIN-2014-52,application/vnd.ms-powerpoint,57086,53514,0.0027\nCC-MAIN-2014-52,application/vnd.ms-word,21751,21559,0.0010\nCC-MAIN-2014-52,application/vnd.oasis.opendocument.text,2048,1925,0.0001\nCC-MAIN-2014-52,application/vnd.openxmlformats-officedocument.presentationml.presentation,3538,3119,0.0002\nCC-MAIN-2014-52,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,3661,3099,0.0002\nCC-MAIN-2014-52,application/vnd.openxmlformats-officedocument.wordprocessingml.document,23663,21047,0.0011\nCC-MAIN-2014-52,application/vnd.wap.xhtml+xml,46475,45911,0.0022\nCC-MAIN-2014-52,application/x-bibtex,38648,37722,0.0019\nCC-MAIN-2014-52,application/x-bittorrent,5667,5613,0.0003\nCC-MAIN-2014-52,application/x-debian-package,53736,53316,0.0026\nCC-MAIN-2014-52,application/x-download,13323,13187,0.0006\nCC-MAIN-2014-52,application/x-endnote-refer,42247,42031,0.0020\nCC-MAIN-2014-52,application/x-gzip,40834,39792,0.0020\nCC-MAIN-2014-52,application/x-httpd-php,7550,7286,0.0004\nCC-MAIN-2014-52,application/x-java-jnlp-file,13696,12713,0.0007\nCC-MAIN-2014-52,application/x-javascript,8531,8471,0.0004\nCC-MAIN-2014-52,application/x-json,54686,54513,0.0026\nCC-MAIN-2014-52,application/x-mobipocket-ebook,31098,29186,0.0015\nCC-MAIN-2014-52,application/x-msdownload,1529,1405,0.0001\nCC-MAIN-2014-52,application/x-netcdf,19881,19742,0.0010\nCC-MAIN-2014-52,application/x-research-info-systems,86803,85162,0.0042\nCC-MAIN-2014-52,application/x-shockwave-flash,8416,8246,0.0004\nCC-MAIN-2014-52,application/x-tar,4830,4727,0.0002\nCC-MAIN-2014-52,application/x-tex,16798,16564,0.0008\nCC-MAIN-2014-52,application/x-troff-man,36093,31729,0.0017\nCC-MAIN-2014-52,application/x-zip-compressed,13432,12649,0.0006\nCC-MAIN-2014-52,application/xhtml+xml,1205247,1151134,0.0578\nCC-MAIN-2014-52,application/xml,1505230,1473417,0.0722\nCC-MAIN-2014-52,application/zip,108845,106880,0.0052\nCC-MAIN-2014-52,audio/mpeg,84458,67918,0.0040\nCC-MAIN-2014-52,audio/x-mpegurl,40831,40574,0.0020\nCC-MAIN-2014-52,audio/x-scpls,72423,71882,0.0035\nCC-MAIN-2014-52,audio/x-wav,449190,446747,0.0215\nCC-MAIN-2014-52,binary/octet-stream,6344,6242,0.0003\nCC-MAIN-2014-52,image/gif,709470,702190,0.0340\nCC-MAIN-2014-52,image/jp2,47915,47776,0.0023\nCC-MAIN-2014-52,image/jpeg,9484897,9340670,0.4547\nCC-MAIN-2014-52,image/jpg,129873,127833,0.0062\nCC-MAIN-2014-52,image/pjpeg,41468,39081,0.0020\nCC-MAIN-2014-52,image/png,3676931,3660369,0.1763\nCC-MAIN-2014-52,image/svg+xml,1384,1366,0.0001\nCC-MAIN-2014-52,image/tiff,43254,42458,0.0021\nCC-MAIN-2014-52,image/vnd.djvu,8749,8693,0.0004\nCC-MAIN-2014-52,image/webp,52,52,0.0000\nCC-MAIN-2014-52,message/rfc822,19875,19461,0.0010\nCC-MAIN-2014-52,text/calendar,1951809,1898218,0.0936\nCC-MAIN-2014-52,text/css,796,776,0.0000\nCC-MAIN-2014-52,text/csv,69069,68048,0.0033\nCC-MAIN-2014-52,text/directory,6358,5967,0.0003\nCC-MAIN-2014-52,text/enriched,11510,10779,0.0006\nCC-MAIN-2014-52,text/html,2038395047,1859432700,97.7190\nCC-MAIN-2014-52,text/javascript,25753,25408,0.0012\nCC-MAIN-2014-52,text/pdf,75,73,0.0000\nCC-MAIN-2014-52,text/plain,3759804,3616547,0.1802\nCC-MAIN-2014-52,text/prs.lines.tag,77,77,0.0000\nCC-MAIN-2014-52,text/tab-separated-values,33578,32811,0.0016\nCC-MAIN-2014-52,text/turtle,12110,11810,0.0006\nCC-MAIN-2014-52,text/vcard,1385,1286,0.0001\nCC-MAIN-2014-52,text/x-bibtex,23509,23292,0.0011\nCC-MAIN-2014-52,text/x-c,4350,4305,0.0002\nCC-MAIN-2014-52,text/x-csrc,3435,3358,0.0002\nCC-MAIN-2014-52,text/x-diff,9096,8676,0.0004\nCC-MAIN-2014-52,text/x-patch,97016,95888,0.0047\nCC-MAIN-2014-52,text/x-perl,21708,21546,0.0010\nCC-MAIN-2014-52,text/x-vcalendar,81850,77566,0.0039\nCC-MAIN-2014-52,text/x-vcard,48939,47334,0.0023\nCC-MAIN-2014-52,text/xml,9125408,8831069,0.4375\nCC-MAIN-2014-52,unknown/unknown,324369,265521,0.0155\nCC-MAIN-2014-52,video/mp4,4698,4600,0.0002\nCC-MAIN-2014-52,video/webm,8646,8572,0.0004\nCC-MAIN-2014-52,video/x-ms-asf,250618,245922,0.0120\nCC-MAIN-2015-06,<other>,1826024103,1679287071,100.0000\nCC-MAIN-2015-11,<other>,1837196089,1685659195,100.0000\nCC-MAIN-2015-14,<other>,2237119,2148722,0.1359\nCC-MAIN-2015-14,application/atom+xml,1781801,1769716,0.1082\nCC-MAIN-2015-14,application/calendar,6176,5829,0.0004\nCC-MAIN-2015-14,application/download,43785,43132,0.0027\nCC-MAIN-2015-14,application/epub+zip,45712,41044,0.0028\nCC-MAIN-2015-14,application/force-download,21605,20385,0.0013\nCC-MAIN-2015-14,application/gpx+xml,227,227,0.0000\nCC-MAIN-2015-14,application/ics,3153,3153,0.0002\nCC-MAIN-2015-14,application/javascript,570,534,0.0000\nCC-MAIN-2015-14,application/json,323653,317256,0.0197\nCC-MAIN-2015-14,application/ld+json,5539,5539,0.0003\nCC-MAIN-2015-14,application/marc,8362,8362,0.0005\nCC-MAIN-2015-14,application/msword,89418,82400,0.0054\nCC-MAIN-2015-14,application/octet-stream,686404,662455,0.0417\nCC-MAIN-2015-14,application/octetstream,14239,14187,0.0009\nCC-MAIN-2015-14,application/pdf,3195676,2962826,0.1941\nCC-MAIN-2015-14,application/pgp-encrypted,13841,13502,0.0008\nCC-MAIN-2015-14,application/pgp-signature,13797,13771,0.0008\nCC-MAIN-2015-14,application/postscript,5851,5727,0.0004\nCC-MAIN-2015-14,application/rdf+xml,58939,58513,0.0036\nCC-MAIN-2015-14,application/rss+xml,2386034,2245214,0.1449\nCC-MAIN-2015-14,application/rtf,982,956,0.0001\nCC-MAIN-2015-14,application/save-to-disk,37758,37758,0.0023\nCC-MAIN-2015-14,application/text,14283,13981,0.0009\nCC-MAIN-2015-14,application/unknown,7628,7479,0.0005\nCC-MAIN-2015-14,application/vnd.android.package-archive,1345,1331,0.0001\nCC-MAIN-2015-14,application/vnd.google-earth.kml+xml,134209,133192,0.0082\nCC-MAIN-2015-14,application/vnd.google-earth.kmz,34945,34710,0.0021\nCC-MAIN-2015-14,application/vnd.ms-excel,73731,71476,0.0045\nCC-MAIN-2015-14,application/vnd.ms-powerpoint,34865,33301,0.0021\nCC-MAIN-2015-14,application/vnd.ms-word,18383,18335,0.0011\nCC-MAIN-2015-14,application/vnd.oasis.opendocument.text,1848,1746,0.0001\nCC-MAIN-2015-14,application/vnd.openxmlformats-officedocument.presentationml.presentation,3506,3125,0.0002\nCC-MAIN-2015-14,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,3796,3319,0.0002\nCC-MAIN-2015-14,application/vnd.openxmlformats-officedocument.wordprocessingml.document,22876,20347,0.0014\nCC-MAIN-2015-14,application/vnd.wap.xhtml+xml,42645,42307,0.0026\nCC-MAIN-2015-14,application/x-bibtex,32026,31121,0.0019\nCC-MAIN-2015-14,application/x-bittorrent,4930,4916,0.0003\nCC-MAIN-2015-14,application/x-debian-package,47079,47008,0.0029\nCC-MAIN-2015-14,application/x-download,13384,13341,0.0008\nCC-MAIN-2015-14,application/x-endnote-refer,33216,32917,0.0020\nCC-MAIN-2015-14,application/x-gzip,36396,35657,0.0022\nCC-MAIN-2015-14,application/x-httpd-php,10723,10319,0.0007\nCC-MAIN-2015-14,application/x-java-jnlp-file,9580,9553,0.0006\nCC-MAIN-2015-14,application/x-javascript,4002,3986,0.0002\nCC-MAIN-2015-14,application/x-json,29391,29341,0.0018\nCC-MAIN-2015-14,application/x-mobipocket-ebook,17991,16599,0.0011\nCC-MAIN-2015-14,application/x-msdownload,2581,2444,0.0002\nCC-MAIN-2015-14,application/x-netcdf,17222,17207,0.0010\nCC-MAIN-2015-14,application/x-research-info-systems,56912,56449,0.0035\nCC-MAIN-2015-14,application/x-shockwave-flash,35086,34868,0.0021\nCC-MAIN-2015-14,application/x-tar,3573,3542,0.0002\nCC-MAIN-2015-14,application/x-tex,15293,15172,0.0009\nCC-MAIN-2015-14,application/x-troff-man,31218,27585,0.0019\nCC-MAIN-2015-14,application/x-zip-compressed,12392,11647,0.0008\nCC-MAIN-2015-14,application/xhtml+xml,1022890,984161,0.0621\nCC-MAIN-2015-14,application/xml,1174447,1147234,0.0713\nCC-MAIN-2015-14,application/zip,103875,101980,0.0063\nCC-MAIN-2015-14,audio/mpeg,73156,60604,0.0044\nCC-MAIN-2015-14,audio/x-mpegurl,34617,34592,0.0021\nCC-MAIN-2015-14,audio/x-scpls,64408,64363,0.0039\nCC-MAIN-2015-14,audio/x-wav,359624,359482,0.0218\nCC-MAIN-2015-14,binary/octet-stream,5815,5742,0.0004\nCC-MAIN-2015-14,image/gif,542469,539369,0.0329\nCC-MAIN-2015-14,image/jp2,26525,26370,0.0016\nCC-MAIN-2015-14,image/jpeg,7975589,7898261,0.4843\nCC-MAIN-2015-14,image/jpg,101050,100690,0.0061\nCC-MAIN-2015-14,image/pjpeg,38424,36634,0.0023\nCC-MAIN-2015-14,image/png,2599454,2595213,0.1579\nCC-MAIN-2015-14,image/svg+xml,1272,1247,0.0001\nCC-MAIN-2015-14,image/tiff,31155,30748,0.0019\nCC-MAIN-2015-14,image/vnd.djvu,5234,5230,0.0003\nCC-MAIN-2015-14,image/webp,76,76,0.0000\nCC-MAIN-2015-14,message/rfc822,16209,15866,0.0010\nCC-MAIN-2015-14,text/calendar,1475916,1444536,0.0896\nCC-MAIN-2015-14,text/css,670,656,0.0000\nCC-MAIN-2015-14,text/csv,83557,80702,0.0051\nCC-MAIN-2015-14,text/directory,5286,4992,0.0003\nCC-MAIN-2015-14,text/enriched,6385,6066,0.0004\nCC-MAIN-2015-14,text/html,1607660300,1476960095,97.6294\nCC-MAIN-2015-14,text/javascript,17666,17433,0.0011\nCC-MAIN-2015-14,text/pdf,28162,28162,0.0017\nCC-MAIN-2015-14,text/plain,3038748,2933352,0.1845\nCC-MAIN-2015-14,text/prs.lines.tag,59,59,0.0000\nCC-MAIN-2015-14,text/tab-separated-values,55458,52825,0.0034\nCC-MAIN-2015-14,text/turtle,6612,6446,0.0004\nCC-MAIN-2015-14,text/vcard,2274,1540,0.0001\nCC-MAIN-2015-14,text/x-bibtex,21123,21061,0.0013\nCC-MAIN-2015-14,text/x-c,4171,4010,0.0003\nCC-MAIN-2015-14,text/x-csrc,3069,3012,0.0002\nCC-MAIN-2015-14,text/x-diff,13009,12618,0.0008\nCC-MAIN-2015-14,text/x-patch,98400,97739,0.0060\nCC-MAIN-2015-14,text/x-perl,19276,19260,0.0012\nCC-MAIN-2015-14,text/x-vcalendar,68680,64667,0.0042\nCC-MAIN-2015-14,text/x-vcard,42121,40386,0.0026\nCC-MAIN-2015-14,text/xml,7736085,7502422,0.4698\nCC-MAIN-2015-14,unknown/unknown,197565,165402,0.0120\nCC-MAIN-2015-14,video/mp4,4421,4378,0.0003\nCC-MAIN-2015-14,video/webm,9455,9435,0.0006\nCC-MAIN-2015-14,video/x-ms-asf,135081,131328,0.0082\nCC-MAIN-2015-18,<other>,2686508,2574336,0.1270\nCC-MAIN-2015-18,application/atom+xml,2111340,2096286,0.0998\nCC-MAIN-2015-18,application/calendar,7792,7275,0.0004\nCC-MAIN-2015-18,application/download,68038,66390,0.0032\nCC-MAIN-2015-18,application/epub+zip,63240,57392,0.0030\nCC-MAIN-2015-18,application/force-download,23715,22353,0.0011\nCC-MAIN-2015-18,application/gpx+xml,259,259,0.0000\nCC-MAIN-2015-18,application/ics,3518,3518,0.0002\nCC-MAIN-2015-18,application/javascript,657,618,0.0000\nCC-MAIN-2015-18,application/json,421710,412238,0.0199\nCC-MAIN-2015-18,application/ld+json,12415,12414,0.0006\nCC-MAIN-2015-18,application/marc,19419,19419,0.0009\nCC-MAIN-2015-18,application/msword,104249,96481,0.0049\nCC-MAIN-2015-18,application/octet-stream,801893,775576,0.0379\nCC-MAIN-2015-18,application/octetstream,15759,15704,0.0007\nCC-MAIN-2015-18,application/pdf,3643080,3377225,0.1722\nCC-MAIN-2015-18,application/pgp-encrypted,23731,22278,0.0011\nCC-MAIN-2015-18,application/pgp-signature,16318,16286,0.0008\nCC-MAIN-2015-18,application/postscript,7494,7357,0.0004\nCC-MAIN-2015-18,application/rdf+xml,85244,84722,0.0040\nCC-MAIN-2015-18,application/rss+xml,3070205,2896459,0.1451\nCC-MAIN-2015-18,application/rtf,1101,1067,0.0001\nCC-MAIN-2015-18,application/save-to-disk,41306,41306,0.0020\nCC-MAIN-2015-18,application/text,19160,18734,0.0009\nCC-MAIN-2015-18,application/unknown,8376,8212,0.0004\nCC-MAIN-2015-18,application/vnd.android.package-archive,1483,1467,0.0001\nCC-MAIN-2015-18,application/vnd.google-earth.kml+xml,164545,163416,0.0078\nCC-MAIN-2015-18,application/vnd.google-earth.kmz,38340,38082,0.0018\nCC-MAIN-2015-18,application/vnd.ms-excel,86503,83645,0.0041\nCC-MAIN-2015-18,application/vnd.ms-powerpoint,40570,38090,0.0019\nCC-MAIN-2015-18,application/vnd.ms-word,21993,21922,0.0010\nCC-MAIN-2015-18,application/vnd.oasis.opendocument.text,2098,1983,0.0001\nCC-MAIN-2015-18,application/vnd.openxmlformats-officedocument.presentationml.presentation,3982,3544,0.0002\nCC-MAIN-2015-18,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,4257,3723,0.0002\nCC-MAIN-2015-18,application/vnd.openxmlformats-officedocument.wordprocessingml.document,25111,22388,0.0012\nCC-MAIN-2015-18,application/vnd.wap.xhtml+xml,45992,45591,0.0022\nCC-MAIN-2015-18,application/x-bibtex,40797,39820,0.0019\nCC-MAIN-2015-18,application/x-bittorrent,5487,5470,0.0003\nCC-MAIN-2015-18,application/x-debian-package,47082,47012,0.0022\nCC-MAIN-2015-18,application/x-download,14877,14830,0.0007\nCC-MAIN-2015-18,application/x-endnote-refer,44043,43599,0.0021\nCC-MAIN-2015-18,application/x-gzip,41155,40251,0.0019\nCC-MAIN-2015-18,application/x-httpd-php,11399,11011,0.0005\nCC-MAIN-2015-18,application/x-java-jnlp-file,14892,14105,0.0007\nCC-MAIN-2015-18,application/x-javascript,5900,5882,0.0003\nCC-MAIN-2015-18,application/x-json,61058,60924,0.0029\nCC-MAIN-2015-18,application/x-mobipocket-ebook,26953,25193,0.0013\nCC-MAIN-2015-18,application/x-msdownload,2880,2708,0.0001\nCC-MAIN-2015-18,application/x-netcdf,19469,19453,0.0009\nCC-MAIN-2015-18,application/x-research-info-systems,97751,95937,0.0046\nCC-MAIN-2015-18,application/x-shockwave-flash,53258,52957,0.0025\nCC-MAIN-2015-18,application/x-tar,3966,3906,0.0002\nCC-MAIN-2015-18,application/x-tex,16578,16442,0.0008\nCC-MAIN-2015-18,application/x-troff-man,35249,30974,0.0017\nCC-MAIN-2015-18,application/x-zip-compressed,14386,13432,0.0007\nCC-MAIN-2015-18,application/xhtml+xml,1231107,1185747,0.0582\nCC-MAIN-2015-18,application/xml,1554906,1514258,0.0735\nCC-MAIN-2015-18,application/zip,125675,122900,0.0059\nCC-MAIN-2015-18,audio/mpeg,80937,67231,0.0038\nCC-MAIN-2015-18,audio/x-mpegurl,40045,40004,0.0019\nCC-MAIN-2015-18,audio/x-scpls,71385,71316,0.0034\nCC-MAIN-2015-18,audio/x-wav,443589,443404,0.0210\nCC-MAIN-2015-18,binary/octet-stream,6480,6309,0.0003\nCC-MAIN-2015-18,image/gif,722817,719003,0.0342\nCC-MAIN-2015-18,image/jp2,48159,47830,0.0023\nCC-MAIN-2015-18,image/jpeg,9121820,9040605,0.4311\nCC-MAIN-2015-18,image/jpg,116763,116336,0.0055\nCC-MAIN-2015-18,image/pjpeg,42872,41290,0.0020\nCC-MAIN-2015-18,image/png,4733630,4727506,0.2237\nCC-MAIN-2015-18,image/svg+xml,1420,1395,0.0001\nCC-MAIN-2015-18,image/tiff,44608,43916,0.0021\nCC-MAIN-2015-18,image/vnd.djvu,6928,6923,0.0003\nCC-MAIN-2015-18,image/webp,81,81,0.0000\nCC-MAIN-2015-18,message/rfc822,17986,17634,0.0009\nCC-MAIN-2015-18,text/calendar,1843975,1806610,0.0872\nCC-MAIN-2015-18,text/css,681,668,0.0000\nCC-MAIN-2015-18,text/csv,110977,107750,0.0052\nCC-MAIN-2015-18,text/directory,5930,5606,0.0003\nCC-MAIN-2015-18,text/enriched,8406,8274,0.0004\nCC-MAIN-2015-18,text/html,2067330597,1887431497,97.7083\nCC-MAIN-2015-18,text/javascript,26952,26706,0.0013\nCC-MAIN-2015-18,text/pdf,39710,39710,0.0019\nCC-MAIN-2015-18,text/plain,3784490,3656496,0.1789\nCC-MAIN-2015-18,text/prs.lines.tag,72,72,0.0000\nCC-MAIN-2015-18,text/tab-separated-values,67742,64806,0.0032\nCC-MAIN-2015-18,text/turtle,13508,13310,0.0006\nCC-MAIN-2015-18,text/vcard,2473,1712,0.0001\nCC-MAIN-2015-18,text/x-bibtex,23316,23253,0.0011\nCC-MAIN-2015-18,text/x-c,4585,4418,0.0002\nCC-MAIN-2015-18,text/x-csrc,3584,3522,0.0002\nCC-MAIN-2015-18,text/x-diff,15771,15320,0.0007\nCC-MAIN-2015-18,text/x-patch,111010,110202,0.0052\nCC-MAIN-2015-18,text/x-perl,20981,20965,0.0010\nCC-MAIN-2015-18,text/x-vcalendar,76614,72161,0.0036\nCC-MAIN-2015-18,text/x-vcard,48113,46257,0.0023\nCC-MAIN-2015-18,text/xml,9085389,8802535,0.4294\nCC-MAIN-2015-18,unknown/unknown,268051,220982,0.0127\nCC-MAIN-2015-18,video/mp4,6309,6238,0.0003\nCC-MAIN-2015-18,video/webm,10345,10321,0.0005\nCC-MAIN-2015-18,video/x-ms-asf,248689,244606,0.0118\nCC-MAIN-2015-22,<other>,2593956,2478632,0.1287\nCC-MAIN-2015-22,application/atom+xml,2068900,2052473,0.1027\nCC-MAIN-2015-22,application/calendar,7719,6958,0.0004\nCC-MAIN-2015-22,application/download,61952,60856,0.0031\nCC-MAIN-2015-22,application/epub+zip,60516,54196,0.0030\nCC-MAIN-2015-22,application/force-download,23342,21994,0.0012\nCC-MAIN-2015-22,application/gpx+xml,261,261,0.0000\nCC-MAIN-2015-22,application/ics,3545,3545,0.0002\nCC-MAIN-2015-22,application/javascript,678,634,0.0000\nCC-MAIN-2015-22,application/json,404739,394475,0.0201\nCC-MAIN-2015-22,application/ld+json,9356,9355,0.0005\nCC-MAIN-2015-22,application/marc,17680,17680,0.0009\nCC-MAIN-2015-22,application/msword,101632,93433,0.0050\nCC-MAIN-2015-22,application/octet-stream,784006,756453,0.0389\nCC-MAIN-2015-22,application/octetstream,15892,15825,0.0008\nCC-MAIN-2015-22,application/pdf,3575034,3292080,0.1774\nCC-MAIN-2015-22,application/pgp-encrypted,20744,19752,0.0010\nCC-MAIN-2015-22,application/pgp-signature,16290,16249,0.0008\nCC-MAIN-2015-22,application/postscript,7584,7430,0.0004\nCC-MAIN-2015-22,application/rdf+xml,78596,78005,0.0039\nCC-MAIN-2015-22,application/rss+xml,2851715,2664248,0.1415\nCC-MAIN-2015-22,application/rtf,1089,1053,0.0001\nCC-MAIN-2015-22,application/save-to-disk,41649,41649,0.0021\nCC-MAIN-2015-22,application/text,18705,18239,0.0009\nCC-MAIN-2015-22,application/unknown,8127,7934,0.0004\nCC-MAIN-2015-22,application/vnd.android.package-archive,1478,1447,0.0001\nCC-MAIN-2015-22,application/vnd.google-earth.kml+xml,158217,156932,0.0079\nCC-MAIN-2015-22,application/vnd.google-earth.kmz,38786,38496,0.0019\nCC-MAIN-2015-22,application/vnd.ms-excel,83437,80433,0.0041\nCC-MAIN-2015-22,application/vnd.ms-powerpoint,37598,35209,0.0019\nCC-MAIN-2015-22,application/vnd.ms-word,21862,21776,0.0011\nCC-MAIN-2015-22,application/vnd.oasis.opendocument.text,2074,1955,0.0001\nCC-MAIN-2015-22,application/vnd.openxmlformats-officedocument.presentationml.presentation,3833,3430,0.0002\nCC-MAIN-2015-22,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,4319,3725,0.0002\nCC-MAIN-2015-22,application/vnd.openxmlformats-officedocument.wordprocessingml.document,25148,22235,0.0012\nCC-MAIN-2015-22,application/vnd.wap.xhtml+xml,46221,45985,0.0023\nCC-MAIN-2015-22,application/x-bibtex,39582,38581,0.0020\nCC-MAIN-2015-22,application/x-bittorrent,5466,5449,0.0003\nCC-MAIN-2015-22,application/x-debian-package,45555,45475,0.0023\nCC-MAIN-2015-22,application/x-download,14595,14547,0.0007\nCC-MAIN-2015-22,application/x-endnote-refer,43231,42718,0.0021\nCC-MAIN-2015-22,application/x-gzip,40483,39590,0.0020\nCC-MAIN-2015-22,application/x-httpd-php,9428,9033,0.0005\nCC-MAIN-2015-22,application/x-java-jnlp-file,14734,14052,0.0007\nCC-MAIN-2015-22,application/x-javascript,5036,5013,0.0002\nCC-MAIN-2015-22,application/x-json,40935,40848,0.0020\nCC-MAIN-2015-22,application/x-mobipocket-ebook,25006,22933,0.0012\nCC-MAIN-2015-22,application/x-msdownload,3010,2826,0.0001\nCC-MAIN-2015-22,application/x-netcdf,16634,16618,0.0008\nCC-MAIN-2015-22,application/x-research-info-systems,82522,81070,0.0041\nCC-MAIN-2015-22,application/x-shockwave-flash,53253,52922,0.0026\nCC-MAIN-2015-22,application/x-tar,3889,3827,0.0002\nCC-MAIN-2015-22,application/x-tex,16878,16735,0.0008\nCC-MAIN-2015-22,application/x-troff-man,35866,31176,0.0018\nCC-MAIN-2015-22,application/x-zip-compressed,14962,13970,0.0007\nCC-MAIN-2015-22,application/xhtml+xml,1137090,1091203,0.0564\nCC-MAIN-2015-22,application/xml,1473201,1432218,0.0731\nCC-MAIN-2015-22,application/zip,119790,116874,0.0059\nCC-MAIN-2015-22,audio/mpeg,77995,64051,0.0039\nCC-MAIN-2015-22,audio/x-mpegurl,40787,40751,0.0020\nCC-MAIN-2015-22,audio/x-scpls,71931,71847,0.0036\nCC-MAIN-2015-22,audio/x-wav,401777,401612,0.0199\nCC-MAIN-2015-22,binary/octet-stream,6521,6329,0.0003\nCC-MAIN-2015-22,image/gif,703410,699369,0.0349\nCC-MAIN-2015-22,image/jp2,43503,43348,0.0022\nCC-MAIN-2015-22,image/jpeg,9118029,9008831,0.4524\nCC-MAIN-2015-22,image/jpg,116626,116170,0.0058\nCC-MAIN-2015-22,image/pjpeg,42590,40818,0.0021\nCC-MAIN-2015-22,image/png,4166719,4160673,0.2067\nCC-MAIN-2015-22,image/svg+xml,1440,1413,0.0001\nCC-MAIN-2015-22,image/tiff,42450,41768,0.0021\nCC-MAIN-2015-22,image/vnd.djvu,7462,7193,0.0004\nCC-MAIN-2015-22,image/webp,84,84,0.0000\nCC-MAIN-2015-22,message/rfc822,18099,17706,0.0009\nCC-MAIN-2015-22,text/calendar,1742042,1702948,0.0864\nCC-MAIN-2015-22,text/css,617,603,0.0000\nCC-MAIN-2015-22,text/csv,96531,93907,0.0048\nCC-MAIN-2015-22,text/directory,5890,5531,0.0003\nCC-MAIN-2015-22,text/enriched,8101,7985,0.0004\nCC-MAIN-2015-22,text/html,1968735332,1791214035,97.6816\nCC-MAIN-2015-22,text/javascript,23672,23436,0.0012\nCC-MAIN-2015-22,text/pdf,35770,35770,0.0018\nCC-MAIN-2015-22,text/plain,3639018,3508960,0.1806\nCC-MAIN-2015-22,text/prs.lines.tag,69,69,0.0000\nCC-MAIN-2015-22,text/tab-separated-values,59605,57240,0.0030\nCC-MAIN-2015-22,text/turtle,10533,10326,0.0005\nCC-MAIN-2015-22,text/vcard,2566,1699,0.0001\nCC-MAIN-2015-22,text/x-bibtex,23444,23371,0.0012\nCC-MAIN-2015-22,text/x-c,4633,4447,0.0002\nCC-MAIN-2015-22,text/x-csrc,3425,3359,0.0002\nCC-MAIN-2015-22,text/x-diff,15078,14655,0.0007\nCC-MAIN-2015-22,text/x-patch,107476,106747,0.0053\nCC-MAIN-2015-22,text/x-perl,21299,21278,0.0011\nCC-MAIN-2015-22,text/x-vcalendar,73796,69436,0.0037\nCC-MAIN-2015-22,text/x-vcard,49060,46857,0.0024\nCC-MAIN-2015-22,text/xml,9031180,8726610,0.4481\nCC-MAIN-2015-22,unknown/unknown,241752,200226,0.0120\nCC-MAIN-2015-22,video/mp4,6348,6275,0.0003\nCC-MAIN-2015-22,video/webm,10468,10436,0.0005\nCC-MAIN-2015-22,video/x-ms-asf,216494,212027,0.0107\nCC-MAIN-2015-27,<other>,2812640,2720566,0.1679\nCC-MAIN-2015-27,application/atom+xml,1772121,1758202,0.1058\nCC-MAIN-2015-27,application/calendar,6732,6115,0.0004\nCC-MAIN-2015-27,application/download,50435,49698,0.0030\nCC-MAIN-2015-27,application/epub+zip,44698,39705,0.0027\nCC-MAIN-2015-27,application/force-download,20158,19050,0.0012\nCC-MAIN-2015-27,application/gpx+xml,250,250,0.0000\nCC-MAIN-2015-27,application/ics,3046,3046,0.0002\nCC-MAIN-2015-27,application/javascript,815,783,0.0000\nCC-MAIN-2015-27,application/json,269397,261907,0.0161\nCC-MAIN-2015-27,application/ld+json,6796,6795,0.0004\nCC-MAIN-2015-27,application/marc,12071,12071,0.0007\nCC-MAIN-2015-27,application/msword,87373,80675,0.0052\nCC-MAIN-2015-27,application/octet-stream,677006,654042,0.0404\nCC-MAIN-2015-27,application/octetstream,14449,14399,0.0009\nCC-MAIN-2015-27,application/pdf,2968417,2752620,0.1772\nCC-MAIN-2015-27,application/pgp-encrypted,18504,17698,0.0011\nCC-MAIN-2015-27,application/pgp-signature,14318,14276,0.0009\nCC-MAIN-2015-27,application/postscript,6314,6192,0.0004\nCC-MAIN-2015-27,application/rdf+xml,66556,66089,0.0040\nCC-MAIN-2015-27,application/rss+xml,2364909,2218258,0.1411\nCC-MAIN-2015-27,application/rtf,938,910,0.0001\nCC-MAIN-2015-27,application/save-to-disk,36917,36917,0.0022\nCC-MAIN-2015-27,application/text,14468,14130,0.0009\nCC-MAIN-2015-27,application/unknown,7714,7582,0.0005\nCC-MAIN-2015-27,application/vnd.android.package-archive,1311,1276,0.0001\nCC-MAIN-2015-27,application/vnd.google-earth.kml+xml,135088,134784,0.0081\nCC-MAIN-2015-27,application/vnd.google-earth.kmz,34863,34629,0.0021\nCC-MAIN-2015-27,application/vnd.ms-excel,70976,68702,0.0042\nCC-MAIN-2015-27,application/vnd.ms-powerpoint,31626,29977,0.0019\nCC-MAIN-2015-27,application/vnd.ms-word,9439,9380,0.0006\nCC-MAIN-2015-27,application/vnd.oasis.opendocument.text,1729,1630,0.0001\nCC-MAIN-2015-27,application/vnd.openxmlformats-officedocument.presentationml.presentation,3501,3139,0.0002\nCC-MAIN-2015-27,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,3756,3286,0.0002\nCC-MAIN-2015-27,application/vnd.openxmlformats-officedocument.wordprocessingml.document,22311,19903,0.0013\nCC-MAIN-2015-27,application/vnd.wap.xhtml+xml,41390,41229,0.0025\nCC-MAIN-2015-27,application/x-bibtex,35646,34747,0.0021\nCC-MAIN-2015-27,application/x-bittorrent,4735,4719,0.0003\nCC-MAIN-2015-27,application/x-debian-package,36039,35978,0.0022\nCC-MAIN-2015-27,application/x-download,12747,12724,0.0008\nCC-MAIN-2015-27,application/x-endnote-refer,37087,36703,0.0022\nCC-MAIN-2015-27,application/x-gzip,28397,28114,0.0017\nCC-MAIN-2015-27,application/x-httpd-php,14367,14025,0.0009\nCC-MAIN-2015-27,application/x-java-jnlp-file,13059,12393,0.0008\nCC-MAIN-2015-27,application/x-javascript,3944,3931,0.0002\nCC-MAIN-2015-27,application/x-json,35784,35703,0.0021\nCC-MAIN-2015-27,application/x-mobipocket-ebook,16053,14372,0.0010\nCC-MAIN-2015-27,application/x-msdownload,2483,2332,0.0001\nCC-MAIN-2015-27,application/x-netcdf,15862,15850,0.0009\nCC-MAIN-2015-27,application/x-research-info-systems,64966,64139,0.0039\nCC-MAIN-2015-27,application/x-shockwave-flash,40233,40016,0.0024\nCC-MAIN-2015-27,application/x-tar,3458,3418,0.0002\nCC-MAIN-2015-27,application/x-tex,14276,14164,0.0009\nCC-MAIN-2015-27,application/x-troff-man,32944,29381,0.0020\nCC-MAIN-2015-27,application/x-zip-compressed,13233,12423,0.0008\nCC-MAIN-2015-27,application/xhtml+xml,973867,936652,0.0581\nCC-MAIN-2015-27,application/xml,1223595,1191711,0.0730\nCC-MAIN-2015-27,application/zip,103143,100882,0.0062\nCC-MAIN-2015-27,audio/mpeg,66344,55378,0.0040\nCC-MAIN-2015-27,audio/x-mpegurl,35842,35820,0.0021\nCC-MAIN-2015-27,audio/x-scpls,63819,63754,0.0038\nCC-MAIN-2015-27,audio/x-wav,302099,301969,0.0180\nCC-MAIN-2015-27,binary/octet-stream,5877,5720,0.0004\nCC-MAIN-2015-27,image/gif,593658,590256,0.0354\nCC-MAIN-2015-27,image/jp2,32745,32538,0.0020\nCC-MAIN-2015-27,image/jpeg,7605850,7521555,0.4539\nCC-MAIN-2015-27,image/jpg,111911,111606,0.0067\nCC-MAIN-2015-27,image/pjpeg,32967,31595,0.0020\nCC-MAIN-2015-27,image/png,3199558,3194502,0.1909\nCC-MAIN-2015-27,image/svg+xml,1288,1262,0.0001\nCC-MAIN-2015-27,image/tiff,35254,34688,0.0021\nCC-MAIN-2015-27,image/vnd.djvu,6128,5877,0.0004\nCC-MAIN-2015-27,image/webp,78,78,0.0000\nCC-MAIN-2015-27,message/rfc822,16049,15736,0.0010\nCC-MAIN-2015-27,text/calendar,1403176,1373774,0.0837\nCC-MAIN-2015-27,text/css,590,579,0.0000\nCC-MAIN-2015-27,text/csv,88844,85626,0.0053\nCC-MAIN-2015-27,text/directory,5059,4804,0.0003\nCC-MAIN-2015-27,text/enriched,7118,7041,0.0004\nCC-MAIN-2015-27,text/html,1636065696,1492616771,97.6395\nCC-MAIN-2015-27,text/javascript,18145,17963,0.0011\nCC-MAIN-2015-27,text/pdf,27587,27587,0.0016\nCC-MAIN-2015-27,text/plain,3053844,2959525,0.1823\nCC-MAIN-2015-27,text/prs.lines.tag,62,62,0.0000\nCC-MAIN-2015-27,text/tab-separated-values,60393,57333,0.0036\nCC-MAIN-2015-27,text/turtle,7822,7657,0.0005\nCC-MAIN-2015-27,text/vcard,2261,1555,0.0001\nCC-MAIN-2015-27,text/x-bibtex,20858,20804,0.0012\nCC-MAIN-2015-27,text/x-c,3917,3788,0.0002\nCC-MAIN-2015-27,text/x-csrc,3286,3229,0.0002\nCC-MAIN-2015-27,text/x-diff,14291,13829,0.0009\nCC-MAIN-2015-27,text/x-patch,92701,91777,0.0055\nCC-MAIN-2015-27,text/x-perl,39546,39531,0.0024\nCC-MAIN-2015-27,text/x-vcalendar,62359,58744,0.0037\nCC-MAIN-2015-27,text/x-vcard,40378,38176,0.0024\nCC-MAIN-2015-27,text/xml,7735987,7496309,0.4617\nCC-MAIN-2015-27,unknown/unknown,182441,150017,0.0109\nCC-MAIN-2015-27,video/mp4,5757,5691,0.0003\nCC-MAIN-2015-27,video/webm,9167,8524,0.0005\nCC-MAIN-2015-27,video/x-ms-asf,199396,195681,0.0119\nCC-MAIN-2015-32,<other>,2217869,2137250,0.1222\nCC-MAIN-2015-32,application/atom+xml,1890523,1874892,0.1041\nCC-MAIN-2015-32,application/calendar,7336,6644,0.0004\nCC-MAIN-2015-32,application/download,43653,42595,0.0024\nCC-MAIN-2015-32,application/epub+zip,57106,51429,0.0031\nCC-MAIN-2015-32,application/force-download,21267,20024,0.0012\nCC-MAIN-2015-32,application/gpx+xml,248,248,0.0000\nCC-MAIN-2015-32,application/ics,3330,3330,0.0002\nCC-MAIN-2015-32,application/javascript,646,610,0.0000\nCC-MAIN-2015-32,application/json,306840,295667,0.0169\nCC-MAIN-2015-32,application/ld+json,8286,8286,0.0005\nCC-MAIN-2015-32,application/marc,17593,17593,0.0010\nCC-MAIN-2015-32,application/msword,92405,84924,0.0051\nCC-MAIN-2015-32,application/octet-stream,691954,667548,0.0381\nCC-MAIN-2015-32,application/octetstream,14452,14415,0.0008\nCC-MAIN-2015-32,application/pdf,3102659,2867207,0.1709\nCC-MAIN-2015-32,application/pgp-encrypted,19452,18604,0.0011\nCC-MAIN-2015-32,application/pgp-signature,15158,15106,0.0008\nCC-MAIN-2015-32,application/postscript,6367,6237,0.0004\nCC-MAIN-2015-32,application/rdf+xml,72956,72376,0.0040\nCC-MAIN-2015-32,application/rss+xml,3090099,2883660,0.1702\nCC-MAIN-2015-32,application/rtf,999,965,0.0001\nCC-MAIN-2015-32,application/save-to-disk,38364,38364,0.0021\nCC-MAIN-2015-32,application/text,15924,15485,0.0009\nCC-MAIN-2015-32,application/unknown,8293,8121,0.0005\nCC-MAIN-2015-32,application/vnd.android.package-archive,1384,1344,0.0001\nCC-MAIN-2015-32,application/vnd.google-earth.kml+xml,145792,145483,0.0080\nCC-MAIN-2015-32,application/vnd.google-earth.kmz,35931,35695,0.0020\nCC-MAIN-2015-32,application/vnd.ms-excel,76736,74076,0.0042\nCC-MAIN-2015-32,application/vnd.ms-powerpoint,35116,32823,0.0019\nCC-MAIN-2015-32,application/vnd.ms-word,10320,10246,0.0006\nCC-MAIN-2015-32,application/vnd.oasis.opendocument.text,1766,1659,0.0001\nCC-MAIN-2015-32,application/vnd.openxmlformats-officedocument.presentationml.presentation,3707,3306,0.0002\nCC-MAIN-2015-32,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,4043,3498,0.0002\nCC-MAIN-2015-32,application/vnd.openxmlformats-officedocument.wordprocessingml.document,23636,20987,0.0013\nCC-MAIN-2015-32,application/vnd.wap.xhtml+xml,43629,43424,0.0024\nCC-MAIN-2015-32,application/x-bibtex,37990,37029,0.0021\nCC-MAIN-2015-32,application/x-bittorrent,4418,4414,0.0002\nCC-MAIN-2015-32,application/x-debian-package,38539,38468,0.0021\nCC-MAIN-2015-32,application/x-download,14031,13449,0.0008\nCC-MAIN-2015-32,application/x-endnote-refer,42464,41981,0.0023\nCC-MAIN-2015-32,application/x-gzip,31262,30938,0.0017\nCC-MAIN-2015-32,application/x-httpd-php,14112,13811,0.0008\nCC-MAIN-2015-32,application/x-java-jnlp-file,14027,13229,0.0008\nCC-MAIN-2015-32,application/x-javascript,4547,4532,0.0003\nCC-MAIN-2015-32,application/x-json,50762,50762,0.0028\nCC-MAIN-2015-32,application/x-mobipocket-ebook,24385,22639,0.0013\nCC-MAIN-2015-32,application/x-msdownload,2653,2488,0.0001\nCC-MAIN-2015-32,application/x-netcdf,16871,16859,0.0009\nCC-MAIN-2015-32,application/x-research-info-systems,74657,73605,0.0041\nCC-MAIN-2015-32,application/x-shockwave-flash,46620,46383,0.0026\nCC-MAIN-2015-32,application/x-tar,4547,4500,0.0003\nCC-MAIN-2015-32,application/x-tex,15758,15637,0.0009\nCC-MAIN-2015-32,application/x-troff-man,36376,32265,0.0020\nCC-MAIN-2015-32,application/x-zip-compressed,13552,12704,0.0007\nCC-MAIN-2015-32,application/xhtml+xml,1007669,969049,0.0555\nCC-MAIN-2015-32,application/xml,1340441,1301637,0.0738\nCC-MAIN-2015-32,application/zip,113561,110762,0.0063\nCC-MAIN-2015-32,audio/mpeg,69553,57331,0.0038\nCC-MAIN-2015-32,audio/x-mpegurl,38265,38243,0.0021\nCC-MAIN-2015-32,audio/x-scpls,67635,67565,0.0037\nCC-MAIN-2015-32,audio/x-wav,244080,243935,0.0134\nCC-MAIN-2015-32,binary/octet-stream,6738,6195,0.0004\nCC-MAIN-2015-32,image/gif,658904,655126,0.0363\nCC-MAIN-2015-32,image/jp2,39149,38643,0.0022\nCC-MAIN-2015-32,image/jpeg,7771581,7675608,0.4281\nCC-MAIN-2015-32,image/jpg,119403,119204,0.0066\nCC-MAIN-2015-32,image/pjpeg,37592,36075,0.0021\nCC-MAIN-2015-32,image/png,4366391,4360734,0.2405\nCC-MAIN-2015-32,image/svg+xml,643,617,0.0000\nCC-MAIN-2015-32,image/tiff,38989,38257,0.0021\nCC-MAIN-2015-32,image/vnd.djvu,7090,6800,0.0004\nCC-MAIN-2015-32,image/webp,82,82,0.0000\nCC-MAIN-2015-32,message/rfc822,16730,16415,0.0009\nCC-MAIN-2015-32,text/calendar,1512985,1476865,0.0833\nCC-MAIN-2015-32,text/css,1062,1050,0.0001\nCC-MAIN-2015-32,text/csv,98431,94858,0.0054\nCC-MAIN-2015-32,text/directory,5290,4993,0.0003\nCC-MAIN-2015-32,text/enriched,7548,7466,0.0004\nCC-MAIN-2015-32,text/html,1773328721,1608324379,97.6776\nCC-MAIN-2015-32,text/javascript,21093,20866,0.0012\nCC-MAIN-2015-32,text/pdf,31225,31225,0.0017\nCC-MAIN-2015-32,text/plain,3437651,3330134,0.1894\nCC-MAIN-2015-32,text/prs.lines.tag,65,65,0.0000\nCC-MAIN-2015-32,text/tab-separated-values,66219,62879,0.0036\nCC-MAIN-2015-32,text/turtle,9452,9258,0.0005\nCC-MAIN-2015-32,text/vcard,2401,1635,0.0001\nCC-MAIN-2015-32,text/x-bibtex,10876,10809,0.0006\nCC-MAIN-2015-32,text/x-c,4202,4037,0.0002\nCC-MAIN-2015-32,text/x-csrc,3448,3384,0.0002\nCC-MAIN-2015-32,text/x-diff,15270,14746,0.0008\nCC-MAIN-2015-32,text/x-patch,102234,101132,0.0056\nCC-MAIN-2015-32,text/x-perl,40711,40695,0.0022\nCC-MAIN-2015-32,text/x-vcalendar,64960,60969,0.0036\nCC-MAIN-2015-32,text/x-vcard,41992,39721,0.0023\nCC-MAIN-2015-32,text/xml,7706521,7474594,0.4245\nCC-MAIN-2015-32,unknown/unknown,182423,156382,0.0100\nCC-MAIN-2015-32,video/mp4,6057,5999,0.0003\nCC-MAIN-2015-32,video/webm,9832,9103,0.0005\nCC-MAIN-2015-32,video/x-ms-asf,223834,219490,0.0123\nCC-MAIN-2015-35,<other>,2344317,2264824,0.1269\nCC-MAIN-2015-35,application/atom+xml,1911959,1895821,0.1035\nCC-MAIN-2015-35,application/calendar,6828,6176,0.0004\nCC-MAIN-2015-35,application/download,40464,39633,0.0022\nCC-MAIN-2015-35,application/epub+zip,43616,37729,0.0024\nCC-MAIN-2015-35,application/force-download,22159,20863,0.0012\nCC-MAIN-2015-35,application/gpx+xml,259,259,0.0000\nCC-MAIN-2015-35,application/ics,3488,3488,0.0002\nCC-MAIN-2015-35,application/javascript,650,608,0.0000\nCC-MAIN-2015-35,application/json,318381,306338,0.0172\nCC-MAIN-2015-35,application/ld+json,7088,7087,0.0004\nCC-MAIN-2015-35,application/marc,17980,17980,0.0010\nCC-MAIN-2015-35,application/msword,91358,83463,0.0049\nCC-MAIN-2015-35,application/octet-stream,706775,680734,0.0382\nCC-MAIN-2015-35,application/octetstream,15249,15214,0.0008\nCC-MAIN-2015-35,application/pdf,3088285,2841601,0.1671\nCC-MAIN-2015-35,application/pgp-encrypted,5906,5903,0.0003\nCC-MAIN-2015-35,application/pgp-signature,14685,14634,0.0008\nCC-MAIN-2015-35,application/postscript,7161,7008,0.0004\nCC-MAIN-2015-35,application/rdf+xml,72613,72012,0.0039\nCC-MAIN-2015-35,application/rss+xml,4068129,3816239,0.2201\nCC-MAIN-2015-35,application/rtf,990,954,0.0001\nCC-MAIN-2015-35,application/save-to-disk,40272,40272,0.0022\nCC-MAIN-2015-35,application/text,16853,16389,0.0009\nCC-MAIN-2015-35,application/unknown,8258,8087,0.0004\nCC-MAIN-2015-35,application/vnd.android.package-archive,1389,1350,0.0001\nCC-MAIN-2015-35,application/vnd.google-earth.kml+xml,151617,150995,0.0082\nCC-MAIN-2015-35,application/vnd.google-earth.kmz,37846,37558,0.0020\nCC-MAIN-2015-35,application/vnd.ms-excel,79086,76347,0.0043\nCC-MAIN-2015-35,application/vnd.ms-powerpoint,36497,34071,0.0020\nCC-MAIN-2015-35,application/vnd.ms-word,8053,8039,0.0004\nCC-MAIN-2015-35,application/vnd.oasis.opendocument.text,1831,1716,0.0001\nCC-MAIN-2015-35,application/vnd.openxmlformats-officedocument.presentationml.presentation,3847,3420,0.0002\nCC-MAIN-2015-35,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,4303,3729,0.0002\nCC-MAIN-2015-35,application/vnd.openxmlformats-officedocument.wordprocessingml.document,24666,21601,0.0013\nCC-MAIN-2015-35,application/vnd.wap.xhtml+xml,44846,44597,0.0024\nCC-MAIN-2015-35,application/x-bibtex,39141,38062,0.0021\nCC-MAIN-2015-35,application/x-bittorrent,4589,4585,0.0002\nCC-MAIN-2015-35,application/x-debian-package,37300,37223,0.0020\nCC-MAIN-2015-35,application/x-download,14722,14093,0.0008\nCC-MAIN-2015-35,application/x-endnote-refer,43692,43172,0.0024\nCC-MAIN-2015-35,application/x-gzip,33417,32944,0.0018\nCC-MAIN-2015-35,application/x-httpd-php,10719,10374,0.0006\nCC-MAIN-2015-35,application/x-java-jnlp-file,14728,13842,0.0008\nCC-MAIN-2015-35,application/x-javascript,4357,4340,0.0002\nCC-MAIN-2015-35,application/x-json,44444,44444,0.0024\nCC-MAIN-2015-35,application/x-mobipocket-ebook,12069,10109,0.0007\nCC-MAIN-2015-35,application/x-msdownload,2750,2578,0.0001\nCC-MAIN-2015-35,application/x-netcdf,13319,13308,0.0007\nCC-MAIN-2015-35,application/x-research-info-systems,70291,69378,0.0038\nCC-MAIN-2015-35,application/x-shockwave-flash,44219,43998,0.0024\nCC-MAIN-2015-35,application/x-tar,4873,4798,0.0003\nCC-MAIN-2015-35,application/x-tex,16217,16088,0.0009\nCC-MAIN-2015-35,application/x-troff-man,38581,34129,0.0021\nCC-MAIN-2015-35,application/x-zip-compressed,14102,13209,0.0008\nCC-MAIN-2015-35,application/xhtml+xml,1057183,1014766,0.0572\nCC-MAIN-2015-35,application/xml,1344259,1306241,0.0727\nCC-MAIN-2015-35,application/zip,114009,111121,0.0062\nCC-MAIN-2015-35,audio/mpeg,71775,58787,0.0039\nCC-MAIN-2015-35,audio/x-mpegurl,39090,39065,0.0021\nCC-MAIN-2015-35,audio/x-scpls,70502,70423,0.0038\nCC-MAIN-2015-35,audio/x-wav,244905,244748,0.0133\nCC-MAIN-2015-35,binary/octet-stream,6823,6328,0.0004\nCC-MAIN-2015-35,image/gif,666528,662608,0.0361\nCC-MAIN-2015-35,image/jp2,31122,30640,0.0017\nCC-MAIN-2015-35,image/jpeg,8051817,7941491,0.4357\nCC-MAIN-2015-35,image/jpg,123527,123296,0.0067\nCC-MAIN-2015-35,image/pjpeg,37913,36437,0.0021\nCC-MAIN-2015-35,image/png,4297528,4291626,0.2325\nCC-MAIN-2015-35,image/svg+xml,479,453,0.0000\nCC-MAIN-2015-35,image/tiff,40921,40167,0.0022\nCC-MAIN-2015-35,image/vnd.djvu,49930,49617,0.0027\nCC-MAIN-2015-35,image/webp,84,84,0.0000\nCC-MAIN-2015-35,message/rfc822,17289,16949,0.0009\nCC-MAIN-2015-35,text/calendar,1357351,1323389,0.0734\nCC-MAIN-2015-35,text/css,588,577,0.0000\nCC-MAIN-2015-35,text/csv,98643,94923,0.0053\nCC-MAIN-2015-35,text/directory,5415,5089,0.0003\nCC-MAIN-2015-35,text/enriched,7844,7720,0.0004\nCC-MAIN-2015-35,text/html,1805339707,1631822186,97.6904\nCC-MAIN-2015-35,text/javascript,20953,20736,0.0011\nCC-MAIN-2015-35,text/pdf,16610,16610,0.0009\nCC-MAIN-2015-35,text/plain,3432114,3317167,0.1857\nCC-MAIN-2015-35,text/prs.lines.tag,68,68,0.0000\nCC-MAIN-2015-35,text/tab-separated-values,67143,63632,0.0036\nCC-MAIN-2015-35,text/turtle,8219,8011,0.0004\nCC-MAIN-2015-35,text/vcard,2565,1743,0.0001\nCC-MAIN-2015-35,text/x-bibtex,12325,12258,0.0007\nCC-MAIN-2015-35,text/x-c,4351,4177,0.0002\nCC-MAIN-2015-35,text/x-csrc,18178,18104,0.0010\nCC-MAIN-2015-35,text/x-diff,15556,15014,0.0008\nCC-MAIN-2015-35,text/x-patch,105978,104874,0.0057\nCC-MAIN-2015-35,text/x-perl,42389,42370,0.0023\nCC-MAIN-2015-35,text/x-vcalendar,68179,63940,0.0037\nCC-MAIN-2015-35,text/x-vcard,42312,39720,0.0023\nCC-MAIN-2015-35,text/xml,6951091,6736528,0.3761\nCC-MAIN-2015-35,unknown/unknown,180679,154760,0.0098\nCC-MAIN-2015-35,video/mp4,6208,6139,0.0003\nCC-MAIN-2015-35,video/webm,10255,9469,0.0006\nCC-MAIN-2015-35,video/x-ms-asf,230836,226078,0.0125\nCC-MAIN-2015-40,<other>,2045089,1970273,0.1547\nCC-MAIN-2015-40,application/atom+xml,1394134,1385759,0.1055\nCC-MAIN-2015-40,application/calendar,4383,4160,0.0003\nCC-MAIN-2015-40,application/download,32455,31912,0.0025\nCC-MAIN-2015-40,application/epub+zip,31733,28542,0.0024\nCC-MAIN-2015-40,application/force-download,16041,15259,0.0012\nCC-MAIN-2015-40,application/gpx+xml,242,242,0.0000\nCC-MAIN-2015-40,application/ics,2624,2624,0.0002\nCC-MAIN-2015-40,application/javascript,451,431,0.0000\nCC-MAIN-2015-40,application/json,246716,239582,0.0187\nCC-MAIN-2015-40,application/ld+json,6697,6697,0.0005\nCC-MAIN-2015-40,application/marc,12105,12105,0.0009\nCC-MAIN-2015-40,application/msword,62536,57900,0.0047\nCC-MAIN-2015-40,application/octet-stream,522892,506064,0.0396\nCC-MAIN-2015-40,application/octetstream,11742,11719,0.0009\nCC-MAIN-2015-40,application/pdf,2218713,2068527,0.1678\nCC-MAIN-2015-40,application/pgp-encrypted,4287,4286,0.0003\nCC-MAIN-2015-40,application/pgp-signature,11552,11530,0.0009\nCC-MAIN-2015-40,application/postscript,4913,4824,0.0004\nCC-MAIN-2015-40,application/rdf+xml,56489,56196,0.0043\nCC-MAIN-2015-40,application/rss+xml,3481554,3317183,0.2634\nCC-MAIN-2015-40,application/rtf,712,694,0.0001\nCC-MAIN-2015-40,application/save-to-disk,28529,28529,0.0022\nCC-MAIN-2015-40,application/text,11862,11633,0.0009\nCC-MAIN-2015-40,application/unknown,5353,5332,0.0004\nCC-MAIN-2015-40,application/vnd.android.package-archive,1170,1149,0.0001\nCC-MAIN-2015-40,application/vnd.google-earth.kml+xml,118362,117769,0.0090\nCC-MAIN-2015-40,application/vnd.google-earth.kmz,30358,30221,0.0023\nCC-MAIN-2015-40,application/vnd.ms-excel,57501,55933,0.0043\nCC-MAIN-2015-40,application/vnd.ms-powerpoint,23391,22455,0.0018\nCC-MAIN-2015-40,application/vnd.ms-word,6336,6323,0.0005\nCC-MAIN-2015-40,application/vnd.oasis.opendocument.text,1391,1330,0.0001\nCC-MAIN-2015-40,application/vnd.openxmlformats-officedocument.presentationml.presentation,2907,2623,0.0002\nCC-MAIN-2015-40,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,3183,2814,0.0002\nCC-MAIN-2015-40,application/vnd.openxmlformats-officedocument.wordprocessingml.document,18035,16205,0.0014\nCC-MAIN-2015-40,application/vnd.wap.xhtml+xml,30106,29893,0.0023\nCC-MAIN-2015-40,application/x-bibtex,27565,26809,0.0021\nCC-MAIN-2015-40,application/x-bittorrent,3105,3103,0.0002\nCC-MAIN-2015-40,application/x-debian-package,28658,28615,0.0022\nCC-MAIN-2015-40,application/x-download,9915,9900,0.0008\nCC-MAIN-2015-40,application/x-endnote-refer,30595,30318,0.0023\nCC-MAIN-2015-40,application/x-gzip,23358,23131,0.0018\nCC-MAIN-2015-40,application/x-httpd-php,6796,6582,0.0005\nCC-MAIN-2015-40,application/x-java-jnlp-file,6670,6655,0.0005\nCC-MAIN-2015-40,application/x-javascript,3558,3548,0.0003\nCC-MAIN-2015-40,application/x-json,22445,22445,0.0017\nCC-MAIN-2015-40,application/x-mobipocket-ebook,8625,7712,0.0007\nCC-MAIN-2015-40,application/x-msdownload,1007,895,0.0001\nCC-MAIN-2015-40,application/x-netcdf,11470,11460,0.0009\nCC-MAIN-2015-40,application/x-research-info-systems,56960,56400,0.0043\nCC-MAIN-2015-40,application/x-shockwave-flash,26944,26805,0.0020\nCC-MAIN-2015-40,application/x-tar,3052,3033,0.0002\nCC-MAIN-2015-40,application/x-tex,12932,12846,0.0010\nCC-MAIN-2015-40,application/x-troff-man,26739,24624,0.0020\nCC-MAIN-2015-40,application/x-zip-compressed,10577,10027,0.0008\nCC-MAIN-2015-40,application/xhtml+xml,740343,716204,0.0560\nCC-MAIN-2015-40,application/xml,944292,925292,0.0714\nCC-MAIN-2015-40,application/zip,87844,86414,0.0066\nCC-MAIN-2015-40,audio/mpeg,57204,49290,0.0043\nCC-MAIN-2015-40,audio/x-mpegurl,29554,29538,0.0022\nCC-MAIN-2015-40,audio/x-scpls,47751,47712,0.0036\nCC-MAIN-2015-40,audio/x-wav,173672,173591,0.0131\nCC-MAIN-2015-40,binary/octet-stream,4844,4514,0.0004\nCC-MAIN-2015-40,image/gif,510533,507849,0.0386\nCC-MAIN-2015-40,image/jp2,28599,28433,0.0022\nCC-MAIN-2015-40,image/jpeg,5945602,5874932,0.4497\nCC-MAIN-2015-40,image/jpg,88763,88614,0.0067\nCC-MAIN-2015-40,image/pjpeg,25918,25067,0.0020\nCC-MAIN-2015-40,image/png,3215767,3211817,0.2433\nCC-MAIN-2015-40,image/svg+xml,384,365,0.0000\nCC-MAIN-2015-40,image/tiff,28648,28283,0.0022\nCC-MAIN-2015-40,image/vnd.djvu,34101,33923,0.0026\nCC-MAIN-2015-40,image/webp,69,69,0.0000\nCC-MAIN-2015-40,message/rfc822,11877,11669,0.0009\nCC-MAIN-2015-40,text/calendar,947154,930085,0.0716\nCC-MAIN-2015-40,text/css,384,379,0.0000\nCC-MAIN-2015-40,text/csv,72200,70160,0.0055\nCC-MAIN-2015-40,text/directory,4130,3939,0.0003\nCC-MAIN-2015-40,text/enriched,6206,5930,0.0005\nCC-MAIN-2015-40,text/html,1290572848,1184479338,97.6237\nCC-MAIN-2015-40,text/javascript,14451,14321,0.0011\nCC-MAIN-2015-40,text/pdf,13859,13859,0.0010\nCC-MAIN-2015-40,text/plain,2473187,2413710,0.1871\nCC-MAIN-2015-40,text/prs.lines.tag,50,50,0.0000\nCC-MAIN-2015-40,text/tab-separated-values,48390,46528,0.0037\nCC-MAIN-2015-40,text/turtle,7387,7280,0.0006\nCC-MAIN-2015-40,text/vcard,1937,1422,0.0001\nCC-MAIN-2015-40,text/x-bibtex,10690,10685,0.0008\nCC-MAIN-2015-40,text/x-c,3108,3022,0.0002\nCC-MAIN-2015-40,text/x-csrc,13429,13382,0.0010\nCC-MAIN-2015-40,text/x-diff,11363,11039,0.0009\nCC-MAIN-2015-40,text/x-patch,77064,76461,0.0058\nCC-MAIN-2015-40,text/x-perl,32938,32931,0.0025\nCC-MAIN-2015-40,text/x-vcalendar,50207,47774,0.0038\nCC-MAIN-2015-40,text/x-vcard,29019,27592,0.0022\nCC-MAIN-2015-40,text/xml,4496974,4396848,0.3402\nCC-MAIN-2015-40,unknown/unknown,128309,113649,0.0097\nCC-MAIN-2015-40,video/mp4,4586,4541,0.0003\nCC-MAIN-2015-40,video/webm,8260,7662,0.0006\nCC-MAIN-2015-40,video/x-ms-asf,155969,153032,0.0118\nCC-MAIN-2015-48,<other>,2721577,2571480,0.1492\nCC-MAIN-2015-48,application/atom+xml,1884123,1869344,0.1033\nCC-MAIN-2015-48,application/calendar,7603,7163,0.0004\nCC-MAIN-2015-48,application/download,44860,43569,0.0025\nCC-MAIN-2015-48,application/epub+zip,45514,39502,0.0025\nCC-MAIN-2015-48,application/force-download,21079,19749,0.0012\nCC-MAIN-2015-48,application/gpx+xml,302,302,0.0000\nCC-MAIN-2015-48,application/ics,3527,3527,0.0002\nCC-MAIN-2015-48,application/javascript,621,576,0.0000\nCC-MAIN-2015-48,application/json,316469,304307,0.0173\nCC-MAIN-2015-48,application/ld+json,8243,8243,0.0005\nCC-MAIN-2015-48,application/marc,17940,17940,0.0010\nCC-MAIN-2015-48,application/msword,87647,80086,0.0048\nCC-MAIN-2015-48,application/octet-stream,1476259,1444917,0.0809\nCC-MAIN-2015-48,application/octetstream,15144,15109,0.0008\nCC-MAIN-2015-48,application/pdf,2898533,2668978,0.1589\nCC-MAIN-2015-48,application/pgp-encrypted,6164,6161,0.0003\nCC-MAIN-2015-48,application/pgp-signature,15500,15455,0.0008\nCC-MAIN-2015-48,application/postscript,7252,7088,0.0004\nCC-MAIN-2015-48,application/rdf+xml,74161,73562,0.0041\nCC-MAIN-2015-48,application/rss+xml,5243127,4925799,0.2874\nCC-MAIN-2015-48,application/rtf,955,913,0.0001\nCC-MAIN-2015-48,application/save-to-disk,32961,32961,0.0018\nCC-MAIN-2015-48,application/text,16838,16453,0.0009\nCC-MAIN-2015-48,application/unknown,7396,7356,0.0004\nCC-MAIN-2015-48,application/vnd.android.package-archive,1690,1647,0.0001\nCC-MAIN-2015-48,application/vnd.google-earth.kml+xml,156888,155623,0.0086\nCC-MAIN-2015-48,application/vnd.google-earth.kmz,37419,37137,0.0021\nCC-MAIN-2015-48,application/vnd.ms-excel,66506,63683,0.0036\nCC-MAIN-2015-48,application/vnd.ms-powerpoint,32490,30435,0.0018\nCC-MAIN-2015-48,application/vnd.ms-word,8139,8123,0.0004\nCC-MAIN-2015-48,application/vnd.oasis.opendocument.text,1796,1680,0.0001\nCC-MAIN-2015-48,application/vnd.openxmlformats-officedocument.presentationml.presentation,3739,3330,0.0002\nCC-MAIN-2015-48,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,4086,3575,0.0002\nCC-MAIN-2015-48,application/vnd.openxmlformats-officedocument.wordprocessingml.document,23745,20897,0.0013\nCC-MAIN-2015-48,application/vnd.wap.xhtml+xml,43916,43612,0.0024\nCC-MAIN-2015-48,application/x-bibtex,33692,32617,0.0018\nCC-MAIN-2015-48,application/x-bittorrent,4509,4506,0.0002\nCC-MAIN-2015-48,application/x-debian-package,38501,38425,0.0021\nCC-MAIN-2015-48,application/x-download,13484,13453,0.0007\nCC-MAIN-2015-48,application/x-endnote-refer,41991,41545,0.0023\nCC-MAIN-2015-48,application/x-gzip,32777,32458,0.0018\nCC-MAIN-2015-48,application/x-httpd-php,9265,8945,0.0005\nCC-MAIN-2015-48,application/x-java-jnlp-file,9461,9438,0.0005\nCC-MAIN-2015-48,application/x-javascript,4458,4441,0.0002\nCC-MAIN-2015-48,application/x-json,54099,53981,0.0030\nCC-MAIN-2015-48,application/x-mobipocket-ebook,12175,10148,0.0007\nCC-MAIN-2015-48,application/x-msdownload,5291,5107,0.0003\nCC-MAIN-2015-48,application/x-netcdf,16836,16823,0.0009\nCC-MAIN-2015-48,application/x-research-info-systems,76584,75380,0.0042\nCC-MAIN-2015-48,application/x-shockwave-flash,49601,49404,0.0027\nCC-MAIN-2015-48,application/x-tar,9094,9051,0.0005\nCC-MAIN-2015-48,application/x-tex,16225,16093,0.0009\nCC-MAIN-2015-48,application/x-troff-man,38231,33626,0.0021\nCC-MAIN-2015-48,application/x-zip-compressed,13908,13020,0.0008\nCC-MAIN-2015-48,application/xhtml+xml,1000325,958913,0.0548\nCC-MAIN-2015-48,application/xml,1293430,1251390,0.0709\nCC-MAIN-2015-48,application/zip,109128,106867,0.0060\nCC-MAIN-2015-48,audio/mpeg,66662,54470,0.0037\nCC-MAIN-2015-48,audio/x-mpegurl,39494,39471,0.0022\nCC-MAIN-2015-48,audio/x-scpls,71126,71042,0.0039\nCC-MAIN-2015-48,audio/x-wav,220477,220325,0.0121\nCC-MAIN-2015-48,binary/octet-stream,7303,6743,0.0004\nCC-MAIN-2015-48,image/gif,1021938,1017997,0.0560\nCC-MAIN-2015-48,image/jp2,41979,41581,0.0023\nCC-MAIN-2015-48,image/jpeg,8067933,7949198,0.4423\nCC-MAIN-2015-48,image/jpg,111023,110789,0.0061\nCC-MAIN-2015-48,image/pjpeg,33890,32261,0.0019\nCC-MAIN-2015-48,image/png,4435890,4430075,0.2432\nCC-MAIN-2015-48,image/svg+xml,508,479,0.0000\nCC-MAIN-2015-48,image/tiff,38537,37689,0.0021\nCC-MAIN-2015-48,image/vnd.djvu,50102,49786,0.0027\nCC-MAIN-2015-48,image/webp,83,83,0.0000\nCC-MAIN-2015-48,message/rfc822,17052,16714,0.0009\nCC-MAIN-2015-48,text/calendar,1223500,1199284,0.0671\nCC-MAIN-2015-48,text/css,583,569,0.0000\nCC-MAIN-2015-48,text/csv,93885,90585,0.0051\nCC-MAIN-2015-48,text/directory,5086,4786,0.0003\nCC-MAIN-2015-48,text/enriched,10291,9698,0.0006\nCC-MAIN-2015-48,text/html,1781368298,1602716151,97.6536\nCC-MAIN-2015-48,text/javascript,21031,20788,0.0012\nCC-MAIN-2015-48,text/pdf,31128,31128,0.0017\nCC-MAIN-2015-48,text/plain,3347808,3219492,0.1835\nCC-MAIN-2015-48,text/prs.lines.tag,69,69,0.0000\nCC-MAIN-2015-48,text/tab-separated-values,62677,59574,0.0034\nCC-MAIN-2015-48,text/turtle,9537,9340,0.0005\nCC-MAIN-2015-48,text/vcard,2242,1574,0.0001\nCC-MAIN-2015-48,text/x-bibtex,12166,12155,0.0007\nCC-MAIN-2015-48,text/x-c,4366,4194,0.0002\nCC-MAIN-2015-48,text/x-csrc,18327,18257,0.0010\nCC-MAIN-2015-48,text/x-diff,15152,14675,0.0008\nCC-MAIN-2015-48,text/x-patch,104622,103774,0.0057\nCC-MAIN-2015-48,text/x-perl,41497,41480,0.0023\nCC-MAIN-2015-48,text/x-vcalendar,47763,45949,0.0026\nCC-MAIN-2015-48,text/x-vcard,41380,38750,0.0023\nCC-MAIN-2015-48,text/xml,4901272,4771217,0.2687\nCC-MAIN-2015-48,unknown/unknown,156223,140872,0.0086\nCC-MAIN-2015-48,video/mp4,6240,6150,0.0003\nCC-MAIN-2015-48,video/webm,10203,9401,0.0006\nCC-MAIN-2015-48,video/x-ms-asf,193910,189210,0.0106\nCC-MAIN-2016-07,<other>,2454516,2296966,0.1416\nCC-MAIN-2016-07,application/atom+xml,1840413,1826051,0.1062\nCC-MAIN-2016-07,application/calendar,7407,7240,0.0004\nCC-MAIN-2016-07,application/download,40609,38262,0.0023\nCC-MAIN-2016-07,application/epub+zip,42751,36829,0.0025\nCC-MAIN-2016-07,application/force-download,19672,18376,0.0011\nCC-MAIN-2016-07,application/gpx+xml,295,295,0.0000\nCC-MAIN-2016-07,application/ics,3484,3484,0.0002\nCC-MAIN-2016-07,application/javascript,625,581,0.0000\nCC-MAIN-2016-07,application/json,387623,366385,0.0224\nCC-MAIN-2016-07,application/ld+json,7835,7835,0.0005\nCC-MAIN-2016-07,application/marc,15098,15098,0.0009\nCC-MAIN-2016-07,application/msword,82105,74698,0.0047\nCC-MAIN-2016-07,application/octet-stream,1337672,1311815,0.0772\nCC-MAIN-2016-07,application/octetstream,15402,15366,0.0009\nCC-MAIN-2016-07,application/pdf,2727331,2511102,0.1574\nCC-MAIN-2016-07,application/pgp-encrypted,22565,22563,0.0013\nCC-MAIN-2016-07,application/pgp-signature,14220,14175,0.0008\nCC-MAIN-2016-07,application/postscript,6747,6589,0.0004\nCC-MAIN-2016-07,application/rdf+xml,71249,70724,0.0041\nCC-MAIN-2016-07,application/rss+xml,5431616,5093288,0.3134\nCC-MAIN-2016-07,application/rtf,819,787,0.0000\nCC-MAIN-2016-07,application/save-to-disk,12345,12345,0.0007\nCC-MAIN-2016-07,application/text,16285,15861,0.0009\nCC-MAIN-2016-07,application/unknown,7276,6431,0.0004\nCC-MAIN-2016-07,application/vnd.android.package-archive,1662,1618,0.0001\nCC-MAIN-2016-07,application/vnd.google-earth.kml+xml,155668,154412,0.0090\nCC-MAIN-2016-07,application/vnd.google-earth.kmz,37108,36854,0.0021\nCC-MAIN-2016-07,application/vnd.ms-excel,65565,63185,0.0038\nCC-MAIN-2016-07,application/vnd.ms-powerpoint,35184,33012,0.0020\nCC-MAIN-2016-07,application/vnd.ms-word,8078,8062,0.0005\nCC-MAIN-2016-07,application/vnd.oasis.opendocument.text,1670,1560,0.0001\nCC-MAIN-2016-07,application/vnd.openxmlformats-officedocument.presentationml.presentation,3324,2911,0.0002\nCC-MAIN-2016-07,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,4911,4434,0.0003\nCC-MAIN-2016-07,application/vnd.openxmlformats-officedocument.wordprocessingml.document,22768,19946,0.0013\nCC-MAIN-2016-07,application/vnd.wap.xhtml+xml,43886,43622,0.0025\nCC-MAIN-2016-07,application/x-bibtex,36383,35845,0.0021\nCC-MAIN-2016-07,application/x-bittorrent,3866,3863,0.0002\nCC-MAIN-2016-07,application/x-debian-package,37340,37277,0.0022\nCC-MAIN-2016-07,application/x-download,12232,12201,0.0007\nCC-MAIN-2016-07,application/x-endnote-refer,44644,44180,0.0026\nCC-MAIN-2016-07,application/x-gzip,37883,37035,0.0022\nCC-MAIN-2016-07,application/x-httpd-php,9763,9488,0.0006\nCC-MAIN-2016-07,application/x-java-jnlp-file,9342,9321,0.0005\nCC-MAIN-2016-07,application/x-javascript,3207,3191,0.0002\nCC-MAIN-2016-07,application/x-json,47080,46969,0.0027\nCC-MAIN-2016-07,application/x-mobipocket-ebook,12036,10080,0.0007\nCC-MAIN-2016-07,application/x-msdownload,5258,5076,0.0003\nCC-MAIN-2016-07,application/x-netcdf,16998,16983,0.0010\nCC-MAIN-2016-07,application/x-research-info-systems,73882,72902,0.0043\nCC-MAIN-2016-07,application/x-shockwave-flash,42849,42650,0.0025\nCC-MAIN-2016-07,application/x-tar,8474,8426,0.0005\nCC-MAIN-2016-07,application/x-tex,16035,15916,0.0009\nCC-MAIN-2016-07,application/x-troff-man,36871,32377,0.0021\nCC-MAIN-2016-07,application/x-zip-compressed,13147,12392,0.0008\nCC-MAIN-2016-07,application/xhtml+xml,1040903,1002452,0.0601\nCC-MAIN-2016-07,application/xml,1175673,1137137,0.0678\nCC-MAIN-2016-07,application/zip,101263,99696,0.0058\nCC-MAIN-2016-07,audio/mpeg,66871,54885,0.0039\nCC-MAIN-2016-07,audio/x-mpegurl,27784,27762,0.0016\nCC-MAIN-2016-07,audio/x-scpls,70897,70811,0.0041\nCC-MAIN-2016-07,audio/x-wav,224004,223863,0.0129\nCC-MAIN-2016-07,binary/octet-stream,7273,6746,0.0004\nCC-MAIN-2016-07,image/gif,947248,942895,0.0547\nCC-MAIN-2016-07,image/jp2,36254,35794,0.0021\nCC-MAIN-2016-07,image/jpeg,7396703,7274620,0.4267\nCC-MAIN-2016-07,image/jpg,112322,112094,0.0065\nCC-MAIN-2016-07,image/pjpeg,34944,33345,0.0020\nCC-MAIN-2016-07,image/png,4268192,4263164,0.2462\nCC-MAIN-2016-07,image/svg+xml,485,458,0.0000\nCC-MAIN-2016-07,image/tiff,34740,33989,0.0020\nCC-MAIN-2016-07,image/vnd.djvu,49254,48942,0.0028\nCC-MAIN-2016-07,image/webp,84,84,0.0000\nCC-MAIN-2016-07,message/rfc822,16513,16242,0.0010\nCC-MAIN-2016-07,text/calendar,1196133,1166961,0.0690\nCC-MAIN-2016-07,text/css,548,533,0.0000\nCC-MAIN-2016-07,text/csv,94875,91176,0.0055\nCC-MAIN-2016-07,text/directory,5005,4649,0.0003\nCC-MAIN-2016-07,text/enriched,9927,9361,0.0006\nCC-MAIN-2016-07,text/html,1692652107,1520893306,97.6557\nCC-MAIN-2016-07,text/javascript,15883,15665,0.0009\nCC-MAIN-2016-07,text/pdf,30454,30454,0.0018\nCC-MAIN-2016-07,text/plain,3164912,3053579,0.1826\nCC-MAIN-2016-07,text/prs.lines.tag,67,67,0.0000\nCC-MAIN-2016-07,text/tab-separated-values,64444,61051,0.0037\nCC-MAIN-2016-07,text/turtle,8870,8674,0.0005\nCC-MAIN-2016-07,text/vcard,2266,1607,0.0001\nCC-MAIN-2016-07,text/x-bibtex,12250,12239,0.0007\nCC-MAIN-2016-07,text/x-c,4274,4101,0.0002\nCC-MAIN-2016-07,text/x-csrc,18587,18460,0.0011\nCC-MAIN-2016-07,text/x-diff,15802,15280,0.0009\nCC-MAIN-2016-07,text/x-patch,105646,104628,0.0061\nCC-MAIN-2016-07,text/x-perl,15189,15174,0.0009\nCC-MAIN-2016-07,text/x-vcalendar,47260,45625,0.0027\nCC-MAIN-2016-07,text/x-vcard,38944,36625,0.0022\nCC-MAIN-2016-07,text/xml,4370706,4253197,0.2522\nCC-MAIN-2016-07,unknown/unknown,146077,123957,0.0084\nCC-MAIN-2016-07,video/mp4,6285,6181,0.0004\nCC-MAIN-2016-07,video/webm,10184,9373,0.0006\nCC-MAIN-2016-07,video/x-ms-asf,223946,219935,0.0129\nCC-MAIN-2016-18,<other>,2195885,2195885,0.1645\nCC-MAIN-2016-18,application/atom+xml,1768306,1768306,0.1325\nCC-MAIN-2016-18,application/calendar,6948,6948,0.0005\nCC-MAIN-2016-18,application/download,15446,15446,0.0012\nCC-MAIN-2016-18,application/epub+zip,35490,35490,0.0027\nCC-MAIN-2016-18,application/force-download,15159,15159,0.0011\nCC-MAIN-2016-18,application/gpx+xml,294,294,0.0000\nCC-MAIN-2016-18,application/ics,3504,3504,0.0003\nCC-MAIN-2016-18,application/javascript,687,687,0.0001\nCC-MAIN-2016-18,application/json,343899,343899,0.0258\nCC-MAIN-2016-18,application/ld+json,7845,7845,0.0006\nCC-MAIN-2016-18,application/marc,14348,14348,0.0011\nCC-MAIN-2016-18,application/msword,66067,66067,0.0049\nCC-MAIN-2016-18,application/octet-stream,1843360,1843360,0.1381\nCC-MAIN-2016-18,application/octetstream,13960,13960,0.0010\nCC-MAIN-2016-18,application/pdf,2285417,2285417,0.1712\nCC-MAIN-2016-18,application/pgp-encrypted,70347,70347,0.0053\nCC-MAIN-2016-18,application/pgp-signature,15735,15735,0.0012\nCC-MAIN-2016-18,application/postscript,5776,5776,0.0004\nCC-MAIN-2016-18,application/rdf+xml,68226,68226,0.0051\nCC-MAIN-2016-18,application/rss+xml,4863206,4863206,0.3643\nCC-MAIN-2016-18,application/rtf,568,568,0.0000\nCC-MAIN-2016-18,application/save-to-disk,4873,4873,0.0004\nCC-MAIN-2016-18,application/text,14482,14482,0.0011\nCC-MAIN-2016-18,application/unknown,2735,2735,0.0002\nCC-MAIN-2016-18,application/vnd.android.package-archive,1247,1247,0.0001\nCC-MAIN-2016-18,application/vnd.google-earth.kml+xml,156349,156349,0.0117\nCC-MAIN-2016-18,application/vnd.google-earth.kmz,35936,35936,0.0027\nCC-MAIN-2016-18,application/vnd.ms-excel,45279,45279,0.0034\nCC-MAIN-2016-18,application/vnd.ms-powerpoint,11845,11845,0.0009\nCC-MAIN-2016-18,application/vnd.ms-word,11176,11176,0.0008\nCC-MAIN-2016-18,application/vnd.oasis.opendocument.text,1484,1484,0.0001\nCC-MAIN-2016-18,application/vnd.openxmlformats-officedocument.presentationml.presentation,2681,2681,0.0002\nCC-MAIN-2016-18,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,4245,4245,0.0003\nCC-MAIN-2016-18,application/vnd.openxmlformats-officedocument.wordprocessingml.document,18123,18123,0.0014\nCC-MAIN-2016-18,application/vnd.wap.xhtml+xml,43861,43861,0.0033\nCC-MAIN-2016-18,application/x-bibtex,35683,35683,0.0027\nCC-MAIN-2016-18,application/x-bittorrent,1202,1202,0.0001\nCC-MAIN-2016-18,application/x-debian-package,36132,36132,0.0027\nCC-MAIN-2016-18,application/x-download,10377,10377,0.0008\nCC-MAIN-2016-18,application/x-endnote-refer,42063,42063,0.0032\nCC-MAIN-2016-18,application/x-gzip,37385,37385,0.0028\nCC-MAIN-2016-18,application/x-httpd-php,9908,9908,0.0007\nCC-MAIN-2016-18,application/x-java-jnlp-file,9347,9347,0.0007\nCC-MAIN-2016-18,application/x-javascript,3123,3123,0.0002\nCC-MAIN-2016-18,application/x-json,95,95,0.0000\nCC-MAIN-2016-18,application/x-mobipocket-ebook,9170,9170,0.0007\nCC-MAIN-2016-18,application/x-msdownload,4400,4400,0.0003\nCC-MAIN-2016-18,application/x-netcdf,16054,16054,0.0012\nCC-MAIN-2016-18,application/x-research-info-systems,38995,38995,0.0029\nCC-MAIN-2016-18,application/x-shockwave-flash,2915,2915,0.0002\nCC-MAIN-2016-18,application/x-tar,7060,7060,0.0005\nCC-MAIN-2016-18,application/x-tex,15847,15847,0.0012\nCC-MAIN-2016-18,application/x-troff-man,29111,29111,0.0022\nCC-MAIN-2016-18,application/x-zip-compressed,11412,11412,0.0009\nCC-MAIN-2016-18,application/xhtml+xml,888924,888924,0.0666\nCC-MAIN-2016-18,application/xml,1006490,1006490,0.0754\nCC-MAIN-2016-18,application/zip,68561,68561,0.0051\nCC-MAIN-2016-18,audio/mpeg,49785,49785,0.0037\nCC-MAIN-2016-18,audio/x-mpegurl,29956,29956,0.0022\nCC-MAIN-2016-18,audio/x-scpls,69879,69879,0.0052\nCC-MAIN-2016-18,audio/x-wav,171179,171179,0.0128\nCC-MAIN-2016-18,binary/octet-stream,7502,7502,0.0006\nCC-MAIN-2016-18,image/gif,926740,926740,0.0694\nCC-MAIN-2016-18,image/jp2,41327,41327,0.0031\nCC-MAIN-2016-18,image/jpeg,6636869,6636869,0.4971\nCC-MAIN-2016-18,image/jpg,112538,112538,0.0084\nCC-MAIN-2016-18,image/pjpeg,33023,33023,0.0025\nCC-MAIN-2016-18,image/png,4240410,4240410,0.3176\nCC-MAIN-2016-18,image/svg+xml,434,434,0.0000\nCC-MAIN-2016-18,image/tiff,14070,14070,0.0011\nCC-MAIN-2016-18,image/vnd.djvu,45354,45354,0.0034\nCC-MAIN-2016-18,image/webp,82,82,0.0000\nCC-MAIN-2016-18,message/rfc822,15392,15392,0.0012\nCC-MAIN-2016-18,text/calendar,1111187,1111187,0.0832\nCC-MAIN-2016-18,text/css,573,573,0.0000\nCC-MAIN-2016-18,text/csv,84142,84142,0.0063\nCC-MAIN-2016-18,text/directory,4622,4622,0.0003\nCC-MAIN-2016-18,text/enriched,7848,7848,0.0006\nCC-MAIN-2016-18,text/html,1298313206,1298313206,97.2485\nCC-MAIN-2016-18,text/javascript,13360,13360,0.0010\nCC-MAIN-2016-18,text/pdf,30807,30807,0.0023\nCC-MAIN-2016-18,text/plain,2759169,2759169,0.2067\nCC-MAIN-2016-18,text/prs.lines.tag,70,70,0.0000\nCC-MAIN-2016-18,text/tab-separated-values,54916,54916,0.0041\nCC-MAIN-2016-18,text/turtle,8634,8634,0.0006\nCC-MAIN-2016-18,text/vcard,1763,1763,0.0001\nCC-MAIN-2016-18,text/x-bibtex,19139,19139,0.0014\nCC-MAIN-2016-18,text/x-c,3965,3965,0.0003\nCC-MAIN-2016-18,text/x-csrc,18179,18179,0.0014\nCC-MAIN-2016-18,text/x-diff,14797,14797,0.0011\nCC-MAIN-2016-18,text/x-patch,98875,98875,0.0074\nCC-MAIN-2016-18,text/x-perl,23549,23549,0.0018\nCC-MAIN-2016-18,text/x-vcalendar,41121,41121,0.0031\nCC-MAIN-2016-18,text/x-vcard,36142,36142,0.0027\nCC-MAIN-2016-18,text/xml,3377012,3377012,0.2530\nCC-MAIN-2016-18,unknown/unknown,87990,87990,0.0066\nCC-MAIN-2016-18,video/mp4,6046,6046,0.0005\nCC-MAIN-2016-18,video/webm,9071,9071,0.0007\nCC-MAIN-2016-18,video/x-ms-asf,247157,247157,0.0185\nCC-MAIN-2016-22,<other>,2301554,2301554,0.1570\nCC-MAIN-2016-22,application/atom+xml,1768320,1768320,0.1206\nCC-MAIN-2016-22,application/calendar,6817,6817,0.0005\nCC-MAIN-2016-22,application/download,15821,15821,0.0011\nCC-MAIN-2016-22,application/epub+zip,31467,31467,0.0021\nCC-MAIN-2016-22,application/force-download,16671,16671,0.0011\nCC-MAIN-2016-22,application/gpx+xml,194,194,0.0000\nCC-MAIN-2016-22,application/ics,3495,3495,0.0002\nCC-MAIN-2016-22,application/javascript,804,804,0.0001\nCC-MAIN-2016-22,application/json,323473,323473,0.0221\nCC-MAIN-2016-22,application/ld+json,7771,7771,0.0005\nCC-MAIN-2016-22,application/marc,15079,15079,0.0010\nCC-MAIN-2016-22,application/msword,576352,576352,0.0393\nCC-MAIN-2016-22,application/octet-stream,2219528,2219528,0.1514\nCC-MAIN-2016-22,application/octetstream,15517,15517,0.0011\nCC-MAIN-2016-22,application/pdf,3687625,3687625,0.2515\nCC-MAIN-2016-22,application/pgp-encrypted,69157,69157,0.0047\nCC-MAIN-2016-22,application/pgp-signature,17127,17127,0.0012\nCC-MAIN-2016-22,application/postscript,8048,8048,0.0005\nCC-MAIN-2016-22,application/rdf+xml,67831,67831,0.0046\nCC-MAIN-2016-22,application/rss+xml,4891492,4891492,0.3336\nCC-MAIN-2016-22,application/rtf,2212,2212,0.0002\nCC-MAIN-2016-22,application/save-to-disk,5250,5250,0.0004\nCC-MAIN-2016-22,application/text,13510,13510,0.0009\nCC-MAIN-2016-22,application/unknown,2869,2869,0.0002\nCC-MAIN-2016-22,application/vnd.android.package-archive,1439,1439,0.0001\nCC-MAIN-2016-22,application/vnd.google-earth.kml+xml,285282,285282,0.0195\nCC-MAIN-2016-22,application/vnd.google-earth.kmz,38222,38222,0.0026\nCC-MAIN-2016-22,application/vnd.ms-excel,162044,162044,0.0111\nCC-MAIN-2016-22,application/vnd.ms-powerpoint,125903,125903,0.0086\nCC-MAIN-2016-22,application/vnd.ms-word,11711,11711,0.0008\nCC-MAIN-2016-22,application/vnd.oasis.opendocument.text,1605,1605,0.0001\nCC-MAIN-2016-22,application/vnd.openxmlformats-officedocument.presentationml.presentation,3389,3389,0.0002\nCC-MAIN-2016-22,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,5740,5740,0.0004\nCC-MAIN-2016-22,application/vnd.openxmlformats-officedocument.wordprocessingml.document,21861,21861,0.0015\nCC-MAIN-2016-22,application/vnd.wap.xhtml+xml,43763,43763,0.0030\nCC-MAIN-2016-22,application/x-bibtex,23639,23639,0.0016\nCC-MAIN-2016-22,application/x-bittorrent,870,870,0.0001\nCC-MAIN-2016-22,application/x-debian-package,36166,36166,0.0025\nCC-MAIN-2016-22,application/x-download,10768,10768,0.0007\nCC-MAIN-2016-22,application/x-endnote-refer,28673,28673,0.0020\nCC-MAIN-2016-22,application/x-gzip,38998,38998,0.0027\nCC-MAIN-2016-22,application/x-httpd-php,32441,32441,0.0022\nCC-MAIN-2016-22,application/x-java-jnlp-file,9413,9413,0.0006\nCC-MAIN-2016-22,application/x-javascript,3319,3319,0.0002\nCC-MAIN-2016-22,application/x-json,94,94,0.0000\nCC-MAIN-2016-22,application/x-mobipocket-ebook,7105,7105,0.0005\nCC-MAIN-2016-22,application/x-msdownload,9085,9085,0.0006\nCC-MAIN-2016-22,application/x-netcdf,11074,11074,0.0008\nCC-MAIN-2016-22,application/x-research-info-systems,27869,27869,0.0019\nCC-MAIN-2016-22,application/x-shockwave-flash,19424,19424,0.0013\nCC-MAIN-2016-22,application/x-tar,7743,7743,0.0005\nCC-MAIN-2016-22,application/x-tex,15758,15758,0.0011\nCC-MAIN-2016-22,application/x-troff-man,30657,30657,0.0021\nCC-MAIN-2016-22,application/x-zip-compressed,22768,22768,0.0016\nCC-MAIN-2016-22,application/xhtml+xml,926057,926057,0.0632\nCC-MAIN-2016-22,application/xml,980236,980236,0.0669\nCC-MAIN-2016-22,application/zip,90892,90892,0.0062\nCC-MAIN-2016-22,audio/mpeg,96927,96927,0.0066\nCC-MAIN-2016-22,audio/x-mpegurl,30981,30981,0.0021\nCC-MAIN-2016-22,audio/x-scpls,68357,68357,0.0047\nCC-MAIN-2016-22,audio/x-wav,145015,145015,0.0099\nCC-MAIN-2016-22,binary/octet-stream,7575,7575,0.0005\nCC-MAIN-2016-22,image/gif,899655,899655,0.0614\nCC-MAIN-2016-22,image/jp2,39585,39585,0.0027\nCC-MAIN-2016-22,image/jpeg,9606892,9606892,0.6552\nCC-MAIN-2016-22,image/jpg,126744,126744,0.0086\nCC-MAIN-2016-22,image/pjpeg,32303,32303,0.0022\nCC-MAIN-2016-22,image/png,4385118,4385118,0.2991\nCC-MAIN-2016-22,image/svg+xml,507,507,0.0000\nCC-MAIN-2016-22,image/tiff,16854,16854,0.0011\nCC-MAIN-2016-22,image/vnd.djvu,6441,6441,0.0004\nCC-MAIN-2016-22,image/webp,82,82,0.0000\nCC-MAIN-2016-22,message/rfc822,15186,15186,0.0010\nCC-MAIN-2016-22,text/calendar,1032325,1032325,0.0704\nCC-MAIN-2016-22,text/css,706,706,0.0000\nCC-MAIN-2016-22,text/csv,73971,73971,0.0050\nCC-MAIN-2016-22,text/directory,4349,4349,0.0003\nCC-MAIN-2016-22,text/enriched,7165,7165,0.0005\nCC-MAIN-2016-22,text/html,1423652589,1423652589,97.0967\nCC-MAIN-2016-22,text/javascript,12745,12745,0.0009\nCC-MAIN-2016-22,text/pdf,33107,33107,0.0023\nCC-MAIN-2016-22,text/plain,2821340,2821340,0.1924\nCC-MAIN-2016-22,text/prs.lines.tag,75,75,0.0000\nCC-MAIN-2016-22,text/tab-separated-values,57491,57491,0.0039\nCC-MAIN-2016-22,text/turtle,8546,8546,0.0006\nCC-MAIN-2016-22,text/vcard,1703,1703,0.0001\nCC-MAIN-2016-22,text/x-bibtex,23226,23226,0.0016\nCC-MAIN-2016-22,text/x-c,4047,4047,0.0003\nCC-MAIN-2016-22,text/x-csrc,18379,18379,0.0013\nCC-MAIN-2016-22,text/x-diff,13874,13874,0.0009\nCC-MAIN-2016-22,text/x-patch,102079,102079,0.0070\nCC-MAIN-2016-22,text/x-perl,21999,21999,0.0015\nCC-MAIN-2016-22,text/x-vcalendar,43952,43952,0.0030\nCC-MAIN-2016-22,text/x-vcard,35256,35256,0.0024\nCC-MAIN-2016-22,text/xml,3324638,3324638,0.2267\nCC-MAIN-2016-22,unknown/unknown,92683,92683,0.0063\nCC-MAIN-2016-22,video/mp4,29976,29976,0.0020\nCC-MAIN-2016-22,video/webm,9289,9289,0.0006\nCC-MAIN-2016-22,video/x-ms-asf,215074,215074,0.0147\nCC-MAIN-2016-26,<other>,1909876,1909876,0.1544\nCC-MAIN-2016-26,application/atom+xml,1655623,1655623,0.1339\nCC-MAIN-2016-26,application/calendar,6541,6541,0.0005\nCC-MAIN-2016-26,application/download,11740,11740,0.0009\nCC-MAIN-2016-26,application/epub+zip,25486,25486,0.0021\nCC-MAIN-2016-26,application/force-download,15965,15965,0.0013\nCC-MAIN-2016-26,application/gpx+xml,203,203,0.0000\nCC-MAIN-2016-26,application/ics,3515,3515,0.0003\nCC-MAIN-2016-26,application/javascript,774,774,0.0001\nCC-MAIN-2016-26,application/json,309305,309305,0.0250\nCC-MAIN-2016-26,application/ld+json,9,9,0.0000\nCC-MAIN-2016-26,application/marc,18733,18733,0.0015\nCC-MAIN-2016-26,application/msword,71700,71700,0.0058\nCC-MAIN-2016-26,application/octet-stream,2336120,2336120,0.1889\nCC-MAIN-2016-26,application/octetstream,15483,15483,0.0013\nCC-MAIN-2016-26,application/pdf,3273925,3273925,0.2647\nCC-MAIN-2016-26,application/pgp-encrypted,68854,68854,0.0056\nCC-MAIN-2016-26,application/pgp-signature,13007,13007,0.0011\nCC-MAIN-2016-26,application/postscript,5630,5630,0.0005\nCC-MAIN-2016-26,application/rdf+xml,66546,66546,0.0054\nCC-MAIN-2016-26,application/rss+xml,4053207,4053207,0.3277\nCC-MAIN-2016-26,application/rtf,2115,2115,0.0002\nCC-MAIN-2016-26,application/save-to-disk,5248,5248,0.0004\nCC-MAIN-2016-26,application/text,12003,12003,0.0010\nCC-MAIN-2016-26,application/unknown,2710,2710,0.0002\nCC-MAIN-2016-26,application/vnd.android.package-archive,1334,1334,0.0001\nCC-MAIN-2016-26,application/vnd.google-earth.kml+xml,157098,157098,0.0127\nCC-MAIN-2016-26,application/vnd.google-earth.kmz,37603,37603,0.0030\nCC-MAIN-2016-26,application/vnd.ms-excel,38838,38838,0.0031\nCC-MAIN-2016-26,application/vnd.ms-powerpoint,14043,14043,0.0011\nCC-MAIN-2016-26,application/vnd.ms-word,11587,11587,0.0009\nCC-MAIN-2016-26,application/vnd.oasis.opendocument.text,1423,1423,0.0001\nCC-MAIN-2016-26,application/vnd.openxmlformats-officedocument.presentationml.presentation,2613,2613,0.0002\nCC-MAIN-2016-26,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,4595,4595,0.0004\nCC-MAIN-2016-26,application/vnd.openxmlformats-officedocument.wordprocessingml.document,18419,18419,0.0015\nCC-MAIN-2016-26,application/vnd.wap.xhtml+xml,42438,42438,0.0034\nCC-MAIN-2016-26,application/x-bibtex,22256,22256,0.0018\nCC-MAIN-2016-26,application/x-bittorrent,813,813,0.0001\nCC-MAIN-2016-26,application/x-debian-package,32309,32309,0.0026\nCC-MAIN-2016-26,application/x-download,10615,10615,0.0009\nCC-MAIN-2016-26,application/x-endnote-refer,24598,24598,0.0020\nCC-MAIN-2016-26,application/x-gzip,8869,8869,0.0007\nCC-MAIN-2016-26,application/x-httpd-php,32325,32325,0.0026\nCC-MAIN-2016-26,application/x-java-jnlp-file,9734,9734,0.0008\nCC-MAIN-2016-26,application/x-javascript,10722,10722,0.0009\nCC-MAIN-2016-26,application/x-json,95,95,0.0000\nCC-MAIN-2016-26,application/x-mobipocket-ebook,4625,4625,0.0004\nCC-MAIN-2016-26,application/x-msdownload,4577,4577,0.0004\nCC-MAIN-2016-26,application/x-netcdf,10856,10856,0.0009\nCC-MAIN-2016-26,application/x-research-info-systems,24931,24931,0.0020\nCC-MAIN-2016-26,application/x-shockwave-flash,8402,8402,0.0007\nCC-MAIN-2016-26,application/x-tar,2694,2694,0.0002\nCC-MAIN-2016-26,application/x-tex,13965,13965,0.0011\nCC-MAIN-2016-26,application/x-troff-man,27591,27591,0.0022\nCC-MAIN-2016-26,application/x-zip-compressed,13815,13815,0.0011\nCC-MAIN-2016-26,application/xhtml+xml,862947,862947,0.0698\nCC-MAIN-2016-26,application/xml,958782,958782,0.0775\nCC-MAIN-2016-26,application/zip,71482,71482,0.0058\nCC-MAIN-2016-26,audio/mpeg,76694,76694,0.0062\nCC-MAIN-2016-26,audio/x-mpegurl,28501,28501,0.0023\nCC-MAIN-2016-26,audio/x-scpls,68606,68606,0.0055\nCC-MAIN-2016-26,audio/x-wav,140420,140420,0.0114\nCC-MAIN-2016-26,binary/octet-stream,6553,6553,0.0005\nCC-MAIN-2016-26,image/gif,915870,915870,0.0741\nCC-MAIN-2016-26,image/jp2,41149,41149,0.0033\nCC-MAIN-2016-26,image/jpeg,9120813,9120813,0.7374\nCC-MAIN-2016-26,image/jpg,115130,115130,0.0093\nCC-MAIN-2016-26,image/pjpeg,31521,31521,0.0025\nCC-MAIN-2016-26,image/png,4342103,4342103,0.3511\nCC-MAIN-2016-26,image/svg+xml,507,507,0.0000\nCC-MAIN-2016-26,image/tiff,13686,13686,0.0011\nCC-MAIN-2016-26,image/vnd.djvu,3255,3255,0.0003\nCC-MAIN-2016-26,image/webp,82,82,0.0000\nCC-MAIN-2016-26,message/rfc822,8649,8649,0.0007\nCC-MAIN-2016-26,text/calendar,979591,979591,0.0792\nCC-MAIN-2016-26,text/css,679,679,0.0001\nCC-MAIN-2016-26,text/csv,54989,54989,0.0044\nCC-MAIN-2016-26,text/directory,3982,3982,0.0003\nCC-MAIN-2016-26,text/enriched,4705,4705,0.0004\nCC-MAIN-2016-26,text/html,1198156764,1198156764,96.8743\nCC-MAIN-2016-26,text/javascript,12324,12324,0.0010\nCC-MAIN-2016-26,text/pdf,37638,37638,0.0030\nCC-MAIN-2016-26,text/plain,2446487,2446487,0.1978\nCC-MAIN-2016-26,text/prs.lines.tag,64,64,0.0000\nCC-MAIN-2016-26,text/tab-separated-values,43608,43608,0.0035\nCC-MAIN-2016-26,text/turtle,1081,1081,0.0001\nCC-MAIN-2016-26,text/vcard,1679,1679,0.0001\nCC-MAIN-2016-26,text/x-bibtex,22857,22857,0.0018\nCC-MAIN-2016-26,text/x-c,3676,3676,0.0003\nCC-MAIN-2016-26,text/x-csrc,17092,17092,0.0014\nCC-MAIN-2016-26,text/x-diff,8508,8508,0.0007\nCC-MAIN-2016-26,text/x-patch,87310,87310,0.0071\nCC-MAIN-2016-26,text/x-perl,23742,23742,0.0019\nCC-MAIN-2016-26,text/x-vcalendar,41304,41304,0.0033\nCC-MAIN-2016-26,text/x-vcard,30340,30340,0.0025\nCC-MAIN-2016-26,text/xml,3266988,3266988,0.2641\nCC-MAIN-2016-26,unknown/unknown,2219,2219,0.0002\nCC-MAIN-2016-26,video/mp4,27184,27184,0.0022\nCC-MAIN-2016-26,video/webm,7444,7444,0.0006\nCC-MAIN-2016-26,video/x-ms-asf,248554,248554,0.0201\nCC-MAIN-2016-30,<other>,2458570,2364554,0.1415\nCC-MAIN-2016-30,application/atom+xml,1788425,1775938,0.1029\nCC-MAIN-2016-30,application/calendar,7382,7226,0.0004\nCC-MAIN-2016-30,application/download,40564,39572,0.0023\nCC-MAIN-2016-30,application/epub+zip,33945,32912,0.0020\nCC-MAIN-2016-30,application/force-download,19975,19445,0.0011\nCC-MAIN-2016-30,application/gpx+xml,209,209,0.0000\nCC-MAIN-2016-30,application/ics,3408,3408,0.0002\nCC-MAIN-2016-30,application/javascript,916,865,0.0001\nCC-MAIN-2016-30,application/json,416939,397107,0.0240\nCC-MAIN-2016-30,application/ld+json,9827,9827,0.0006\nCC-MAIN-2016-30,application/marc,16661,16661,0.0010\nCC-MAIN-2016-30,application/msword,96041,92203,0.0055\nCC-MAIN-2016-30,application/octet-stream,2423927,2391470,0.1395\nCC-MAIN-2016-30,application/octetstream,15512,15485,0.0009\nCC-MAIN-2016-30,application/pdf,3940996,3797986,0.2268\nCC-MAIN-2016-30,application/pgp-encrypted,70929,70918,0.0041\nCC-MAIN-2016-30,application/pgp-signature,21648,20498,0.0012\nCC-MAIN-2016-30,application/postscript,8945,8782,0.0005\nCC-MAIN-2016-30,application/rdf+xml,84246,83681,0.0048\nCC-MAIN-2016-30,application/rss+xml,5666218,5409178,0.3261\nCC-MAIN-2016-30,application/rtf,2306,2290,0.0001\nCC-MAIN-2016-30,application/save-to-disk,5136,5136,0.0003\nCC-MAIN-2016-30,application/text,16645,16310,0.0010\nCC-MAIN-2016-30,application/unknown,2958,2934,0.0002\nCC-MAIN-2016-30,application/vnd.android.package-archive,1590,1565,0.0001\nCC-MAIN-2016-30,application/vnd.google-earth.kml+xml,158179,157827,0.0091\nCC-MAIN-2016-30,application/vnd.google-earth.kmz,39249,39035,0.0023\nCC-MAIN-2016-30,application/vnd.ms-excel,65412,64251,0.0038\nCC-MAIN-2016-30,application/vnd.ms-powerpoint,23192,21794,0.0013\nCC-MAIN-2016-30,application/vnd.ms-word,13345,13256,0.0008\nCC-MAIN-2016-30,application/vnd.oasis.opendocument.text,1855,1785,0.0001\nCC-MAIN-2016-30,application/vnd.openxmlformats-officedocument.presentationml.presentation,4298,4082,0.0002\nCC-MAIN-2016-30,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,6770,6297,0.0004\nCC-MAIN-2016-30,application/vnd.openxmlformats-officedocument.wordprocessingml.document,25479,23850,0.0015\nCC-MAIN-2016-30,application/vnd.wap.xhtml+xml,44345,44224,0.0026\nCC-MAIN-2016-30,application/x-bibtex,25132,25132,0.0014\nCC-MAIN-2016-30,application/x-bittorrent,874,868,0.0001\nCC-MAIN-2016-30,application/x-debian-package,25492,25453,0.0015\nCC-MAIN-2016-30,application/x-download,11441,11415,0.0007\nCC-MAIN-2016-30,application/x-endnote-refer,32958,32558,0.0019\nCC-MAIN-2016-30,application/x-gzip,12118,11893,0.0007\nCC-MAIN-2016-30,application/x-httpd-php,37105,36923,0.0021\nCC-MAIN-2016-30,application/x-java-jnlp-file,9928,9893,0.0006\nCC-MAIN-2016-30,application/x-javascript,16310,16293,0.0009\nCC-MAIN-2016-30,application/x-json,95,95,0.0000\nCC-MAIN-2016-30,application/x-mobipocket-ebook,8436,7680,0.0005\nCC-MAIN-2016-30,application/x-msdownload,9906,9773,0.0006\nCC-MAIN-2016-30,application/x-netcdf,11775,11771,0.0007\nCC-MAIN-2016-30,application/x-research-info-systems,64046,63277,0.0037\nCC-MAIN-2016-30,application/x-shockwave-flash,53790,53654,0.0031\nCC-MAIN-2016-30,application/x-tar,8527,8480,0.0005\nCC-MAIN-2016-30,application/x-tex,16031,15938,0.0009\nCC-MAIN-2016-30,application/x-troff-man,35703,31059,0.0021\nCC-MAIN-2016-30,application/x-zip-compressed,22760,22577,0.0013\nCC-MAIN-2016-30,application/xhtml+xml,1231960,1198924,0.0709\nCC-MAIN-2016-30,application/xml,1298621,1272622,0.0747\nCC-MAIN-2016-30,application/zip,140247,138930,0.0081\nCC-MAIN-2016-30,audio/mpeg,108859,101353,0.0063\nCC-MAIN-2016-30,audio/x-mpegurl,41762,40354,0.0024\nCC-MAIN-2016-30,audio/x-scpls,70295,70150,0.0040\nCC-MAIN-2016-30,audio/x-wav,143800,143789,0.0083\nCC-MAIN-2016-30,binary/octet-stream,9147,8627,0.0005\nCC-MAIN-2016-30,image/gif,1034362,1032898,0.0595\nCC-MAIN-2016-30,image/jp2,31757,31307,0.0018\nCC-MAIN-2016-30,image/jpeg,9801292,9714824,0.5642\nCC-MAIN-2016-30,image/jpg,124186,123968,0.0071\nCC-MAIN-2016-30,image/pjpeg,33928,32442,0.0020\nCC-MAIN-2016-30,image/png,4411402,4408019,0.2539\nCC-MAIN-2016-30,image/svg+xml,647,624,0.0000\nCC-MAIN-2016-30,image/tiff,54098,52282,0.0031\nCC-MAIN-2016-30,image/vnd.djvu,6015,5972,0.0003\nCC-MAIN-2016-30,image/webp,80,80,0.0000\nCC-MAIN-2016-30,message/rfc822,14714,14496,0.0008\nCC-MAIN-2016-30,text/calendar,992801,971741,0.0571\nCC-MAIN-2016-30,text/css,754,742,0.0000\nCC-MAIN-2016-30,text/csv,116234,113088,0.0067\nCC-MAIN-2016-30,text/directory,5778,5405,0.0003\nCC-MAIN-2016-30,text/enriched,8437,8408,0.0005\nCC-MAIN-2016-30,text/html,1692068745,1588170343,97.3952\nCC-MAIN-2016-30,text/javascript,16746,16601,0.0010\nCC-MAIN-2016-30,text/pdf,37831,37831,0.0022\nCC-MAIN-2016-30,text/plain,2955773,2874440,0.1701\nCC-MAIN-2016-30,text/prs.lines.tag,70,70,0.0000\nCC-MAIN-2016-30,text/tab-separated-values,68273,65198,0.0039\nCC-MAIN-2016-30,text/turtle,11369,11095,0.0007\nCC-MAIN-2016-30,text/vcard,2267,1779,0.0001\nCC-MAIN-2016-30,text/x-bibtex,23305,23299,0.0013\nCC-MAIN-2016-30,text/x-c,4171,4053,0.0002\nCC-MAIN-2016-30,text/x-csrc,18319,18251,0.0011\nCC-MAIN-2016-30,text/x-diff,15750,15458,0.0009\nCC-MAIN-2016-30,text/x-patch,103968,103472,0.0060\nCC-MAIN-2016-30,text/x-perl,22421,22406,0.0013\nCC-MAIN-2016-30,text/x-vcalendar,45063,44151,0.0026\nCC-MAIN-2016-30,text/x-vcard,37470,36220,0.0022\nCC-MAIN-2016-30,text/xml,3690109,3620001,0.2124\nCC-MAIN-2016-30,unknown/unknown,255968,222995,0.0147\nCC-MAIN-2016-30,video/mp4,33794,33727,0.0019\nCC-MAIN-2016-30,video/webm,9634,9016,0.0006\nCC-MAIN-2016-30,video/x-ms-asf,281613,278430,0.0162\nCC-MAIN-2016-36,<other>,2489092,2390396,0.1544\nCC-MAIN-2016-36,application/atom+xml,1791851,1787078,0.1112\nCC-MAIN-2016-36,application/calendar,7083,7082,0.0004\nCC-MAIN-2016-36,application/download,24381,24354,0.0015\nCC-MAIN-2016-36,application/epub+zip,32503,32480,0.0020\nCC-MAIN-2016-36,application/force-download,16588,16566,0.0010\nCC-MAIN-2016-36,application/gpx+xml,209,209,0.0000\nCC-MAIN-2016-36,application/ics,3478,3478,0.0002\nCC-MAIN-2016-36,application/javascript,888,887,0.0001\nCC-MAIN-2016-36,application/json,318696,318209,0.0198\nCC-MAIN-2016-36,application/ld+json,39609,39609,0.0025\nCC-MAIN-2016-36,application/marc,18395,18395,0.0011\nCC-MAIN-2016-36,application/msword,85650,84870,0.0053\nCC-MAIN-2016-36,application/octet-stream,2417285,2415603,0.1500\nCC-MAIN-2016-36,application/octetstream,15674,15671,0.0010\nCC-MAIN-2016-36,application/pdf,3579276,3551400,0.2221\nCC-MAIN-2016-36,application/pgp-encrypted,71161,71161,0.0044\nCC-MAIN-2016-36,application/pgp-signature,18463,18448,0.0011\nCC-MAIN-2016-36,application/postscript,8688,8676,0.0005\nCC-MAIN-2016-36,application/rdf+xml,112495,112454,0.0070\nCC-MAIN-2016-36,application/rss+xml,5391858,5338147,0.3346\nCC-MAIN-2016-36,application/rtf,2178,2170,0.0001\nCC-MAIN-2016-36,application/save-to-disk,5059,5059,0.0003\nCC-MAIN-2016-36,application/text,18584,18573,0.0012\nCC-MAIN-2016-36,application/unknown,2895,2893,0.0002\nCC-MAIN-2016-36,application/vnd.android.package-archive,1182,1178,0.0001\nCC-MAIN-2016-36,application/vnd.google-earth.kml+xml,162682,162652,0.0101\nCC-MAIN-2016-36,application/vnd.google-earth.kmz,38715,38684,0.0024\nCC-MAIN-2016-36,application/vnd.ms-excel,63701,63603,0.0040\nCC-MAIN-2016-36,application/vnd.ms-powerpoint,19058,18662,0.0012\nCC-MAIN-2016-36,application/vnd.ms-word,13735,13733,0.0009\nCC-MAIN-2016-36,application/vnd.oasis.opendocument.text,1709,1704,0.0001\nCC-MAIN-2016-36,application/vnd.openxmlformats-officedocument.presentationml.presentation,3716,3702,0.0002\nCC-MAIN-2016-36,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,5880,5867,0.0004\nCC-MAIN-2016-36,application/vnd.openxmlformats-officedocument.wordprocessingml.document,21500,21423,0.0013\nCC-MAIN-2016-36,application/vnd.wap.xhtml+xml,44657,44630,0.0028\nCC-MAIN-2016-36,application/x-bibtex,23672,23672,0.0015\nCC-MAIN-2016-36,application/x-bittorrent,879,879,0.0001\nCC-MAIN-2016-36,application/x-debian-package,24463,24441,0.0015\nCC-MAIN-2016-36,application/x-download,10956,10956,0.0007\nCC-MAIN-2016-36,application/x-endnote-refer,37191,37177,0.0023\nCC-MAIN-2016-36,application/x-gzip,13718,13137,0.0009\nCC-MAIN-2016-36,application/x-httpd-php,38525,38429,0.0024\nCC-MAIN-2016-36,application/x-java-jnlp-file,9485,9471,0.0006\nCC-MAIN-2016-36,application/x-javascript,12895,12894,0.0008\nCC-MAIN-2016-36,application/x-json,94,94,0.0000\nCC-MAIN-2016-36,application/x-mobipocket-ebook,7819,7804,0.0005\nCC-MAIN-2016-36,application/x-msdownload,9017,8970,0.0006\nCC-MAIN-2016-36,application/x-netcdf,11886,11886,0.0007\nCC-MAIN-2016-36,application/x-research-info-systems,40952,40948,0.0025\nCC-MAIN-2016-36,application/x-shockwave-flash,16191,16110,0.0010\nCC-MAIN-2016-36,application/x-tar,8161,8030,0.0005\nCC-MAIN-2016-36,application/x-tex,15852,15852,0.0010\nCC-MAIN-2016-36,application/x-troff-man,36888,32813,0.0023\nCC-MAIN-2016-36,application/x-zip-compressed,22931,22875,0.0014\nCC-MAIN-2016-36,application/xhtml+xml,1175101,1161656,0.0729\nCC-MAIN-2016-36,application/xml,1217035,1210679,0.0755\nCC-MAIN-2016-36,application/zip,151530,151304,0.0094\nCC-MAIN-2016-36,audio/mpeg,96522,95063,0.0060\nCC-MAIN-2016-36,audio/x-mpegurl,42192,42184,0.0026\nCC-MAIN-2016-36,audio/x-scpls,70134,70115,0.0044\nCC-MAIN-2016-36,audio/x-wav,131728,131728,0.0082\nCC-MAIN-2016-36,binary/octet-stream,8875,8658,0.0006\nCC-MAIN-2016-36,image/gif,924423,923916,0.0574\nCC-MAIN-2016-36,image/jp2,38833,38822,0.0024\nCC-MAIN-2016-36,image/jpeg,9441245,9431637,0.5858\nCC-MAIN-2016-36,image/jpg,123228,123190,0.0076\nCC-MAIN-2016-36,image/pjpeg,32028,32002,0.0020\nCC-MAIN-2016-36,image/png,4341831,4340668,0.2694\nCC-MAIN-2016-36,image/svg+xml,681,661,0.0000\nCC-MAIN-2016-36,image/tiff,42940,42904,0.0027\nCC-MAIN-2016-36,image/vnd.djvu,6907,6907,0.0004\nCC-MAIN-2016-36,image/webp,82,82,0.0000\nCC-MAIN-2016-36,message/rfc822,15385,15361,0.0010\nCC-MAIN-2016-36,text/calendar,941912,940235,0.0584\nCC-MAIN-2016-36,text/css,754,747,0.0000\nCC-MAIN-2016-36,text/csv,82920,82865,0.0051\nCC-MAIN-2016-36,text/directory,4970,4798,0.0003\nCC-MAIN-2016-36,text/enriched,8038,8034,0.0005\nCC-MAIN-2016-36,text/html,1568091931,1515332924,97.2995\nCC-MAIN-2016-36,text/javascript,15229,15221,0.0009\nCC-MAIN-2016-36,text/pdf,38250,38250,0.0024\nCC-MAIN-2016-36,text/plain,3042489,3013757,0.1888\nCC-MAIN-2016-36,text/prs.lines.tag,66,66,0.0000\nCC-MAIN-2016-36,text/tab-separated-values,64159,64116,0.0040\nCC-MAIN-2016-36,text/turtle,40836,40836,0.0025\nCC-MAIN-2016-36,text/vcard,1766,1747,0.0001\nCC-MAIN-2016-36,text/x-bibtex,23449,23395,0.0015\nCC-MAIN-2016-36,text/x-c,2217,2212,0.0001\nCC-MAIN-2016-36,text/x-csrc,17001,16990,0.0011\nCC-MAIN-2016-36,text/x-diff,16279,16270,0.0010\nCC-MAIN-2016-36,text/x-patch,104471,104465,0.0065\nCC-MAIN-2016-36,text/x-perl,22969,22963,0.0014\nCC-MAIN-2016-36,text/x-vcalendar,44019,43490,0.0027\nCC-MAIN-2016-36,text/x-vcard,34413,34371,0.0021\nCC-MAIN-2016-36,text/xml,3369795,3354326,0.2091\nCC-MAIN-2016-36,unknown/unknown,245875,219041,0.0153\nCC-MAIN-2016-36,video/mp4,33599,33510,0.0021\nCC-MAIN-2016-36,video/webm,9324,9322,0.0006\nCC-MAIN-2016-36,video/x-ms-asf,305510,305423,0.0190\nCC-MAIN-2016-40,<other>,2476401,2464116,0.1438\nCC-MAIN-2016-40,application/atom+xml,1777111,1775982,0.1032\nCC-MAIN-2016-40,application/calendar,7221,7218,0.0004\nCC-MAIN-2016-40,application/download,21351,20952,0.0012\nCC-MAIN-2016-40,application/epub+zip,33240,33164,0.0019\nCC-MAIN-2016-40,application/force-download,15439,15423,0.0009\nCC-MAIN-2016-40,application/gpx+xml,204,204,0.0000\nCC-MAIN-2016-40,application/ics,3527,3527,0.0002\nCC-MAIN-2016-40,application/javascript,2330,2330,0.0001\nCC-MAIN-2016-40,application/json,367618,366803,0.0213\nCC-MAIN-2016-40,application/ld+json,44505,44505,0.0026\nCC-MAIN-2016-40,application/marc,16596,16596,0.0010\nCC-MAIN-2016-40,application/msword,106271,105094,0.0062\nCC-MAIN-2016-40,application/octet-stream,2404104,2401154,0.1396\nCC-MAIN-2016-40,application/octetstream,15687,15686,0.0009\nCC-MAIN-2016-40,application/pdf,4336876,4280220,0.2518\nCC-MAIN-2016-40,application/pgp-encrypted,71161,71151,0.0041\nCC-MAIN-2016-40,application/pgp-signature,19907,19902,0.0012\nCC-MAIN-2016-40,application/postscript,10178,10163,0.0006\nCC-MAIN-2016-40,application/rdf+xml,117432,117421,0.0068\nCC-MAIN-2016-40,application/rss+xml,5458773,5430540,0.3169\nCC-MAIN-2016-40,application/rtf,3050,3049,0.0002\nCC-MAIN-2016-40,application/save-to-disk,5244,5244,0.0003\nCC-MAIN-2016-40,application/text,17991,17988,0.0010\nCC-MAIN-2016-40,application/unknown,2531,2529,0.0001\nCC-MAIN-2016-40,application/vnd.android.package-archive,1035,1032,0.0001\nCC-MAIN-2016-40,application/vnd.google-earth.kml+xml,160156,159486,0.0093\nCC-MAIN-2016-40,application/vnd.google-earth.kmz,35817,35800,0.0021\nCC-MAIN-2016-40,application/vnd.ms-excel,70057,69088,0.0041\nCC-MAIN-2016-40,application/vnd.ms-powerpoint,19902,19808,0.0012\nCC-MAIN-2016-40,application/vnd.ms-word,14832,14832,0.0009\nCC-MAIN-2016-40,application/vnd.oasis.opendocument.text,1777,1763,0.0001\nCC-MAIN-2016-40,application/vnd.openxmlformats-officedocument.presentationml.presentation,4441,4327,0.0003\nCC-MAIN-2016-40,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,7392,7283,0.0004\nCC-MAIN-2016-40,application/vnd.openxmlformats-officedocument.wordprocessingml.document,25553,25137,0.0015\nCC-MAIN-2016-40,application/vnd.wap.xhtml+xml,45091,45088,0.0026\nCC-MAIN-2016-40,application/x-bibtex,21464,21464,0.0012\nCC-MAIN-2016-40,application/x-bittorrent,867,867,0.0001\nCC-MAIN-2016-40,application/x-debian-package,24648,24644,0.0014\nCC-MAIN-2016-40,application/x-download,13251,13251,0.0008\nCC-MAIN-2016-40,application/x-endnote-refer,36180,36171,0.0021\nCC-MAIN-2016-40,application/x-gzip,16961,16702,0.0010\nCC-MAIN-2016-40,application/x-httpd-php,38089,38046,0.0022\nCC-MAIN-2016-40,application/x-java-jnlp-file,9611,9609,0.0006\nCC-MAIN-2016-40,application/x-javascript,16441,16441,0.0010\nCC-MAIN-2016-40,application/x-json,94,94,0.0000\nCC-MAIN-2016-40,application/x-mobipocket-ebook,7539,7504,0.0004\nCC-MAIN-2016-40,application/x-msdownload,9048,9041,0.0005\nCC-MAIN-2016-40,application/x-netcdf,12045,12045,0.0007\nCC-MAIN-2016-40,application/x-research-info-systems,36416,36411,0.0021\nCC-MAIN-2016-40,application/x-shockwave-flash,19910,19836,0.0012\nCC-MAIN-2016-40,application/x-tar,8059,8004,0.0005\nCC-MAIN-2016-40,application/x-tex,15979,15968,0.0009\nCC-MAIN-2016-40,application/x-troff-man,33036,33036,0.0019\nCC-MAIN-2016-40,application/x-zip-compressed,23391,23326,0.0014\nCC-MAIN-2016-40,application/xhtml+xml,1226537,1213301,0.0712\nCC-MAIN-2016-40,application/xml,1193892,1182260,0.0693\nCC-MAIN-2016-40,application/zip,152317,152072,0.0088\nCC-MAIN-2016-40,audio/mpeg,105650,104398,0.0061\nCC-MAIN-2016-40,audio/x-mpegurl,42526,42183,0.0025\nCC-MAIN-2016-40,audio/x-scpls,70148,70111,0.0041\nCC-MAIN-2016-40,audio/x-wav,137346,137345,0.0080\nCC-MAIN-2016-40,binary/octet-stream,9370,9177,0.0005\nCC-MAIN-2016-40,image/gif,1120744,1120271,0.0651\nCC-MAIN-2016-40,image/jp2,41563,41562,0.0024\nCC-MAIN-2016-40,image/jpeg,10145910,10141088,0.5890\nCC-MAIN-2016-40,image/jpg,122441,122423,0.0071\nCC-MAIN-2016-40,image/pjpeg,34192,33982,0.0020\nCC-MAIN-2016-40,image/png,4490507,4489779,0.2607\nCC-MAIN-2016-40,image/svg+xml,1962,1957,0.0001\nCC-MAIN-2016-40,image/tiff,31465,31364,0.0018\nCC-MAIN-2016-40,image/vnd.djvu,6639,6639,0.0004\nCC-MAIN-2016-40,image/webp,1414,1414,0.0001\nCC-MAIN-2016-40,message/rfc822,15632,15623,0.0009\nCC-MAIN-2016-40,text/calendar,943145,942515,0.0547\nCC-MAIN-2016-40,text/css,3594,3585,0.0002\nCC-MAIN-2016-40,text/csv,89479,89401,0.0052\nCC-MAIN-2016-40,text/directory,4890,4712,0.0003\nCC-MAIN-2016-40,text/enriched,7537,7537,0.0004\nCC-MAIN-2016-40,text/html,1676919246,1645246264,97.3450\nCC-MAIN-2016-40,text/javascript,22340,22325,0.0013\nCC-MAIN-2016-40,text/pdf,38913,38913,0.0023\nCC-MAIN-2016-40,text/plain,3232624,3226099,0.1877\nCC-MAIN-2016-40,text/prs.lines.tag,74,74,0.0000\nCC-MAIN-2016-40,text/tab-separated-values,68875,68837,0.0040\nCC-MAIN-2016-40,text/turtle,45707,45707,0.0027\nCC-MAIN-2016-40,text/vcard,1815,1815,0.0001\nCC-MAIN-2016-40,text/x-bibtex,23390,23386,0.0014\nCC-MAIN-2016-40,text/x-c,3237,3151,0.0002\nCC-MAIN-2016-40,text/x-csrc,18472,18417,0.0011\nCC-MAIN-2016-40,text/x-diff,16427,16397,0.0010\nCC-MAIN-2016-40,text/x-patch,105435,105182,0.0061\nCC-MAIN-2016-40,text/x-perl,23140,23139,0.0013\nCC-MAIN-2016-40,text/x-vcalendar,42798,42498,0.0025\nCC-MAIN-2016-40,text/x-vcard,35675,35236,0.0021\nCC-MAIN-2016-40,text/xml,3481533,3471860,0.2021\nCC-MAIN-2016-40,unknown/unknown,198062,183431,0.0115\nCC-MAIN-2016-40,video/mp4,33807,33796,0.0020\nCC-MAIN-2016-40,video/webm,9272,9266,0.0005\nCC-MAIN-2016-40,video/x-ms-asf,272821,272698,0.0158\nCC-MAIN-2016-44,<other>,3551040,3525226,0.1091\nCC-MAIN-2016-44,application/atom+xml,1864549,1862622,0.0573\nCC-MAIN-2016-44,application/calendar,4456,4453,0.0001\nCC-MAIN-2016-44,application/download,32546,31915,0.0010\nCC-MAIN-2016-44,application/epub+zip,32682,32597,0.0010\nCC-MAIN-2016-44,application/force-download,14588,14499,0.0004\nCC-MAIN-2016-44,application/gpx+xml,208,208,0.0000\nCC-MAIN-2016-44,application/ics,3519,3519,0.0001\nCC-MAIN-2016-44,application/javascript,12441,12441,0.0004\nCC-MAIN-2016-44,application/json,359880,358232,0.0111\nCC-MAIN-2016-44,application/ld+json,37661,37661,0.0012\nCC-MAIN-2016-44,application/marc,19573,19573,0.0006\nCC-MAIN-2016-44,application/msword,199165,197170,0.0061\nCC-MAIN-2016-44,application/octet-stream,2110313,2106076,0.0648\nCC-MAIN-2016-44,application/octetstream,18229,18227,0.0006\nCC-MAIN-2016-44,application/pdf,6316656,6211625,0.1941\nCC-MAIN-2016-44,application/pgp-encrypted,70616,70606,0.0022\nCC-MAIN-2016-44,application/pgp-signature,13314,13301,0.0004\nCC-MAIN-2016-44,application/postscript,10420,10385,0.0003\nCC-MAIN-2016-44,application/rdf+xml,159204,159191,0.0049\nCC-MAIN-2016-44,application/rss+xml,5638895,5579724,0.1732\nCC-MAIN-2016-44,application/rtf,4867,4860,0.0001\nCC-MAIN-2016-44,application/save-to-disk,5238,5238,0.0002\nCC-MAIN-2016-44,application/text,18791,18791,0.0006\nCC-MAIN-2016-44,application/unknown,2545,2544,0.0001\nCC-MAIN-2016-44,application/vnd.android.package-archive,1060,1057,0.0000\nCC-MAIN-2016-44,application/vnd.google-earth.kml+xml,212111,212066,0.0065\nCC-MAIN-2016-44,application/vnd.google-earth.kmz,36714,36689,0.0011\nCC-MAIN-2016-44,application/vnd.ms-excel,73141,70200,0.0022\nCC-MAIN-2016-44,application/vnd.ms-powerpoint,26310,26232,0.0008\nCC-MAIN-2016-44,application/vnd.ms-word,14551,14551,0.0004\nCC-MAIN-2016-44,application/vnd.oasis.opendocument.text,1908,1888,0.0001\nCC-MAIN-2016-44,application/vnd.openxmlformats-officedocument.presentationml.presentation,5530,5487,0.0002\nCC-MAIN-2016-44,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,21023,20901,0.0006\nCC-MAIN-2016-44,application/vnd.openxmlformats-officedocument.wordprocessingml.document,32006,31627,0.0010\nCC-MAIN-2016-44,application/vnd.wap.xhtml+xml,44852,44834,0.0014\nCC-MAIN-2016-44,application/x-bibtex,21340,21316,0.0007\nCC-MAIN-2016-44,application/x-bittorrent,1640,1640,0.0001\nCC-MAIN-2016-44,application/x-debian-package,23393,23386,0.0007\nCC-MAIN-2016-44,application/x-download,13009,13009,0.0004\nCC-MAIN-2016-44,application/x-endnote-refer,38468,38442,0.0012\nCC-MAIN-2016-44,application/x-gzip,18621,18161,0.0006\nCC-MAIN-2016-44,application/x-httpd-php,39752,39719,0.0012\nCC-MAIN-2016-44,application/x-java-jnlp-file,9489,9484,0.0003\nCC-MAIN-2016-44,application/x-javascript,19740,19735,0.0006\nCC-MAIN-2016-44,application/x-json,95,95,0.0000\nCC-MAIN-2016-44,application/x-mobipocket-ebook,6381,6340,0.0002\nCC-MAIN-2016-44,application/x-msdownload,9647,9640,0.0003\nCC-MAIN-2016-44,application/x-netcdf,12002,12002,0.0004\nCC-MAIN-2016-44,application/x-research-info-systems,47582,47582,0.0015\nCC-MAIN-2016-44,application/x-shockwave-flash,41857,41729,0.0013\nCC-MAIN-2016-44,application/x-tar,8268,8183,0.0003\nCC-MAIN-2016-44,application/x-tex,15686,15676,0.0005\nCC-MAIN-2016-44,application/x-troff-man,32991,32971,0.0010\nCC-MAIN-2016-44,application/x-zip-compressed,24364,24287,0.0007\nCC-MAIN-2016-44,application/xhtml+xml,1235986,1211197,0.0380\nCC-MAIN-2016-44,application/xml,1331576,1324129,0.0409\nCC-MAIN-2016-44,application/zip,162710,162440,0.0050\nCC-MAIN-2016-44,audio/mpeg,111698,109986,0.0034\nCC-MAIN-2016-44,audio/x-mpegurl,42805,42457,0.0013\nCC-MAIN-2016-44,audio/x-scpls,57253,57214,0.0018\nCC-MAIN-2016-44,audio/x-wav,135065,135065,0.0041\nCC-MAIN-2016-44,binary/octet-stream,17790,17521,0.0005\nCC-MAIN-2016-44,image/gif,1471562,1469079,0.0452\nCC-MAIN-2016-44,image/jp2,17654,17654,0.0005\nCC-MAIN-2016-44,image/jpeg,12093981,12089974,0.3716\nCC-MAIN-2016-44,image/jpg,180517,180500,0.0055\nCC-MAIN-2016-44,image/pjpeg,53954,53804,0.0017\nCC-MAIN-2016-44,image/png,4022702,4021778,0.1236\nCC-MAIN-2016-44,image/svg+xml,13730,13723,0.0004\nCC-MAIN-2016-44,image/tiff,42073,42008,0.0013\nCC-MAIN-2016-44,image/vnd.djvu,7623,7623,0.0002\nCC-MAIN-2016-44,image/webp,32409,32409,0.0010\nCC-MAIN-2016-44,message/rfc822,15611,15599,0.0005\nCC-MAIN-2016-44,text/calendar,958300,957427,0.0294\nCC-MAIN-2016-44,text/css,28450,28418,0.0009\nCC-MAIN-2016-44,text/csv,85693,84943,0.0026\nCC-MAIN-2016-44,text/directory,4819,4792,0.0001\nCC-MAIN-2016-44,text/enriched,7870,7868,0.0002\nCC-MAIN-2016-44,text/html,3203619009,3149584579,98.4222\nCC-MAIN-2016-44,text/javascript,42173,42155,0.0013\nCC-MAIN-2016-44,text/pdf,37413,37413,0.0011\nCC-MAIN-2016-44,text/plain,3256006,3246727,0.1000\nCC-MAIN-2016-44,text/prs.lines.tag,71,71,0.0000\nCC-MAIN-2016-44,text/tab-separated-values,63988,63985,0.0020\nCC-MAIN-2016-44,text/turtle,38782,38782,0.0012\nCC-MAIN-2016-44,text/vcard,1742,1742,0.0001\nCC-MAIN-2016-44,text/x-bibtex,23418,23414,0.0007\nCC-MAIN-2016-44,text/x-c,6116,5952,0.0002\nCC-MAIN-2016-44,text/x-csrc,18611,18557,0.0006\nCC-MAIN-2016-44,text/x-diff,16211,16183,0.0005\nCC-MAIN-2016-44,text/x-patch,105054,104639,0.0032\nCC-MAIN-2016-44,text/x-perl,21924,21922,0.0007\nCC-MAIN-2016-44,text/x-vcalendar,40673,40255,0.0012\nCC-MAIN-2016-44,text/x-vcard,35163,34780,0.0011\nCC-MAIN-2016-44,text/xml,3670826,3662691,0.1128\nCC-MAIN-2016-44,unknown/unknown,212474,193598,0.0065\nCC-MAIN-2016-44,video/mp4,34684,34676,0.0011\nCC-MAIN-2016-44,video/webm,9405,9399,0.0003\nCC-MAIN-2016-44,video/x-ms-asf,236230,236165,0.0073\nCC-MAIN-2016-50,<other>,2093070,2073463,0.0730\nCC-MAIN-2016-50,application/atom+xml,1928772,1918511,0.0673\nCC-MAIN-2016-50,application/calendar,2615,2585,0.0001\nCC-MAIN-2016-50,application/download,13277,13222,0.0005\nCC-MAIN-2016-50,application/epub+zip,24890,24770,0.0009\nCC-MAIN-2016-50,application/force-download,11372,11318,0.0004\nCC-MAIN-2016-50,application/gpx+xml,198,198,0.0000\nCC-MAIN-2016-50,application/ics,3112,3105,0.0001\nCC-MAIN-2016-50,application/javascript,5981,5943,0.0002\nCC-MAIN-2016-50,application/json,223143,221669,0.0078\nCC-MAIN-2016-50,application/ld+json,23906,23782,0.0008\nCC-MAIN-2016-50,application/marc,22521,22416,0.0008\nCC-MAIN-2016-50,application/msword,165063,163822,0.0058\nCC-MAIN-2016-50,application/octet-stream,896106,891212,0.0313\nCC-MAIN-2016-50,application/octetstream,11877,11803,0.0004\nCC-MAIN-2016-50,application/pdf,5610808,5551939,0.1958\nCC-MAIN-2016-50,application/pgp-encrypted,38492,38302,0.0013\nCC-MAIN-2016-50,application/pgp-signature,18659,18576,0.0007\nCC-MAIN-2016-50,application/postscript,9652,9613,0.0003\nCC-MAIN-2016-50,application/rdf+xml,139375,138654,0.0049\nCC-MAIN-2016-50,application/rss+xml,5105288,5067412,0.1781\nCC-MAIN-2016-50,application/rtf,5269,5255,0.0002\nCC-MAIN-2016-50,application/save-to-disk,45,45,0.0000\nCC-MAIN-2016-50,application/text,12325,12254,0.0004\nCC-MAIN-2016-50,application/unknown,1494,1493,0.0001\nCC-MAIN-2016-50,application/vnd.android.package-archive,1006,990,0.0000\nCC-MAIN-2016-50,application/vnd.google-earth.kml+xml,179316,178346,0.0063\nCC-MAIN-2016-50,application/vnd.google-earth.kmz,35435,35284,0.0012\nCC-MAIN-2016-50,application/vnd.ms-excel,59634,58817,0.0021\nCC-MAIN-2016-50,application/vnd.ms-powerpoint,26164,25973,0.0009\nCC-MAIN-2016-50,application/vnd.ms-word,5339,5318,0.0002\nCC-MAIN-2016-50,application/vnd.oasis.opendocument.text,1520,1505,0.0001\nCC-MAIN-2016-50,application/vnd.openxmlformats-officedocument.presentationml.presentation,5220,5117,0.0002\nCC-MAIN-2016-50,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,20085,19941,0.0007\nCC-MAIN-2016-50,application/vnd.openxmlformats-officedocument.wordprocessingml.document,25400,25132,0.0009\nCC-MAIN-2016-50,application/vnd.wap.xhtml+xml,44839,44601,0.0016\nCC-MAIN-2016-50,application/x-bibtex,19452,19341,0.0007\nCC-MAIN-2016-50,application/x-bittorrent,1608,1592,0.0001\nCC-MAIN-2016-50,application/x-debian-package,11948,11901,0.0004\nCC-MAIN-2016-50,application/x-download,6103,5985,0.0002\nCC-MAIN-2016-50,application/x-endnote-refer,29599,29408,0.0010\nCC-MAIN-2016-50,application/x-gzip,17569,17176,0.0006\nCC-MAIN-2016-50,application/x-httpd-php,9445,9369,0.0003\nCC-MAIN-2016-50,application/x-java-jnlp-file,5764,5736,0.0002\nCC-MAIN-2016-50,application/x-javascript,5206,5166,0.0002\nCC-MAIN-2016-50,application/x-mobipocket-ebook,6266,6219,0.0002\nCC-MAIN-2016-50,application/x-msdownload,9445,9395,0.0003\nCC-MAIN-2016-50,application/x-netcdf,11755,11690,0.0004\nCC-MAIN-2016-50,application/x-research-info-systems,30272,30129,0.0011\nCC-MAIN-2016-50,application/x-shockwave-flash,35181,35044,0.0012\nCC-MAIN-2016-50,application/x-tar,7338,7274,0.0003\nCC-MAIN-2016-50,application/x-tex,13719,13667,0.0005\nCC-MAIN-2016-50,application/x-troff-man,12363,12297,0.0004\nCC-MAIN-2016-50,application/x-zip-compressed,23047,22949,0.0008\nCC-MAIN-2016-50,application/xhtml+xml,1083585,1073555,0.0378\nCC-MAIN-2016-50,application/xml,1153253,1144726,0.0402\nCC-MAIN-2016-50,application/zip,97755,97131,0.0034\nCC-MAIN-2016-50,audio/mpeg,92892,92404,0.0032\nCC-MAIN-2016-50,audio/x-mpegurl,38269,38037,0.0013\nCC-MAIN-2016-50,audio/x-scpls,5463,5424,0.0002\nCC-MAIN-2016-50,audio/x-wav,116769,116167,0.0041\nCC-MAIN-2016-50,binary/octet-stream,14911,14841,0.0005\nCC-MAIN-2016-50,image/gif,634545,630686,0.0221\nCC-MAIN-2016-50,image/jp2,28937,28823,0.0010\nCC-MAIN-2016-50,image/jpeg,10570148,10514671,0.3688\nCC-MAIN-2016-50,image/jpg,122724,122169,0.0043\nCC-MAIN-2016-50,image/pjpeg,44334,44054,0.0015\nCC-MAIN-2016-50,image/png,3004150,2986320,0.1048\nCC-MAIN-2016-50,image/svg+xml,12586,12526,0.0004\nCC-MAIN-2016-50,image/tiff,34950,34789,0.0012\nCC-MAIN-2016-50,image/vnd.djvu,6535,6507,0.0002\nCC-MAIN-2016-50,image/webp,31418,31232,0.0011\nCC-MAIN-2016-50,message/rfc822,14650,14565,0.0005\nCC-MAIN-2016-50,text/calendar,453396,450104,0.0158\nCC-MAIN-2016-50,text/css,6298,6260,0.0002\nCC-MAIN-2016-50,text/csv,67132,66697,0.0023\nCC-MAIN-2016-50,text/directory,4364,4351,0.0002\nCC-MAIN-2016-50,text/enriched,7969,7932,0.0003\nCC-MAIN-2016-50,text/html,2824483627,2781363126,98.5417\nCC-MAIN-2016-50,text/javascript,7115,7079,0.0002\nCC-MAIN-2016-50,text/markdown,7,5,0.0000\nCC-MAIN-2016-50,text/pdf,37607,37385,0.0013\nCC-MAIN-2016-50,text/plain,2859637,2840655,0.0998\nCC-MAIN-2016-50,text/prs.lines.tag,59,59,0.0000\nCC-MAIN-2016-50,text/tab-separated-values,53700,53389,0.0019\nCC-MAIN-2016-50,text/turtle,24387,24257,0.0009\nCC-MAIN-2016-50,text/vcard,1609,1600,0.0001\nCC-MAIN-2016-50,text/x-bibtex,7037,7004,0.0002\nCC-MAIN-2016-50,text/x-c,98691,98040,0.0034\nCC-MAIN-2016-50,text/x-csrc,7765,7733,0.0003\nCC-MAIN-2016-50,text/x-diff,18509,18424,0.0006\nCC-MAIN-2016-50,text/x-patch,96048,95572,0.0034\nCC-MAIN-2016-50,text/x-perl,3234,3227,0.0001\nCC-MAIN-2016-50,text/x-vcalendar,35379,35172,0.0012\nCC-MAIN-2016-50,text/x-vcard,25072,24940,0.0009\nCC-MAIN-2016-50,text/xml,3299998,3279608,0.1151\nCC-MAIN-2016-50,unknown/unknown,143359,140287,0.0050\nCC-MAIN-2016-50,video/mp4,37279,37048,0.0013\nCC-MAIN-2016-50,video/webm,9427,9307,0.0003\nCC-MAIN-2016-50,video/x-ms-asf,358463,356516,0.0125\nCC-MAIN-2017-04,<other>,2117057,2105397,0.0673\nCC-MAIN-2017-04,application/atom+xml,2218852,2218358,0.0705\nCC-MAIN-2017-04,application/calendar,1889,1889,0.0001\nCC-MAIN-2017-04,application/download,12401,12384,0.0004\nCC-MAIN-2017-04,application/epub+zip,37966,37936,0.0012\nCC-MAIN-2017-04,application/force-download,23481,23463,0.0007\nCC-MAIN-2017-04,application/gpx+xml,265,265,0.0000\nCC-MAIN-2017-04,application/ics,2985,2985,0.0001\nCC-MAIN-2017-04,application/javascript,6605,6604,0.0002\nCC-MAIN-2017-04,application/json,206442,206417,0.0066\nCC-MAIN-2017-04,application/ld+json,31831,31831,0.0010\nCC-MAIN-2017-04,application/marc,22161,22161,0.0007\nCC-MAIN-2017-04,application/msword,164906,164376,0.0052\nCC-MAIN-2017-04,application/octet-stream,767295,766027,0.0244\nCC-MAIN-2017-04,application/octetstream,12964,12962,0.0004\nCC-MAIN-2017-04,application/pdf,7472067,7436392,0.2375\nCC-MAIN-2017-04,application/pgp-encrypted,38620,38620,0.0012\nCC-MAIN-2017-04,application/pgp-signature,17419,17412,0.0006\nCC-MAIN-2017-04,application/postscript,11978,11971,0.0004\nCC-MAIN-2017-04,application/rdf+xml,149683,149662,0.0048\nCC-MAIN-2017-04,application/rss+xml,5086423,5079921,0.1617\nCC-MAIN-2017-04,application/rtf,4487,4487,0.0001\nCC-MAIN-2017-04,application/save-to-disk,2,2,0.0000\nCC-MAIN-2017-04,application/text,7944,7944,0.0003\nCC-MAIN-2017-04,application/unknown,2341,2341,0.0001\nCC-MAIN-2017-04,application/vnd.android.package-archive,8045,7849,0.0003\nCC-MAIN-2017-04,application/vnd.google-earth.kml+xml,190801,190285,0.0061\nCC-MAIN-2017-04,application/vnd.google-earth.kmz,36379,36376,0.0012\nCC-MAIN-2017-04,application/vnd.ms-excel,51693,51162,0.0016\nCC-MAIN-2017-04,application/vnd.ms-powerpoint,34890,34856,0.0011\nCC-MAIN-2017-04,application/vnd.ms-word,6513,6508,0.0002\nCC-MAIN-2017-04,application/vnd.oasis.opendocument.text,2481,2477,0.0001\nCC-MAIN-2017-04,application/vnd.openxmlformats-officedocument.presentationml.presentation,5404,5360,0.0002\nCC-MAIN-2017-04,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,20949,20865,0.0007\nCC-MAIN-2017-04,application/vnd.openxmlformats-officedocument.wordprocessingml.document,28049,27800,0.0009\nCC-MAIN-2017-04,application/vnd.wap.xhtml+xml,43898,43799,0.0014\nCC-MAIN-2017-04,application/x-bibtex,17258,17253,0.0005\nCC-MAIN-2017-04,application/x-bittorrent,7915,7801,0.0003\nCC-MAIN-2017-04,application/x-debian-package,11701,11701,0.0004\nCC-MAIN-2017-04,application/x-download,9790,9790,0.0003\nCC-MAIN-2017-04,application/x-endnote-refer,20726,20725,0.0007\nCC-MAIN-2017-04,application/x-gzip,14757,14732,0.0005\nCC-MAIN-2017-04,application/x-httpd-php,39302,39264,0.0012\nCC-MAIN-2017-04,application/x-java-jnlp-file,6159,6159,0.0002\nCC-MAIN-2017-04,application/x-javascript,3795,3795,0.0001\nCC-MAIN-2017-04,application/x-json,1,1,0.0000\nCC-MAIN-2017-04,application/x-mobipocket-ebook,6825,6808,0.0002\nCC-MAIN-2017-04,application/x-msdownload,10759,10701,0.0003\nCC-MAIN-2017-04,application/x-netcdf,11845,11845,0.0004\nCC-MAIN-2017-04,application/x-research-info-systems,26752,26752,0.0009\nCC-MAIN-2017-04,application/x-shockwave-flash,38400,38171,0.0012\nCC-MAIN-2017-04,application/x-tar,7839,7828,0.0002\nCC-MAIN-2017-04,application/x-tex,13941,13941,0.0004\nCC-MAIN-2017-04,application/x-troff-man,12237,12236,0.0004\nCC-MAIN-2017-04,application/x-zip-compressed,25715,25621,0.0008\nCC-MAIN-2017-04,application/xhtml+xml,886222,883572,0.0282\nCC-MAIN-2017-04,application/xml,1263079,1261198,0.0401\nCC-MAIN-2017-04,application/zip,112005,111579,0.0036\nCC-MAIN-2017-04,audio/mpeg,115353,115127,0.0037\nCC-MAIN-2017-04,audio/x-mpegurl,42642,42623,0.0014\nCC-MAIN-2017-04,audio/x-scpls,6010,5993,0.0002\nCC-MAIN-2017-04,audio/x-wav,114951,114948,0.0037\nCC-MAIN-2017-04,binary/octet-stream,15961,15957,0.0005\nCC-MAIN-2017-04,image/gif,619132,618793,0.0197\nCC-MAIN-2017-04,image/jp2,28579,28579,0.0009\nCC-MAIN-2017-04,image/jpeg,11023155,11020515,0.3503\nCC-MAIN-2017-04,image/jpg,122195,122195,0.0039\nCC-MAIN-2017-04,image/pjpeg,45063,45032,0.0014\nCC-MAIN-2017-04,image/png,2979108,2978532,0.0947\nCC-MAIN-2017-04,image/svg+xml,13409,13408,0.0004\nCC-MAIN-2017-04,image/tiff,23463,23454,0.0007\nCC-MAIN-2017-04,image/vnd.djvu,10215,10213,0.0003\nCC-MAIN-2017-04,image/webp,34341,34341,0.0011\nCC-MAIN-2017-04,message/rfc822,16013,16012,0.0005\nCC-MAIN-2017-04,text/calendar,458471,457828,0.0146\nCC-MAIN-2017-04,text/css,6515,6484,0.0002\nCC-MAIN-2017-04,text/csv,66866,66826,0.0021\nCC-MAIN-2017-04,text/directory,4484,4484,0.0001\nCC-MAIN-2017-04,text/enriched,6328,6328,0.0002\nCC-MAIN-2017-04,text/html,3102193897,3071914242,98.5920\nCC-MAIN-2017-04,text/javascript,6454,6453,0.0002\nCC-MAIN-2017-04,text/markdown,2,2,0.0000\nCC-MAIN-2017-04,text/pdf,38768,38768,0.0012\nCC-MAIN-2017-04,text/plain,2767756,2766029,0.0880\nCC-MAIN-2017-04,text/prs.lines.tag,64,64,0.0000\nCC-MAIN-2017-04,text/tab-separated-values,53272,53272,0.0017\nCC-MAIN-2017-04,text/turtle,32691,32691,0.0010\nCC-MAIN-2017-04,text/vcard,1841,1841,0.0001\nCC-MAIN-2017-04,text/x-bibtex,7315,7315,0.0002\nCC-MAIN-2017-04,text/x-c,97751,97663,0.0031\nCC-MAIN-2017-04,text/x-csrc,7620,7619,0.0002\nCC-MAIN-2017-04,text/x-diff,15666,15662,0.0005\nCC-MAIN-2017-04,text/x-patch,97009,97007,0.0031\nCC-MAIN-2017-04,text/x-perl,4210,4208,0.0001\nCC-MAIN-2017-04,text/x-vcalendar,35864,35849,0.0011\nCC-MAIN-2017-04,text/x-vcard,21434,21433,0.0007\nCC-MAIN-2017-04,text/xml,3606886,3601844,0.1146\nCC-MAIN-2017-04,unknown/unknown,113624,113592,0.0036\nCC-MAIN-2017-04,video/mp4,43238,43102,0.0014\nCC-MAIN-2017-04,video/webm,10217,10213,0.0003\nCC-MAIN-2017-04,video/x-ms-asf,196004,195975,0.0062\nCC-MAIN-2017-09,<other>,2248013,2066263,0.0729\nCC-MAIN-2017-09,application/atom+xml,1928781,1913774,0.0625\nCC-MAIN-2017-09,application/calendar,1873,1845,0.0001\nCC-MAIN-2017-09,application/download,25898,24945,0.0008\nCC-MAIN-2017-09,application/epub+zip,22138,21316,0.0007\nCC-MAIN-2017-09,application/force-download,21753,21514,0.0007\nCC-MAIN-2017-09,application/gpx+xml,328,326,0.0000\nCC-MAIN-2017-09,application/ics,2073,2073,0.0001\nCC-MAIN-2017-09,application/javascript,4678,4677,0.0002\nCC-MAIN-2017-09,application/json,201361,193629,0.0065\nCC-MAIN-2017-09,application/ld+json,8939,8938,0.0003\nCC-MAIN-2017-09,application/marc,26260,26260,0.0009\nCC-MAIN-2017-09,application/msword,80646,77852,0.0026\nCC-MAIN-2017-09,application/octet-stream,359141,350160,0.0116\nCC-MAIN-2017-09,application/octetstream,3354,3339,0.0001\nCC-MAIN-2017-09,application/pdf,8247262,8104390,0.2674\nCC-MAIN-2017-09,application/pgp-encrypted,1405,1404,0.0000\nCC-MAIN-2017-09,application/pgp-signature,7341,7200,0.0002\nCC-MAIN-2017-09,application/postscript,10811,10727,0.0004\nCC-MAIN-2017-09,application/rdf+xml,60437,60223,0.0020\nCC-MAIN-2017-09,application/rss+xml,4645218,4421876,0.1506\nCC-MAIN-2017-09,application/rtf,1882,1874,0.0001\nCC-MAIN-2017-09,application/save-to-disk,5209,5209,0.0002\nCC-MAIN-2017-09,application/text,9339,9330,0.0003\nCC-MAIN-2017-09,application/unknown,2621,2614,0.0001\nCC-MAIN-2017-09,application/vnd.android.package-archive,6767,6720,0.0002\nCC-MAIN-2017-09,application/vnd.google-earth.kml+xml,61380,61176,0.0020\nCC-MAIN-2017-09,application/vnd.google-earth.kmz,8822,8693,0.0003\nCC-MAIN-2017-09,application/vnd.ms-excel,40254,38292,0.0013\nCC-MAIN-2017-09,application/vnd.ms-powerpoint,31808,25446,0.0010\nCC-MAIN-2017-09,application/vnd.ms-word,2813,2813,0.0001\nCC-MAIN-2017-09,application/vnd.oasis.opendocument.text,2312,2258,0.0001\nCC-MAIN-2017-09,application/vnd.openxmlformats-officedocument.presentationml.presentation,4003,3847,0.0001\nCC-MAIN-2017-09,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,6553,6011,0.0002\nCC-MAIN-2017-09,application/vnd.openxmlformats-officedocument.wordprocessingml.document,14222,13341,0.0005\nCC-MAIN-2017-09,application/vnd.wap.xhtml+xml,45329,45146,0.0015\nCC-MAIN-2017-09,application/x-bibtex,3830,3828,0.0001\nCC-MAIN-2017-09,application/x-bittorrent,4691,4691,0.0002\nCC-MAIN-2017-09,application/x-debian-package,5245,5181,0.0002\nCC-MAIN-2017-09,application/x-download,3722,3685,0.0001\nCC-MAIN-2017-09,application/x-endnote-refer,15003,14995,0.0005\nCC-MAIN-2017-09,application/x-gzip,8255,7946,0.0003\nCC-MAIN-2017-09,application/x-httpd-php,7132,7031,0.0002\nCC-MAIN-2017-09,application/x-java-jnlp-file,1141,1132,0.0000\nCC-MAIN-2017-09,application/x-javascript,2385,2383,0.0001\nCC-MAIN-2017-09,application/x-json,4,4,0.0000\nCC-MAIN-2017-09,application/x-mobipocket-ebook,4505,3922,0.0001\nCC-MAIN-2017-09,application/x-msdownload,9307,9200,0.0003\nCC-MAIN-2017-09,application/x-netcdf,1486,1486,0.0000\nCC-MAIN-2017-09,application/x-research-info-systems,29619,29205,0.0010\nCC-MAIN-2017-09,application/x-shockwave-flash,21439,21232,0.0007\nCC-MAIN-2017-09,application/x-tar,8140,8092,0.0003\nCC-MAIN-2017-09,application/x-tex,3918,3905,0.0001\nCC-MAIN-2017-09,application/x-troff-man,5440,5366,0.0002\nCC-MAIN-2017-09,application/x-zip-compressed,10728,10405,0.0003\nCC-MAIN-2017-09,application/xhtml+xml,949526,913099,0.0308\nCC-MAIN-2017-09,application/xml,1104982,1081274,0.0358\nCC-MAIN-2017-09,application/zip,105297,104199,0.0034\nCC-MAIN-2017-09,audio/mpeg,94581,90644,0.0031\nCC-MAIN-2017-09,audio/x-mpegurl,32034,31963,0.0010\nCC-MAIN-2017-09,audio/x-scpls,5406,5355,0.0002\nCC-MAIN-2017-09,audio/x-wav,110032,109986,0.0036\nCC-MAIN-2017-09,binary/octet-stream,11954,11739,0.0004\nCC-MAIN-2017-09,image/gif,175147,174390,0.0057\nCC-MAIN-2017-09,image/jp2,28166,28146,0.0009\nCC-MAIN-2017-09,image/jpeg,2901208,2891208,0.0941\nCC-MAIN-2017-09,image/jpg,20449,20256,0.0007\nCC-MAIN-2017-09,image/pjpeg,9557,9486,0.0003\nCC-MAIN-2017-09,image/png,1417865,1415751,0.0460\nCC-MAIN-2017-09,image/svg+xml,3979,3965,0.0001\nCC-MAIN-2017-09,image/tiff,35518,34882,0.0012\nCC-MAIN-2017-09,image/vnd.djvu,8655,8527,0.0003\nCC-MAIN-2017-09,image/webp,8462,8462,0.0003\nCC-MAIN-2017-09,message/rfc822,2987,2958,0.0001\nCC-MAIN-2017-09,text/calendar,373488,360196,0.0121\nCC-MAIN-2017-09,text/css,3096,3072,0.0001\nCC-MAIN-2017-09,text/csv,31109,29304,0.0010\nCC-MAIN-2017-09,text/directory,3735,3548,0.0001\nCC-MAIN-2017-09,text/enriched,7696,7348,0.0002\nCC-MAIN-2017-09,text/html,3054287200,2898686647,99.0248\nCC-MAIN-2017-09,text/javascript,6664,6648,0.0002\nCC-MAIN-2017-09,text/markdown,4,4,0.0000\nCC-MAIN-2017-09,text/pdf,33660,33660,0.0011\nCC-MAIN-2017-09,text/plain,1153471,1135625,0.0374\nCC-MAIN-2017-09,text/prs.lines.tag,16,16,0.0000\nCC-MAIN-2017-09,text/tab-separated-values,18156,16647,0.0006\nCC-MAIN-2017-09,text/turtle,10132,10127,0.0003\nCC-MAIN-2017-09,text/vcard,3376,2772,0.0001\nCC-MAIN-2017-09,text/x-bibtex,19367,19357,0.0006\nCC-MAIN-2017-09,text/x-c,8521,8494,0.0003\nCC-MAIN-2017-09,text/x-csrc,1359,1304,0.0000\nCC-MAIN-2017-09,text/x-diff,3588,3502,0.0001\nCC-MAIN-2017-09,text/x-patch,4115,3944,0.0001\nCC-MAIN-2017-09,text/x-perl,4131,4116,0.0001\nCC-MAIN-2017-09,text/x-vcalendar,9522,8998,0.0003\nCC-MAIN-2017-09,text/x-vcard,15310,13757,0.0005\nCC-MAIN-2017-09,text/xml,2711265,2647161,0.0879\nCC-MAIN-2017-09,unknown/unknown,96359,80107,0.0031\nCC-MAIN-2017-09,video/mp4,23581,23418,0.0008\nCC-MAIN-2017-09,video/webm,10136,9528,0.0003\nCC-MAIN-2017-09,video/x-ms-asf,204786,204482,0.0066\nCC-MAIN-2017-13,<other>,2531128,2494993,0.0824\nCC-MAIN-2017-13,application/atom+xml,4952509,4951451,0.1613\nCC-MAIN-2017-13,application/calendar,2468,2468,0.0001\nCC-MAIN-2017-13,application/download,35271,34814,0.0011\nCC-MAIN-2017-13,application/epub+zip,31551,31387,0.0010\nCC-MAIN-2017-13,application/force-download,53275,53256,0.0017\nCC-MAIN-2017-13,application/gpx+xml,2972,2972,0.0001\nCC-MAIN-2017-13,application/ics,2219,2219,0.0001\nCC-MAIN-2017-13,application/javascript,8007,8003,0.0003\nCC-MAIN-2017-13,application/json,160899,160553,0.0052\nCC-MAIN-2017-13,application/ld+json,7663,7663,0.0002\nCC-MAIN-2017-13,application/marc,23639,23639,0.0008\nCC-MAIN-2017-13,application/msword,86902,86054,0.0028\nCC-MAIN-2017-13,application/octet-stream,664027,662376,0.0216\nCC-MAIN-2017-13,application/octetstream,6273,6273,0.0002\nCC-MAIN-2017-13,application/pdf,21234794,21169133,0.6915\nCC-MAIN-2017-13,application/pgp-encrypted,576,576,0.0000\nCC-MAIN-2017-13,application/pgp-signature,17884,17876,0.0006\nCC-MAIN-2017-13,application/postscript,40847,40750,0.0013\nCC-MAIN-2017-13,application/rdf+xml,74874,74823,0.0024\nCC-MAIN-2017-13,application/rss+xml,4096726,4085058,0.1334\nCC-MAIN-2017-13,application/rtf,3173,3159,0.0001\nCC-MAIN-2017-13,application/save-to-disk,71,71,0.0000\nCC-MAIN-2017-13,application/text,14023,13866,0.0005\nCC-MAIN-2017-13,application/unknown,8741,8738,0.0003\nCC-MAIN-2017-13,application/vnd.android.package-archive,9233,9171,0.0003\nCC-MAIN-2017-13,application/vnd.google-earth.kml+xml,57235,57226,0.0019\nCC-MAIN-2017-13,application/vnd.google-earth.kmz,16765,16757,0.0005\nCC-MAIN-2017-13,application/vnd.ms-excel,29139,28987,0.0009\nCC-MAIN-2017-13,application/vnd.ms-powerpoint,26299,26233,0.0009\nCC-MAIN-2017-13,application/vnd.ms-word,2699,2699,0.0001\nCC-MAIN-2017-13,application/vnd.oasis.opendocument.text,7344,7340,0.0002\nCC-MAIN-2017-13,application/vnd.openxmlformats-officedocument.presentationml.presentation,4987,4961,0.0002\nCC-MAIN-2017-13,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,8671,8645,0.0003\nCC-MAIN-2017-13,application/vnd.openxmlformats-officedocument.wordprocessingml.document,21019,20587,0.0007\nCC-MAIN-2017-13,application/vnd.wap.xhtml+xml,40251,40231,0.0013\nCC-MAIN-2017-13,application/x-bibtex,6684,6684,0.0002\nCC-MAIN-2017-13,application/x-bittorrent,3878,3876,0.0001\nCC-MAIN-2017-13,application/x-debian-package,7925,7907,0.0003\nCC-MAIN-2017-13,application/x-download,17239,17234,0.0006\nCC-MAIN-2017-13,application/x-endnote-refer,19878,19725,0.0006\nCC-MAIN-2017-13,application/x-gzip,11923,11811,0.0004\nCC-MAIN-2017-13,application/x-httpd-php,9460,9415,0.0003\nCC-MAIN-2017-13,application/x-java-jnlp-file,1936,1935,0.0001\nCC-MAIN-2017-13,application/x-javascript,3386,3343,0.0001\nCC-MAIN-2017-13,application/x-json,5,5,0.0000\nCC-MAIN-2017-13,application/x-mobipocket-ebook,6118,6039,0.0002\nCC-MAIN-2017-13,application/x-msdownload,9934,9838,0.0003\nCC-MAIN-2017-13,application/x-netcdf,2183,2181,0.0001\nCC-MAIN-2017-13,application/x-research-info-systems,52688,52103,0.0017\nCC-MAIN-2017-13,application/x-shockwave-flash,20623,20528,0.0007\nCC-MAIN-2017-13,application/x-tar,13013,12976,0.0004\nCC-MAIN-2017-13,application/x-tex,6191,6189,0.0002\nCC-MAIN-2017-13,application/x-troff-man,3299,3295,0.0001\nCC-MAIN-2017-13,application/x-zip-compressed,13828,13777,0.0005\nCC-MAIN-2017-13,application/xhtml+xml,826122,822095,0.0269\nCC-MAIN-2017-13,application/xml,1342581,1334486,0.0437\nCC-MAIN-2017-13,application/zip,82535,80248,0.0027\nCC-MAIN-2017-13,audio/mpeg,115275,114061,0.0038\nCC-MAIN-2017-13,audio/x-mpegurl,47317,47291,0.0015\nCC-MAIN-2017-13,audio/x-scpls,5891,5831,0.0002\nCC-MAIN-2017-13,audio/x-wav,99157,99156,0.0032\nCC-MAIN-2017-13,binary/octet-stream,12817,12812,0.0004\nCC-MAIN-2017-13,image/gif,126191,125968,0.0041\nCC-MAIN-2017-13,image/jp2,31314,31314,0.0010\nCC-MAIN-2017-13,image/jpeg,3666642,3665276,0.1194\nCC-MAIN-2017-13,image/jpg,25240,25239,0.0008\nCC-MAIN-2017-13,image/pjpeg,8675,8639,0.0003\nCC-MAIN-2017-13,image/png,684633,684146,0.0223\nCC-MAIN-2017-13,image/svg+xml,2715,2714,0.0001\nCC-MAIN-2017-13,image/tiff,28320,28303,0.0009\nCC-MAIN-2017-13,image/vnd.djvu,18677,18660,0.0006\nCC-MAIN-2017-13,image/webp,1205,1205,0.0000\nCC-MAIN-2017-13,message/rfc822,6537,6509,0.0002\nCC-MAIN-2017-13,text/calendar,401881,401737,0.0131\nCC-MAIN-2017-13,text/css,4818,4813,0.0002\nCC-MAIN-2017-13,text/csv,14419,14338,0.0005\nCC-MAIN-2017-13,text/directory,4893,4879,0.0002\nCC-MAIN-2017-13,text/enriched,8092,8089,0.0003\nCC-MAIN-2017-13,text/html,3023852452,2989525620,98.4737\nCC-MAIN-2017-13,text/javascript,6652,6652,0.0002\nCC-MAIN-2017-13,text/markdown,71,71,0.0000\nCC-MAIN-2017-13,text/pdf,32559,32559,0.0011\nCC-MAIN-2017-13,text/plain,1746241,1743631,0.0569\nCC-MAIN-2017-13,text/prs.lines.tag,9425,9425,0.0003\nCC-MAIN-2017-13,text/tab-separated-values,3337,3253,0.0001\nCC-MAIN-2017-13,text/turtle,18184,18183,0.0006\nCC-MAIN-2017-13,text/vcard,5253,5253,0.0002\nCC-MAIN-2017-13,text/x-bibtex,10621,10567,0.0003\nCC-MAIN-2017-13,text/x-c,4261,4250,0.0001\nCC-MAIN-2017-13,text/x-csrc,3267,3265,0.0001\nCC-MAIN-2017-13,text/x-diff,18790,18787,0.0006\nCC-MAIN-2017-13,text/x-patch,1372,1370,0.0000\nCC-MAIN-2017-13,text/x-perl,7555,7524,0.0002\nCC-MAIN-2017-13,text/x-vcalendar,10296,10287,0.0003\nCC-MAIN-2017-13,text/x-vcard,25812,25787,0.0008\nCC-MAIN-2017-13,text/xml,2747382,2712387,0.0895\nCC-MAIN-2017-13,unknown/unknown,85009,84049,0.0028\nCC-MAIN-2017-13,video/mp4,25483,25394,0.0008\nCC-MAIN-2017-13,video/webm,10593,10575,0.0003\nCC-MAIN-2017-13,video/x-ms-asf,35669,35610,0.0012\nCC-MAIN-2017-17,<other>,2335712,2303795,0.0794\nCC-MAIN-2017-17,application/atom+xml,7358444,7357498,0.2500\nCC-MAIN-2017-17,application/calendar,2019,2014,0.0001\nCC-MAIN-2017-17,application/download,36186,36173,0.0012\nCC-MAIN-2017-17,application/epub+zip,41019,40990,0.0014\nCC-MAIN-2017-17,application/force-download,67104,67088,0.0023\nCC-MAIN-2017-17,application/gpx+xml,3734,3733,0.0001\nCC-MAIN-2017-17,application/ics,3152,3147,0.0001\nCC-MAIN-2017-17,application/javascript,14099,14095,0.0005\nCC-MAIN-2017-17,application/json,222160,221657,0.0075\nCC-MAIN-2017-17,application/ld+json,23459,23459,0.0008\nCC-MAIN-2017-17,application/marc,17622,17622,0.0006\nCC-MAIN-2017-17,application/msword,160577,160280,0.0055\nCC-MAIN-2017-17,application/octet-stream,870981,869584,0.0296\nCC-MAIN-2017-17,application/octetstream,15275,15273,0.0005\nCC-MAIN-2017-17,application/pdf,22496349,22459634,0.7644\nCC-MAIN-2017-17,application/pgp-encrypted,38097,38097,0.0013\nCC-MAIN-2017-17,application/pgp-signature,24303,24294,0.0008\nCC-MAIN-2017-17,application/postscript,45093,45077,0.0015\nCC-MAIN-2017-17,application/rdf+xml,139506,139485,0.0047\nCC-MAIN-2017-17,application/rss+xml,4560528,4548912,0.1550\nCC-MAIN-2017-17,application/rtf,5631,5627,0.0002\nCC-MAIN-2017-17,application/save-to-disk,3,3,0.0000\nCC-MAIN-2017-17,application/text,13247,13245,0.0005\nCC-MAIN-2017-17,application/unknown,7217,7217,0.0002\nCC-MAIN-2017-17,application/vnd.android.package-archive,9516,9481,0.0003\nCC-MAIN-2017-17,application/vnd.google-earth.kml+xml,170308,169623,0.0058\nCC-MAIN-2017-17,application/vnd.google-earth.kmz,44885,44876,0.0015\nCC-MAIN-2017-17,application/vnd.ms-excel,63968,63877,0.0022\nCC-MAIN-2017-17,application/vnd.ms-powerpoint,35371,35352,0.0012\nCC-MAIN-2017-17,application/vnd.ms-word,6012,6011,0.0002\nCC-MAIN-2017-17,application/vnd.oasis.opendocument.text,8888,8864,0.0003\nCC-MAIN-2017-17,application/vnd.openxmlformats-officedocument.presentationml.presentation,6016,6000,0.0002\nCC-MAIN-2017-17,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,23331,23314,0.0008\nCC-MAIN-2017-17,application/vnd.openxmlformats-officedocument.wordprocessingml.document,34507,34322,0.0012\nCC-MAIN-2017-17,application/vnd.wap.xhtml+xml,32225,32210,0.0011\nCC-MAIN-2017-17,application/x-bibtex,21637,21635,0.0007\nCC-MAIN-2017-17,application/x-bittorrent,4069,4068,0.0001\nCC-MAIN-2017-17,application/x-debian-package,11926,11912,0.0004\nCC-MAIN-2017-17,application/x-download,12942,12929,0.0004\nCC-MAIN-2017-17,application/x-endnote-refer,24543,24543,0.0008\nCC-MAIN-2017-17,application/x-gzip,18552,18492,0.0006\nCC-MAIN-2017-17,application/x-httpd-php,17063,16995,0.0006\nCC-MAIN-2017-17,application/x-java-jnlp-file,7128,7127,0.0002\nCC-MAIN-2017-17,application/x-javascript,5047,5032,0.0002\nCC-MAIN-2017-17,application/x-json,2,2,0.0000\nCC-MAIN-2017-17,application/x-mobipocket-ebook,9646,9641,0.0003\nCC-MAIN-2017-17,application/x-msdownload,11592,11510,0.0004\nCC-MAIN-2017-17,application/x-netcdf,11876,11875,0.0004\nCC-MAIN-2017-17,application/x-research-info-systems,59023,59018,0.0020\nCC-MAIN-2017-17,application/x-shockwave-flash,38553,38494,0.0013\nCC-MAIN-2017-17,application/x-tar,11568,11506,0.0004\nCC-MAIN-2017-17,application/x-tex,15042,15041,0.0005\nCC-MAIN-2017-17,application/x-troff-man,13950,13733,0.0005\nCC-MAIN-2017-17,application/x-zip-compressed,23835,23787,0.0008\nCC-MAIN-2017-17,application/xhtml+xml,805613,802132,0.0274\nCC-MAIN-2017-17,application/xml,1538936,1535172,0.0523\nCC-MAIN-2017-17,application/zip,120666,120404,0.0041\nCC-MAIN-2017-17,audio/mpeg,129977,129671,0.0044\nCC-MAIN-2017-17,audio/x-mpegurl,57112,57099,0.0019\nCC-MAIN-2017-17,audio/x-scpls,6711,6693,0.0002\nCC-MAIN-2017-17,audio/x-wav,75574,75571,0.0026\nCC-MAIN-2017-17,binary/octet-stream,15331,15326,0.0005\nCC-MAIN-2017-17,image/gif,236921,236480,0.0081\nCC-MAIN-2017-17,image/jp2,31419,31419,0.0011\nCC-MAIN-2017-17,image/jpeg,12090543,12087490,0.4108\nCC-MAIN-2017-17,image/jpg,126566,126564,0.0043\nCC-MAIN-2017-17,image/pjpeg,42027,41990,0.0014\nCC-MAIN-2017-17,image/png,2552442,2551739,0.0867\nCC-MAIN-2017-17,image/svg+xml,13604,13604,0.0005\nCC-MAIN-2017-17,image/tiff,26755,26629,0.0009\nCC-MAIN-2017-17,image/vnd.djvu,25524,25387,0.0009\nCC-MAIN-2017-17,image/webp,33687,33686,0.0011\nCC-MAIN-2017-17,message/rfc822,18004,18003,0.0006\nCC-MAIN-2017-17,text/calendar,469885,468872,0.0160\nCC-MAIN-2017-17,text/css,9018,9012,0.0003\nCC-MAIN-2017-17,text/csv,53630,53617,0.0018\nCC-MAIN-2017-17,text/directory,5431,5419,0.0002\nCC-MAIN-2017-17,text/enriched,7613,7613,0.0003\nCC-MAIN-2017-17,text/html,2877825462,2842745969,97.7877\nCC-MAIN-2017-17,text/javascript,7271,7269,0.0002\nCC-MAIN-2017-17,text/markdown,78,78,0.0000\nCC-MAIN-2017-17,text/pdf,26086,26086,0.0009\nCC-MAIN-2017-17,text/plain,3326011,3322968,0.1130\nCC-MAIN-2017-17,text/prs.lines.tag,5365,5365,0.0002\nCC-MAIN-2017-17,text/tab-separated-values,45117,45114,0.0015\nCC-MAIN-2017-17,text/turtle,29826,29825,0.0010\nCC-MAIN-2017-17,text/vcard,4436,4434,0.0002\nCC-MAIN-2017-17,text/x-bibtex,14181,14181,0.0005\nCC-MAIN-2017-17,text/x-c,104539,104228,0.0036\nCC-MAIN-2017-17,text/x-csrc,9416,9414,0.0003\nCC-MAIN-2017-17,text/x-diff,22979,22964,0.0008\nCC-MAIN-2017-17,text/x-patch,94844,94844,0.0032\nCC-MAIN-2017-17,text/x-perl,11763,11735,0.0004\nCC-MAIN-2017-17,text/x-vcalendar,36824,36806,0.0013\nCC-MAIN-2017-17,text/x-vcard,33311,33254,0.0011\nCC-MAIN-2017-17,text/xml,3402754,3372663,0.1156\nCC-MAIN-2017-17,unknown/unknown,82062,78770,0.0028\nCC-MAIN-2017-17,video/mp4,35341,35289,0.0012\nCC-MAIN-2017-17,video/webm,11273,11271,0.0004\nCC-MAIN-2017-17,video/x-ms-asf,54016,53961,0.0018\nCC-MAIN-2017-22,<other>,1907658,1866513,0.0643\nCC-MAIN-2017-22,application/atom+xml,7511430,7509831,0.2531\nCC-MAIN-2017-22,application/calendar,2185,2179,0.0001\nCC-MAIN-2017-22,application/download,40000,39928,0.0013\nCC-MAIN-2017-22,application/epub+zip,23816,23658,0.0008\nCC-MAIN-2017-22,application/force-download,52647,52613,0.0018\nCC-MAIN-2017-22,application/gpx+xml,1874,1874,0.0001\nCC-MAIN-2017-22,application/ics,1814,1814,0.0001\nCC-MAIN-2017-22,application/javascript,14504,14495,0.0005\nCC-MAIN-2017-22,application/json,133482,133258,0.0045\nCC-MAIN-2017-22,application/ld+json,10865,10863,0.0004\nCC-MAIN-2017-22,application/marc,17095,17095,0.0006\nCC-MAIN-2017-22,application/msword,111014,110054,0.0037\nCC-MAIN-2017-22,application/octet-stream,514472,511792,0.0173\nCC-MAIN-2017-22,application/octetstream,5177,5175,0.0002\nCC-MAIN-2017-22,application/pdf,17764629,17713409,0.5987\nCC-MAIN-2017-22,application/pgp-encrypted,1540,1537,0.0001\nCC-MAIN-2017-22,application/pgp-signature,7550,7547,0.0003\nCC-MAIN-2017-22,application/postscript,27023,27007,0.0009\nCC-MAIN-2017-22,application/rdf+xml,66219,66140,0.0022\nCC-MAIN-2017-22,application/rss+xml,3986231,3963278,0.1343\nCC-MAIN-2017-22,application/rtf,3831,3810,0.0001\nCC-MAIN-2017-22,application/save-to-disk,5193,5193,0.0002\nCC-MAIN-2017-22,application/text,10428,10423,0.0004\nCC-MAIN-2017-22,application/unknown,5859,5856,0.0002\nCC-MAIN-2017-22,application/vnd.android.package-archive,19045,19012,0.0006\nCC-MAIN-2017-22,application/vnd.google-earth.kml+xml,51605,51112,0.0017\nCC-MAIN-2017-22,application/vnd.google-earth.kmz,10609,10597,0.0004\nCC-MAIN-2017-22,application/vnd.ms-excel,24833,24525,0.0008\nCC-MAIN-2017-22,application/vnd.ms-powerpoint,19773,19472,0.0007\nCC-MAIN-2017-22,application/vnd.ms-word,2398,2398,0.0001\nCC-MAIN-2017-22,application/vnd.oasis.opendocument.text,7101,7087,0.0002\nCC-MAIN-2017-22,application/vnd.openxmlformats-officedocument.presentationml.presentation,4068,4059,0.0001\nCC-MAIN-2017-22,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,8529,8285,0.0003\nCC-MAIN-2017-22,application/vnd.openxmlformats-officedocument.wordprocessingml.document,22161,21859,0.0007\nCC-MAIN-2017-22,application/vnd.wap.xhtml+xml,28172,28142,0.0009\nCC-MAIN-2017-22,application/x-bibtex,6728,6704,0.0002\nCC-MAIN-2017-22,application/x-bittorrent,5173,5069,0.0002\nCC-MAIN-2017-22,application/x-debian-package,3809,3795,0.0001\nCC-MAIN-2017-22,application/x-download,16443,16439,0.0006\nCC-MAIN-2017-22,application/x-endnote-refer,16239,16235,0.0005\nCC-MAIN-2017-22,application/x-gzip,9770,9659,0.0003\nCC-MAIN-2017-22,application/x-httpd-php,9070,9032,0.0003\nCC-MAIN-2017-22,application/x-java-jnlp-file,1890,1885,0.0001\nCC-MAIN-2017-22,application/x-javascript,3006,3000,0.0001\nCC-MAIN-2017-22,application/x-json,1,1,0.0000\nCC-MAIN-2017-22,application/x-mobipocket-ebook,5046,5007,0.0002\nCC-MAIN-2017-22,application/x-msdownload,8725,8654,0.0003\nCC-MAIN-2017-22,application/x-netcdf,1515,1515,0.0001\nCC-MAIN-2017-22,application/x-research-info-systems,46936,46917,0.0016\nCC-MAIN-2017-22,application/x-shockwave-flash,20656,20594,0.0007\nCC-MAIN-2017-22,application/x-tar,7640,7616,0.0003\nCC-MAIN-2017-22,application/x-tex,4864,4854,0.0002\nCC-MAIN-2017-22,application/x-troff-man,3442,3441,0.0001\nCC-MAIN-2017-22,application/x-zip-compressed,11459,11434,0.0004\nCC-MAIN-2017-22,application/xhtml+xml,879917,861070,0.0297\nCC-MAIN-2017-22,application/xml,1355853,1350781,0.0457\nCC-MAIN-2017-22,application/zip,126970,126278,0.0043\nCC-MAIN-2017-22,audio/mpeg,112129,111436,0.0038\nCC-MAIN-2017-22,audio/x-mpegurl,45999,45992,0.0016\nCC-MAIN-2017-22,audio/x-scpls,6981,6942,0.0002\nCC-MAIN-2017-22,audio/x-wav,69420,69420,0.0023\nCC-MAIN-2017-22,binary/octet-stream,9120,8925,0.0003\nCC-MAIN-2017-22,image/gif,131989,131544,0.0044\nCC-MAIN-2017-22,image/jp2,20536,20536,0.0007\nCC-MAIN-2017-22,image/jpeg,4617602,4614164,0.1556\nCC-MAIN-2017-22,image/jpg,37753,37739,0.0013\nCC-MAIN-2017-22,image/pjpeg,10106,10017,0.0003\nCC-MAIN-2017-22,image/png,1345322,1343617,0.0453\nCC-MAIN-2017-22,image/svg+xml,4278,4268,0.0001\nCC-MAIN-2017-22,image/tiff,34601,34169,0.0012\nCC-MAIN-2017-22,image/vnd.djvu,23536,23475,0.0008\nCC-MAIN-2017-22,image/webp,8189,8160,0.0003\nCC-MAIN-2017-22,message/rfc822,4364,4353,0.0001\nCC-MAIN-2017-22,text/calendar,338837,338283,0.0114\nCC-MAIN-2017-22,text/css,6416,6397,0.0002\nCC-MAIN-2017-22,text/csv,23625,23593,0.0008\nCC-MAIN-2017-22,text/directory,4634,4536,0.0002\nCC-MAIN-2017-22,text/enriched,7041,7028,0.0002\nCC-MAIN-2017-22,text/html,2921073486,2872905079,98.4423\nCC-MAIN-2017-22,text/javascript,6321,6314,0.0002\nCC-MAIN-2017-22,text/markdown,105,105,0.0000\nCC-MAIN-2017-22,text/pdf,21509,21509,0.0007\nCC-MAIN-2017-22,text/plain,1436916,1429801,0.0484\nCC-MAIN-2017-22,text/prs.lines.tag,1449,1449,0.0000\nCC-MAIN-2017-22,text/tab-separated-values,14612,14605,0.0005\nCC-MAIN-2017-22,text/turtle,14368,14366,0.0005\nCC-MAIN-2017-22,text/vcard,2854,2853,0.0001\nCC-MAIN-2017-22,text/x-bibtex,20357,20353,0.0007\nCC-MAIN-2017-22,text/x-c,5338,5198,0.0002\nCC-MAIN-2017-22,text/x-csrc,2047,1985,0.0001\nCC-MAIN-2017-22,text/x-diff,8150,8141,0.0003\nCC-MAIN-2017-22,text/x-patch,4009,3759,0.0001\nCC-MAIN-2017-22,text/x-perl,6346,6274,0.0002\nCC-MAIN-2017-22,text/x-vcalendar,16171,15962,0.0005\nCC-MAIN-2017-22,text/x-vcard,20357,20119,0.0007\nCC-MAIN-2017-22,text/xml,2665303,2645134,0.0898\nCC-MAIN-2017-22,unknown/unknown,88109,81444,0.0030\nCC-MAIN-2017-22,video/mp4,20478,20440,0.0007\nCC-MAIN-2017-22,video/webm,9034,9032,0.0003\nCC-MAIN-2017-22,video/x-ms-asf,23920,23821,0.0008\nCC-MAIN-2017-26,<other>,1716791,1682956,0.0542\nCC-MAIN-2017-26,application/atom+xml,11339720,11338820,0.3583\nCC-MAIN-2017-26,application/calendar,1416,1415,0.0000\nCC-MAIN-2017-26,application/download,37682,37680,0.0012\nCC-MAIN-2017-26,application/epub+zip,22469,22418,0.0007\nCC-MAIN-2017-26,application/force-download,62253,62227,0.0020\nCC-MAIN-2017-26,application/gpx+xml,2420,2420,0.0001\nCC-MAIN-2017-26,application/ics,2365,2365,0.0001\nCC-MAIN-2017-26,application/javascript,21645,21635,0.0007\nCC-MAIN-2017-26,application/json,166457,166209,0.0053\nCC-MAIN-2017-26,application/ld+json,21531,21531,0.0007\nCC-MAIN-2017-26,application/marc,16210,16210,0.0005\nCC-MAIN-2017-26,application/msword,82197,81819,0.0026\nCC-MAIN-2017-26,application/octet-stream,572679,571444,0.0181\nCC-MAIN-2017-26,application/octetstream,5340,5333,0.0002\nCC-MAIN-2017-26,application/pdf,22479738,22444624,0.7102\nCC-MAIN-2017-26,application/pgp-encrypted,311,311,0.0000\nCC-MAIN-2017-26,application/pgp-signature,6867,6855,0.0002\nCC-MAIN-2017-26,application/postscript,25369,25349,0.0008\nCC-MAIN-2017-26,application/rdf+xml,82072,82041,0.0026\nCC-MAIN-2017-26,application/rss+xml,4464864,4455368,0.1411\nCC-MAIN-2017-26,application/rtf,4700,4700,0.0001\nCC-MAIN-2017-26,application/save-to-disk,58,58,0.0000\nCC-MAIN-2017-26,application/text,10199,10196,0.0003\nCC-MAIN-2017-26,application/unknown,6392,6389,0.0002\nCC-MAIN-2017-26,application/vnd.android.package-archive,32491,32444,0.0010\nCC-MAIN-2017-26,application/vnd.google-earth.kml+xml,52331,52272,0.0017\nCC-MAIN-2017-26,application/vnd.google-earth.kmz,12888,12884,0.0004\nCC-MAIN-2017-26,application/vnd.ms-excel,22572,22504,0.0007\nCC-MAIN-2017-26,application/vnd.ms-powerpoint,18191,18146,0.0006\nCC-MAIN-2017-26,application/vnd.ms-word,2269,2269,0.0001\nCC-MAIN-2017-26,application/vnd.oasis.opendocument.text,7577,7576,0.0002\nCC-MAIN-2017-26,application/vnd.openxmlformats-officedocument.presentationml.presentation,5274,5270,0.0002\nCC-MAIN-2017-26,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,9241,9209,0.0003\nCC-MAIN-2017-26,application/vnd.openxmlformats-officedocument.wordprocessingml.document,22786,22670,0.0007\nCC-MAIN-2017-26,application/vnd.wap.xhtml+xml,29268,29249,0.0009\nCC-MAIN-2017-26,application/x-bibtex,4640,4639,0.0001\nCC-MAIN-2017-26,application/x-bittorrent,4213,4208,0.0001\nCC-MAIN-2017-26,application/x-debian-package,2744,2741,0.0001\nCC-MAIN-2017-26,application/x-download,17492,17489,0.0006\nCC-MAIN-2017-26,application/x-endnote-refer,14003,14002,0.0004\nCC-MAIN-2017-26,application/x-gzip,10907,10809,0.0003\nCC-MAIN-2017-26,application/x-httpd-php,16889,16791,0.0005\nCC-MAIN-2017-26,application/x-java-jnlp-file,2196,2195,0.0001\nCC-MAIN-2017-26,application/x-javascript,4629,4580,0.0001\nCC-MAIN-2017-26,application/x-json,2,2,0.0000\nCC-MAIN-2017-26,application/x-mobipocket-ebook,4363,4360,0.0001\nCC-MAIN-2017-26,application/x-msdownload,8606,8471,0.0003\nCC-MAIN-2017-26,application/x-netcdf,2058,2058,0.0001\nCC-MAIN-2017-26,application/x-research-info-systems,32345,32342,0.0010\nCC-MAIN-2017-26,application/x-shockwave-flash,22769,22707,0.0007\nCC-MAIN-2017-26,application/x-tar,9264,9139,0.0003\nCC-MAIN-2017-26,application/x-tex,1884,1881,0.0001\nCC-MAIN-2017-26,application/x-troff-man,2890,2887,0.0001\nCC-MAIN-2017-26,application/x-zip-compressed,11471,11451,0.0004\nCC-MAIN-2017-26,application/xhtml+xml,757077,753534,0.0239\nCC-MAIN-2017-26,application/xml,1417458,1414517,0.0448\nCC-MAIN-2017-26,application/zip,75395,75006,0.0024\nCC-MAIN-2017-26,audio/mpeg,116324,115642,0.0037\nCC-MAIN-2017-26,audio/x-mpegurl,42356,42333,0.0013\nCC-MAIN-2017-26,audio/x-scpls,7998,7967,0.0003\nCC-MAIN-2017-26,audio/x-wav,69468,69466,0.0022\nCC-MAIN-2017-26,binary/octet-stream,9708,9699,0.0003\nCC-MAIN-2017-26,image/gif,134359,134115,0.0042\nCC-MAIN-2017-26,image/jp2,24148,24148,0.0008\nCC-MAIN-2017-26,image/jpeg,4841559,4839682,0.1530\nCC-MAIN-2017-26,image/jpg,38692,38681,0.0012\nCC-MAIN-2017-26,image/pjpeg,8956,8902,0.0003\nCC-MAIN-2017-26,image/png,873688,873179,0.0276\nCC-MAIN-2017-26,image/svg+xml,3278,3274,0.0001\nCC-MAIN-2017-26,image/tiff,24570,24549,0.0008\nCC-MAIN-2017-26,image/vnd.djvu,19393,19379,0.0006\nCC-MAIN-2017-26,image/webp,2627,2592,0.0001\nCC-MAIN-2017-26,message/rfc822,4787,4779,0.0002\nCC-MAIN-2017-26,text/calendar,347122,346829,0.0110\nCC-MAIN-2017-26,text/css,9022,9016,0.0003\nCC-MAIN-2017-26,text/csv,14173,14110,0.0004\nCC-MAIN-2017-26,text/directory,5596,5572,0.0002\nCC-MAIN-2017-26,text/enriched,5788,5783,0.0002\nCC-MAIN-2017-26,text/html,3110549133,3079671926,98.2729\nCC-MAIN-2017-26,text/javascript,8194,8192,0.0003\nCC-MAIN-2017-26,text/markdown,171,171,0.0000\nCC-MAIN-2017-26,text/pdf,24708,24708,0.0008\nCC-MAIN-2017-26,text/plain,1048492,1046508,0.0331\nCC-MAIN-2017-26,text/prs.lines.tag,292,292,0.0000\nCC-MAIN-2017-26,text/tab-separated-values,4948,4948,0.0002\nCC-MAIN-2017-26,text/turtle,22367,22366,0.0007\nCC-MAIN-2017-26,text/vcard,4578,4578,0.0001\nCC-MAIN-2017-26,text/x-bibtex,5633,5633,0.0002\nCC-MAIN-2017-26,text/x-c,4144,4129,0.0001\nCC-MAIN-2017-26,text/x-csrc,1786,1786,0.0001\nCC-MAIN-2017-26,text/x-diff,6576,6569,0.0002\nCC-MAIN-2017-26,text/x-patch,844,811,0.0000\nCC-MAIN-2017-26,text/x-perl,4219,4194,0.0001\nCC-MAIN-2017-26,text/x-vcalendar,16143,16142,0.0005\nCC-MAIN-2017-26,text/x-vcard,27572,27535,0.0009\nCC-MAIN-2017-26,text/xml,2991255,2956353,0.0945\nCC-MAIN-2017-26,unknown/unknown,42573,42152,0.0013\nCC-MAIN-2017-26,video/mp4,22777,22753,0.0007\nCC-MAIN-2017-26,video/webm,12104,12101,0.0004\nCC-MAIN-2017-26,video/x-ms-asf,22037,22005,0.0007\nCC-MAIN-2017-30,<other>,3216534,3156321,0.1112\nCC-MAIN-2017-30,application/atom+xml,8715582,8714209,0.3013\nCC-MAIN-2017-30,application/calendar,3090,3090,0.0001\nCC-MAIN-2017-30,application/download,38299,38277,0.0013\nCC-MAIN-2017-30,application/epub+zip,36071,35816,0.0012\nCC-MAIN-2017-30,application/force-download,55163,55053,0.0019\nCC-MAIN-2017-30,application/gpx+xml,2949,2949,0.0001\nCC-MAIN-2017-30,application/ics,2771,2771,0.0001\nCC-MAIN-2017-30,application/javascript,27978,27918,0.0010\nCC-MAIN-2017-30,application/json,287970,287793,0.0100\nCC-MAIN-2017-30,application/ld+json,8219,8219,0.0003\nCC-MAIN-2017-30,application/marc,12089,12089,0.0004\nCC-MAIN-2017-30,application/msword,178000,176484,0.0062\nCC-MAIN-2017-30,application/octet-stream,1278672,1277145,0.0442\nCC-MAIN-2017-30,application/octetstream,21113,21112,0.0007\nCC-MAIN-2017-30,application/pdf,21585409,21522638,0.7463\nCC-MAIN-2017-30,application/pgp-encrypted,69540,69536,0.0024\nCC-MAIN-2017-30,application/pgp-signature,21728,21724,0.0008\nCC-MAIN-2017-30,application/postscript,31861,31825,0.0011\nCC-MAIN-2017-30,application/rdf+xml,82728,82702,0.0029\nCC-MAIN-2017-30,application/rss+xml,3984902,3953217,0.1378\nCC-MAIN-2017-30,application/rtf,6052,6046,0.0002\nCC-MAIN-2017-30,application/save-to-disk,4,4,0.0000\nCC-MAIN-2017-30,application/text,18194,18192,0.0006\nCC-MAIN-2017-30,application/unknown,7109,7109,0.0002\nCC-MAIN-2017-30,application/vnd.android.package-archive,17439,17271,0.0006\nCC-MAIN-2017-30,application/vnd.google-earth.kml+xml,179857,179064,0.0062\nCC-MAIN-2017-30,application/vnd.google-earth.kmz,42060,42056,0.0015\nCC-MAIN-2017-30,application/vnd.ms-excel,57930,56913,0.0020\nCC-MAIN-2017-30,application/vnd.ms-powerpoint,25781,25708,0.0009\nCC-MAIN-2017-30,application/vnd.ms-word,12137,11387,0.0004\nCC-MAIN-2017-30,application/vnd.oasis.opendocument.text,9906,9894,0.0003\nCC-MAIN-2017-30,application/vnd.openxmlformats-officedocument.presentationml.presentation,5765,5727,0.0002\nCC-MAIN-2017-30,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,23365,23307,0.0008\nCC-MAIN-2017-30,application/vnd.openxmlformats-officedocument.wordprocessingml.document,40347,39662,0.0014\nCC-MAIN-2017-30,application/vnd.wap.xhtml+xml,19832,19761,0.0007\nCC-MAIN-2017-30,application/x-bibtex,21413,21369,0.0007\nCC-MAIN-2017-30,application/x-bittorrent,3964,3958,0.0001\nCC-MAIN-2017-30,application/x-debian-package,20949,20934,0.0007\nCC-MAIN-2017-30,application/x-download,17243,17232,0.0006\nCC-MAIN-2017-30,application/x-endnote-refer,30605,30593,0.0011\nCC-MAIN-2017-30,application/x-gzip,16872,16765,0.0006\nCC-MAIN-2017-30,application/x-httpd-php,53272,53214,0.0018\nCC-MAIN-2017-30,application/x-java-jnlp-file,9743,9742,0.0003\nCC-MAIN-2017-30,application/x-javascript,20713,20710,0.0007\nCC-MAIN-2017-30,application/x-json,2,2,0.0000\nCC-MAIN-2017-30,application/x-mobipocket-ebook,8166,8011,0.0003\nCC-MAIN-2017-30,application/x-msdownload,12062,11861,0.0004\nCC-MAIN-2017-30,application/x-netcdf,18593,18593,0.0006\nCC-MAIN-2017-30,application/x-research-info-systems,53513,53483,0.0019\nCC-MAIN-2017-30,application/x-shockwave-flash,44851,44744,0.0016\nCC-MAIN-2017-30,application/x-tar,9329,9286,0.0003\nCC-MAIN-2017-30,application/x-tex,15821,15819,0.0005\nCC-MAIN-2017-30,application/x-troff-man,24060,24044,0.0008\nCC-MAIN-2017-30,application/x-zip-compressed,22817,22784,0.0008\nCC-MAIN-2017-30,application/xhtml+xml,639071,623784,0.0221\nCC-MAIN-2017-30,application/xml,1363657,1361206,0.0471\nCC-MAIN-2017-30,application/zip,116498,116243,0.0040\nCC-MAIN-2017-30,audio/mpeg,117061,116706,0.0040\nCC-MAIN-2017-30,audio/x-mpegurl,62254,61897,0.0022\nCC-MAIN-2017-30,audio/x-scpls,59946,59934,0.0021\nCC-MAIN-2017-30,audio/x-wav,51871,51871,0.0018\nCC-MAIN-2017-30,binary/octet-stream,14433,14433,0.0005\nCC-MAIN-2017-30,image/gif,1016303,1013346,0.0351\nCC-MAIN-2017-30,image/jp2,19484,19484,0.0007\nCC-MAIN-2017-30,image/jpeg,12998747,12986010,0.4494\nCC-MAIN-2017-30,image/jpg,171899,171898,0.0059\nCC-MAIN-2017-30,image/pjpeg,48176,48142,0.0017\nCC-MAIN-2017-30,image/png,3113364,3111967,0.1076\nCC-MAIN-2017-30,image/svg+xml,14783,14779,0.0005\nCC-MAIN-2017-30,image/tiff,23618,23575,0.0008\nCC-MAIN-2017-30,image/vnd.djvu,22333,22291,0.0008\nCC-MAIN-2017-30,image/webp,33620,33611,0.0012\nCC-MAIN-2017-30,message/rfc822,18460,18452,0.0006\nCC-MAIN-2017-30,text/calendar,505996,504306,0.0175\nCC-MAIN-2017-30,text/css,31587,31547,0.0011\nCC-MAIN-2017-30,text/csv,63781,63455,0.0022\nCC-MAIN-2017-30,text/directory,4766,4761,0.0002\nCC-MAIN-2017-30,text/enriched,7809,7804,0.0003\nCC-MAIN-2017-30,text/html,2823340738,2776712554,97.6187\nCC-MAIN-2017-30,text/javascript,35048,35043,0.0012\nCC-MAIN-2017-30,text/markdown,122,122,0.0000\nCC-MAIN-2017-30,text/pdf,15774,15774,0.0005\nCC-MAIN-2017-30,text/plain,3867867,3863723,0.1337\nCC-MAIN-2017-30,text/prs.lines.tag,5226,5226,0.0002\nCC-MAIN-2017-30,text/tab-separated-values,51335,51331,0.0018\nCC-MAIN-2017-30,text/turtle,14961,14961,0.0005\nCC-MAIN-2017-30,text/vcard,4050,4049,0.0001\nCC-MAIN-2017-30,text/x-bibtex,10174,10164,0.0004\nCC-MAIN-2017-30,text/x-c,182525,182045,0.0063\nCC-MAIN-2017-30,text/x-csrc,20231,20231,0.0007\nCC-MAIN-2017-30,text/x-diff,21176,21159,0.0007\nCC-MAIN-2017-30,text/x-patch,103261,103261,0.0036\nCC-MAIN-2017-30,text/x-perl,22479,22402,0.0008\nCC-MAIN-2017-30,text/x-vcalendar,24992,24822,0.0009\nCC-MAIN-2017-30,text/x-vcard,31914,31843,0.0011\nCC-MAIN-2017-30,text/xml,3278250,3258647,0.1133\nCC-MAIN-2017-30,unknown/unknown,45850,45268,0.0016\nCC-MAIN-2017-30,video/mp4,30506,30475,0.0011\nCC-MAIN-2017-30,video/webm,7882,7865,0.0003\nCC-MAIN-2017-30,video/x-ms-asf,49340,49295,0.0017\nCC-MAIN-2017-34,<other>,2069244,2048684,0.0631\nCC-MAIN-2017-34,application/atom+xml,12042549,12041850,0.3671\nCC-MAIN-2017-34,application/calendar,1361,1361,0.0000\nCC-MAIN-2017-34,application/download,28688,28683,0.0009\nCC-MAIN-2017-34,application/epub+zip,32637,32416,0.0010\nCC-MAIN-2017-34,application/force-download,50518,50506,0.0015\nCC-MAIN-2017-34,application/gpx+xml,1777,1777,0.0001\nCC-MAIN-2017-34,application/ics,2289,2289,0.0001\nCC-MAIN-2017-34,application/javascript,24286,24267,0.0007\nCC-MAIN-2017-34,application/json,149864,149793,0.0046\nCC-MAIN-2017-34,application/ld+json,10214,10213,0.0003\nCC-MAIN-2017-34,application/marc,16144,16144,0.0005\nCC-MAIN-2017-34,application/msword,88900,88595,0.0027\nCC-MAIN-2017-34,application/octet-stream,455377,454829,0.0139\nCC-MAIN-2017-34,application/octetstream,4557,4557,0.0001\nCC-MAIN-2017-34,application/pdf,18225203,18202615,0.5556\nCC-MAIN-2017-34,application/pgp-encrypted,641,641,0.0000\nCC-MAIN-2017-34,application/pgp-signature,4607,4366,0.0001\nCC-MAIN-2017-34,application/postscript,13762,13762,0.0004\nCC-MAIN-2017-34,application/rdf+xml,70719,70707,0.0022\nCC-MAIN-2017-34,application/rss+xml,4023461,4018943,0.1227\nCC-MAIN-2017-34,application/rtf,4810,4806,0.0001\nCC-MAIN-2017-34,application/text,2966,2966,0.0001\nCC-MAIN-2017-34,application/unknown,7427,7426,0.0002\nCC-MAIN-2017-34,application/vnd.android.package-archive,59932,59839,0.0018\nCC-MAIN-2017-34,application/vnd.google-earth.kml+xml,48708,48705,0.0015\nCC-MAIN-2017-34,application/vnd.google-earth.kmz,9639,9636,0.0003\nCC-MAIN-2017-34,application/vnd.ms-excel,25109,24188,0.0008\nCC-MAIN-2017-34,application/vnd.ms-powerpoint,18114,18107,0.0006\nCC-MAIN-2017-34,application/vnd.ms-word,2407,2405,0.0001\nCC-MAIN-2017-34,application/vnd.oasis.opendocument.text,5956,5955,0.0002\nCC-MAIN-2017-34,application/vnd.openxmlformats-officedocument.presentationml.presentation,4890,4879,0.0001\nCC-MAIN-2017-34,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,10655,10627,0.0003\nCC-MAIN-2017-34,application/vnd.openxmlformats-officedocument.wordprocessingml.document,23799,23672,0.0007\nCC-MAIN-2017-34,application/vnd.wap.xhtml+xml,29641,29624,0.0009\nCC-MAIN-2017-34,application/x-bibtex,3180,3168,0.0001\nCC-MAIN-2017-34,application/x-bittorrent,5220,5071,0.0002\nCC-MAIN-2017-34,application/x-debian-package,2803,2782,0.0001\nCC-MAIN-2017-34,application/x-download,17424,17393,0.0005\nCC-MAIN-2017-34,application/x-endnote-refer,4078,4067,0.0001\nCC-MAIN-2017-34,application/x-gzip,10259,10195,0.0003\nCC-MAIN-2017-34,application/x-httpd-php,10684,10641,0.0003\nCC-MAIN-2017-34,application/x-java-jnlp-file,1209,1209,0.0000\nCC-MAIN-2017-34,application/x-javascript,4315,4307,0.0001\nCC-MAIN-2017-34,application/x-json,1,1,0.0000\nCC-MAIN-2017-34,application/x-mobipocket-ebook,4222,4221,0.0001\nCC-MAIN-2017-34,application/x-msdownload,7678,7609,0.0002\nCC-MAIN-2017-34,application/x-netcdf,1116,1116,0.0000\nCC-MAIN-2017-34,application/x-research-info-systems,26114,26094,0.0008\nCC-MAIN-2017-34,application/x-shockwave-flash,15891,15793,0.0005\nCC-MAIN-2017-34,application/x-tar,7895,7873,0.0002\nCC-MAIN-2017-34,application/x-tex,1240,1239,0.0000\nCC-MAIN-2017-34,application/x-troff-man,2265,2265,0.0001\nCC-MAIN-2017-34,application/x-zip-compressed,8410,8400,0.0003\nCC-MAIN-2017-34,application/xhtml+xml,647091,640877,0.0197\nCC-MAIN-2017-34,application/xml,935779,933997,0.0285\nCC-MAIN-2017-34,application/zip,72982,72568,0.0022\nCC-MAIN-2017-34,audio/mpeg,112908,112585,0.0034\nCC-MAIN-2017-34,audio/x-mpegurl,31319,31299,0.0010\nCC-MAIN-2017-34,audio/x-scpls,5502,5439,0.0002\nCC-MAIN-2017-34,audio/x-wav,58687,58686,0.0018\nCC-MAIN-2017-34,binary/octet-stream,9866,9856,0.0003\nCC-MAIN-2017-34,image/gif,155084,154860,0.0047\nCC-MAIN-2017-34,image/jp2,30044,30044,0.0009\nCC-MAIN-2017-34,image/jpeg,5034113,5031185,0.1535\nCC-MAIN-2017-34,image/jpg,37735,37735,0.0012\nCC-MAIN-2017-34,image/pjpeg,11527,11521,0.0004\nCC-MAIN-2017-34,image/png,1026862,1025892,0.0313\nCC-MAIN-2017-34,image/svg+xml,3192,3175,0.0001\nCC-MAIN-2017-34,image/tiff,14841,14829,0.0005\nCC-MAIN-2017-34,image/vnd.djvu,15670,15635,0.0005\nCC-MAIN-2017-34,image/webp,3170,2694,0.0001\nCC-MAIN-2017-34,message/rfc822,3747,3746,0.0001\nCC-MAIN-2017-34,text/calendar,353128,352972,0.0108\nCC-MAIN-2017-34,text/css,10319,10286,0.0003\nCC-MAIN-2017-34,text/csv,8535,8469,0.0003\nCC-MAIN-2017-34,text/directory,4972,4971,0.0002\nCC-MAIN-2017-34,text/enriched,1386,1386,0.0000\nCC-MAIN-2017-34,text/html,3230122511,3206946818,98.4769\nCC-MAIN-2017-34,text/javascript,7179,7178,0.0002\nCC-MAIN-2017-34,text/markdown,165,165,0.0000\nCC-MAIN-2017-34,text/pdf,22043,22042,0.0007\nCC-MAIN-2017-34,text/plain,755739,754976,0.0230\nCC-MAIN-2017-34,text/prs.lines.tag,392,392,0.0000\nCC-MAIN-2017-34,text/tab-separated-values,2687,2687,0.0001\nCC-MAIN-2017-34,text/turtle,10323,10323,0.0003\nCC-MAIN-2017-34,text/vcard,3308,3285,0.0001\nCC-MAIN-2017-34,text/x-bibtex,2428,2424,0.0001\nCC-MAIN-2017-34,text/x-c,4459,4455,0.0001\nCC-MAIN-2017-34,text/x-csrc,1230,1230,0.0000\nCC-MAIN-2017-34,text/x-diff,1772,1770,0.0001\nCC-MAIN-2017-34,text/x-patch,1164,1163,0.0000\nCC-MAIN-2017-34,text/x-perl,4806,4787,0.0001\nCC-MAIN-2017-34,text/x-vcalendar,11722,11722,0.0004\nCC-MAIN-2017-34,text/x-vcard,20666,20652,0.0006\nCC-MAIN-2017-34,text/xml,2711335,2697142,0.0827\nCC-MAIN-2017-34,unknown/unknown,56565,52510,0.0017\nCC-MAIN-2017-34,video/mp4,21225,21197,0.0006\nCC-MAIN-2017-34,video/webm,10710,10705,0.0003\nCC-MAIN-2017-34,video/x-ms-asf,15167,15083,0.0005\nCC-MAIN-2017-39,<other>,2325120,2239408,0.0771\nCC-MAIN-2017-39,application/atom+xml,6834366,6833470,0.2265\nCC-MAIN-2017-39,application/calendar,4245,4244,0.0001\nCC-MAIN-2017-39,application/download,64044,63966,0.0021\nCC-MAIN-2017-39,application/epub+zip,20744,20109,0.0007\nCC-MAIN-2017-39,application/force-download,98591,98528,0.0033\nCC-MAIN-2017-39,application/gpx+xml,2425,2425,0.0001\nCC-MAIN-2017-39,application/ics,2246,2246,0.0001\nCC-MAIN-2017-39,application/javascript,16709,16691,0.0006\nCC-MAIN-2017-39,application/json,180757,180476,0.0060\nCC-MAIN-2017-39,application/ld+json,11640,11640,0.0004\nCC-MAIN-2017-39,application/marc,13124,13120,0.0004\nCC-MAIN-2017-39,application/msword,146750,146062,0.0049\nCC-MAIN-2017-39,application/octet-stream,806309,804371,0.0267\nCC-MAIN-2017-39,application/octetstream,7541,7514,0.0002\nCC-MAIN-2017-39,application/pdf,24824876,24759274,0.8228\nCC-MAIN-2017-39,application/pgp-encrypted,877,877,0.0000\nCC-MAIN-2017-39,application/pgp-signature,17206,17201,0.0006\nCC-MAIN-2017-39,application/postscript,49371,49265,0.0016\nCC-MAIN-2017-39,application/rdf+xml,61518,61449,0.0020\nCC-MAIN-2017-39,application/rss+xml,3251717,3239723,0.1078\nCC-MAIN-2017-39,application/rtf,8336,8320,0.0003\nCC-MAIN-2017-39,application/save-to-disk,2469,2469,0.0001\nCC-MAIN-2017-39,application/text,17416,17403,0.0006\nCC-MAIN-2017-39,application/unknown,9593,9593,0.0003\nCC-MAIN-2017-39,application/vnd.android.package-archive,34455,34342,0.0011\nCC-MAIN-2017-39,application/vnd.google-earth.kml+xml,91654,91501,0.0030\nCC-MAIN-2017-39,application/vnd.google-earth.kmz,13058,13047,0.0004\nCC-MAIN-2017-39,application/vnd.ms-excel,32799,32522,0.0011\nCC-MAIN-2017-39,application/vnd.ms-powerpoint,20480,20434,0.0007\nCC-MAIN-2017-39,application/vnd.ms-word,3369,3368,0.0001\nCC-MAIN-2017-39,application/vnd.oasis.opendocument.text,14066,14058,0.0005\nCC-MAIN-2017-39,application/vnd.openxmlformats-officedocument.presentationml.presentation,7838,7810,0.0003\nCC-MAIN-2017-39,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,13316,13130,0.0004\nCC-MAIN-2017-39,application/vnd.openxmlformats-officedocument.wordprocessingml.document,43876,43579,0.0015\nCC-MAIN-2017-39,application/vnd.wap.xhtml+xml,20375,20321,0.0007\nCC-MAIN-2017-39,application/x-bibtex,10750,10742,0.0004\nCC-MAIN-2017-39,application/x-bittorrent,7427,7423,0.0002\nCC-MAIN-2017-39,application/x-debian-package,688,659,0.0000\nCC-MAIN-2017-39,application/x-download,23861,23789,0.0008\nCC-MAIN-2017-39,application/x-endnote-refer,22829,22810,0.0008\nCC-MAIN-2017-39,application/x-gzip,14247,14185,0.0005\nCC-MAIN-2017-39,application/x-httpd-php,20138,20068,0.0007\nCC-MAIN-2017-39,application/x-java-jnlp-file,2107,2101,0.0001\nCC-MAIN-2017-39,application/x-javascript,3736,3728,0.0001\nCC-MAIN-2017-39,application/x-json,3,3,0.0000\nCC-MAIN-2017-39,application/x-mobipocket-ebook,4082,4072,0.0001\nCC-MAIN-2017-39,application/x-msdownload,8472,8364,0.0003\nCC-MAIN-2017-39,application/x-netcdf,4161,4161,0.0001\nCC-MAIN-2017-39,application/x-research-info-systems,56874,56864,0.0019\nCC-MAIN-2017-39,application/x-shockwave-flash,48611,48558,0.0016\nCC-MAIN-2017-39,application/x-tar,9909,9871,0.0003\nCC-MAIN-2017-39,application/x-tex,9502,9467,0.0003\nCC-MAIN-2017-39,application/x-troff-man,7673,7670,0.0003\nCC-MAIN-2017-39,application/x-zip-compressed,11326,11267,0.0004\nCC-MAIN-2017-39,application/xhtml+xml,874417,865981,0.0290\nCC-MAIN-2017-39,application/xml,981892,979038,0.0325\nCC-MAIN-2017-39,application/zip,111483,110795,0.0037\nCC-MAIN-2017-39,audio/mpeg,108815,108263,0.0036\nCC-MAIN-2017-39,audio/x-mpegurl,47877,47814,0.0016\nCC-MAIN-2017-39,audio/x-scpls,5845,5826,0.0002\nCC-MAIN-2017-39,audio/x-wav,48495,48494,0.0016\nCC-MAIN-2017-39,binary/octet-stream,6356,6267,0.0002\nCC-MAIN-2017-39,image/gif,170708,169946,0.0057\nCC-MAIN-2017-39,image/jp2,4098,4098,0.0001\nCC-MAIN-2017-39,image/jpeg,5299640,5296599,0.1756\nCC-MAIN-2017-39,image/jpg,71673,71641,0.0024\nCC-MAIN-2017-39,image/pjpeg,19500,19489,0.0006\nCC-MAIN-2017-39,image/png,943608,942263,0.0313\nCC-MAIN-2017-39,image/svg+xml,4747,4688,0.0002\nCC-MAIN-2017-39,image/tiff,19490,19393,0.0006\nCC-MAIN-2017-39,image/vnd.djvu,24004,23909,0.0008\nCC-MAIN-2017-39,image/webp,6970,6830,0.0002\nCC-MAIN-2017-39,message/rfc822,5613,5596,0.0002\nCC-MAIN-2017-39,text/calendar,381556,381178,0.0126\nCC-MAIN-2017-39,text/css,7072,7070,0.0002\nCC-MAIN-2017-39,text/csv,16697,16642,0.0006\nCC-MAIN-2017-39,text/directory,6284,6266,0.0002\nCC-MAIN-2017-39,text/enriched,6573,6558,0.0002\nCC-MAIN-2017-39,text/html,2964333217,2929094025,98.2485\nCC-MAIN-2017-39,text/javascript,10680,10675,0.0004\nCC-MAIN-2017-39,text/markdown,353,351,0.0000\nCC-MAIN-2017-39,text/pdf,17767,17752,0.0006\nCC-MAIN-2017-39,text/plain,1375457,1372461,0.0456\nCC-MAIN-2017-39,text/prs.lines.tag,1413,1413,0.0000\nCC-MAIN-2017-39,text/tab-separated-values,8393,8393,0.0003\nCC-MAIN-2017-39,text/turtle,12952,12941,0.0004\nCC-MAIN-2017-39,text/vcard,5522,5520,0.0002\nCC-MAIN-2017-39,text/x-bibtex,19554,19479,0.0006\nCC-MAIN-2017-39,text/x-c,5852,5805,0.0002\nCC-MAIN-2017-39,text/x-csrc,3456,3446,0.0001\nCC-MAIN-2017-39,text/x-diff,8155,8154,0.0003\nCC-MAIN-2017-39,text/x-patch,1741,1652,0.0001\nCC-MAIN-2017-39,text/x-perl,9762,9723,0.0003\nCC-MAIN-2017-39,text/x-vcalendar,15965,15896,0.0005\nCC-MAIN-2017-39,text/x-vcard,29057,28929,0.0010\nCC-MAIN-2017-39,text/xml,2700462,2693112,0.0895\nCC-MAIN-2017-39,unknown/unknown,49034,48560,0.0016\nCC-MAIN-2017-39,video/mp4,22414,22299,0.0007\nCC-MAIN-2017-39,video/webm,17643,17625,0.0006\nCC-MAIN-2017-39,video/x-ms-asf,18629,18521,0.0006\nCC-MAIN-2017-43,<other>,2381707,2286577,0.0652\nCC-MAIN-2017-43,application/atom+xml,7250118,7249363,0.1986\nCC-MAIN-2017-43,application/calendar,2164,2161,0.0001\nCC-MAIN-2017-43,application/download,38504,38484,0.0011\nCC-MAIN-2017-43,application/epub+zip,27939,27696,0.0008\nCC-MAIN-2017-43,application/force-download,75165,75143,0.0021\nCC-MAIN-2017-43,application/gpx+xml,2094,2094,0.0001\nCC-MAIN-2017-43,application/ics,2914,2914,0.0001\nCC-MAIN-2017-43,application/javascript,13477,13472,0.0004\nCC-MAIN-2017-43,application/json,191350,191121,0.0052\nCC-MAIN-2017-43,application/ld+json,13677,13677,0.0004\nCC-MAIN-2017-43,application/marc,16445,16445,0.0005\nCC-MAIN-2017-43,application/msword,95330,94813,0.0026\nCC-MAIN-2017-43,application/octet-stream,614569,613055,0.0168\nCC-MAIN-2017-43,application/octetstream,5106,5099,0.0001\nCC-MAIN-2017-43,application/pdf,16430181,16388691,0.4501\nCC-MAIN-2017-43,application/pgp-encrypted,1138,1132,0.0000\nCC-MAIN-2017-43,application/pgp-signature,5962,5947,0.0002\nCC-MAIN-2017-43,application/postscript,17640,17629,0.0005\nCC-MAIN-2017-43,application/rdf+xml,63244,63209,0.0017\nCC-MAIN-2017-43,application/rss+xml,3601487,3591140,0.0987\nCC-MAIN-2017-43,application/rtf,9540,9538,0.0003\nCC-MAIN-2017-43,application/save-to-disk,1870,1870,0.0001\nCC-MAIN-2017-43,application/text,8230,8229,0.0002\nCC-MAIN-2017-43,application/unknown,6231,6231,0.0002\nCC-MAIN-2017-43,application/vnd.android.package-archive,32089,31997,0.0009\nCC-MAIN-2017-43,application/vnd.google-earth.kml+xml,72219,71744,0.0020\nCC-MAIN-2017-43,application/vnd.google-earth.kmz,7927,7923,0.0002\nCC-MAIN-2017-43,application/vnd.ms-excel,29773,29679,0.0008\nCC-MAIN-2017-43,application/vnd.ms-powerpoint,17456,17419,0.0005\nCC-MAIN-2017-43,application/vnd.ms-word,2682,2678,0.0001\nCC-MAIN-2017-43,application/vnd.oasis.opendocument.text,6623,6617,0.0002\nCC-MAIN-2017-43,application/vnd.openxmlformats-officedocument.presentationml.presentation,4646,4628,0.0001\nCC-MAIN-2017-43,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,15356,15295,0.0004\nCC-MAIN-2017-43,application/vnd.openxmlformats-officedocument.wordprocessingml.document,27497,27303,0.0008\nCC-MAIN-2017-43,application/vnd.wap.xhtml+xml,30896,30852,0.0008\nCC-MAIN-2017-43,application/x-bibtex,8670,8648,0.0002\nCC-MAIN-2017-43,application/x-bittorrent,5509,5354,0.0002\nCC-MAIN-2017-43,application/x-debian-package,585,560,0.0000\nCC-MAIN-2017-43,application/x-download,22728,22698,0.0006\nCC-MAIN-2017-43,application/x-endnote-refer,14605,14582,0.0004\nCC-MAIN-2017-43,application/x-gzip,10239,10166,0.0003\nCC-MAIN-2017-43,application/x-httpd-php,11557,11529,0.0003\nCC-MAIN-2017-43,application/x-java-jnlp-file,1362,1361,0.0000\nCC-MAIN-2017-43,application/x-javascript,5386,5354,0.0001\nCC-MAIN-2017-43,application/x-json,15,15,0.0000\nCC-MAIN-2017-43,application/x-mobipocket-ebook,3100,3092,0.0001\nCC-MAIN-2017-43,application/x-msdownload,8553,8493,0.0002\nCC-MAIN-2017-43,application/x-netcdf,838,838,0.0000\nCC-MAIN-2017-43,application/x-research-info-systems,53807,53785,0.0015\nCC-MAIN-2017-43,application/x-shockwave-flash,34024,33964,0.0009\nCC-MAIN-2017-43,application/x-tar,4128,4105,0.0001\nCC-MAIN-2017-43,application/x-tex,2719,2714,0.0001\nCC-MAIN-2017-43,application/x-troff-man,2284,2269,0.0001\nCC-MAIN-2017-43,application/x-zip-compressed,8762,8686,0.0002\nCC-MAIN-2017-43,application/xhtml+xml,1044138,1033282,0.0286\nCC-MAIN-2017-43,application/xml,1037824,1035598,0.0284\nCC-MAIN-2017-43,application/zip,87426,87139,0.0024\nCC-MAIN-2017-43,audio/mpeg,104166,103648,0.0029\nCC-MAIN-2017-43,audio/x-mpegurl,39067,39047,0.0011\nCC-MAIN-2017-43,audio/x-scpls,6034,6000,0.0002\nCC-MAIN-2017-43,audio/x-wav,63192,63190,0.0017\nCC-MAIN-2017-43,binary/octet-stream,9138,9074,0.0003\nCC-MAIN-2017-43,image/gif,1352722,1350555,0.0371\nCC-MAIN-2017-43,image/jp2,2785,2785,0.0001\nCC-MAIN-2017-43,image/jpeg,93354344,91656676,2.5574\nCC-MAIN-2017-43,image/jpg,204533,204497,0.0056\nCC-MAIN-2017-43,image/pjpeg,19478,19432,0.0005\nCC-MAIN-2017-43,image/png,11207898,11190799,0.3070\nCC-MAIN-2017-43,image/svg+xml,83876,83659,0.0023\nCC-MAIN-2017-43,image/tiff,30228,30218,0.0008\nCC-MAIN-2017-43,image/vnd.djvu,7006,6970,0.0002\nCC-MAIN-2017-43,image/webp,7454,7329,0.0002\nCC-MAIN-2017-43,message/rfc822,4444,4438,0.0001\nCC-MAIN-2017-43,text/calendar,427655,427359,0.0117\nCC-MAIN-2017-43,text/css,6651,6580,0.0002\nCC-MAIN-2017-43,text/csv,16611,16603,0.0005\nCC-MAIN-2017-43,text/directory,5316,5313,0.0001\nCC-MAIN-2017-43,text/enriched,3180,3180,0.0001\nCC-MAIN-2017-43,text/html,3505651351,3469828773,96.0339\nCC-MAIN-2017-43,text/javascript,8714,8706,0.0002\nCC-MAIN-2017-43,text/markdown,242,242,0.0000\nCC-MAIN-2017-43,text/pdf,22117,22117,0.0006\nCC-MAIN-2017-43,text/plain,1106158,1102467,0.0303\nCC-MAIN-2017-43,text/prs.lines.tag,441,441,0.0000\nCC-MAIN-2017-43,text/tab-separated-values,9393,9393,0.0003\nCC-MAIN-2017-43,text/turtle,15115,15096,0.0004\nCC-MAIN-2017-43,text/vcard,3427,3423,0.0001\nCC-MAIN-2017-43,text/x-bibtex,17443,17423,0.0005\nCC-MAIN-2017-43,text/x-c,145421,145357,0.0040\nCC-MAIN-2017-43,text/x-csrc,1418,1393,0.0000\nCC-MAIN-2017-43,text/x-diff,7578,7573,0.0002\nCC-MAIN-2017-43,text/x-patch,2253,2181,0.0001\nCC-MAIN-2017-43,text/x-perl,28426,28347,0.0008\nCC-MAIN-2017-43,text/x-vcalendar,17148,17001,0.0005\nCC-MAIN-2017-43,text/x-vcard,20176,20051,0.0006\nCC-MAIN-2017-43,text/xml,2803364,2796161,0.0768\nCC-MAIN-2017-43,unknown/unknown,61054,59395,0.0017\nCC-MAIN-2017-43,video/mp4,16132,16063,0.0004\nCC-MAIN-2017-43,video/webm,7798,7796,0.0002\nCC-MAIN-2017-43,video/x-ms-asf,37766,37747,0.0010\nCC-MAIN-2017-47,<other>,2045261,1978820,0.0638\nCC-MAIN-2017-47,application/atom+xml,6240146,6239407,0.1947\nCC-MAIN-2017-47,application/calendar,3942,3931,0.0001\nCC-MAIN-2017-47,application/download,67111,67104,0.0021\nCC-MAIN-2017-47,application/epub+zip,21466,21214,0.0007\nCC-MAIN-2017-47,application/force-download,108131,108109,0.0034\nCC-MAIN-2017-47,application/gpx+xml,1701,1701,0.0001\nCC-MAIN-2017-47,application/ics,2903,2903,0.0001\nCC-MAIN-2017-47,application/javascript,6927,6918,0.0002\nCC-MAIN-2017-47,application/json,190218,190077,0.0059\nCC-MAIN-2017-47,application/ld+json,24035,24035,0.0007\nCC-MAIN-2017-47,application/marc,13221,13221,0.0004\nCC-MAIN-2017-47,application/msword,125240,124778,0.0039\nCC-MAIN-2017-47,application/octet-stream,712940,712108,0.0222\nCC-MAIN-2017-47,application/octetstream,6048,6047,0.0002\nCC-MAIN-2017-47,application/pdf,15847375,15817683,0.4945\nCC-MAIN-2017-47,application/pgp-encrypted,547,544,0.0000\nCC-MAIN-2017-47,application/pgp-signature,5513,5511,0.0002\nCC-MAIN-2017-47,application/postscript,17167,17156,0.0005\nCC-MAIN-2017-47,application/rdf+xml,68710,68692,0.0021\nCC-MAIN-2017-47,application/rss+xml,3189829,3183308,0.0995\nCC-MAIN-2017-47,application/rtf,10902,10901,0.0003\nCC-MAIN-2017-47,application/save-to-disk,685,685,0.0000\nCC-MAIN-2017-47,application/text,17884,17882,0.0006\nCC-MAIN-2017-47,application/unknown,9201,9171,0.0003\nCC-MAIN-2017-47,application/vnd.android.package-archive,20028,19832,0.0006\nCC-MAIN-2017-47,application/vnd.google-earth.kml+xml,60097,60029,0.0019\nCC-MAIN-2017-47,application/vnd.google-earth.kmz,9382,9372,0.0003\nCC-MAIN-2017-47,application/vnd.ms-excel,28932,28862,0.0009\nCC-MAIN-2017-47,application/vnd.ms-powerpoint,22267,22241,0.0007\nCC-MAIN-2017-47,application/vnd.ms-word,3029,3029,0.0001\nCC-MAIN-2017-47,application/vnd.oasis.opendocument.text,6930,6928,0.0002\nCC-MAIN-2017-47,application/vnd.openxmlformats-officedocument.presentationml.presentation,5708,5701,0.0002\nCC-MAIN-2017-47,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,11246,11192,0.0004\nCC-MAIN-2017-47,application/vnd.openxmlformats-officedocument.wordprocessingml.document,31550,31471,0.0010\nCC-MAIN-2017-47,application/vnd.wap.xhtml+xml,21823,21798,0.0007\nCC-MAIN-2017-47,application/x-bibtex,14933,14920,0.0005\nCC-MAIN-2017-47,application/x-bittorrent,8219,7983,0.0003\nCC-MAIN-2017-47,application/x-debian-package,407,407,0.0000\nCC-MAIN-2017-47,application/x-download,22679,22655,0.0007\nCC-MAIN-2017-47,application/x-endnote-refer,27714,27703,0.0009\nCC-MAIN-2017-47,application/x-gzip,9614,9564,0.0003\nCC-MAIN-2017-47,application/x-httpd-php,9380,9357,0.0003\nCC-MAIN-2017-47,application/x-java-jnlp-file,1654,1652,0.0001\nCC-MAIN-2017-47,application/x-javascript,4698,4673,0.0001\nCC-MAIN-2017-47,application/x-json,7,7,0.0000\nCC-MAIN-2017-47,application/x-mobipocket-ebook,3745,3738,0.0001\nCC-MAIN-2017-47,application/x-msdownload,7666,7595,0.0002\nCC-MAIN-2017-47,application/x-netcdf,965,965,0.0000\nCC-MAIN-2017-47,application/x-research-info-systems,48952,48934,0.0015\nCC-MAIN-2017-47,application/x-shockwave-flash,30404,30373,0.0009\nCC-MAIN-2017-47,application/x-tar,3691,3681,0.0001\nCC-MAIN-2017-47,application/x-tex,1573,1572,0.0000\nCC-MAIN-2017-47,application/x-troff-man,960,959,0.0000\nCC-MAIN-2017-47,application/x-zip-compressed,12058,11976,0.0004\nCC-MAIN-2017-47,application/xhtml+xml,922865,918580,0.0288\nCC-MAIN-2017-47,application/xml,1013003,1011649,0.0316\nCC-MAIN-2017-47,application/zip,81249,80599,0.0025\nCC-MAIN-2017-47,audio/mpeg,111070,110296,0.0035\nCC-MAIN-2017-47,audio/x-mpegurl,28309,28300,0.0009\nCC-MAIN-2017-47,audio/x-scpls,5664,5659,0.0002\nCC-MAIN-2017-47,audio/x-wav,35504,35502,0.0011\nCC-MAIN-2017-47,binary/octet-stream,17946,17941,0.0006\nCC-MAIN-2017-47,image/gif,644744,642773,0.0201\nCC-MAIN-2017-47,image/jp2,4770,4770,0.0001\nCC-MAIN-2017-47,image/jpeg,52901803,51884174,1.6506\nCC-MAIN-2017-47,image/jpg,166110,166084,0.0052\nCC-MAIN-2017-47,image/pjpeg,16120,16073,0.0005\nCC-MAIN-2017-47,image/png,5477540,5461983,0.1709\nCC-MAIN-2017-47,image/svg+xml,72064,72038,0.0022\nCC-MAIN-2017-47,image/tiff,26836,26828,0.0008\nCC-MAIN-2017-47,image/vnd.djvu,8591,8591,0.0003\nCC-MAIN-2017-47,image/webp,11541,11488,0.0004\nCC-MAIN-2017-47,message/rfc822,3611,3609,0.0001\nCC-MAIN-2017-47,text/calendar,424088,423797,0.0132\nCC-MAIN-2017-47,text/css,5721,5713,0.0002\nCC-MAIN-2017-47,text/csv,16766,16747,0.0005\nCC-MAIN-2017-47,text/directory,5018,5018,0.0002\nCC-MAIN-2017-47,text/enriched,6537,6537,0.0002\nCC-MAIN-2017-47,text/html,3110219477,3082812426,97.0444\nCC-MAIN-2017-47,text/javascript,9740,9739,0.0003\nCC-MAIN-2017-47,text/markdown,435,435,0.0000\nCC-MAIN-2017-47,text/pdf,17533,17533,0.0005\nCC-MAIN-2017-47,text/plain,683433,681736,0.0213\nCC-MAIN-2017-47,text/prs.lines.tag,154,154,0.0000\nCC-MAIN-2017-47,text/tab-separated-values,5136,5136,0.0002\nCC-MAIN-2017-47,text/turtle,25250,25248,0.0008\nCC-MAIN-2017-47,text/vcard,4993,4988,0.0002\nCC-MAIN-2017-47,text/x-bibtex,6299,6293,0.0002\nCC-MAIN-2017-47,text/x-c,39739,39717,0.0012\nCC-MAIN-2017-47,text/x-csrc,1309,1308,0.0000\nCC-MAIN-2017-47,text/x-diff,3114,3114,0.0001\nCC-MAIN-2017-47,text/x-patch,849,807,0.0000\nCC-MAIN-2017-47,text/x-perl,5366,5351,0.0002\nCC-MAIN-2017-47,text/x-vcalendar,18971,18962,0.0006\nCC-MAIN-2017-47,text/x-vcard,24439,24411,0.0008\nCC-MAIN-2017-47,text/xml,2542840,2536277,0.0793\nCC-MAIN-2017-47,unknown/unknown,65711,63752,0.0021\nCC-MAIN-2017-47,video/mp4,17702,17639,0.0006\nCC-MAIN-2017-47,video/webm,62292,62237,0.0019\nCC-MAIN-2017-47,video/x-ms-asf,13907,13893,0.0004\nCC-MAIN-2017-51,<other>,1426768,1362312,0.0490\nCC-MAIN-2017-51,application/atom+xml,3062118,3061892,0.1051\nCC-MAIN-2017-51,application/calendar,1599,1599,0.0001\nCC-MAIN-2017-51,application/download,27032,27028,0.0009\nCC-MAIN-2017-51,application/epub+zip,19785,19726,0.0007\nCC-MAIN-2017-51,application/force-download,66045,66006,0.0023\nCC-MAIN-2017-51,application/gpx+xml,2066,2066,0.0001\nCC-MAIN-2017-51,application/ics,2249,2249,0.0001\nCC-MAIN-2017-51,application/javascript,5477,5477,0.0002\nCC-MAIN-2017-51,application/json,160032,159773,0.0055\nCC-MAIN-2017-51,application/ld+json,7717,7717,0.0003\nCC-MAIN-2017-51,application/marc,12017,12017,0.0004\nCC-MAIN-2017-51,application/msword,43532,43475,0.0015\nCC-MAIN-2017-51,application/octet-stream,395209,394854,0.0136\nCC-MAIN-2017-51,application/octetstream,3423,3423,0.0001\nCC-MAIN-2017-51,application/pdf,8278188,8267511,0.2841\nCC-MAIN-2017-51,application/pgp-encrypted,364,364,0.0000\nCC-MAIN-2017-51,application/pgp-signature,2828,2827,0.0001\nCC-MAIN-2017-51,application/postscript,3403,3403,0.0001\nCC-MAIN-2017-51,application/rdf+xml,35806,35801,0.0012\nCC-MAIN-2017-51,application/rss+xml,2434204,2431254,0.0835\nCC-MAIN-2017-51,application/rtf,3859,3857,0.0001\nCC-MAIN-2017-51,application/save-to-disk,199,199,0.0000\nCC-MAIN-2017-51,application/text,4844,4844,0.0002\nCC-MAIN-2017-51,application/unknown,3771,3770,0.0001\nCC-MAIN-2017-51,application/vnd.android.package-archive,23716,23654,0.0008\nCC-MAIN-2017-51,application/vnd.google-earth.kml+xml,84228,84204,0.0029\nCC-MAIN-2017-51,application/vnd.google-earth.kmz,4411,4407,0.0002\nCC-MAIN-2017-51,application/vnd.ms-excel,15280,15245,0.0005\nCC-MAIN-2017-51,application/vnd.ms-powerpoint,10523,10518,0.0004\nCC-MAIN-2017-51,application/vnd.ms-word,2060,2060,0.0001\nCC-MAIN-2017-51,application/vnd.oasis.opendocument.text,3141,3140,0.0001\nCC-MAIN-2017-51,application/vnd.openxmlformats-officedocument.presentationml.presentation,2351,2344,0.0001\nCC-MAIN-2017-51,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,8138,8109,0.0003\nCC-MAIN-2017-51,application/vnd.openxmlformats-officedocument.wordprocessingml.document,11893,11871,0.0004\nCC-MAIN-2017-51,application/vnd.wap.xhtml+xml,24850,24832,0.0009\nCC-MAIN-2017-51,application/x-bibtex,7110,7110,0.0002\nCC-MAIN-2017-51,application/x-bittorrent,3916,3485,0.0001\nCC-MAIN-2017-51,application/x-debian-package,185,185,0.0000\nCC-MAIN-2017-51,application/x-download,16054,15770,0.0006\nCC-MAIN-2017-51,application/x-endnote-refer,9914,9914,0.0003\nCC-MAIN-2017-51,application/x-gzip,5307,5276,0.0002\nCC-MAIN-2017-51,application/x-httpd-php,11049,11006,0.0004\nCC-MAIN-2017-51,application/x-java-jnlp-file,914,914,0.0000\nCC-MAIN-2017-51,application/x-javascript,2924,2909,0.0001\nCC-MAIN-2017-51,application/x-json,1,1,0.0000\nCC-MAIN-2017-51,application/x-mobipocket-ebook,2172,2172,0.0001\nCC-MAIN-2017-51,application/x-msdownload,3380,3342,0.0001\nCC-MAIN-2017-51,application/x-netcdf,566,566,0.0000\nCC-MAIN-2017-51,application/x-research-info-systems,33737,33737,0.0012\nCC-MAIN-2017-51,application/x-shockwave-flash,20341,20326,0.0007\nCC-MAIN-2017-51,application/x-tar,1136,1136,0.0000\nCC-MAIN-2017-51,application/x-tex,832,831,0.0000\nCC-MAIN-2017-51,application/x-troff-man,490,490,0.0000\nCC-MAIN-2017-51,application/x-zip-compressed,3270,3257,0.0001\nCC-MAIN-2017-51,application/xhtml+xml,783056,780898,0.0269\nCC-MAIN-2017-51,application/xml,577130,575763,0.0198\nCC-MAIN-2017-51,application/zip,32866,32695,0.0011\nCC-MAIN-2017-51,audio/mpeg,61053,60399,0.0021\nCC-MAIN-2017-51,audio/x-mpegurl,14813,14790,0.0005\nCC-MAIN-2017-51,audio/x-scpls,3100,3079,0.0001\nCC-MAIN-2017-51,audio/x-wav,24148,24147,0.0008\nCC-MAIN-2017-51,binary/octet-stream,2908,2907,0.0001\nCC-MAIN-2017-51,image/gif,636279,631960,0.0218\nCC-MAIN-2017-51,image/jp2,3159,3158,0.0001\nCC-MAIN-2017-51,image/jpeg,53910534,52835590,1.8500\nCC-MAIN-2017-51,image/jpg,189545,189537,0.0065\nCC-MAIN-2017-51,image/pjpeg,9271,9267,0.0003\nCC-MAIN-2017-51,image/png,5734381,5714626,0.1968\nCC-MAIN-2017-51,image/svg+xml,87505,87478,0.0030\nCC-MAIN-2017-51,image/tiff,13217,13214,0.0005\nCC-MAIN-2017-51,image/vnd.djvu,3466,3466,0.0001\nCC-MAIN-2017-51,image/webp,8154,8154,0.0003\nCC-MAIN-2017-51,message/rfc822,1900,1900,0.0001\nCC-MAIN-2017-51,text/calendar,352317,352212,0.0121\nCC-MAIN-2017-51,text/css,3023,3019,0.0001\nCC-MAIN-2017-51,text/csv,5578,5578,0.0002\nCC-MAIN-2017-51,text/directory,4620,4619,0.0002\nCC-MAIN-2017-51,text/enriched,1684,1684,0.0001\nCC-MAIN-2017-51,text/html,2832861215,2814569134,97.2154\nCC-MAIN-2017-51,text/javascript,7027,7018,0.0002\nCC-MAIN-2017-51,text/markdown,185,185,0.0000\nCC-MAIN-2017-51,text/pdf,13654,13654,0.0005\nCC-MAIN-2017-51,text/plain,324903,324040,0.0111\nCC-MAIN-2017-51,text/prs.lines.tag,29,29,0.0000\nCC-MAIN-2017-51,text/tab-separated-values,1421,1421,0.0000\nCC-MAIN-2017-51,text/turtle,8227,8227,0.0003\nCC-MAIN-2017-51,text/vcard,2502,2502,0.0001\nCC-MAIN-2017-51,text/x-bibtex,977,977,0.0000\nCC-MAIN-2017-51,text/x-c,4355,4352,0.0001\nCC-MAIN-2017-51,text/x-csrc,1883,1883,0.0001\nCC-MAIN-2017-51,text/x-diff,432,431,0.0000\nCC-MAIN-2017-51,text/x-patch,449,448,0.0000\nCC-MAIN-2017-51,text/x-perl,639,639,0.0000\nCC-MAIN-2017-51,text/x-vcalendar,7370,7365,0.0003\nCC-MAIN-2017-51,text/x-vcard,12071,12069,0.0004\nCC-MAIN-2017-51,text/xml,1886816,1884013,0.0647\nCC-MAIN-2017-51,unknown/unknown,34046,33039,0.0012\nCC-MAIN-2017-51,video/mp4,10861,10738,0.0004\nCC-MAIN-2017-51,video/webm,38227,38198,0.0013\nCC-MAIN-2017-51,video/x-ms-asf,7003,6999,0.0002\nCC-MAIN-2018-05,<other>,2864473,2805231,0.0827\nCC-MAIN-2018-05,application/atom+xml,5694601,5694037,0.1644\nCC-MAIN-2018-05,application/calendar,3303,3296,0.0001\nCC-MAIN-2018-05,application/download,64961,64574,0.0019\nCC-MAIN-2018-05,application/epub+zip,46634,45464,0.0013\nCC-MAIN-2018-05,application/force-download,127248,127172,0.0037\nCC-MAIN-2018-05,application/gpx+xml,5451,5451,0.0002\nCC-MAIN-2018-05,application/ics,3805,3805,0.0001\nCC-MAIN-2018-05,application/javascript,10632,10626,0.0003\nCC-MAIN-2018-05,application/json,236416,236019,0.0068\nCC-MAIN-2018-05,application/ld+json,14068,14068,0.0004\nCC-MAIN-2018-05,application/marc,9841,9841,0.0003\nCC-MAIN-2018-05,application/msword,205311,203524,0.0059\nCC-MAIN-2018-05,application/octet-stream,1258992,1256452,0.0363\nCC-MAIN-2018-05,application/octetstream,23095,23091,0.0007\nCC-MAIN-2018-05,application/pdf,29198955,29131460,0.8428\nCC-MAIN-2018-05,application/pgp-encrypted,36787,36784,0.0011\nCC-MAIN-2018-05,application/pgp-signature,27135,27132,0.0008\nCC-MAIN-2018-05,application/postscript,36254,36149,0.0010\nCC-MAIN-2018-05,application/rdf+xml,89451,89433,0.0026\nCC-MAIN-2018-05,application/rss+xml,3708254,3700573,0.1070\nCC-MAIN-2018-05,application/rtf,10315,10278,0.0003\nCC-MAIN-2018-05,application/save-to-disk,34,34,0.0000\nCC-MAIN-2018-05,application/text,14141,14141,0.0004\nCC-MAIN-2018-05,application/unknown,11455,11455,0.0003\nCC-MAIN-2018-05,application/vnd.android.package-archive,68742,68325,0.0020\nCC-MAIN-2018-05,application/vnd.google-earth.kml+xml,169267,169233,0.0049\nCC-MAIN-2018-05,application/vnd.google-earth.kmz,39696,39689,0.0011\nCC-MAIN-2018-05,application/vnd.ms-excel,73957,73833,0.0021\nCC-MAIN-2018-05,application/vnd.ms-powerpoint,26917,26841,0.0008\nCC-MAIN-2018-05,application/vnd.ms-word,7796,7794,0.0002\nCC-MAIN-2018-05,application/vnd.oasis.opendocument.text,15904,15845,0.0005\nCC-MAIN-2018-05,application/vnd.openxmlformats-officedocument.presentationml.presentation,8768,8738,0.0003\nCC-MAIN-2018-05,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,27757,27648,0.0008\nCC-MAIN-2018-05,application/vnd.openxmlformats-officedocument.wordprocessingml.document,56182,55734,0.0016\nCC-MAIN-2018-05,application/vnd.wap.xhtml+xml,19570,19387,0.0006\nCC-MAIN-2018-05,application/x-bibtex,23180,23176,0.0007\nCC-MAIN-2018-05,application/x-bittorrent,18182,16933,0.0005\nCC-MAIN-2018-05,application/x-debian-package,7944,7943,0.0002\nCC-MAIN-2018-05,application/x-download,27820,27753,0.0008\nCC-MAIN-2018-05,application/x-endnote-refer,27363,27359,0.0008\nCC-MAIN-2018-05,application/x-gzip,18798,18749,0.0005\nCC-MAIN-2018-05,application/x-httpd-php,38919,38828,0.0011\nCC-MAIN-2018-05,application/x-java-jnlp-file,4249,4245,0.0001\nCC-MAIN-2018-05,application/x-javascript,4840,4836,0.0001\nCC-MAIN-2018-05,application/x-json,7,7,0.0000\nCC-MAIN-2018-05,application/x-mobipocket-ebook,9476,9469,0.0003\nCC-MAIN-2018-05,application/x-msdownload,10197,10004,0.0003\nCC-MAIN-2018-05,application/x-netcdf,4510,4510,0.0001\nCC-MAIN-2018-05,application/x-research-info-systems,50008,50004,0.0014\nCC-MAIN-2018-05,application/x-shockwave-flash,35767,35696,0.0010\nCC-MAIN-2018-05,application/x-tar,7860,7856,0.0002\nCC-MAIN-2018-05,application/x-tex,10211,10201,0.0003\nCC-MAIN-2018-05,application/x-troff-man,12428,12419,0.0004\nCC-MAIN-2018-05,application/x-zip-compressed,26202,26140,0.0008\nCC-MAIN-2018-05,application/xhtml+xml,747172,742434,0.0216\nCC-MAIN-2018-05,application/xml,1189329,1187611,0.0343\nCC-MAIN-2018-05,application/zip,168177,154251,0.0049\nCC-MAIN-2018-05,audio/mpeg,162486,160450,0.0047\nCC-MAIN-2018-05,audio/x-mpegurl,77121,77088,0.0022\nCC-MAIN-2018-05,audio/x-scpls,8700,8675,0.0003\nCC-MAIN-2018-05,audio/x-wav,26436,26431,0.0008\nCC-MAIN-2018-05,binary/octet-stream,11142,11118,0.0003\nCC-MAIN-2018-05,image/gif,760190,758610,0.0219\nCC-MAIN-2018-05,image/jp2,3189,3189,0.0001\nCC-MAIN-2018-05,image/jpeg,60878281,60078272,1.7572\nCC-MAIN-2018-05,image/jpg,309841,309821,0.0089\nCC-MAIN-2018-05,image/pjpeg,49945,49912,0.0014\nCC-MAIN-2018-05,image/png,7252717,7243689,0.2093\nCC-MAIN-2018-05,image/svg+xml,89355,89271,0.0026\nCC-MAIN-2018-05,image/tiff,18264,18255,0.0005\nCC-MAIN-2018-05,image/vnd.djvu,19404,19398,0.0006\nCC-MAIN-2018-05,image/webp,25760,25760,0.0007\nCC-MAIN-2018-05,message/rfc822,13158,13150,0.0004\nCC-MAIN-2018-05,text/calendar,533931,533591,0.0154\nCC-MAIN-2018-05,text/css,6294,6285,0.0002\nCC-MAIN-2018-05,text/csv,46276,46251,0.0013\nCC-MAIN-2018-05,text/directory,6900,6893,0.0002\nCC-MAIN-2018-05,text/enriched,4045,4045,0.0001\nCC-MAIN-2018-05,text/html,3341202641,3310679978,96.4401\nCC-MAIN-2018-05,text/javascript,10299,10291,0.0003\nCC-MAIN-2018-05,text/markdown,396,396,0.0000\nCC-MAIN-2018-05,text/pdf,16358,16358,0.0005\nCC-MAIN-2018-05,text/plain,2676011,2672717,0.0772\nCC-MAIN-2018-05,text/prs.lines.tag,7323,7323,0.0002\nCC-MAIN-2018-05,text/tab-separated-values,36575,36575,0.0011\nCC-MAIN-2018-05,text/turtle,15524,15509,0.0004\nCC-MAIN-2018-05,text/vcard,6497,6488,0.0002\nCC-MAIN-2018-05,text/x-bibtex,7757,7754,0.0002\nCC-MAIN-2018-05,text/x-c,8476,8472,0.0002\nCC-MAIN-2018-05,text/x-csrc,9864,9861,0.0003\nCC-MAIN-2018-05,text/x-diff,15816,15814,0.0005\nCC-MAIN-2018-05,text/x-patch,80590,80590,0.0023\nCC-MAIN-2018-05,text/x-perl,5791,5780,0.0002\nCC-MAIN-2018-05,text/x-vcalendar,28120,28102,0.0008\nCC-MAIN-2018-05,text/x-vcard,37091,37064,0.0011\nCC-MAIN-2018-05,text/xml,3220119,3209650,0.0929\nCC-MAIN-2018-05,unknown/unknown,43283,43219,0.0012\nCC-MAIN-2018-05,video/mp4,34334,34004,0.0010\nCC-MAIN-2018-05,video/webm,67575,67388,0.0020\nCC-MAIN-2018-05,video/x-ms-asf,44523,44511,0.0013\nCC-MAIN-2018-09,<other>,2522172,2404857,0.0723\nCC-MAIN-2018-09,application/atom+xml,6265656,6264609,0.1796\nCC-MAIN-2018-09,application/calendar,3797,3690,0.0001\nCC-MAIN-2018-09,application/download,57094,57051,0.0016\nCC-MAIN-2018-09,application/epub+zip,24798,24363,0.0007\nCC-MAIN-2018-09,application/force-download,109513,109325,0.0031\nCC-MAIN-2018-09,application/gpx+xml,2765,2765,0.0001\nCC-MAIN-2018-09,application/ics,3423,3420,0.0001\nCC-MAIN-2018-09,application/javascript,11305,11288,0.0003\nCC-MAIN-2018-09,application/json,222998,222777,0.0064\nCC-MAIN-2018-09,application/ld+json,18604,18604,0.0005\nCC-MAIN-2018-09,application/marc,13584,13584,0.0004\nCC-MAIN-2018-09,application/msword,130307,129914,0.0037\nCC-MAIN-2018-09,application/octet-stream,955465,952893,0.0274\nCC-MAIN-2018-09,application/octetstream,7686,7679,0.0002\nCC-MAIN-2018-09,application/pdf,21153171,21080085,0.6064\nCC-MAIN-2018-09,application/pgp-encrypted,1679,1679,0.0000\nCC-MAIN-2018-09,application/pgp-signature,17343,17340,0.0005\nCC-MAIN-2018-09,application/postscript,15567,15552,0.0004\nCC-MAIN-2018-09,application/rdf+xml,86209,86178,0.0025\nCC-MAIN-2018-09,application/rss+xml,3629596,3619591,0.1040\nCC-MAIN-2018-09,application/rtf,11249,11230,0.0003\nCC-MAIN-2018-09,application/text,7915,7915,0.0002\nCC-MAIN-2018-09,application/unknown,9028,9015,0.0003\nCC-MAIN-2018-09,application/vnd.android.package-archive,47909,47616,0.0014\nCC-MAIN-2018-09,application/vnd.google-earth.kml+xml,74790,74758,0.0021\nCC-MAIN-2018-09,application/vnd.google-earth.kmz,11635,11617,0.0003\nCC-MAIN-2018-09,application/vnd.ms-excel,32090,31896,0.0009\nCC-MAIN-2018-09,application/vnd.ms-powerpoint,16884,16849,0.0005\nCC-MAIN-2018-09,application/vnd.ms-word,4639,4638,0.0001\nCC-MAIN-2018-09,application/vnd.oasis.opendocument.text,10582,10569,0.0003\nCC-MAIN-2018-09,application/vnd.openxmlformats-officedocument.presentationml.presentation,8876,8843,0.0003\nCC-MAIN-2018-09,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,19917,19665,0.0006\nCC-MAIN-2018-09,application/vnd.openxmlformats-officedocument.wordprocessingml.document,46547,46158,0.0013\nCC-MAIN-2018-09,application/vnd.wap.xhtml+xml,25785,25675,0.0007\nCC-MAIN-2018-09,application/x-bibtex,13636,13635,0.0004\nCC-MAIN-2018-09,application/x-bittorrent,9014,8724,0.0003\nCC-MAIN-2018-09,application/x-debian-package,358,358,0.0000\nCC-MAIN-2018-09,application/x-download,23398,23292,0.0007\nCC-MAIN-2018-09,application/x-endnote-refer,12951,12949,0.0004\nCC-MAIN-2018-09,application/x-gzip,10361,10330,0.0003\nCC-MAIN-2018-09,application/x-httpd-php,21468,21391,0.0006\nCC-MAIN-2018-09,application/x-java-jnlp-file,1876,1871,0.0001\nCC-MAIN-2018-09,application/x-javascript,4758,4746,0.0001\nCC-MAIN-2018-09,application/x-json,3,3,0.0000\nCC-MAIN-2018-09,application/x-mobipocket-ebook,3716,3678,0.0001\nCC-MAIN-2018-09,application/x-msdownload,6441,6255,0.0002\nCC-MAIN-2018-09,application/x-netcdf,1456,1456,0.0000\nCC-MAIN-2018-09,application/x-research-info-systems,35815,35814,0.0010\nCC-MAIN-2018-09,application/x-shockwave-flash,15755,15663,0.0005\nCC-MAIN-2018-09,application/x-tar,10189,10186,0.0003\nCC-MAIN-2018-09,application/x-tex,3247,3246,0.0001\nCC-MAIN-2018-09,application/x-troff-man,2482,2482,0.0001\nCC-MAIN-2018-09,application/x-zip-compressed,8225,8129,0.0002\nCC-MAIN-2018-09,application/xhtml+xml,1133732,1123336,0.0325\nCC-MAIN-2018-09,application/xml,1056388,1054516,0.0303\nCC-MAIN-2018-09,application/zip,74846,73429,0.0021\nCC-MAIN-2018-09,audio/mpeg,123690,122406,0.0035\nCC-MAIN-2018-09,audio/x-mpegurl,40911,40881,0.0012\nCC-MAIN-2018-09,audio/x-scpls,5802,5778,0.0002\nCC-MAIN-2018-09,audio/x-wav,14392,14390,0.0004\nCC-MAIN-2018-09,binary/octet-stream,11337,11324,0.0003\nCC-MAIN-2018-09,image/gif,781397,777707,0.0224\nCC-MAIN-2018-09,image/jp2,2850,2849,0.0001\nCC-MAIN-2018-09,image/jpeg,63792488,62756839,1.8287\nCC-MAIN-2018-09,image/jpg,588412,588380,0.0169\nCC-MAIN-2018-09,image/pjpeg,27159,27091,0.0008\nCC-MAIN-2018-09,image/png,7529850,7501523,0.2159\nCC-MAIN-2018-09,image/svg+xml,90983,90865,0.0026\nCC-MAIN-2018-09,image/tiff,8622,8616,0.0002\nCC-MAIN-2018-09,image/vnd.djvu,8096,8090,0.0002\nCC-MAIN-2018-09,image/webp,11492,11491,0.0003\nCC-MAIN-2018-09,message/rfc822,4532,4531,0.0001\nCC-MAIN-2018-09,text/calendar,519762,519186,0.0149\nCC-MAIN-2018-09,text/css,6578,6571,0.0002\nCC-MAIN-2018-09,text/csv,13121,13110,0.0004\nCC-MAIN-2018-09,text/directory,6506,6506,0.0002\nCC-MAIN-2018-09,text/enriched,2345,2345,0.0001\nCC-MAIN-2018-09,text/html,3372339966,3342955157,96.6712\nCC-MAIN-2018-09,text/javascript,11474,11465,0.0003\nCC-MAIN-2018-09,text/markdown,304,304,0.0000\nCC-MAIN-2018-09,text/pdf,18303,18300,0.0005\nCC-MAIN-2018-09,text/plain,1097980,1096076,0.0315\nCC-MAIN-2018-09,text/prs.lines.tag,573,573,0.0000\nCC-MAIN-2018-09,text/tab-separated-values,4107,4106,0.0001\nCC-MAIN-2018-09,text/turtle,20102,20075,0.0006\nCC-MAIN-2018-09,text/vcard,6032,6032,0.0002\nCC-MAIN-2018-09,text/x-bibtex,2991,2989,0.0001\nCC-MAIN-2018-09,text/x-c,2698,2696,0.0001\nCC-MAIN-2018-09,text/x-csrc,2240,2239,0.0001\nCC-MAIN-2018-09,text/x-diff,5653,5652,0.0002\nCC-MAIN-2018-09,text/x-patch,12926,12925,0.0004\nCC-MAIN-2018-09,text/x-perl,3419,3402,0.0001\nCC-MAIN-2018-09,text/x-vcalendar,17589,17583,0.0005\nCC-MAIN-2018-09,text/x-vcard,33752,33717,0.0010\nCC-MAIN-2018-09,text/xml,3132954,3121825,0.0898\nCC-MAIN-2018-09,unknown/unknown,44547,44483,0.0013\nCC-MAIN-2018-09,video/mp4,24034,23885,0.0007\nCC-MAIN-2018-09,video/webm,47631,47522,0.0014\nCC-MAIN-2018-09,video/x-ms-asf,13026,12990,0.0004\nCC-MAIN-2018-13,<other>,2509700,2312019,0.0776\nCC-MAIN-2018-13,application/atom+xml,11677596,11676293,0.3612\nCC-MAIN-2018-13,application/calendar,2916,2913,0.0001\nCC-MAIN-2018-13,application/download,43213,43187,0.0013\nCC-MAIN-2018-13,application/epub+zip,25621,25465,0.0008\nCC-MAIN-2018-13,application/force-download,101129,101055,0.0031\nCC-MAIN-2018-13,application/gpx+xml,2616,2615,0.0001\nCC-MAIN-2018-13,application/ics,3640,3640,0.0001\nCC-MAIN-2018-13,application/javascript,15646,15438,0.0005\nCC-MAIN-2018-13,application/json,224460,223466,0.0069\nCC-MAIN-2018-13,application/ld+json,6776,6776,0.0002\nCC-MAIN-2018-13,application/marc,9359,9359,0.0003\nCC-MAIN-2018-13,application/msword,103176,102718,0.0032\nCC-MAIN-2018-13,application/octet-stream,820503,818486,0.0254\nCC-MAIN-2018-13,application/octetstream,8102,8060,0.0003\nCC-MAIN-2018-13,application/pdf,16682020,16621176,0.5160\nCC-MAIN-2018-13,application/pgp-encrypted,1615,1614,0.0000\nCC-MAIN-2018-13,application/pgp-signature,10317,10316,0.0003\nCC-MAIN-2018-13,application/postscript,22739,22689,0.0007\nCC-MAIN-2018-13,application/rdf+xml,64845,64807,0.0020\nCC-MAIN-2018-13,application/rss+xml,2951798,2942070,0.0913\nCC-MAIN-2018-13,application/rtf,8492,8484,0.0003\nCC-MAIN-2018-13,application/text,8434,8434,0.0003\nCC-MAIN-2018-13,application/unknown,7813,7806,0.0002\nCC-MAIN-2018-13,application/vnd.android.package-archive,40195,40076,0.0012\nCC-MAIN-2018-13,application/vnd.google-earth.kml+xml,59741,59659,0.0018\nCC-MAIN-2018-13,application/vnd.google-earth.kmz,7627,7605,0.0002\nCC-MAIN-2018-13,application/vnd.ms-excel,34186,33985,0.0011\nCC-MAIN-2018-13,application/vnd.ms-powerpoint,13566,13535,0.0004\nCC-MAIN-2018-13,application/vnd.ms-word,3647,3640,0.0001\nCC-MAIN-2018-13,application/vnd.oasis.opendocument.text,7262,7220,0.0002\nCC-MAIN-2018-13,application/vnd.openxmlformats-officedocument.presentationml.presentation,5638,5628,0.0002\nCC-MAIN-2018-13,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,13450,13340,0.0004\nCC-MAIN-2018-13,application/vnd.openxmlformats-officedocument.wordprocessingml.document,38568,38178,0.0012\nCC-MAIN-2018-13,application/vnd.wap.xhtml+xml,21056,21023,0.0007\nCC-MAIN-2018-13,application/x-bibtex,10049,10049,0.0003\nCC-MAIN-2018-13,application/x-bittorrent,9360,9068,0.0003\nCC-MAIN-2018-13,application/x-debian-package,693,693,0.0000\nCC-MAIN-2018-13,application/x-download,23432,23380,0.0007\nCC-MAIN-2018-13,application/x-endnote-refer,14967,14963,0.0005\nCC-MAIN-2018-13,application/x-gzip,11209,11179,0.0003\nCC-MAIN-2018-13,application/x-httpd-php,15807,15741,0.0005\nCC-MAIN-2018-13,application/x-java-jnlp-file,3768,3760,0.0001\nCC-MAIN-2018-13,application/x-javascript,6286,6235,0.0002\nCC-MAIN-2018-13,application/x-json,15,15,0.0000\nCC-MAIN-2018-13,application/x-mobipocket-ebook,3895,3866,0.0001\nCC-MAIN-2018-13,application/x-msdownload,8112,7970,0.0003\nCC-MAIN-2018-13,application/x-netcdf,548,546,0.0000\nCC-MAIN-2018-13,application/x-research-info-systems,30763,30754,0.0010\nCC-MAIN-2018-13,application/x-shockwave-flash,26300,25990,0.0008\nCC-MAIN-2018-13,application/x-tar,3291,3278,0.0001\nCC-MAIN-2018-13,application/x-tex,6391,6385,0.0002\nCC-MAIN-2018-13,application/x-troff-man,2441,2434,0.0001\nCC-MAIN-2018-13,application/x-zip-compressed,8334,8299,0.0003\nCC-MAIN-2018-13,application/xhtml+xml,1011991,999799,0.0313\nCC-MAIN-2018-13,application/xml,920908,919278,0.0285\nCC-MAIN-2018-13,application/zip,85158,81747,0.0026\nCC-MAIN-2018-13,audio/mpeg,113378,112376,0.0035\nCC-MAIN-2018-13,audio/x-mpegurl,50198,50149,0.0016\nCC-MAIN-2018-13,audio/x-scpls,7032,6984,0.0002\nCC-MAIN-2018-13,audio/x-wav,12825,12823,0.0004\nCC-MAIN-2018-13,binary/octet-stream,10044,10023,0.0003\nCC-MAIN-2018-13,image/gif,725633,718221,0.0224\nCC-MAIN-2018-13,image/jp2,33126,33061,0.0010\nCC-MAIN-2018-13,image/jpeg,65578372,62885192,2.0286\nCC-MAIN-2018-13,image/jpg,416226,416154,0.0129\nCC-MAIN-2018-13,image/pjpeg,23895,23010,0.0007\nCC-MAIN-2018-13,image/png,6832185,6788127,0.2113\nCC-MAIN-2018-13,image/svg+xml,65270,65111,0.0020\nCC-MAIN-2018-13,image/tiff,8722,8709,0.0003\nCC-MAIN-2018-13,image/vnd.djvu,8160,8159,0.0003\nCC-MAIN-2018-13,image/webp,7185,7183,0.0002\nCC-MAIN-2018-13,message/rfc822,4218,4217,0.0001\nCC-MAIN-2018-13,text/calendar,428724,428407,0.0133\nCC-MAIN-2018-13,text/css,8240,8228,0.0003\nCC-MAIN-2018-13,text/csv,20299,20191,0.0006\nCC-MAIN-2018-13,text/directory,5800,5799,0.0002\nCC-MAIN-2018-13,text/enriched,3394,3394,0.0001\nCC-MAIN-2018-13,text/html,3116608332,3085577352,96.4077\nCC-MAIN-2018-13,text/javascript,8827,8815,0.0003\nCC-MAIN-2018-13,text/markdown,431,431,0.0000\nCC-MAIN-2018-13,text/pdf,12351,12351,0.0004\nCC-MAIN-2018-13,text/plain,1010596,1007312,0.0313\nCC-MAIN-2018-13,text/prs.lines.tag,2536,2536,0.0001\nCC-MAIN-2018-13,text/tab-separated-values,8746,8746,0.0003\nCC-MAIN-2018-13,text/turtle,9048,9040,0.0003\nCC-MAIN-2018-13,text/vcard,4435,4407,0.0001\nCC-MAIN-2018-13,text/x-bibtex,4935,4843,0.0002\nCC-MAIN-2018-13,text/x-c,3548,3544,0.0001\nCC-MAIN-2018-13,text/x-csrc,2280,2279,0.0001\nCC-MAIN-2018-13,text/x-diff,10977,10961,0.0003\nCC-MAIN-2018-13,text/x-patch,3596,3594,0.0001\nCC-MAIN-2018-13,text/x-perl,6489,6473,0.0002\nCC-MAIN-2018-13,text/x-vcalendar,18685,18681,0.0006\nCC-MAIN-2018-13,text/x-vcard,23322,23284,0.0007\nCC-MAIN-2018-13,text/xml,2774625,2755923,0.0858\nCC-MAIN-2018-13,unknown/unknown,21570,21529,0.0007\nCC-MAIN-2018-13,video/mp4,25270,25135,0.0008\nCC-MAIN-2018-13,video/webm,32259,32217,0.0010\nCC-MAIN-2018-13,video/x-ms-asf,21054,21005,0.0007\nCC-MAIN-2018-17,<other>,2441738,2238559,0.0787\nCC-MAIN-2018-17,application/atom+xml,5210591,5209545,0.1680\nCC-MAIN-2018-17,application/calendar,2582,2572,0.0001\nCC-MAIN-2018-17,application/download,50431,50395,0.0016\nCC-MAIN-2018-17,application/epub+zip,12417,12292,0.0004\nCC-MAIN-2018-17,application/force-download,97542,97511,0.0031\nCC-MAIN-2018-17,application/gpx+xml,2089,2089,0.0001\nCC-MAIN-2018-17,application/ics,3933,3933,0.0001\nCC-MAIN-2018-17,application/javascript,10158,10138,0.0003\nCC-MAIN-2018-17,application/json,184247,184137,0.0059\nCC-MAIN-2018-17,application/ld+json,21227,21227,0.0007\nCC-MAIN-2018-17,application/marc,18336,18336,0.0006\nCC-MAIN-2018-17,application/msword,108942,108553,0.0035\nCC-MAIN-2018-17,application/octet-stream,741851,740666,0.0239\nCC-MAIN-2018-17,application/octetstream,7945,7821,0.0003\nCC-MAIN-2018-17,application/pdf,13838046,13805257,0.4462\nCC-MAIN-2018-17,application/pgp-encrypted,392,392,0.0000\nCC-MAIN-2018-17,application/pgp-signature,6567,6527,0.0002\nCC-MAIN-2018-17,application/postscript,15299,15291,0.0005\nCC-MAIN-2018-17,application/rdf+xml,62492,62481,0.0020\nCC-MAIN-2018-17,application/rss+xml,3142074,3136599,0.1013\nCC-MAIN-2018-17,application/rtf,7640,7638,0.0002\nCC-MAIN-2018-17,application/text,7091,7091,0.0002\nCC-MAIN-2018-17,application/unknown,7911,7883,0.0003\nCC-MAIN-2018-17,application/vnd.android.package-archive,44737,44611,0.0014\nCC-MAIN-2018-17,application/vnd.google-earth.kml+xml,38433,38409,0.0012\nCC-MAIN-2018-17,application/vnd.google-earth.kmz,6281,6277,0.0002\nCC-MAIN-2018-17,application/vnd.ms-excel,37638,37021,0.0012\nCC-MAIN-2018-17,application/vnd.ms-powerpoint,15610,15584,0.0005\nCC-MAIN-2018-17,application/vnd.ms-word,3502,3502,0.0001\nCC-MAIN-2018-17,application/vnd.oasis.opendocument.text,6211,6209,0.0002\nCC-MAIN-2018-17,application/vnd.openxmlformats-officedocument.presentationml.presentation,6406,6397,0.0002\nCC-MAIN-2018-17,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,12623,12556,0.0004\nCC-MAIN-2018-17,application/vnd.openxmlformats-officedocument.wordprocessingml.document,39201,39024,0.0013\nCC-MAIN-2018-17,application/vnd.wap.xhtml+xml,33332,33298,0.0011\nCC-MAIN-2018-17,application/x-bibtex,9958,9957,0.0003\nCC-MAIN-2018-17,application/x-bittorrent,9149,9002,0.0003\nCC-MAIN-2018-17,application/x-debian-package,307,307,0.0000\nCC-MAIN-2018-17,application/x-download,24615,24476,0.0008\nCC-MAIN-2018-17,application/x-endnote-refer,11007,11007,0.0004\nCC-MAIN-2018-17,application/x-gzip,8778,8758,0.0003\nCC-MAIN-2018-17,application/x-httpd-php,11448,11392,0.0004\nCC-MAIN-2018-17,application/x-java-jnlp-file,2320,2316,0.0001\nCC-MAIN-2018-17,application/x-javascript,5356,5352,0.0002\nCC-MAIN-2018-17,application/x-json,12,12,0.0000\nCC-MAIN-2018-17,application/x-mobipocket-ebook,1961,1961,0.0001\nCC-MAIN-2018-17,application/x-msdownload,7374,7284,0.0002\nCC-MAIN-2018-17,application/x-netcdf,736,736,0.0000\nCC-MAIN-2018-17,application/x-research-info-systems,19841,19840,0.0006\nCC-MAIN-2018-17,application/x-shockwave-flash,23621,23480,0.0008\nCC-MAIN-2018-17,application/x-tar,2038,2034,0.0001\nCC-MAIN-2018-17,application/x-tex,3029,3029,0.0001\nCC-MAIN-2018-17,application/x-troff-man,745,727,0.0000\nCC-MAIN-2018-17,application/x-zip-compressed,6498,6482,0.0002\nCC-MAIN-2018-17,application/xhtml+xml,989338,981052,0.0319\nCC-MAIN-2018-17,application/xml,807739,806579,0.0260\nCC-MAIN-2018-17,application/zip,73134,72708,0.0024\nCC-MAIN-2018-17,audio/mpeg,107360,106612,0.0035\nCC-MAIN-2018-17,audio/x-mpegurl,25745,25717,0.0008\nCC-MAIN-2018-17,audio/x-scpls,6639,6598,0.0002\nCC-MAIN-2018-17,audio/x-wav,17344,17344,0.0006\nCC-MAIN-2018-17,binary/octet-stream,6385,6357,0.0002\nCC-MAIN-2018-17,image/gif,225925,224709,0.0073\nCC-MAIN-2018-17,image/jp2,15385,15374,0.0005\nCC-MAIN-2018-17,image/jpeg,15591859,15197112,0.5027\nCC-MAIN-2018-17,image/jpg,113311,113308,0.0037\nCC-MAIN-2018-17,image/pjpeg,19851,19386,0.0006\nCC-MAIN-2018-17,image/png,1800323,1794453,0.0580\nCC-MAIN-2018-17,image/svg+xml,13500,13432,0.0004\nCC-MAIN-2018-17,image/tiff,8507,8505,0.0003\nCC-MAIN-2018-17,image/vnd.djvu,5474,5474,0.0002\nCC-MAIN-2018-17,image/webp,3091,3091,0.0001\nCC-MAIN-2018-17,message/rfc822,3648,3645,0.0001\nCC-MAIN-2018-17,text/calendar,474933,474553,0.0153\nCC-MAIN-2018-17,text/css,6174,6138,0.0002\nCC-MAIN-2018-17,text/csv,16777,16415,0.0005\nCC-MAIN-2018-17,text/directory,6654,6653,0.0002\nCC-MAIN-2018-17,text/enriched,2671,2671,0.0001\nCC-MAIN-2018-17,text/html,3050567020,3025679638,98.3624\nCC-MAIN-2018-17,text/javascript,8023,8020,0.0003\nCC-MAIN-2018-17,text/markdown,431,431,0.0000\nCC-MAIN-2018-17,text/pdf,26464,26464,0.0009\nCC-MAIN-2018-17,text/plain,833576,830073,0.0269\nCC-MAIN-2018-17,text/prs.lines.tag,686,686,0.0000\nCC-MAIN-2018-17,text/tab-separated-values,4755,4755,0.0002\nCC-MAIN-2018-17,text/turtle,20883,20876,0.0007\nCC-MAIN-2018-17,text/vcard,4600,4599,0.0001\nCC-MAIN-2018-17,text/x-bibtex,3747,3737,0.0001\nCC-MAIN-2018-17,text/x-c,2060,2060,0.0001\nCC-MAIN-2018-17,text/x-csrc,1252,1252,0.0000\nCC-MAIN-2018-17,text/x-diff,2726,2724,0.0001\nCC-MAIN-2018-17,text/x-patch,386,386,0.0000\nCC-MAIN-2018-17,text/x-perl,2014,1988,0.0001\nCC-MAIN-2018-17,text/x-vcalendar,11999,11998,0.0004\nCC-MAIN-2018-17,text/x-vcard,27713,27704,0.0009\nCC-MAIN-2018-17,text/xml,2995120,2989533,0.0966\nCC-MAIN-2018-17,unknown/unknown,40923,40892,0.0013\nCC-MAIN-2018-17,video/mp4,17315,17165,0.0006\nCC-MAIN-2018-17,video/webm,31566,31514,0.0010\nCC-MAIN-2018-17,video/x-ms-asf,14655,14584,0.0005\nCC-MAIN-2018-22,<other>,1575437,1567669,0.0565\nCC-MAIN-2018-22,application/atom+xml,4628490,4627323,0.1660\nCC-MAIN-2018-22,application/calendar,2858,2842,0.0001\nCC-MAIN-2018-22,application/download,50139,50092,0.0018\nCC-MAIN-2018-22,application/epub+zip,14961,14901,0.0005\nCC-MAIN-2018-22,application/force-download,95844,95800,0.0034\nCC-MAIN-2018-22,application/gpx+xml,1232,1232,0.0000\nCC-MAIN-2018-22,application/ics,3966,3966,0.0001\nCC-MAIN-2018-22,application/javascript,13104,13086,0.0005\nCC-MAIN-2018-22,application/json,197585,197412,0.0071\nCC-MAIN-2018-22,application/ld+json,14057,14054,0.0005\nCC-MAIN-2018-22,application/marc,11076,11076,0.0004\nCC-MAIN-2018-22,application/msword,101824,101431,0.0037\nCC-MAIN-2018-22,application/octet-stream,790575,789324,0.0284\nCC-MAIN-2018-22,application/octetstream,5621,5620,0.0002\nCC-MAIN-2018-22,application/pdf,11460488,11424760,0.4110\nCC-MAIN-2018-22,application/pgp-encrypted,324,324,0.0000\nCC-MAIN-2018-22,application/pgp-signature,13821,13819,0.0005\nCC-MAIN-2018-22,application/postscript,9678,9664,0.0003\nCC-MAIN-2018-22,application/rdf+xml,58366,58342,0.0021\nCC-MAIN-2018-22,application/rss+xml,2263910,2258501,0.0812\nCC-MAIN-2018-22,application/rtf,11350,11342,0.0004\nCC-MAIN-2018-22,application/save-to-disk,11,11,0.0000\nCC-MAIN-2018-22,application/text,10370,10370,0.0004\nCC-MAIN-2018-22,application/unknown,8045,8032,0.0003\nCC-MAIN-2018-22,application/vnd.android.package-archive,19320,19059,0.0007\nCC-MAIN-2018-22,application/vnd.google-earth.kml+xml,46154,46125,0.0017\nCC-MAIN-2018-22,application/vnd.google-earth.kmz,6341,6336,0.0002\nCC-MAIN-2018-22,application/vnd.ms-excel,28945,28807,0.0010\nCC-MAIN-2018-22,application/vnd.ms-powerpoint,11986,11972,0.0004\nCC-MAIN-2018-22,application/vnd.ms-word,3377,3377,0.0001\nCC-MAIN-2018-22,application/vnd.oasis.opendocument.text,6542,6537,0.0002\nCC-MAIN-2018-22,application/vnd.openxmlformats-officedocument.presentationml.presentation,6231,6194,0.0002\nCC-MAIN-2018-22,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,14497,14404,0.0005\nCC-MAIN-2018-22,application/vnd.openxmlformats-officedocument.wordprocessingml.document,39966,39757,0.0014\nCC-MAIN-2018-22,application/vnd.wap.xhtml+xml,21400,21377,0.0008\nCC-MAIN-2018-22,application/x-bibtex,10846,10846,0.0004\nCC-MAIN-2018-22,application/x-bittorrent,10949,10773,0.0004\nCC-MAIN-2018-22,application/x-debian-package,268,268,0.0000\nCC-MAIN-2018-22,application/x-download,18489,18423,0.0007\nCC-MAIN-2018-22,application/x-endnote-refer,16366,16366,0.0006\nCC-MAIN-2018-22,application/x-gzip,7492,7461,0.0003\nCC-MAIN-2018-22,application/x-httpd-php,7233,7159,0.0003\nCC-MAIN-2018-22,application/x-java-jnlp-file,1394,1392,0.0000\nCC-MAIN-2018-22,application/x-javascript,4750,4740,0.0002\nCC-MAIN-2018-22,application/x-json,4,4,0.0000\nCC-MAIN-2018-22,application/x-mobipocket-ebook,1513,1511,0.0001\nCC-MAIN-2018-22,application/x-msdownload,7315,7160,0.0003\nCC-MAIN-2018-22,application/x-netcdf,181,181,0.0000\nCC-MAIN-2018-22,application/x-research-info-systems,27468,27467,0.0010\nCC-MAIN-2018-22,application/x-shockwave-flash,20734,20701,0.0007\nCC-MAIN-2018-22,application/x-tar,2315,2315,0.0001\nCC-MAIN-2018-22,application/x-tex,1475,1475,0.0001\nCC-MAIN-2018-22,application/x-troff-man,1026,999,0.0000\nCC-MAIN-2018-22,application/x-zip-compressed,6730,6676,0.0002\nCC-MAIN-2018-22,application/xhtml+xml,902482,897360,0.0324\nCC-MAIN-2018-22,application/xml,658705,657250,0.0236\nCC-MAIN-2018-22,application/zip,70249,69672,0.0025\nCC-MAIN-2018-22,audio/mpeg,149544,148584,0.0054\nCC-MAIN-2018-22,audio/x-mpegurl,18009,17972,0.0006\nCC-MAIN-2018-22,audio/x-scpls,4632,4621,0.0002\nCC-MAIN-2018-22,audio/x-wav,11520,11518,0.0004\nCC-MAIN-2018-22,binary/octet-stream,6148,6142,0.0002\nCC-MAIN-2018-22,image/gif,264120,262358,0.0095\nCC-MAIN-2018-22,image/jp2,859,859,0.0000\nCC-MAIN-2018-22,image/jpeg,23888816,23660355,0.8567\nCC-MAIN-2018-22,image/jpg,424620,424448,0.0152\nCC-MAIN-2018-22,image/pjpeg,16209,16180,0.0006\nCC-MAIN-2018-22,image/png,2950856,2941428,0.1058\nCC-MAIN-2018-22,image/svg+xml,34728,34708,0.0012\nCC-MAIN-2018-22,image/tiff,6692,6689,0.0002\nCC-MAIN-2018-22,image/vnd.djvu,2017,2016,0.0001\nCC-MAIN-2018-22,image/webp,5577,5577,0.0002\nCC-MAIN-2018-22,message/rfc822,3139,3138,0.0001\nCC-MAIN-2018-22,text/calendar,422043,421703,0.0151\nCC-MAIN-2018-22,text/css,7412,7407,0.0003\nCC-MAIN-2018-22,text/csv,11772,11748,0.0004\nCC-MAIN-2018-22,text/directory,5132,5130,0.0002\nCC-MAIN-2018-22,text/enriched,3308,3307,0.0001\nCC-MAIN-2018-22,text/html,2733744773,2706176906,98.0403\nCC-MAIN-2018-22,text/javascript,9955,9948,0.0004\nCC-MAIN-2018-22,text/markdown,376,375,0.0000\nCC-MAIN-2018-22,text/pdf,14678,14677,0.0005\nCC-MAIN-2018-22,text/plain,557467,554415,0.0200\nCC-MAIN-2018-22,text/prs.lines.tag,63,63,0.0000\nCC-MAIN-2018-22,text/tab-separated-values,3136,3136,0.0001\nCC-MAIN-2018-22,text/turtle,13713,13699,0.0005\nCC-MAIN-2018-22,text/vcard,4212,4208,0.0002\nCC-MAIN-2018-22,text/x-bibtex,2188,2187,0.0001\nCC-MAIN-2018-22,text/x-c,878,863,0.0000\nCC-MAIN-2018-22,text/x-csrc,983,981,0.0000\nCC-MAIN-2018-22,text/x-diff,2360,2360,0.0001\nCC-MAIN-2018-22,text/x-patch,891,890,0.0000\nCC-MAIN-2018-22,text/x-perl,2342,2300,0.0001\nCC-MAIN-2018-22,text/x-vcalendar,12371,12369,0.0004\nCC-MAIN-2018-22,text/x-vcard,20725,20687,0.0007\nCC-MAIN-2018-22,text/xml,2340521,2335762,0.0839\nCC-MAIN-2018-22,unknown/unknown,29569,29529,0.0011\nCC-MAIN-2018-22,video/mp4,23637,23547,0.0008\nCC-MAIN-2018-22,video/webm,32245,32198,0.0012\nCC-MAIN-2018-22,video/x-ms-asf,7896,7878,0.0003\nCC-MAIN-2018-26,<other>,1828093,1819559,0.0596\nCC-MAIN-2018-26,application/atom+xml,5341932,5340665,0.1740\nCC-MAIN-2018-26,application/calendar,3291,3289,0.0001\nCC-MAIN-2018-26,application/download,59280,59212,0.0019\nCC-MAIN-2018-26,application/epub+zip,24595,24325,0.0008\nCC-MAIN-2018-26,application/force-download,110796,110636,0.0036\nCC-MAIN-2018-26,application/gpx+xml,3131,3131,0.0001\nCC-MAIN-2018-26,application/ics,4602,4602,0.0001\nCC-MAIN-2018-26,application/javascript,9615,9606,0.0003\nCC-MAIN-2018-26,application/json,210903,210576,0.0069\nCC-MAIN-2018-26,application/ld+json,10526,10522,0.0003\nCC-MAIN-2018-26,application/marc,11141,11141,0.0004\nCC-MAIN-2018-26,application/msword,113215,112915,0.0037\nCC-MAIN-2018-26,application/octet-stream,855833,853710,0.0279\nCC-MAIN-2018-26,application/octetstream,11268,11178,0.0004\nCC-MAIN-2018-26,application/pdf,16784526,16749784,0.5468\nCC-MAIN-2018-26,application/pgp-encrypted,21930,21930,0.0007\nCC-MAIN-2018-26,application/pgp-signature,18339,18336,0.0006\nCC-MAIN-2018-26,application/postscript,20343,20322,0.0007\nCC-MAIN-2018-26,application/rdf+xml,82755,82733,0.0027\nCC-MAIN-2018-26,application/rss+xml,2714799,2708624,0.0884\nCC-MAIN-2018-26,application/rtf,10848,10836,0.0004\nCC-MAIN-2018-26,application/save-to-disk,2,2,0.0000\nCC-MAIN-2018-26,application/text,11772,11772,0.0004\nCC-MAIN-2018-26,application/unknown,7490,7480,0.0002\nCC-MAIN-2018-26,application/vnd.android.package-archive,16914,16765,0.0006\nCC-MAIN-2018-26,application/vnd.google-earth.kml+xml,70235,70188,0.0023\nCC-MAIN-2018-26,application/vnd.google-earth.kmz,20295,20278,0.0007\nCC-MAIN-2018-26,application/vnd.ms-excel,41364,41256,0.0013\nCC-MAIN-2018-26,application/vnd.ms-powerpoint,16793,16689,0.0005\nCC-MAIN-2018-26,application/vnd.ms-word,4374,4373,0.0001\nCC-MAIN-2018-26,application/vnd.oasis.opendocument.text,8975,8969,0.0003\nCC-MAIN-2018-26,application/vnd.openxmlformats-officedocument.presentationml.presentation,5218,5204,0.0002\nCC-MAIN-2018-26,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,21540,21371,0.0007\nCC-MAIN-2018-26,application/vnd.openxmlformats-officedocument.wordprocessingml.document,37907,37763,0.0012\nCC-MAIN-2018-26,application/vnd.wap.xhtml+xml,23526,23499,0.0008\nCC-MAIN-2018-26,application/x-bibtex,14797,14795,0.0005\nCC-MAIN-2018-26,application/x-bittorrent,12245,11981,0.0004\nCC-MAIN-2018-26,application/x-debian-package,4113,4113,0.0001\nCC-MAIN-2018-26,application/x-download,21856,21546,0.0007\nCC-MAIN-2018-26,application/x-endnote-refer,21090,21090,0.0007\nCC-MAIN-2018-26,application/x-gzip,12762,12693,0.0004\nCC-MAIN-2018-26,application/x-httpd-php,10443,10368,0.0003\nCC-MAIN-2018-26,application/x-java-jnlp-file,2409,2408,0.0001\nCC-MAIN-2018-26,application/x-javascript,4598,4596,0.0001\nCC-MAIN-2018-26,application/x-json,23,23,0.0000\nCC-MAIN-2018-26,application/x-mobipocket-ebook,4694,4691,0.0002\nCC-MAIN-2018-26,application/x-msdownload,8554,8434,0.0003\nCC-MAIN-2018-26,application/x-netcdf,2240,2240,0.0001\nCC-MAIN-2018-26,application/x-research-info-systems,32674,32674,0.0011\nCC-MAIN-2018-26,application/x-shockwave-flash,26130,26083,0.0009\nCC-MAIN-2018-26,application/x-tar,5803,5799,0.0002\nCC-MAIN-2018-26,application/x-tex,4754,4754,0.0002\nCC-MAIN-2018-26,application/x-troff-man,3570,3539,0.0001\nCC-MAIN-2018-26,application/x-zip-compressed,13325,13297,0.0004\nCC-MAIN-2018-26,application/xhtml+xml,871264,867163,0.0284\nCC-MAIN-2018-26,application/xml,855232,853730,0.0279\nCC-MAIN-2018-26,application/zip,92733,92125,0.0030\nCC-MAIN-2018-26,audio/mpeg,114735,113907,0.0037\nCC-MAIN-2018-26,audio/x-mpegurl,38801,38788,0.0013\nCC-MAIN-2018-26,audio/x-scpls,5766,5756,0.0002\nCC-MAIN-2018-26,audio/x-wav,13510,13473,0.0004\nCC-MAIN-2018-26,binary/octet-stream,9766,9755,0.0003\nCC-MAIN-2018-26,image/gif,341003,339125,0.0111\nCC-MAIN-2018-26,image/jp2,518,518,0.0000\nCC-MAIN-2018-26,image/jpeg,28700658,28511324,0.9351\nCC-MAIN-2018-26,image/jpg,381833,381796,0.0124\nCC-MAIN-2018-26,image/pjpeg,35016,35008,0.0011\nCC-MAIN-2018-26,image/png,4022090,4007817,0.1310\nCC-MAIN-2018-26,image/svg+xml,47348,47315,0.0015\nCC-MAIN-2018-26,image/tiff,7241,7235,0.0002\nCC-MAIN-2018-26,image/vnd.djvu,8811,8810,0.0003\nCC-MAIN-2018-26,image/webp,10320,10320,0.0003\nCC-MAIN-2018-26,message/rfc822,8194,8193,0.0003\nCC-MAIN-2018-26,text/calendar,540390,539804,0.0176\nCC-MAIN-2018-26,text/css,6645,6633,0.0002\nCC-MAIN-2018-26,text/csv,34176,34156,0.0011\nCC-MAIN-2018-26,text/directory,5158,5153,0.0002\nCC-MAIN-2018-26,text/enriched,3294,3294,0.0001\nCC-MAIN-2018-26,text/html,2999500027,2965621240,97.7222\nCC-MAIN-2018-26,text/javascript,7956,7946,0.0003\nCC-MAIN-2018-26,text/markdown,449,449,0.0000\nCC-MAIN-2018-26,text/pdf,14016,14016,0.0005\nCC-MAIN-2018-26,text/plain,1282409,1279425,0.0418\nCC-MAIN-2018-26,text/prs.lines.tag,5886,5886,0.0002\nCC-MAIN-2018-26,text/tab-separated-values,22053,22053,0.0007\nCC-MAIN-2018-26,text/turtle,10413,10394,0.0003\nCC-MAIN-2018-26,text/vcard,4732,4712,0.0002\nCC-MAIN-2018-26,text/x-bibtex,5721,5721,0.0002\nCC-MAIN-2018-26,text/x-c,3483,3472,0.0001\nCC-MAIN-2018-26,text/x-csrc,3026,3026,0.0001\nCC-MAIN-2018-26,text/x-diff,10106,10103,0.0003\nCC-MAIN-2018-26,text/x-patch,48237,48234,0.0016\nCC-MAIN-2018-26,text/x-perl,2611,2600,0.0001\nCC-MAIN-2018-26,text/x-vcalendar,20848,20844,0.0007\nCC-MAIN-2018-26,text/x-vcard,25163,25145,0.0008\nCC-MAIN-2018-26,text/xml,3456754,3450684,0.1126\nCC-MAIN-2018-26,unknown/unknown,10889,10875,0.0004\nCC-MAIN-2018-26,video/mp4,24746,24672,0.0008\nCC-MAIN-2018-26,video/webm,31116,31056,0.0010\nCC-MAIN-2018-26,video/x-ms-asf,24858,24847,0.0008\nCC-MAIN-2018-30,<other>,1928223,1913161,0.0591\nCC-MAIN-2018-30,application/atom+xml,6236567,6234125,0.1911\nCC-MAIN-2018-30,application/calendar,2480,2476,0.0001\nCC-MAIN-2018-30,application/download,44797,44733,0.0014\nCC-MAIN-2018-30,application/epub+zip,23751,23491,0.0007\nCC-MAIN-2018-30,application/force-download,101427,101330,0.0031\nCC-MAIN-2018-30,application/gpx+xml,2613,2610,0.0001\nCC-MAIN-2018-30,application/ics,3159,3157,0.0001\nCC-MAIN-2018-30,application/javascript,10870,10850,0.0003\nCC-MAIN-2018-30,application/json,167648,167456,0.0051\nCC-MAIN-2018-30,application/ld+json,843,843,0.0000\nCC-MAIN-2018-30,application/marc,857,857,0.0000\nCC-MAIN-2018-30,application/msword,128124,127733,0.0039\nCC-MAIN-2018-30,application/octet-stream,861901,859991,0.0264\nCC-MAIN-2018-30,application/octetstream,8484,8436,0.0003\nCC-MAIN-2018-30,application/pdf,17314340,17257070,0.5305\nCC-MAIN-2018-30,application/pgp-encrypted,927,927,0.0000\nCC-MAIN-2018-30,application/pgp-signature,23911,23905,0.0007\nCC-MAIN-2018-30,application/postscript,19123,19081,0.0006\nCC-MAIN-2018-30,application/rdf+xml,46017,45837,0.0014\nCC-MAIN-2018-30,application/rss+xml,2278279,2270427,0.0698\nCC-MAIN-2018-30,application/rtf,12245,12224,0.0004\nCC-MAIN-2018-30,application/text,8283,8236,0.0003\nCC-MAIN-2018-30,application/unknown,7648,7634,0.0002\nCC-MAIN-2018-30,application/vnd.android.package-archive,20484,20151,0.0006\nCC-MAIN-2018-30,application/vnd.google-earth.kml+xml,57582,57570,0.0018\nCC-MAIN-2018-30,application/vnd.google-earth.kmz,10780,10753,0.0003\nCC-MAIN-2018-30,application/vnd.ms-excel,45197,45029,0.0014\nCC-MAIN-2018-30,application/vnd.ms-powerpoint,13601,13486,0.0004\nCC-MAIN-2018-30,application/vnd.ms-word,4102,4090,0.0001\nCC-MAIN-2018-30,application/vnd.oasis.opendocument.text,7960,7957,0.0002\nCC-MAIN-2018-30,application/vnd.openxmlformats-officedocument.presentationml.presentation,6969,6952,0.0002\nCC-MAIN-2018-30,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,20593,20418,0.0006\nCC-MAIN-2018-30,application/vnd.openxmlformats-officedocument.wordprocessingml.document,50190,49904,0.0015\nCC-MAIN-2018-30,application/vnd.wap.xhtml+xml,6976,6954,0.0002\nCC-MAIN-2018-30,application/x-bibtex,9177,9175,0.0003\nCC-MAIN-2018-30,application/x-bittorrent,15305,14968,0.0005\nCC-MAIN-2018-30,application/x-debian-package,2456,2453,0.0001\nCC-MAIN-2018-30,application/x-download,22916,22820,0.0007\nCC-MAIN-2018-30,application/x-endnote-refer,11320,11319,0.0003\nCC-MAIN-2018-30,application/x-gzip,21576,21488,0.0007\nCC-MAIN-2018-30,application/x-httpd-php,12662,12558,0.0004\nCC-MAIN-2018-30,application/x-java-jnlp-file,2488,2479,0.0001\nCC-MAIN-2018-30,application/x-javascript,5490,5474,0.0002\nCC-MAIN-2018-30,application/x-json,17,17,0.0000\nCC-MAIN-2018-30,application/x-mobipocket-ebook,3589,3588,0.0001\nCC-MAIN-2018-30,application/x-msdownload,8884,8747,0.0003\nCC-MAIN-2018-30,application/x-netcdf,320,320,0.0000\nCC-MAIN-2018-30,application/x-research-info-systems,21420,21413,0.0007\nCC-MAIN-2018-30,application/x-shockwave-flash,87927,87433,0.0027\nCC-MAIN-2018-30,application/x-tar,4366,4357,0.0001\nCC-MAIN-2018-30,application/x-tex,1711,1711,0.0001\nCC-MAIN-2018-30,application/x-troff-man,1893,1882,0.0001\nCC-MAIN-2018-30,application/x-zip-compressed,10401,10352,0.0003\nCC-MAIN-2018-30,application/xhtml+xml,788250,782722,0.0242\nCC-MAIN-2018-30,application/xml,779286,777437,0.0239\nCC-MAIN-2018-30,application/zip,100607,99866,0.0031\nCC-MAIN-2018-30,audio/mpeg,207821,205985,0.0064\nCC-MAIN-2018-30,audio/x-mpegurl,41726,41677,0.0013\nCC-MAIN-2018-30,audio/x-scpls,6419,6373,0.0002\nCC-MAIN-2018-30,audio/x-wav,7981,7975,0.0002\nCC-MAIN-2018-30,binary/octet-stream,9046,9015,0.0003\nCC-MAIN-2018-30,image/gif,410977,408837,0.0126\nCC-MAIN-2018-30,image/jp2,379,379,0.0000\nCC-MAIN-2018-30,image/jpeg,26550210,25091997,0.8134\nCC-MAIN-2018-30,image/jpg,218221,218198,0.0067\nCC-MAIN-2018-30,image/pjpeg,20078,20034,0.0006\nCC-MAIN-2018-30,image/png,2605287,2594504,0.0798\nCC-MAIN-2018-30,image/svg+xml,58046,58015,0.0018\nCC-MAIN-2018-30,image/tiff,7537,7527,0.0002\nCC-MAIN-2018-30,image/vnd.djvu,4729,4729,0.0001\nCC-MAIN-2018-30,image/webp,3352,3352,0.0001\nCC-MAIN-2018-30,message/rfc822,5158,5143,0.0002\nCC-MAIN-2018-30,text/calendar,473092,472402,0.0145\nCC-MAIN-2018-30,text/css,9066,9057,0.0003\nCC-MAIN-2018-30,text/csv,15649,15639,0.0005\nCC-MAIN-2018-30,text/directory,5621,5620,0.0002\nCC-MAIN-2018-30,text/enriched,2343,2343,0.0001\nCC-MAIN-2018-30,text/html,3198781491,3152832803,98.0031\nCC-MAIN-2018-30,text/javascript,7648,7642,0.0002\nCC-MAIN-2018-30,text/markdown,441,441,0.0000\nCC-MAIN-2018-30,text/pdf,431,431,0.0000\nCC-MAIN-2018-30,text/plain,749900,747057,0.0230\nCC-MAIN-2018-30,text/prs.lines.tag,731,731,0.0000\nCC-MAIN-2018-30,text/tab-separated-values,2170,2170,0.0001\nCC-MAIN-2018-30,text/turtle,1507,1495,0.0000\nCC-MAIN-2018-30,text/vcard,4993,4965,0.0002\nCC-MAIN-2018-30,text/x-bibtex,4293,4291,0.0001\nCC-MAIN-2018-30,text/x-c,3555,3554,0.0001\nCC-MAIN-2018-30,text/x-csrc,1686,1681,0.0001\nCC-MAIN-2018-30,text/x-diff,3199,3198,0.0001\nCC-MAIN-2018-30,text/x-patch,858,855,0.0000\nCC-MAIN-2018-30,text/x-perl,5251,5163,0.0002\nCC-MAIN-2018-30,text/x-vcalendar,12602,12601,0.0004\nCC-MAIN-2018-30,text/x-vcard,27219,27106,0.0008\nCC-MAIN-2018-30,text/xml,2183663,2176187,0.0669\nCC-MAIN-2018-30,unknown/unknown,6633,6623,0.0002\nCC-MAIN-2018-30,video/mp4,57797,57603,0.0018\nCC-MAIN-2018-30,video/webm,34212,34126,0.0010\nCC-MAIN-2018-30,video/x-ms-asf,16170,16137,0.0005\nCC-MAIN-2018-34,<other>,17910927,17762417,0.6667\nCC-MAIN-2018-34,application/atom+xml,2692566,2686632,0.1002\nCC-MAIN-2018-34,application/calendar,2438,2421,0.0001\nCC-MAIN-2018-34,application/download,40912,40875,0.0015\nCC-MAIN-2018-34,application/epub+zip,12971,12847,0.0005\nCC-MAIN-2018-34,application/force-download,84869,84809,0.0032\nCC-MAIN-2018-34,application/gpx+xml,1529,1528,0.0001\nCC-MAIN-2018-34,application/ics,4219,4219,0.0002\nCC-MAIN-2018-34,application/javascript,24322,24255,0.0009\nCC-MAIN-2018-34,application/json,158123,157627,0.0059\nCC-MAIN-2018-34,application/ld+json,3937,3937,0.0001\nCC-MAIN-2018-34,application/marc,1111,1111,0.0000\nCC-MAIN-2018-34,application/msword,934589,934039,0.0348\nCC-MAIN-2018-34,application/octet-stream,832973,830940,0.0310\nCC-MAIN-2018-34,application/octetstream,5406,5400,0.0002\nCC-MAIN-2018-34,application/pdf,12239157,12206017,0.4556\nCC-MAIN-2018-34,application/pgp-encrypted,297,296,0.0000\nCC-MAIN-2018-34,application/pgp-signature,5883,5881,0.0002\nCC-MAIN-2018-34,application/postscript,21160,21142,0.0008\nCC-MAIN-2018-34,application/rdf+xml,51627,51428,0.0019\nCC-MAIN-2018-34,application/rss+xml,1816149,1809206,0.0676\nCC-MAIN-2018-34,application/rtf,55120,55088,0.0021\nCC-MAIN-2018-34,application/text,9047,9047,0.0003\nCC-MAIN-2018-34,application/unknown,5793,5793,0.0002\nCC-MAIN-2018-34,application/vnd.android.package-archive,10972,10869,0.0004\nCC-MAIN-2018-34,application/vnd.google-earth.kml+xml,43331,43240,0.0016\nCC-MAIN-2018-34,application/vnd.google-earth.kmz,7583,7581,0.0003\nCC-MAIN-2018-34,application/vnd.ms-excel,219980,219661,0.0082\nCC-MAIN-2018-34,application/vnd.ms-powerpoint,123462,123404,0.0046\nCC-MAIN-2018-34,application/vnd.ms-word,4341,4340,0.0002\nCC-MAIN-2018-34,application/vnd.oasis.opendocument.text,5642,5641,0.0002\nCC-MAIN-2018-34,application/vnd.openxmlformats-officedocument.presentationml.presentation,59566,59544,0.0022\nCC-MAIN-2018-34,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,106942,106800,0.0040\nCC-MAIN-2018-34,application/vnd.openxmlformats-officedocument.wordprocessingml.document,378103,377835,0.0141\nCC-MAIN-2018-34,application/vnd.wap.xhtml+xml,6776,6736,0.0003\nCC-MAIN-2018-34,application/x-bibtex,12117,12115,0.0005\nCC-MAIN-2018-34,application/x-bittorrent,27405,27177,0.0010\nCC-MAIN-2018-34,application/x-debian-package,16974,15774,0.0006\nCC-MAIN-2018-34,application/x-download,19721,19621,0.0007\nCC-MAIN-2018-34,application/x-endnote-refer,14616,14613,0.0005\nCC-MAIN-2018-34,application/x-gzip,148344,148169,0.0055\nCC-MAIN-2018-34,application/x-httpd-php,9045,8968,0.0003\nCC-MAIN-2018-34,application/x-java-jnlp-file,1468,1467,0.0001\nCC-MAIN-2018-34,application/x-javascript,9021,9018,0.0003\nCC-MAIN-2018-34,application/x-json,26,26,0.0000\nCC-MAIN-2018-34,application/x-mobipocket-ebook,2323,2319,0.0001\nCC-MAIN-2018-34,application/x-msdownload,54731,54263,0.0020\nCC-MAIN-2018-34,application/x-netcdf,317,317,0.0000\nCC-MAIN-2018-34,application/x-research-info-systems,28020,28008,0.0010\nCC-MAIN-2018-34,application/x-shockwave-flash,145221,144760,0.0054\nCC-MAIN-2018-34,application/x-tar,20224,20199,0.0008\nCC-MAIN-2018-34,application/x-tex,999,999,0.0000\nCC-MAIN-2018-34,application/x-troff-man,1481,1480,0.0001\nCC-MAIN-2018-34,application/x-zip-compressed,102527,102420,0.0038\nCC-MAIN-2018-34,application/xhtml+xml,586475,581893,0.0218\nCC-MAIN-2018-34,application/xml,779522,777743,0.0290\nCC-MAIN-2018-34,application/zip,803790,802097,0.0299\nCC-MAIN-2018-34,audio/mpeg,2309365,2301287,0.0860\nCC-MAIN-2018-34,audio/x-mpegurl,23817,23792,0.0009\nCC-MAIN-2018-34,audio/x-scpls,3876,3851,0.0001\nCC-MAIN-2018-34,audio/x-wav,60726,60667,0.0023\nCC-MAIN-2018-34,binary/octet-stream,17481,17417,0.0007\nCC-MAIN-2018-34,image/gif,1118123,1115652,0.0416\nCC-MAIN-2018-34,image/jp2,330,330,0.0000\nCC-MAIN-2018-34,image/jpeg,86217475,84427074,3.2095\nCC-MAIN-2018-34,image/jpg,244890,244845,0.0091\nCC-MAIN-2018-34,image/pjpeg,22427,22424,0.0008\nCC-MAIN-2018-34,image/png,5973085,5956651,0.2224\nCC-MAIN-2018-34,image/svg+xml,77816,77549,0.0029\nCC-MAIN-2018-34,image/tiff,37884,37840,0.0014\nCC-MAIN-2018-34,image/vnd.djvu,3601,3598,0.0001\nCC-MAIN-2018-34,image/webp,10960,10960,0.0004\nCC-MAIN-2018-34,message/rfc822,2995,2995,0.0001\nCC-MAIN-2018-34,text/calendar,415352,414763,0.0155\nCC-MAIN-2018-34,text/css,21197,21186,0.0008\nCC-MAIN-2018-34,text/csv,27644,27584,0.0010\nCC-MAIN-2018-34,text/directory,4607,4575,0.0002\nCC-MAIN-2018-34,text/enriched,2728,2728,0.0001\nCC-MAIN-2018-34,text/html,2545480195,2513071893,94.7570\nCC-MAIN-2018-34,text/javascript,7771,7763,0.0003\nCC-MAIN-2018-34,text/markdown,329,329,0.0000\nCC-MAIN-2018-34,text/pdf,391,391,0.0000\nCC-MAIN-2018-34,text/plain,573361,572236,0.0213\nCC-MAIN-2018-34,text/prs.lines.tag,641,641,0.0000\nCC-MAIN-2018-34,text/tab-separated-values,1756,1756,0.0001\nCC-MAIN-2018-34,text/turtle,2350,2340,0.0001\nCC-MAIN-2018-34,text/vcard,3896,3843,0.0001\nCC-MAIN-2018-34,text/x-bibtex,3089,3080,0.0001\nCC-MAIN-2018-34,text/x-c,3168,3167,0.0001\nCC-MAIN-2018-34,text/x-csrc,1295,1294,0.0000\nCC-MAIN-2018-34,text/x-diff,1912,1911,0.0001\nCC-MAIN-2018-34,text/x-patch,621,621,0.0000\nCC-MAIN-2018-34,text/x-perl,2481,2439,0.0001\nCC-MAIN-2018-34,text/x-vcalendar,13980,13978,0.0005\nCC-MAIN-2018-34,text/x-vcard,20728,20665,0.0008\nCC-MAIN-2018-34,text/xml,2311017,2300059,0.0860\nCC-MAIN-2018-34,unknown/unknown,4586,4553,0.0002\nCC-MAIN-2018-34,video/mp4,591579,591025,0.0220\nCC-MAIN-2018-34,video/webm,24992,24941,0.0009\nCC-MAIN-2018-34,video/x-ms-asf,10651,10547,0.0004\nCC-MAIN-2018-39,<other>,18552980,18472643,0.6530\nCC-MAIN-2018-39,application/atom+xml,2704694,2703808,0.0952\nCC-MAIN-2018-39,application/calendar,2456,2435,0.0001\nCC-MAIN-2018-39,application/download,24061,24053,0.0008\nCC-MAIN-2018-39,application/epub+zip,16162,16025,0.0006\nCC-MAIN-2018-39,application/force-download,46807,46788,0.0016\nCC-MAIN-2018-39,application/gpx+xml,1568,1568,0.0001\nCC-MAIN-2018-39,application/ics,3865,3865,0.0001\nCC-MAIN-2018-39,application/javascript,8492,8469,0.0003\nCC-MAIN-2018-39,application/json,226745,226499,0.0080\nCC-MAIN-2018-39,application/ld+json,3178,3178,0.0001\nCC-MAIN-2018-39,application/marc,983,983,0.0000\nCC-MAIN-2018-39,application/msword,66290,66191,0.0023\nCC-MAIN-2018-39,application/octet-stream,407023,405142,0.0143\nCC-MAIN-2018-39,application/octetstream,2728,2728,0.0001\nCC-MAIN-2018-39,application/pdf,4032668,4016958,0.1419\nCC-MAIN-2018-39,application/pgp-encrypted,88,88,0.0000\nCC-MAIN-2018-39,application/pgp-signature,4305,4304,0.0002\nCC-MAIN-2018-39,application/postscript,8782,8764,0.0003\nCC-MAIN-2018-39,application/rdf+xml,58990,58885,0.0021\nCC-MAIN-2018-39,application/rss+xml,1894377,1888769,0.0667\nCC-MAIN-2018-39,application/rtf,11350,11349,0.0004\nCC-MAIN-2018-39,application/text,9013,9009,0.0003\nCC-MAIN-2018-39,application/unknown,2552,2552,0.0001\nCC-MAIN-2018-39,application/vnd.android.package-archive,11176,11044,0.0004\nCC-MAIN-2018-39,application/vnd.google-earth.kml+xml,37789,37772,0.0013\nCC-MAIN-2018-39,application/vnd.google-earth.kmz,5703,5700,0.0002\nCC-MAIN-2018-39,application/vnd.ms-excel,24259,24187,0.0009\nCC-MAIN-2018-39,application/vnd.ms-powerpoint,5374,5345,0.0002\nCC-MAIN-2018-39,application/vnd.ms-word,3906,3906,0.0001\nCC-MAIN-2018-39,application/vnd.oasis.opendocument.text,5866,5861,0.0002\nCC-MAIN-2018-39,application/vnd.openxmlformats-officedocument.presentationml.presentation,6271,6259,0.0002\nCC-MAIN-2018-39,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,16147,16078,0.0006\nCC-MAIN-2018-39,application/vnd.openxmlformats-officedocument.wordprocessingml.document,50104,50007,0.0018\nCC-MAIN-2018-39,application/vnd.wap.xhtml+xml,5675,5660,0.0002\nCC-MAIN-2018-39,application/x-bibtex,11371,11363,0.0004\nCC-MAIN-2018-39,application/x-bittorrent,14982,14790,0.0005\nCC-MAIN-2018-39,application/x-debian-package,1424,1423,0.0001\nCC-MAIN-2018-39,application/x-download,6339,6307,0.0002\nCC-MAIN-2018-39,application/x-endnote-refer,14713,14705,0.0005\nCC-MAIN-2018-39,application/x-gzip,15293,15272,0.0005\nCC-MAIN-2018-39,application/x-httpd-php,14798,14723,0.0005\nCC-MAIN-2018-39,application/x-java-jnlp-file,1504,1502,0.0001\nCC-MAIN-2018-39,application/x-javascript,14773,14644,0.0005\nCC-MAIN-2018-39,application/x-json,46,46,0.0000\nCC-MAIN-2018-39,application/x-mobipocket-ebook,2267,2263,0.0001\nCC-MAIN-2018-39,application/x-msdownload,5910,5828,0.0002\nCC-MAIN-2018-39,application/x-netcdf,848,848,0.0000\nCC-MAIN-2018-39,application/x-research-info-systems,22018,22016,0.0008\nCC-MAIN-2018-39,application/x-shockwave-flash,42262,42071,0.0015\nCC-MAIN-2018-39,application/x-tar,2602,2598,0.0001\nCC-MAIN-2018-39,application/x-tex,798,798,0.0000\nCC-MAIN-2018-39,application/x-troff-man,540,538,0.0000\nCC-MAIN-2018-39,application/x-zip-compressed,6803,6791,0.0002\nCC-MAIN-2018-39,application/xhtml+xml,725517,721770,0.0255\nCC-MAIN-2018-39,application/xml,633301,631390,0.0223\nCC-MAIN-2018-39,application/zip,60248,60001,0.0021\nCC-MAIN-2018-39,audio/mpeg,116310,115429,0.0041\nCC-MAIN-2018-39,audio/x-mpegurl,26198,26170,0.0009\nCC-MAIN-2018-39,audio/x-scpls,4925,4916,0.0002\nCC-MAIN-2018-39,audio/x-wav,6853,6852,0.0002\nCC-MAIN-2018-39,binary/octet-stream,6080,6061,0.0002\nCC-MAIN-2018-39,image/gif,151229,145238,0.0053\nCC-MAIN-2018-39,image/jp2,301,301,0.0000\nCC-MAIN-2018-39,image/jpeg,6110858,6091496,0.2151\nCC-MAIN-2018-39,image/jpg,39343,39339,0.0014\nCC-MAIN-2018-39,image/pjpeg,3017,3015,0.0001\nCC-MAIN-2018-39,image/png,577369,566476,0.0203\nCC-MAIN-2018-39,image/svg+xml,48526,48495,0.0017\nCC-MAIN-2018-39,image/tiff,4686,4679,0.0002\nCC-MAIN-2018-39,image/vnd.djvu,3876,3874,0.0001\nCC-MAIN-2018-39,image/webp,8063,8063,0.0003\nCC-MAIN-2018-39,message/rfc822,3629,3629,0.0001\nCC-MAIN-2018-39,text/calendar,455456,455107,0.0160\nCC-MAIN-2018-39,text/css,7470,7461,0.0003\nCC-MAIN-2018-39,text/csv,11941,11921,0.0004\nCC-MAIN-2018-39,text/directory,5092,5090,0.0002\nCC-MAIN-2018-39,text/enriched,2514,2510,0.0001\nCC-MAIN-2018-39,text/html,2801205816,2769400290,98.5925\nCC-MAIN-2018-39,text/javascript,9748,9703,0.0003\nCC-MAIN-2018-39,text/markdown,417,417,0.0000\nCC-MAIN-2018-39,text/pdf,33,33,0.0000\nCC-MAIN-2018-39,text/plain,535377,534027,0.0188\nCC-MAIN-2018-39,text/prs.lines.tag,523,523,0.0000\nCC-MAIN-2018-39,text/tab-separated-values,3951,3951,0.0001\nCC-MAIN-2018-39,text/turtle,2107,2077,0.0001\nCC-MAIN-2018-39,text/vcard,3975,3965,0.0001\nCC-MAIN-2018-39,text/x-bibtex,3019,3016,0.0001\nCC-MAIN-2018-39,text/x-c,2041,2040,0.0001\nCC-MAIN-2018-39,text/x-csrc,1454,1454,0.0001\nCC-MAIN-2018-39,text/x-diff,2167,2167,0.0001\nCC-MAIN-2018-39,text/x-patch,381,381,0.0000\nCC-MAIN-2018-39,text/x-perl,1597,1577,0.0001\nCC-MAIN-2018-39,text/x-vcalendar,12400,12393,0.0004\nCC-MAIN-2018-39,text/x-vcard,23542,23492,0.0008\nCC-MAIN-2018-39,text/xml,1843160,1836471,0.0649\nCC-MAIN-2018-39,unknown/unknown,6101,6093,0.0002\nCC-MAIN-2018-39,video/mp4,43692,43150,0.0015\nCC-MAIN-2018-39,video/webm,29571,29486,0.0010\nCC-MAIN-2018-39,video/x-ms-asf,9237,9222,0.0003\nCC-MAIN-2018-43,<other>,19827384,19711452,0.6518\nCC-MAIN-2018-43,application/atom+xml,2534181,2532983,0.0833\nCC-MAIN-2018-43,application/calendar,2477,2473,0.0001\nCC-MAIN-2018-43,application/download,43277,43258,0.0014\nCC-MAIN-2018-43,application/epub+zip,19335,19081,0.0006\nCC-MAIN-2018-43,application/force-download,86881,86792,0.0029\nCC-MAIN-2018-43,application/gpx+xml,3661,3660,0.0001\nCC-MAIN-2018-43,application/ics,3883,3882,0.0001\nCC-MAIN-2018-43,application/javascript,9783,9778,0.0003\nCC-MAIN-2018-43,application/json,302408,288338,0.0099\nCC-MAIN-2018-43,application/ld+json,4780,4779,0.0002\nCC-MAIN-2018-43,application/marc,1246,1246,0.0000\nCC-MAIN-2018-43,application/msword,146471,146012,0.0048\nCC-MAIN-2018-43,application/octet-stream,861638,859589,0.0283\nCC-MAIN-2018-43,application/octetstream,7057,7054,0.0002\nCC-MAIN-2018-43,application/pdf,24444899,24387079,0.8036\nCC-MAIN-2018-43,application/pgp-encrypted,320,320,0.0000\nCC-MAIN-2018-43,application/pgp-signature,14340,14337,0.0005\nCC-MAIN-2018-43,application/postscript,21319,21292,0.0007\nCC-MAIN-2018-43,application/rdf+xml,50600,50310,0.0017\nCC-MAIN-2018-43,application/rss+xml,2192093,2183392,0.0721\nCC-MAIN-2018-43,application/rtf,22187,22162,0.0007\nCC-MAIN-2018-43,application/save-to-disk,2,2,0.0000\nCC-MAIN-2018-43,application/text,7628,7622,0.0003\nCC-MAIN-2018-43,application/unknown,7808,7807,0.0003\nCC-MAIN-2018-43,application/vnd.android.package-archive,25143,24833,0.0008\nCC-MAIN-2018-43,application/vnd.google-earth.kml+xml,30344,30287,0.0010\nCC-MAIN-2018-43,application/vnd.google-earth.kmz,9205,9192,0.0003\nCC-MAIN-2018-43,application/vnd.ms-excel,47284,47119,0.0016\nCC-MAIN-2018-43,application/vnd.ms-powerpoint,12919,12897,0.0004\nCC-MAIN-2018-43,application/vnd.ms-word,5109,5104,0.0002\nCC-MAIN-2018-43,application/vnd.oasis.opendocument.text,12220,12193,0.0004\nCC-MAIN-2018-43,application/vnd.openxmlformats-officedocument.presentationml.presentation,15338,15315,0.0005\nCC-MAIN-2018-43,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,39260,39076,0.0013\nCC-MAIN-2018-43,application/vnd.openxmlformats-officedocument.wordprocessingml.document,115238,115084,0.0038\nCC-MAIN-2018-43,application/vnd.wap.xhtml+xml,8798,8762,0.0003\nCC-MAIN-2018-43,application/x-bibtex,11419,11405,0.0004\nCC-MAIN-2018-43,application/x-bittorrent,16499,16155,0.0005\nCC-MAIN-2018-43,application/x-debian-package,4875,4863,0.0002\nCC-MAIN-2018-43,application/x-download,22338,22223,0.0007\nCC-MAIN-2018-43,application/x-endnote-refer,14593,14591,0.0005\nCC-MAIN-2018-43,application/x-gzip,29839,29806,0.0010\nCC-MAIN-2018-43,application/x-httpd-php,22512,22389,0.0007\nCC-MAIN-2018-43,application/x-java-jnlp-file,1780,1773,0.0001\nCC-MAIN-2018-43,application/x-javascript,4726,4714,0.0002\nCC-MAIN-2018-43,application/x-json,33,33,0.0000\nCC-MAIN-2018-43,application/x-mobipocket-ebook,3574,3564,0.0001\nCC-MAIN-2018-43,application/x-msdownload,11708,11540,0.0004\nCC-MAIN-2018-43,application/x-netcdf,1136,1134,0.0000\nCC-MAIN-2018-43,application/x-research-info-systems,25799,25792,0.0008\nCC-MAIN-2018-43,application/x-shockwave-flash,48206,47955,0.0016\nCC-MAIN-2018-43,application/x-tar,5674,5668,0.0002\nCC-MAIN-2018-43,application/x-tex,1886,1885,0.0001\nCC-MAIN-2018-43,application/x-troff-man,2217,2213,0.0001\nCC-MAIN-2018-43,application/x-zip-compressed,10386,10334,0.0003\nCC-MAIN-2018-43,application/xhtml+xml,638157,633876,0.0210\nCC-MAIN-2018-43,application/xml,847450,845932,0.0279\nCC-MAIN-2018-43,application/zip,105862,105314,0.0035\nCC-MAIN-2018-43,audio/mpeg,151108,149796,0.0050\nCC-MAIN-2018-43,audio/x-mpegurl,34759,34720,0.0011\nCC-MAIN-2018-43,audio/x-scpls,4237,4212,0.0001\nCC-MAIN-2018-43,audio/x-wav,11668,11666,0.0004\nCC-MAIN-2018-43,binary/octet-stream,10938,10906,0.0004\nCC-MAIN-2018-43,image/gif,158120,156377,0.0052\nCC-MAIN-2018-43,image/jp2,693,675,0.0000\nCC-MAIN-2018-43,image/jpeg,7224156,7211943,0.2375\nCC-MAIN-2018-43,image/jpg,62968,62961,0.0021\nCC-MAIN-2018-43,image/pjpeg,5368,5367,0.0002\nCC-MAIN-2018-43,image/png,623367,620054,0.0205\nCC-MAIN-2018-43,image/svg+xml,87477,87412,0.0029\nCC-MAIN-2018-43,image/tiff,11124,11118,0.0004\nCC-MAIN-2018-43,image/vnd.djvu,8508,8506,0.0003\nCC-MAIN-2018-43,image/webp,23925,23925,0.0008\nCC-MAIN-2018-43,message/rfc822,5943,5943,0.0002\nCC-MAIN-2018-43,text/calendar,533944,533634,0.0176\nCC-MAIN-2018-43,text/css,8572,8567,0.0003\nCC-MAIN-2018-43,text/csv,15629,15619,0.0005\nCC-MAIN-2018-43,text/directory,5791,5749,0.0002\nCC-MAIN-2018-43,text/enriched,2228,2226,0.0001\nCC-MAIN-2018-43,text/html,2976516273,2944221329,97.8543\nCC-MAIN-2018-43,text/javascript,9082,9020,0.0003\nCC-MAIN-2018-43,text/markdown,388,387,0.0000\nCC-MAIN-2018-43,text/pdf,277,277,0.0000\nCC-MAIN-2018-43,text/plain,801394,800037,0.0263\nCC-MAIN-2018-43,text/prs.lines.tag,799,799,0.0000\nCC-MAIN-2018-43,text/tab-separated-values,2679,2679,0.0001\nCC-MAIN-2018-43,text/turtle,2250,2233,0.0001\nCC-MAIN-2018-43,text/vcard,4670,4665,0.0002\nCC-MAIN-2018-43,text/x-bibtex,4710,4685,0.0002\nCC-MAIN-2018-43,text/x-c,3983,3977,0.0001\nCC-MAIN-2018-43,text/x-csrc,2797,2797,0.0001\nCC-MAIN-2018-43,text/x-diff,5536,5535,0.0002\nCC-MAIN-2018-43,text/x-patch,350,345,0.0000\nCC-MAIN-2018-43,text/x-perl,3303,3249,0.0001\nCC-MAIN-2018-43,text/x-vcalendar,12684,12681,0.0004\nCC-MAIN-2018-43,text/x-vcard,23376,23249,0.0008\nCC-MAIN-2018-43,text/xml,2493066,2484085,0.0820\nCC-MAIN-2018-43,unknown/unknown,6320,6302,0.0002\nCC-MAIN-2018-43,video/mp4,59722,59577,0.0020\nCC-MAIN-2018-43,video/webm,60243,60152,0.0020\nCC-MAIN-2018-43,video/x-ms-asf,12913,12901,0.0004\nCC-MAIN-2018-47,<other>,16298623,16202538,0.6158\nCC-MAIN-2018-47,application/atom+xml,2507678,2505771,0.0948\nCC-MAIN-2018-47,application/calendar,2004,1999,0.0001\nCC-MAIN-2018-47,application/download,43558,43545,0.0016\nCC-MAIN-2018-47,application/epub+zip,20352,20235,0.0008\nCC-MAIN-2018-47,application/force-download,91220,91149,0.0034\nCC-MAIN-2018-47,application/gpx+xml,4844,4842,0.0002\nCC-MAIN-2018-47,application/ics,3760,3760,0.0001\nCC-MAIN-2018-47,application/javascript,12946,12933,0.0005\nCC-MAIN-2018-47,application/json,246509,246177,0.0093\nCC-MAIN-2018-47,application/ld+json,8013,8011,0.0003\nCC-MAIN-2018-47,application/marc,899,893,0.0000\nCC-MAIN-2018-47,application/msword,289341,288888,0.0109\nCC-MAIN-2018-47,application/octet-stream,1211290,1209310,0.0458\nCC-MAIN-2018-47,application/octetstream,5768,5763,0.0002\nCC-MAIN-2018-47,application/pdf,25177149,25108155,0.9513\nCC-MAIN-2018-47,application/pgp-encrypted,561,561,0.0000\nCC-MAIN-2018-47,application/pgp-signature,55244,55241,0.0021\nCC-MAIN-2018-47,application/postscript,29364,29325,0.0011\nCC-MAIN-2018-47,application/rdf+xml,60406,60207,0.0023\nCC-MAIN-2018-47,application/rss+xml,1882909,1874957,0.0711\nCC-MAIN-2018-47,application/rtf,13811,13803,0.0005\nCC-MAIN-2018-47,application/text,8275,8274,0.0003\nCC-MAIN-2018-47,application/unknown,8356,8354,0.0003\nCC-MAIN-2018-47,application/vnd.android.package-archive,45486,45310,0.0017\nCC-MAIN-2018-47,application/vnd.google-earth.kml+xml,43847,43825,0.0017\nCC-MAIN-2018-47,application/vnd.google-earth.kmz,12763,12730,0.0005\nCC-MAIN-2018-47,application/vnd.ms-excel,86839,86595,0.0033\nCC-MAIN-2018-47,application/vnd.ms-powerpoint,27948,27935,0.0011\nCC-MAIN-2018-47,application/vnd.ms-word,3853,3849,0.0001\nCC-MAIN-2018-47,application/vnd.oasis.opendocument.text,11715,11697,0.0004\nCC-MAIN-2018-47,application/vnd.openxmlformats-officedocument.presentationml.presentation,7981,7940,0.0003\nCC-MAIN-2018-47,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,27390,27101,0.0010\nCC-MAIN-2018-47,application/vnd.openxmlformats-officedocument.wordprocessingml.document,58383,58178,0.0022\nCC-MAIN-2018-47,application/vnd.wap.xhtml+xml,3608,3579,0.0001\nCC-MAIN-2018-47,application/x-bibtex,9795,9794,0.0004\nCC-MAIN-2018-47,application/x-bittorrent,13825,13502,0.0005\nCC-MAIN-2018-47,application/x-debian-package,3828,3213,0.0001\nCC-MAIN-2018-47,application/x-download,24636,24576,0.0009\nCC-MAIN-2018-47,application/x-endnote-refer,14844,14843,0.0006\nCC-MAIN-2018-47,application/x-gzip,23127,23053,0.0009\nCC-MAIN-2018-47,application/x-httpd-php,20237,20128,0.0008\nCC-MAIN-2018-47,application/x-java-jnlp-file,2362,2359,0.0001\nCC-MAIN-2018-47,application/x-javascript,5636,5602,0.0002\nCC-MAIN-2018-47,application/x-json,33,33,0.0000\nCC-MAIN-2018-47,application/x-mobipocket-ebook,4568,4560,0.0002\nCC-MAIN-2018-47,application/x-msdownload,9164,8914,0.0003\nCC-MAIN-2018-47,application/x-netcdf,1620,1620,0.0001\nCC-MAIN-2018-47,application/x-research-info-systems,27194,27190,0.0010\nCC-MAIN-2018-47,application/x-shockwave-flash,55755,55479,0.0021\nCC-MAIN-2018-47,application/x-tar,7241,7183,0.0003\nCC-MAIN-2018-47,application/x-tex,1770,1769,0.0001\nCC-MAIN-2018-47,application/x-troff-man,3161,3148,0.0001\nCC-MAIN-2018-47,application/x-zip-compressed,19297,19263,0.0007\nCC-MAIN-2018-47,application/xhtml+xml,449841,445085,0.0170\nCC-MAIN-2018-47,application/xml,697793,695814,0.0264\nCC-MAIN-2018-47,application/zip,230816,230136,0.0087\nCC-MAIN-2018-47,audio/mpeg,170899,168940,0.0065\nCC-MAIN-2018-47,audio/x-mpegurl,49410,49350,0.0019\nCC-MAIN-2018-47,audio/x-scpls,5290,5252,0.0002\nCC-MAIN-2018-47,audio/x-wav,6948,6946,0.0003\nCC-MAIN-2018-47,binary/octet-stream,11827,11788,0.0004\nCC-MAIN-2018-47,image/gif,175329,173749,0.0066\nCC-MAIN-2018-47,image/jp2,1255,1255,0.0000\nCC-MAIN-2018-47,image/jpeg,8054062,8041133,0.3043\nCC-MAIN-2018-47,image/jpg,74888,74883,0.0028\nCC-MAIN-2018-47,image/pjpeg,7324,7324,0.0003\nCC-MAIN-2018-47,image/png,840123,836420,0.0317\nCC-MAIN-2018-47,image/svg+xml,62905,62288,0.0024\nCC-MAIN-2018-47,image/tiff,11427,11415,0.0004\nCC-MAIN-2018-47,image/vnd.djvu,15930,15923,0.0006\nCC-MAIN-2018-47,image/webp,11432,11432,0.0004\nCC-MAIN-2018-47,message/rfc822,9385,9385,0.0004\nCC-MAIN-2018-47,text/calendar,360918,360742,0.0136\nCC-MAIN-2018-47,text/css,10484,10478,0.0004\nCC-MAIN-2018-47,text/csv,13319,13118,0.0005\nCC-MAIN-2018-47,text/directory,4552,4552,0.0002\nCC-MAIN-2018-47,text/enriched,2029,2029,0.0001\nCC-MAIN-2018-47,text/html,2583363556,2550795227,97.6118\nCC-MAIN-2018-47,text/javascript,6868,6810,0.0003\nCC-MAIN-2018-47,text/markdown,635,628,0.0000\nCC-MAIN-2018-47,text/pdf,349,348,0.0000\nCC-MAIN-2018-47,text/plain,1178732,1176185,0.0445\nCC-MAIN-2018-47,text/prs.lines.tag,3322,3322,0.0001\nCC-MAIN-2018-47,text/tab-separated-values,2529,2528,0.0001\nCC-MAIN-2018-47,text/turtle,3516,3502,0.0001\nCC-MAIN-2018-47,text/vcard,6577,6568,0.0002\nCC-MAIN-2018-47,text/x-bibtex,6098,6088,0.0002\nCC-MAIN-2018-47,text/x-c,4100,4094,0.0002\nCC-MAIN-2018-47,text/x-csrc,2289,2289,0.0001\nCC-MAIN-2018-47,text/x-diff,5972,5969,0.0002\nCC-MAIN-2018-47,text/x-patch,397,395,0.0000\nCC-MAIN-2018-47,text/x-perl,6685,6629,0.0003\nCC-MAIN-2018-47,text/x-vcalendar,9187,9187,0.0003\nCC-MAIN-2018-47,text/x-vcard,25952,25822,0.0010\nCC-MAIN-2018-47,text/xml,1934864,1923537,0.0731\nCC-MAIN-2018-47,unknown/unknown,5935,5914,0.0002\nCC-MAIN-2018-47,video/mp4,60580,60445,0.0023\nCC-MAIN-2018-47,video/webm,73944,73854,0.0028\nCC-MAIN-2018-47,video/x-ms-asf,27485,27293,0.0010\nCC-MAIN-2018-51,<other>,17463149,17355197,0.5519\nCC-MAIN-2018-51,application/atom+xml,2586524,2584909,0.0817\nCC-MAIN-2018-51,application/calendar,4505,4492,0.0001\nCC-MAIN-2018-51,application/download,45403,45364,0.0014\nCC-MAIN-2018-51,application/epub+zip,26230,26139,0.0008\nCC-MAIN-2018-51,application/force-download,103648,103369,0.0033\nCC-MAIN-2018-51,application/gpx+xml,6532,6528,0.0002\nCC-MAIN-2018-51,application/ics,5738,5737,0.0002\nCC-MAIN-2018-51,application/javascript,9397,9377,0.0003\nCC-MAIN-2018-51,application/json,296628,296304,0.0094\nCC-MAIN-2018-51,application/ld+json,3914,3894,0.0001\nCC-MAIN-2018-51,application/marc,888,887,0.0000\nCC-MAIN-2018-51,application/msword,133072,132687,0.0042\nCC-MAIN-2018-51,application/octet-stream,1036927,1033669,0.0328\nCC-MAIN-2018-51,application/octetstream,10458,10443,0.0003\nCC-MAIN-2018-51,application/pdf,36064773,35882972,1.1398\nCC-MAIN-2018-51,application/pgp-encrypted,406,405,0.0000\nCC-MAIN-2018-51,application/pgp-signature,15954,15927,0.0005\nCC-MAIN-2018-51,application/postscript,31636,31592,0.0010\nCC-MAIN-2018-51,application/rdf+xml,53443,53384,0.0017\nCC-MAIN-2018-51,application/rss+xml,2515799,2505524,0.0795\nCC-MAIN-2018-51,application/rtf,15502,15464,0.0005\nCC-MAIN-2018-51,application/save-to-disk,76,76,0.0000\nCC-MAIN-2018-51,application/text,9132,9114,0.0003\nCC-MAIN-2018-51,application/unknown,9097,9083,0.0003\nCC-MAIN-2018-51,application/vnd.android.package-archive,33448,32513,0.0011\nCC-MAIN-2018-51,application/vnd.google-earth.kml+xml,47232,46945,0.0015\nCC-MAIN-2018-51,application/vnd.google-earth.kmz,12011,11921,0.0004\nCC-MAIN-2018-51,application/vnd.ms-excel,44767,44531,0.0014\nCC-MAIN-2018-51,application/vnd.ms-powerpoint,13712,13676,0.0004\nCC-MAIN-2018-51,application/vnd.ms-word,4338,4333,0.0001\nCC-MAIN-2018-51,application/vnd.oasis.opendocument.text,16107,16075,0.0005\nCC-MAIN-2018-51,application/vnd.openxmlformats-officedocument.presentationml.presentation,8767,8743,0.0003\nCC-MAIN-2018-51,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,26908,26814,0.0009\nCC-MAIN-2018-51,application/vnd.openxmlformats-officedocument.wordprocessingml.document,71705,71394,0.0023\nCC-MAIN-2018-51,application/vnd.wap.xhtml+xml,5892,5841,0.0002\nCC-MAIN-2018-51,application/x-bibtex,10094,10091,0.0003\nCC-MAIN-2018-51,application/x-bittorrent,12248,11743,0.0004\nCC-MAIN-2018-51,application/x-debian-package,1390,1374,0.0000\nCC-MAIN-2018-51,application/x-download,19009,18921,0.0006\nCC-MAIN-2018-51,application/x-endnote-refer,13781,13773,0.0004\nCC-MAIN-2018-51,application/x-gzip,22609,22406,0.0007\nCC-MAIN-2018-51,application/x-httpd-php,21382,21239,0.0007\nCC-MAIN-2018-51,application/x-java-jnlp-file,2669,2657,0.0001\nCC-MAIN-2018-51,application/x-javascript,5098,5079,0.0002\nCC-MAIN-2018-51,application/x-json,30,30,0.0000\nCC-MAIN-2018-51,application/x-mobipocket-ebook,6112,6104,0.0002\nCC-MAIN-2018-51,application/x-msdownload,10055,9918,0.0003\nCC-MAIN-2018-51,application/x-netcdf,1064,1064,0.0000\nCC-MAIN-2018-51,application/x-research-info-systems,26053,26046,0.0008\nCC-MAIN-2018-51,application/x-shockwave-flash,47912,47707,0.0015\nCC-MAIN-2018-51,application/x-tar,5711,5670,0.0002\nCC-MAIN-2018-51,application/x-tex,3258,3250,0.0001\nCC-MAIN-2018-51,application/x-troff-man,3529,3516,0.0001\nCC-MAIN-2018-51,application/x-zip-compressed,16887,16787,0.0005\nCC-MAIN-2018-51,application/xhtml+xml,657263,652207,0.0208\nCC-MAIN-2018-51,application/xml,830271,827871,0.0262\nCC-MAIN-2018-51,application/zip,110594,109585,0.0035\nCC-MAIN-2018-51,audio/mpeg,175792,172813,0.0056\nCC-MAIN-2018-51,audio/x-mpegurl,42810,42757,0.0014\nCC-MAIN-2018-51,audio/x-scpls,6399,6367,0.0002\nCC-MAIN-2018-51,audio/x-wav,9139,9106,0.0003\nCC-MAIN-2018-51,binary/octet-stream,17567,17476,0.0006\nCC-MAIN-2018-51,image/gif,139654,138309,0.0044\nCC-MAIN-2018-51,image/jp2,953,953,0.0000\nCC-MAIN-2018-51,image/jpeg,8643584,8627506,0.2732\nCC-MAIN-2018-51,image/jpg,75159,75118,0.0024\nCC-MAIN-2018-51,image/pjpeg,9441,9440,0.0003\nCC-MAIN-2018-51,image/png,730264,727206,0.0231\nCC-MAIN-2018-51,image/svg+xml,42680,42640,0.0013\nCC-MAIN-2018-51,image/tiff,8283,8266,0.0003\nCC-MAIN-2018-51,image/vnd.djvu,12933,12860,0.0004\nCC-MAIN-2018-51,image/webp,14997,14997,0.0005\nCC-MAIN-2018-51,message/rfc822,5609,5604,0.0002\nCC-MAIN-2018-51,text/calendar,656510,655726,0.0207\nCC-MAIN-2018-51,text/css,8031,8024,0.0003\nCC-MAIN-2018-51,text/csv,15736,15646,0.0005\nCC-MAIN-2018-51,text/directory,10299,10256,0.0003\nCC-MAIN-2018-51,text/enriched,3071,3062,0.0001\nCC-MAIN-2018-51,text/html,3087226861,3050274826,97.5659\nCC-MAIN-2018-51,text/javascript,8460,8375,0.0003\nCC-MAIN-2018-51,text/markdown,809,808,0.0000\nCC-MAIN-2018-51,text/pdf,410,409,0.0000\nCC-MAIN-2018-51,text/plain,1004183,1001406,0.0317\nCC-MAIN-2018-51,text/prs.lines.tag,829,829,0.0000\nCC-MAIN-2018-51,text/tab-separated-values,3476,3476,0.0001\nCC-MAIN-2018-51,text/turtle,3046,3021,0.0001\nCC-MAIN-2018-51,text/vcard,19712,19623,0.0006\nCC-MAIN-2018-51,text/x-bibtex,10793,10703,0.0003\nCC-MAIN-2018-51,text/x-c,3882,3840,0.0001\nCC-MAIN-2018-51,text/x-csrc,2504,2503,0.0001\nCC-MAIN-2018-51,text/x-diff,6312,6303,0.0002\nCC-MAIN-2018-51,text/x-patch,370,369,0.0000\nCC-MAIN-2018-51,text/x-perl,2921,2920,0.0001\nCC-MAIN-2018-51,text/x-vcalendar,16426,16425,0.0005\nCC-MAIN-2018-51,text/x-vcard,61634,61397,0.0019\nCC-MAIN-2018-51,text/xml,2502236,2489923,0.0791\nCC-MAIN-2018-51,unknown/unknown,3792,3774,0.0001\nCC-MAIN-2018-51,video/mp4,55535,55423,0.0018\nCC-MAIN-2018-51,video/webm,103576,103258,0.0033\nCC-MAIN-2018-51,video/x-ms-asf,20220,20127,0.0006\nCC-MAIN-2019-04,<other>,14656778,14576068,0.5072\nCC-MAIN-2019-04,application/atom+xml,2796216,2794841,0.0968\nCC-MAIN-2019-04,application/calendar,4355,4354,0.0002\nCC-MAIN-2019-04,application/download,46964,46940,0.0016\nCC-MAIN-2019-04,application/epub+zip,24662,24559,0.0009\nCC-MAIN-2019-04,application/force-download,107464,107329,0.0037\nCC-MAIN-2019-04,application/gpx+xml,5671,5653,0.0002\nCC-MAIN-2019-04,application/ics,4792,4792,0.0002\nCC-MAIN-2019-04,application/javascript,9365,9349,0.0003\nCC-MAIN-2019-04,application/json,226465,226038,0.0078\nCC-MAIN-2019-04,application/ld+json,4751,4749,0.0002\nCC-MAIN-2019-04,application/marc,998,998,0.0000\nCC-MAIN-2019-04,application/msword,158369,157923,0.0055\nCC-MAIN-2019-04,application/octet-stream,1208827,1206651,0.0418\nCC-MAIN-2019-04,application/octetstream,10402,10379,0.0004\nCC-MAIN-2019-04,application/pdf,26441488,26354325,0.9150\nCC-MAIN-2019-04,application/pgp-encrypted,561,561,0.0000\nCC-MAIN-2019-04,application/pgp-signature,48768,48761,0.0017\nCC-MAIN-2019-04,application/postscript,18739,18668,0.0006\nCC-MAIN-2019-04,application/rdf+xml,38280,38236,0.0013\nCC-MAIN-2019-04,application/rss+xml,2097326,2089850,0.0726\nCC-MAIN-2019-04,application/rtf,18803,18783,0.0007\nCC-MAIN-2019-04,application/save-to-disk,68,68,0.0000\nCC-MAIN-2019-04,application/text,13957,13945,0.0005\nCC-MAIN-2019-04,application/unknown,11232,11230,0.0004\nCC-MAIN-2019-04,application/vnd.android.package-archive,31393,31220,0.0011\nCC-MAIN-2019-04,application/vnd.google-earth.kml+xml,31754,31697,0.0011\nCC-MAIN-2019-04,application/vnd.google-earth.kmz,9686,9682,0.0003\nCC-MAIN-2019-04,application/vnd.ms-excel,48388,48197,0.0017\nCC-MAIN-2019-04,application/vnd.ms-powerpoint,19868,19701,0.0007\nCC-MAIN-2019-04,application/vnd.ms-word,7415,7414,0.0003\nCC-MAIN-2019-04,application/vnd.oasis.opendocument.text,13774,13744,0.0005\nCC-MAIN-2019-04,application/vnd.openxmlformats-officedocument.presentationml.presentation,13750,13718,0.0005\nCC-MAIN-2019-04,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,39046,38922,0.0014\nCC-MAIN-2019-04,application/vnd.openxmlformats-officedocument.wordprocessingml.document,93435,93022,0.0032\nCC-MAIN-2019-04,application/vnd.wap.xhtml+xml,4344,4318,0.0002\nCC-MAIN-2019-04,application/x-bibtex,17069,17034,0.0006\nCC-MAIN-2019-04,application/x-bittorrent,11665,11179,0.0004\nCC-MAIN-2019-04,application/x-debian-package,3368,3367,0.0001\nCC-MAIN-2019-04,application/x-download,29748,29680,0.0010\nCC-MAIN-2019-04,application/x-endnote-refer,20206,20172,0.0007\nCC-MAIN-2019-04,application/x-gzip,44593,44535,0.0015\nCC-MAIN-2019-04,application/x-httpd-php,9426,9344,0.0003\nCC-MAIN-2019-04,application/x-java-jnlp-file,1529,1527,0.0001\nCC-MAIN-2019-04,application/x-javascript,5654,5644,0.0002\nCC-MAIN-2019-04,application/x-json,411,411,0.0000\nCC-MAIN-2019-04,application/x-mobipocket-ebook,3867,3863,0.0001\nCC-MAIN-2019-04,application/x-msdownload,13094,12972,0.0005\nCC-MAIN-2019-04,application/x-netcdf,1585,1585,0.0001\nCC-MAIN-2019-04,application/x-research-info-systems,38388,38354,0.0013\nCC-MAIN-2019-04,application/x-shockwave-flash,104557,104414,0.0036\nCC-MAIN-2019-04,application/x-tar,8058,8026,0.0003\nCC-MAIN-2019-04,application/x-tex,2988,2964,0.0001\nCC-MAIN-2019-04,application/x-troff-man,3139,3139,0.0001\nCC-MAIN-2019-04,application/x-zip-compressed,23564,23503,0.0008\nCC-MAIN-2019-04,application/xhtml+xml,566013,562509,0.0196\nCC-MAIN-2019-04,application/xml,666243,664641,0.0231\nCC-MAIN-2019-04,application/zip,160935,159973,0.0056\nCC-MAIN-2019-04,audio/mpeg,336167,330830,0.0116\nCC-MAIN-2019-04,audio/x-mpegurl,27873,27848,0.0010\nCC-MAIN-2019-04,audio/x-scpls,4292,4286,0.0001\nCC-MAIN-2019-04,audio/x-wav,11043,11042,0.0004\nCC-MAIN-2019-04,binary/octet-stream,18148,18047,0.0006\nCC-MAIN-2019-04,image/gif,193872,192929,0.0067\nCC-MAIN-2019-04,image/jp2,459,455,0.0000\nCC-MAIN-2019-04,image/jpeg,7388724,7377391,0.2557\nCC-MAIN-2019-04,image/jpg,93463,89566,0.0032\nCC-MAIN-2019-04,image/pjpeg,12502,12494,0.0004\nCC-MAIN-2019-04,image/png,891033,888072,0.0308\nCC-MAIN-2019-04,image/svg+xml,24492,24434,0.0008\nCC-MAIN-2019-04,image/tiff,16432,16408,0.0006\nCC-MAIN-2019-04,image/vnd.djvu,8762,8732,0.0003\nCC-MAIN-2019-04,image/webp,10948,10948,0.0004\nCC-MAIN-2019-04,message/rfc822,6336,6336,0.0002\nCC-MAIN-2019-04,text/calendar,741811,741276,0.0257\nCC-MAIN-2019-04,text/css,9146,9140,0.0003\nCC-MAIN-2019-04,text/csv,20496,20471,0.0007\nCC-MAIN-2019-04,text/directory,6637,6624,0.0002\nCC-MAIN-2019-04,text/enriched,4353,4342,0.0002\nCC-MAIN-2019-04,text/html,2826569957,2799465113,97.8144\nCC-MAIN-2019-04,text/javascript,7754,7708,0.0003\nCC-MAIN-2019-04,text/markdown,777,777,0.0000\nCC-MAIN-2019-04,text/pdf,1279,1279,0.0000\nCC-MAIN-2019-04,text/plain,852644,850576,0.0295\nCC-MAIN-2019-04,text/prs.lines.tag,2187,2187,0.0001\nCC-MAIN-2019-04,text/tab-separated-values,2998,2998,0.0001\nCC-MAIN-2019-04,text/turtle,3613,3601,0.0001\nCC-MAIN-2019-04,text/vcard,17680,17668,0.0006\nCC-MAIN-2019-04,text/x-bibtex,5473,5473,0.0002\nCC-MAIN-2019-04,text/x-c,2515,2515,0.0001\nCC-MAIN-2019-04,text/x-csrc,2523,2522,0.0001\nCC-MAIN-2019-04,text/x-diff,9919,9919,0.0003\nCC-MAIN-2019-04,text/x-patch,837,837,0.0000\nCC-MAIN-2019-04,text/x-perl,782,781,0.0000\nCC-MAIN-2019-04,text/x-vcalendar,20001,20001,0.0007\nCC-MAIN-2019-04,text/x-vcard,45133,44970,0.0016\nCC-MAIN-2019-04,text/xml,2139662,2130422,0.0740\nCC-MAIN-2019-04,unknown/unknown,2705,2703,0.0001\nCC-MAIN-2019-04,video/mp4,135398,135020,0.0047\nCC-MAIN-2019-04,video/webm,60408,60311,0.0021\nCC-MAIN-2019-04,video/x-ms-asf,11154,11139,0.0004\nCC-MAIN-2019-09,<other>,12599352,12523196,0.4324\nCC-MAIN-2019-09,application/atom+xml,2858057,2856687,0.0981\nCC-MAIN-2019-09,application/calendar,6685,6673,0.0002\nCC-MAIN-2019-09,application/download,51672,51623,0.0018\nCC-MAIN-2019-09,application/epub+zip,37883,37783,0.0013\nCC-MAIN-2019-09,application/force-download,115846,114871,0.0040\nCC-MAIN-2019-09,application/gpx+xml,6161,6161,0.0002\nCC-MAIN-2019-09,application/ics,6862,6860,0.0002\nCC-MAIN-2019-09,application/javascript,14340,14328,0.0005\nCC-MAIN-2019-09,application/json,376410,375930,0.0129\nCC-MAIN-2019-09,application/ld+json,7956,7955,0.0003\nCC-MAIN-2019-09,application/marc,2784,2783,0.0001\nCC-MAIN-2019-09,application/msword,242594,242036,0.0083\nCC-MAIN-2019-09,application/octet-stream,1458583,1455089,0.0501\nCC-MAIN-2019-09,application/octetstream,8836,8823,0.0003\nCC-MAIN-2019-09,application/pdf,30891058,30772751,1.0602\nCC-MAIN-2019-09,application/pgp-encrypted,485,485,0.0000\nCC-MAIN-2019-09,application/pgp-signature,26742,26733,0.0009\nCC-MAIN-2019-09,application/postscript,27128,27071,0.0009\nCC-MAIN-2019-09,application/rdf+xml,41450,41397,0.0014\nCC-MAIN-2019-09,application/rss+xml,2438310,2430591,0.0837\nCC-MAIN-2019-09,application/rtf,27340,27315,0.0009\nCC-MAIN-2019-09,application/save-to-disk,74,74,0.0000\nCC-MAIN-2019-09,application/text,28415,28410,0.0010\nCC-MAIN-2019-09,application/unknown,9658,9656,0.0003\nCC-MAIN-2019-09,application/vnd.android.package-archive,28208,28007,0.0010\nCC-MAIN-2019-09,application/vnd.google-earth.kml+xml,55527,55488,0.0019\nCC-MAIN-2019-09,application/vnd.google-earth.kmz,14407,14396,0.0005\nCC-MAIN-2019-09,application/vnd.ms-excel,84626,84445,0.0029\nCC-MAIN-2019-09,application/vnd.ms-powerpoint,27789,27639,0.0010\nCC-MAIN-2019-09,application/vnd.ms-word,9118,9118,0.0003\nCC-MAIN-2019-09,application/vnd.oasis.opendocument.text,15692,15659,0.0005\nCC-MAIN-2019-09,application/vnd.openxmlformats-officedocument.presentationml.presentation,19078,18861,0.0007\nCC-MAIN-2019-09,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,52320,52191,0.0018\nCC-MAIN-2019-09,application/vnd.openxmlformats-officedocument.wordprocessingml.document,134166,133775,0.0046\nCC-MAIN-2019-09,application/vnd.wap.xhtml+xml,4155,4101,0.0001\nCC-MAIN-2019-09,application/x-bibtex,30020,30001,0.0010\nCC-MAIN-2019-09,application/x-bittorrent,11242,10912,0.0004\nCC-MAIN-2019-09,application/x-debian-package,9821,9819,0.0003\nCC-MAIN-2019-09,application/x-download,29096,29067,0.0010\nCC-MAIN-2019-09,application/x-endnote-refer,36150,36141,0.0012\nCC-MAIN-2019-09,application/x-gzip,94540,94503,0.0032\nCC-MAIN-2019-09,application/x-httpd-php,22211,22090,0.0008\nCC-MAIN-2019-09,application/x-java-jnlp-file,3167,3160,0.0001\nCC-MAIN-2019-09,application/x-javascript,12793,12788,0.0004\nCC-MAIN-2019-09,application/x-json,664,664,0.0000\nCC-MAIN-2019-09,application/x-mobipocket-ebook,6586,6580,0.0002\nCC-MAIN-2019-09,application/x-msdownload,15604,15431,0.0005\nCC-MAIN-2019-09,application/x-netcdf,1347,1347,0.0000\nCC-MAIN-2019-09,application/x-research-info-systems,68172,68158,0.0023\nCC-MAIN-2019-09,application/x-shockwave-flash,120502,120380,0.0041\nCC-MAIN-2019-09,application/x-tar,10103,10089,0.0003\nCC-MAIN-2019-09,application/x-tex,2182,2181,0.0001\nCC-MAIN-2019-09,application/x-troff-man,7273,7267,0.0002\nCC-MAIN-2019-09,application/x-zip-compressed,37996,37831,0.0013\nCC-MAIN-2019-09,application/xhtml+xml,489601,484669,0.0168\nCC-MAIN-2019-09,application/xml,1163225,1161047,0.0399\nCC-MAIN-2019-09,application/zip,240185,239521,0.0082\nCC-MAIN-2019-09,audio/mpeg,503541,493467,0.0173\nCC-MAIN-2019-09,audio/x-mpegurl,50691,50657,0.0017\nCC-MAIN-2019-09,audio/x-scpls,6461,6451,0.0002\nCC-MAIN-2019-09,audio/x-wav,15710,15669,0.0005\nCC-MAIN-2019-09,binary/octet-stream,31920,31720,0.0011\nCC-MAIN-2019-09,image/gif,255523,254446,0.0088\nCC-MAIN-2019-09,image/jp2,1690,1689,0.0001\nCC-MAIN-2019-09,image/jpeg,14130815,14111665,0.4850\nCC-MAIN-2019-09,image/jpg,108101,105564,0.0037\nCC-MAIN-2019-09,image/pjpeg,11588,11588,0.0004\nCC-MAIN-2019-09,image/png,1536508,1532712,0.0527\nCC-MAIN-2019-09,image/svg+xml,38390,38278,0.0013\nCC-MAIN-2019-09,image/tiff,18124,18085,0.0006\nCC-MAIN-2019-09,image/vnd.djvu,16137,16135,0.0006\nCC-MAIN-2019-09,image/webp,10309,10309,0.0004\nCC-MAIN-2019-09,message/rfc822,5826,5825,0.0002\nCC-MAIN-2019-09,text/calendar,837080,836295,0.0287\nCC-MAIN-2019-09,text/css,12786,12784,0.0004\nCC-MAIN-2019-09,text/csv,42956,42886,0.0015\nCC-MAIN-2019-09,text/directory,10248,10216,0.0004\nCC-MAIN-2019-09,text/enriched,9276,9271,0.0003\nCC-MAIN-2019-09,text/html,2837790995,2809151925,97.3936\nCC-MAIN-2019-09,text/javascript,10154,10149,0.0003\nCC-MAIN-2019-09,text/markdown,1094,1090,0.0000\nCC-MAIN-2019-09,text/pdf,397,397,0.0000\nCC-MAIN-2019-09,text/plain,1175236,1173527,0.0403\nCC-MAIN-2019-09,text/prs.lines.tag,2838,2838,0.0001\nCC-MAIN-2019-09,text/tab-separated-values,6502,6498,0.0002\nCC-MAIN-2019-09,text/turtle,8090,8066,0.0003\nCC-MAIN-2019-09,text/vcard,20341,20239,0.0007\nCC-MAIN-2019-09,text/x-bibtex,11131,11131,0.0004\nCC-MAIN-2019-09,text/x-c,3800,3797,0.0001\nCC-MAIN-2019-09,text/x-csrc,3092,3090,0.0001\nCC-MAIN-2019-09,text/x-diff,9391,9379,0.0003\nCC-MAIN-2019-09,text/x-patch,1400,1397,0.0000\nCC-MAIN-2019-09,text/x-perl,1882,1882,0.0001\nCC-MAIN-2019-09,text/x-vcalendar,21863,21860,0.0008\nCC-MAIN-2019-09,text/x-vcard,57100,56825,0.0020\nCC-MAIN-2019-09,text/xml,2478059,2467436,0.0850\nCC-MAIN-2019-09,unknown/unknown,9997,9991,0.0003\nCC-MAIN-2019-09,video/mp4,199136,198771,0.0068\nCC-MAIN-2019-09,video/webm,106030,105752,0.0036\nCC-MAIN-2019-09,video/x-ms-asf,18967,18936,0.0007\nCC-MAIN-2019-13,<other>,32102116,31805557,1.2493\nCC-MAIN-2019-13,application/atom+xml,2685179,2683393,0.1045\nCC-MAIN-2019-13,application/calendar,5753,5743,0.0002\nCC-MAIN-2019-13,application/download,32701,32696,0.0013\nCC-MAIN-2019-13,application/epub+zip,34348,34230,0.0013\nCC-MAIN-2019-13,application/force-download,79026,78947,0.0031\nCC-MAIN-2019-13,application/gpx+xml,5088,5087,0.0002\nCC-MAIN-2019-13,application/ics,5875,5875,0.0002\nCC-MAIN-2019-13,application/javascript,15747,15734,0.0006\nCC-MAIN-2019-13,application/json,296914,296530,0.0116\nCC-MAIN-2019-13,application/ld+json,7265,7265,0.0003\nCC-MAIN-2019-13,application/marc,2616,2616,0.0001\nCC-MAIN-2019-13,application/msword,203278,202985,0.0079\nCC-MAIN-2019-13,application/octet-stream,1001197,998650,0.0390\nCC-MAIN-2019-13,application/octetstream,6367,6337,0.0002\nCC-MAIN-2019-13,application/pdf,12012949,11972765,0.4675\nCC-MAIN-2019-13,application/pgp-encrypted,371,371,0.0000\nCC-MAIN-2019-13,application/pgp-signature,21791,21785,0.0008\nCC-MAIN-2019-13,application/postscript,31734,31697,0.0012\nCC-MAIN-2019-13,application/rdf+xml,44282,44220,0.0017\nCC-MAIN-2019-13,application/rss+xml,1898826,1891459,0.0739\nCC-MAIN-2019-13,application/rtf,40867,40845,0.0016\nCC-MAIN-2019-13,application/save-to-disk,2,2,0.0000\nCC-MAIN-2019-13,application/text,40294,40277,0.0016\nCC-MAIN-2019-13,application/unknown,7762,7761,0.0003\nCC-MAIN-2019-13,application/vnd.android.package-archive,22071,21935,0.0009\nCC-MAIN-2019-13,application/vnd.google-earth.kml+xml,56062,55884,0.0022\nCC-MAIN-2019-13,application/vnd.google-earth.kmz,14545,14539,0.0006\nCC-MAIN-2019-13,application/vnd.ms-excel,62355,62243,0.0024\nCC-MAIN-2019-13,application/vnd.ms-powerpoint,24577,24548,0.0010\nCC-MAIN-2019-13,application/vnd.ms-word,10949,10936,0.0004\nCC-MAIN-2019-13,application/vnd.oasis.opendocument.text,16302,16278,0.0006\nCC-MAIN-2019-13,application/vnd.openxmlformats-officedocument.presentationml.presentation,35401,35278,0.0014\nCC-MAIN-2019-13,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,79397,79157,0.0031\nCC-MAIN-2019-13,application/vnd.openxmlformats-officedocument.wordprocessingml.document,228382,228082,0.0089\nCC-MAIN-2019-13,application/vnd.wap.xhtml+xml,2908,2874,0.0001\nCC-MAIN-2019-13,application/x-bibtex,32150,32136,0.0013\nCC-MAIN-2019-13,application/x-bittorrent,16728,15674,0.0007\nCC-MAIN-2019-13,application/x-debian-package,6184,6179,0.0002\nCC-MAIN-2019-13,application/x-download,12194,12092,0.0005\nCC-MAIN-2019-13,application/x-endnote-refer,50804,50780,0.0020\nCC-MAIN-2019-13,application/x-gzip,124151,123839,0.0048\nCC-MAIN-2019-13,application/x-httpd-php,17244,17065,0.0007\nCC-MAIN-2019-13,application/x-java-jnlp-file,2627,2624,0.0001\nCC-MAIN-2019-13,application/x-javascript,6650,6632,0.0003\nCC-MAIN-2019-13,application/x-json,581,581,0.0000\nCC-MAIN-2019-13,application/x-mobipocket-ebook,6328,6318,0.0002\nCC-MAIN-2019-13,application/x-msdownload,13774,13583,0.0005\nCC-MAIN-2019-13,application/x-netcdf,3859,3859,0.0002\nCC-MAIN-2019-13,application/x-research-info-systems,73122,73106,0.0028\nCC-MAIN-2019-13,application/x-shockwave-flash,155600,155458,0.0061\nCC-MAIN-2019-13,application/x-tar,29357,29349,0.0011\nCC-MAIN-2019-13,application/x-tex,4632,4631,0.0002\nCC-MAIN-2019-13,application/x-troff-man,6852,6812,0.0003\nCC-MAIN-2019-13,application/x-zip-compressed,42732,42624,0.0017\nCC-MAIN-2019-13,application/xhtml+xml,475042,470175,0.0185\nCC-MAIN-2019-13,application/xml,721573,719826,0.0281\nCC-MAIN-2019-13,application/zip,228486,227772,0.0089\nCC-MAIN-2019-13,audio/mpeg,530722,520685,0.0207\nCC-MAIN-2019-13,audio/x-mpegurl,52571,52511,0.0020\nCC-MAIN-2019-13,audio/x-scpls,5701,5677,0.0002\nCC-MAIN-2019-13,audio/x-wav,30521,30502,0.0012\nCC-MAIN-2019-13,binary/octet-stream,18591,18547,0.0007\nCC-MAIN-2019-13,image/gif,335730,334882,0.0131\nCC-MAIN-2019-13,image/jp2,2446,2439,0.0001\nCC-MAIN-2019-13,image/jpeg,14054129,14037145,0.5469\nCC-MAIN-2019-13,image/jpg,100891,99519,0.0039\nCC-MAIN-2019-13,image/pjpeg,8693,8692,0.0003\nCC-MAIN-2019-13,image/png,1617191,1613686,0.0629\nCC-MAIN-2019-13,image/svg+xml,50725,50582,0.0020\nCC-MAIN-2019-13,image/tiff,24578,24565,0.0010\nCC-MAIN-2019-13,image/vnd.djvu,20471,20451,0.0008\nCC-MAIN-2019-13,image/webp,15489,15489,0.0006\nCC-MAIN-2019-13,message/rfc822,5420,5416,0.0002\nCC-MAIN-2019-13,text/calendar,824496,823826,0.0321\nCC-MAIN-2019-13,text/css,16050,16035,0.0006\nCC-MAIN-2019-13,text/csv,46817,46793,0.0018\nCC-MAIN-2019-13,text/directory,7663,7661,0.0003\nCC-MAIN-2019-13,text/enriched,12451,12437,0.0005\nCC-MAIN-2019-13,text/html,2494986814,2468797458,97.0932\nCC-MAIN-2019-13,text/javascript,9523,9515,0.0004\nCC-MAIN-2019-13,text/markdown,1034,1034,0.0000\nCC-MAIN-2019-13,text/pdf,138,138,0.0000\nCC-MAIN-2019-13,text/plain,1235461,1233301,0.0481\nCC-MAIN-2019-13,text/prs.lines.tag,1513,1513,0.0001\nCC-MAIN-2019-13,text/tab-separated-values,9096,9096,0.0004\nCC-MAIN-2019-13,text/turtle,10273,10267,0.0004\nCC-MAIN-2019-13,text/vcard,14708,14677,0.0006\nCC-MAIN-2019-13,text/x-bibtex,8057,8054,0.0003\nCC-MAIN-2019-13,text/x-c,5709,5705,0.0002\nCC-MAIN-2019-13,text/x-csrc,3790,3789,0.0001\nCC-MAIN-2019-13,text/x-diff,8018,8006,0.0003\nCC-MAIN-2019-13,text/x-patch,2113,2113,0.0001\nCC-MAIN-2019-13,text/x-perl,1826,1821,0.0001\nCC-MAIN-2019-13,text/x-vcalendar,22059,22049,0.0009\nCC-MAIN-2019-13,text/x-vcard,47203,47046,0.0018\nCC-MAIN-2019-13,text/xml,2119144,2112100,0.0825\nCC-MAIN-2019-13,unknown/unknown,10476,10458,0.0004\nCC-MAIN-2019-13,video/mp4,172337,172045,0.0067\nCC-MAIN-2019-13,video/webm,46634,46607,0.0018\nCC-MAIN-2019-13,video/x-ms-asf,18606,18578,0.0007\nCC-MAIN-2019-18,<other>,34283160,34004174,1.3725\nCC-MAIN-2019-18,application/atom+xml,2623437,2622163,0.1050\nCC-MAIN-2019-18,application/calendar,6373,6370,0.0003\nCC-MAIN-2019-18,application/download,27617,27597,0.0011\nCC-MAIN-2019-18,application/epub+zip,31038,30934,0.0012\nCC-MAIN-2019-18,application/force-download,67461,67311,0.0027\nCC-MAIN-2019-18,application/gpx+xml,5006,5002,0.0002\nCC-MAIN-2019-18,application/ics,10748,10748,0.0004\nCC-MAIN-2019-18,application/javascript,12486,12470,0.0005\nCC-MAIN-2019-18,application/json,368187,367691,0.0147\nCC-MAIN-2019-18,application/ld+json,7429,7428,0.0003\nCC-MAIN-2019-18,application/marc,4186,4186,0.0002\nCC-MAIN-2019-18,application/msword,77013,76785,0.0031\nCC-MAIN-2019-18,application/octet-stream,953919,952592,0.0382\nCC-MAIN-2019-18,application/octetstream,4390,4390,0.0002\nCC-MAIN-2019-18,application/pdf,12701150,12666511,0.5085\nCC-MAIN-2019-18,application/pgp-encrypted,911,911,0.0000\nCC-MAIN-2019-18,application/pgp-signature,39618,39604,0.0016\nCC-MAIN-2019-18,application/postscript,28913,28893,0.0012\nCC-MAIN-2019-18,application/rdf+xml,66433,66366,0.0027\nCC-MAIN-2019-18,application/rss+xml,2150745,2144176,0.0861\nCC-MAIN-2019-18,application/rtf,38804,38799,0.0016\nCC-MAIN-2019-18,application/text,58399,58396,0.0023\nCC-MAIN-2019-18,application/unknown,5707,5705,0.0002\nCC-MAIN-2019-18,application/vnd.android.package-archive,20124,20048,0.0008\nCC-MAIN-2019-18,application/vnd.google-earth.kml+xml,44080,44070,0.0018\nCC-MAIN-2019-18,application/vnd.google-earth.kmz,9541,9525,0.0004\nCC-MAIN-2019-18,application/vnd.ms-excel,30440,30388,0.0012\nCC-MAIN-2019-18,application/vnd.ms-powerpoint,15899,15881,0.0006\nCC-MAIN-2019-18,application/vnd.ms-word,13040,13040,0.0005\nCC-MAIN-2019-18,application/vnd.oasis.opendocument.text,12882,12857,0.0005\nCC-MAIN-2019-18,application/vnd.openxmlformats-officedocument.presentationml.presentation,36287,36249,0.0015\nCC-MAIN-2019-18,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,74989,74919,0.0030\nCC-MAIN-2019-18,application/vnd.openxmlformats-officedocument.wordprocessingml.document,236177,236007,0.0095\nCC-MAIN-2019-18,application/vnd.wap.xhtml+xml,2366,2307,0.0001\nCC-MAIN-2019-18,application/x-bibtex,49020,48989,0.0020\nCC-MAIN-2019-18,application/x-bittorrent,14208,13378,0.0006\nCC-MAIN-2019-18,application/x-debian-package,8091,8090,0.0003\nCC-MAIN-2019-18,application/x-download,9801,9792,0.0004\nCC-MAIN-2019-18,application/x-endnote-refer,75157,75123,0.0030\nCC-MAIN-2019-18,application/x-gzip,18863,18841,0.0008\nCC-MAIN-2019-18,application/x-httpd-php,16792,16702,0.0007\nCC-MAIN-2019-18,application/x-java-jnlp-file,2136,2130,0.0001\nCC-MAIN-2019-18,application/x-javascript,5985,5984,0.0002\nCC-MAIN-2019-18,application/x-json,522,522,0.0000\nCC-MAIN-2019-18,application/x-mobipocket-ebook,6133,6114,0.0002\nCC-MAIN-2019-18,application/x-msdownload,7837,7746,0.0003\nCC-MAIN-2019-18,application/x-netcdf,11093,11093,0.0004\nCC-MAIN-2019-18,application/x-research-info-systems,114700,114648,0.0046\nCC-MAIN-2019-18,application/x-shockwave-flash,31088,30949,0.0012\nCC-MAIN-2019-18,application/x-tar,15057,14992,0.0006\nCC-MAIN-2019-18,application/x-tex,3151,3148,0.0001\nCC-MAIN-2019-18,application/x-troff-man,7741,7739,0.0003\nCC-MAIN-2019-18,application/x-zip-compressed,11858,11796,0.0005\nCC-MAIN-2019-18,application/xhtml+xml,619414,614153,0.0248\nCC-MAIN-2019-18,application/xml,883340,881416,0.0354\nCC-MAIN-2019-18,application/zip,77181,76329,0.0031\nCC-MAIN-2019-18,audio/mpeg,85545,84859,0.0034\nCC-MAIN-2019-18,audio/x-mpegurl,39369,39277,0.0016\nCC-MAIN-2019-18,audio/x-scpls,5411,5399,0.0002\nCC-MAIN-2019-18,audio/x-wav,36034,36031,0.0014\nCC-MAIN-2019-18,binary/octet-stream,15913,15887,0.0006\nCC-MAIN-2019-18,image/gif,65943,65438,0.0026\nCC-MAIN-2019-18,image/jp2,2561,2561,0.0001\nCC-MAIN-2019-18,image/jpeg,3304597,3290299,0.1323\nCC-MAIN-2019-18,image/jpg,38070,36746,0.0015\nCC-MAIN-2019-18,image/pjpeg,5848,5847,0.0002\nCC-MAIN-2019-18,image/png,598315,595613,0.0240\nCC-MAIN-2019-18,image/svg+xml,12511,12455,0.0005\nCC-MAIN-2019-18,image/tiff,7155,7144,0.0003\nCC-MAIN-2019-18,image/vnd.djvu,11407,11406,0.0005\nCC-MAIN-2019-18,image/webp,15882,15868,0.0006\nCC-MAIN-2019-18,message/rfc822,3526,3516,0.0001\nCC-MAIN-2019-18,text/calendar,810140,809435,0.0324\nCC-MAIN-2019-18,text/css,11123,11123,0.0004\nCC-MAIN-2019-18,text/csv,48260,48228,0.0019\nCC-MAIN-2019-18,text/directory,7405,7402,0.0003\nCC-MAIN-2019-18,text/enriched,21447,21447,0.0009\nCC-MAIN-2019-18,text/html,2433040981,2407675509,97.4066\nCC-MAIN-2019-18,text/javascript,8227,8206,0.0003\nCC-MAIN-2019-18,text/markdown,1085,1085,0.0000\nCC-MAIN-2019-18,text/pdf,93,93,0.0000\nCC-MAIN-2019-18,text/plain,1159711,1158211,0.0464\nCC-MAIN-2019-18,text/prs.lines.tag,2700,2700,0.0001\nCC-MAIN-2019-18,text/tab-separated-values,10329,10323,0.0004\nCC-MAIN-2019-18,text/turtle,9055,9055,0.0004\nCC-MAIN-2019-18,text/vcard,14681,14673,0.0006\nCC-MAIN-2019-18,text/x-bibtex,8423,8406,0.0003\nCC-MAIN-2019-18,text/x-c,4112,4111,0.0002\nCC-MAIN-2019-18,text/x-csrc,10446,10444,0.0004\nCC-MAIN-2019-18,text/x-diff,6548,6544,0.0003\nCC-MAIN-2019-18,text/x-patch,3900,3881,0.0002\nCC-MAIN-2019-18,text/x-perl,1778,1778,0.0001\nCC-MAIN-2019-18,text/x-vcalendar,18304,18293,0.0007\nCC-MAIN-2019-18,text/x-vcard,33745,33701,0.0014\nCC-MAIN-2019-18,text/xml,2228552,2221258,0.0892\nCC-MAIN-2019-18,unknown/unknown,11039,11037,0.0004\nCC-MAIN-2019-18,video/mp4,25528,25399,0.0010\nCC-MAIN-2019-18,video/webm,2208,2203,0.0001\nCC-MAIN-2019-18,video/x-ms-asf,12577,12560,0.0005\nCC-MAIN-2019-22,<other>,37932490,37620383,1.4155\nCC-MAIN-2019-22,application/atom+xml,4191887,4190633,0.1564\nCC-MAIN-2019-22,application/calendar,6909,6908,0.0003\nCC-MAIN-2019-22,application/download,40773,40740,0.0015\nCC-MAIN-2019-22,application/epub+zip,42682,42464,0.0016\nCC-MAIN-2019-22,application/force-download,87078,87011,0.0032\nCC-MAIN-2019-22,application/gpx+xml,7226,7221,0.0003\nCC-MAIN-2019-22,application/ics,10510,10508,0.0004\nCC-MAIN-2019-22,application/javascript,11776,11741,0.0004\nCC-MAIN-2019-22,application/json,443183,442486,0.0165\nCC-MAIN-2019-22,application/ld+json,8522,8519,0.0003\nCC-MAIN-2019-22,application/marc,5162,5162,0.0002\nCC-MAIN-2019-22,application/msword,106140,105709,0.0040\nCC-MAIN-2019-22,application/octet-stream,1149705,1148119,0.0429\nCC-MAIN-2019-22,application/octetstream,8850,8847,0.0003\nCC-MAIN-2019-22,application/pdf,18943219,18888213,0.7069\nCC-MAIN-2019-22,application/pgp-encrypted,1729,1728,0.0001\nCC-MAIN-2019-22,application/pgp-signature,21855,21853,0.0008\nCC-MAIN-2019-22,application/postscript,19770,19756,0.0007\nCC-MAIN-2019-22,application/rdf+xml,56363,56264,0.0021\nCC-MAIN-2019-22,application/rss+xml,2262020,2255482,0.0844\nCC-MAIN-2019-22,application/rtf,19870,19838,0.0007\nCC-MAIN-2019-22,application/save-to-disk,209,209,0.0000\nCC-MAIN-2019-22,application/text,47260,47195,0.0018\nCC-MAIN-2019-22,application/unknown,8144,8140,0.0003\nCC-MAIN-2019-22,application/vnd.android.package-archive,33134,32873,0.0012\nCC-MAIN-2019-22,application/vnd.google-earth.kml+xml,47207,47173,0.0018\nCC-MAIN-2019-22,application/vnd.google-earth.kmz,10454,10452,0.0004\nCC-MAIN-2019-22,application/vnd.ms-excel,41627,41573,0.0016\nCC-MAIN-2019-22,application/vnd.ms-powerpoint,23779,23683,0.0009\nCC-MAIN-2019-22,application/vnd.ms-word,15017,15016,0.0006\nCC-MAIN-2019-22,application/vnd.oasis.opendocument.text,15358,15337,0.0006\nCC-MAIN-2019-22,application/vnd.openxmlformats-officedocument.presentationml.presentation,11318,11304,0.0004\nCC-MAIN-2019-22,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,34777,34698,0.0013\nCC-MAIN-2019-22,application/vnd.openxmlformats-officedocument.wordprocessingml.document,78843,78568,0.0029\nCC-MAIN-2019-22,application/vnd.wap.xhtml+xml,2573,2508,0.0001\nCC-MAIN-2019-22,application/x-bibtex,46748,46653,0.0017\nCC-MAIN-2019-22,application/x-bittorrent,12027,11176,0.0004\nCC-MAIN-2019-22,application/x-debian-package,1655,1653,0.0001\nCC-MAIN-2019-22,application/x-download,20136,20059,0.0008\nCC-MAIN-2019-22,application/x-endnote-refer,66135,65933,0.0025\nCC-MAIN-2019-22,application/x-gzip,15578,15551,0.0006\nCC-MAIN-2019-22,application/x-httpd-php,17267,17041,0.0006\nCC-MAIN-2019-22,application/x-java-jnlp-file,4667,4663,0.0002\nCC-MAIN-2019-22,application/x-javascript,8696,8691,0.0003\nCC-MAIN-2019-22,application/x-json,489,489,0.0000\nCC-MAIN-2019-22,application/x-mobipocket-ebook,6226,6226,0.0002\nCC-MAIN-2019-22,application/x-msdownload,10554,10431,0.0004\nCC-MAIN-2019-22,application/x-netcdf,4846,4846,0.0002\nCC-MAIN-2019-22,application/x-research-info-systems,119481,119194,0.0045\nCC-MAIN-2019-22,application/x-shockwave-flash,24712,24569,0.0009\nCC-MAIN-2019-22,application/x-tar,7147,7126,0.0003\nCC-MAIN-2019-22,application/x-tex,2380,2380,0.0001\nCC-MAIN-2019-22,application/x-troff-man,6465,6461,0.0002\nCC-MAIN-2019-22,application/x-zip-compressed,12722,12598,0.0005\nCC-MAIN-2019-22,application/xhtml+xml,658306,652921,0.0246\nCC-MAIN-2019-22,application/xml,781880,780162,0.0292\nCC-MAIN-2019-22,application/zip,93883,93200,0.0035\nCC-MAIN-2019-22,audio/mpeg,128494,126320,0.0048\nCC-MAIN-2019-22,audio/x-mpegurl,36260,36231,0.0014\nCC-MAIN-2019-22,audio/x-scpls,4636,4630,0.0002\nCC-MAIN-2019-22,audio/x-wav,13523,13516,0.0005\nCC-MAIN-2019-22,binary/octet-stream,17974,17833,0.0007\nCC-MAIN-2019-22,image/gif,86949,85566,0.0032\nCC-MAIN-2019-22,image/jp2,4942,4942,0.0002\nCC-MAIN-2019-22,image/jpeg,3908040,3894490,0.1458\nCC-MAIN-2019-22,image/jpg,69152,67936,0.0026\nCC-MAIN-2019-22,image/pjpeg,9888,9888,0.0004\nCC-MAIN-2019-22,image/png,658929,653717,0.0246\nCC-MAIN-2019-22,image/svg+xml,11604,11588,0.0004\nCC-MAIN-2019-22,image/tiff,6653,6649,0.0002\nCC-MAIN-2019-22,image/vnd.djvu,13945,13945,0.0005\nCC-MAIN-2019-22,image/webp,20959,20957,0.0008\nCC-MAIN-2019-22,message/rfc822,6400,6400,0.0002\nCC-MAIN-2019-22,text/calendar,954450,953713,0.0356\nCC-MAIN-2019-22,text/css,7241,7239,0.0003\nCC-MAIN-2019-22,text/csv,41112,41098,0.0015\nCC-MAIN-2019-22,text/directory,8063,8061,0.0003\nCC-MAIN-2019-22,text/enriched,18035,17983,0.0007\nCC-MAIN-2019-22,text/html,2602473306,2575782529,97.1164\nCC-MAIN-2019-22,text/javascript,12675,12651,0.0005\nCC-MAIN-2019-22,text/markdown,1197,1196,0.0000\nCC-MAIN-2019-22,text/pdf,157,157,0.0000\nCC-MAIN-2019-22,text/plain,1116168,1114070,0.0417\nCC-MAIN-2019-22,text/prs.lines.tag,4367,4367,0.0002\nCC-MAIN-2019-22,text/tab-separated-values,15600,15600,0.0006\nCC-MAIN-2019-22,text/turtle,10006,10005,0.0004\nCC-MAIN-2019-22,text/vcard,16389,16382,0.0006\nCC-MAIN-2019-22,text/x-bibtex,6595,6581,0.0002\nCC-MAIN-2019-22,text/x-c,3071,3070,0.0001\nCC-MAIN-2019-22,text/x-csrc,9585,9580,0.0004\nCC-MAIN-2019-22,text/x-diff,9939,9933,0.0004\nCC-MAIN-2019-22,text/x-patch,5389,5337,0.0002\nCC-MAIN-2019-22,text/x-perl,1171,1171,0.0000\nCC-MAIN-2019-22,text/x-vcalendar,22092,21983,0.0008\nCC-MAIN-2019-22,text/x-vcard,43892,43848,0.0016\nCC-MAIN-2019-22,text/xml,2237703,2230711,0.0835\nCC-MAIN-2019-22,unknown/unknown,10158,10157,0.0004\nCC-MAIN-2019-22,video/mp4,35668,35383,0.0013\nCC-MAIN-2019-22,video/webm,2714,2698,0.0001\nCC-MAIN-2019-22,video/x-ms-asf,11740,11726,0.0004\nCC-MAIN-2019-26,<other>,31849602,31601273,1.2277\nCC-MAIN-2019-26,application/atom+xml,3534486,3533965,0.1362\nCC-MAIN-2019-26,application/calendar,4556,4550,0.0002\nCC-MAIN-2019-26,application/download,40156,40151,0.0015\nCC-MAIN-2019-26,application/epub+zip,29231,29149,0.0011\nCC-MAIN-2019-26,application/force-download,79748,79460,0.0031\nCC-MAIN-2019-26,application/gpx+xml,5661,5643,0.0002\nCC-MAIN-2019-26,application/ics,15187,15187,0.0006\nCC-MAIN-2019-26,application/javascript,6770,6717,0.0003\nCC-MAIN-2019-26,application/json,512160,511554,0.0197\nCC-MAIN-2019-26,application/ld+json,7100,7100,0.0003\nCC-MAIN-2019-26,application/marc,6732,6732,0.0003\nCC-MAIN-2019-26,application/msword,77007,76646,0.0030\nCC-MAIN-2019-26,application/octet-stream,1082184,1080297,0.0417\nCC-MAIN-2019-26,application/octetstream,10741,10652,0.0004\nCC-MAIN-2019-26,application/pdf,15666863,15625933,0.6039\nCC-MAIN-2019-26,application/pgp-encrypted,2167,2167,0.0001\nCC-MAIN-2019-26,application/pgp-signature,22003,22003,0.0008\nCC-MAIN-2019-26,application/postscript,17539,17531,0.0007\nCC-MAIN-2019-26,application/rdf+xml,67955,67921,0.0026\nCC-MAIN-2019-26,application/rss+xml,2248261,2243514,0.0867\nCC-MAIN-2019-26,application/rtf,17120,17087,0.0007\nCC-MAIN-2019-26,application/save-to-disk,231,231,0.0000\nCC-MAIN-2019-26,application/text,44490,44482,0.0017\nCC-MAIN-2019-26,application/unknown,7178,7174,0.0003\nCC-MAIN-2019-26,application/vnd.android.package-archive,16892,16802,0.0007\nCC-MAIN-2019-26,application/vnd.google-earth.kml+xml,36801,36781,0.0014\nCC-MAIN-2019-26,application/vnd.google-earth.kmz,10023,10016,0.0004\nCC-MAIN-2019-26,application/vnd.ms-excel,32672,32612,0.0013\nCC-MAIN-2019-26,application/vnd.ms-powerpoint,19748,19733,0.0008\nCC-MAIN-2019-26,application/vnd.ms-word,14899,14895,0.0006\nCC-MAIN-2019-26,application/vnd.oasis.opendocument.text,12244,12232,0.0005\nCC-MAIN-2019-26,application/vnd.openxmlformats-officedocument.presentationml.presentation,5538,5529,0.0002\nCC-MAIN-2019-26,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,23536,23481,0.0009\nCC-MAIN-2019-26,application/vnd.openxmlformats-officedocument.wordprocessingml.document,48574,48462,0.0019\nCC-MAIN-2019-26,application/vnd.wap.xhtml+xml,1827,1814,0.0001\nCC-MAIN-2019-26,application/x-bibtex,36405,36375,0.0014\nCC-MAIN-2019-26,application/x-bittorrent,8568,8019,0.0003\nCC-MAIN-2019-26,application/x-debian-package,1204,1204,0.0000\nCC-MAIN-2019-26,application/x-download,22268,22166,0.0009\nCC-MAIN-2019-26,application/x-endnote-refer,61221,61179,0.0024\nCC-MAIN-2019-26,application/x-gzip,20941,20931,0.0008\nCC-MAIN-2019-26,application/x-httpd-php,11979,11923,0.0005\nCC-MAIN-2019-26,application/x-java-jnlp-file,2798,2796,0.0001\nCC-MAIN-2019-26,application/x-javascript,7957,7955,0.0003\nCC-MAIN-2019-26,application/x-json,1205,1205,0.0000\nCC-MAIN-2019-26,application/x-mobipocket-ebook,3777,3776,0.0001\nCC-MAIN-2019-26,application/x-msdownload,7436,7345,0.0003\nCC-MAIN-2019-26,application/x-netcdf,2424,2424,0.0001\nCC-MAIN-2019-26,application/x-research-info-systems,122464,122360,0.0047\nCC-MAIN-2019-26,application/x-shockwave-flash,22830,22711,0.0009\nCC-MAIN-2019-26,application/x-tar,9114,9106,0.0004\nCC-MAIN-2019-26,application/x-tex,2477,2477,0.0001\nCC-MAIN-2019-26,application/x-troff-man,10976,10973,0.0004\nCC-MAIN-2019-26,application/x-zip-compressed,16109,16007,0.0006\nCC-MAIN-2019-26,application/xhtml+xml,792128,782712,0.0305\nCC-MAIN-2019-26,application/xml,747680,746537,0.0288\nCC-MAIN-2019-26,application/zip,81310,80509,0.0031\nCC-MAIN-2019-26,audio/mpeg,90578,89851,0.0035\nCC-MAIN-2019-26,audio/x-mpegurl,24612,24556,0.0009\nCC-MAIN-2019-26,audio/x-scpls,3666,3664,0.0001\nCC-MAIN-2019-26,audio/x-wav,9011,9011,0.0003\nCC-MAIN-2019-26,binary/octet-stream,16797,16570,0.0006\nCC-MAIN-2019-26,image/gif,74672,74183,0.0029\nCC-MAIN-2019-26,image/jp2,5896,5896,0.0002\nCC-MAIN-2019-26,image/jpeg,3503545,3493652,0.1350\nCC-MAIN-2019-26,image/jpg,66485,65194,0.0026\nCC-MAIN-2019-26,image/pjpeg,10364,10361,0.0004\nCC-MAIN-2019-26,image/png,561140,557223,0.0216\nCC-MAIN-2019-26,image/svg+xml,12780,12743,0.0005\nCC-MAIN-2019-26,image/tiff,8994,8989,0.0003\nCC-MAIN-2019-26,image/vnd.djvu,13451,13346,0.0005\nCC-MAIN-2019-26,image/webp,9864,9864,0.0004\nCC-MAIN-2019-26,message/rfc822,7137,7137,0.0003\nCC-MAIN-2019-26,text/calendar,1010844,1010134,0.0390\nCC-MAIN-2019-26,text/css,4983,4981,0.0002\nCC-MAIN-2019-26,text/csv,44068,44064,0.0017\nCC-MAIN-2019-26,text/directory,8054,8052,0.0003\nCC-MAIN-2019-26,text/enriched,18413,18408,0.0007\nCC-MAIN-2019-26,text/html,2527655390,2505012014,97.4326\nCC-MAIN-2019-26,text/javascript,10940,10936,0.0004\nCC-MAIN-2019-26,text/markdown,1264,1264,0.0000\nCC-MAIN-2019-26,text/pdf,141,141,0.0000\nCC-MAIN-2019-26,text/plain,1049501,1048538,0.0405\nCC-MAIN-2019-26,text/prs.lines.tag,2480,2480,0.0001\nCC-MAIN-2019-26,text/tab-separated-values,12949,12949,0.0005\nCC-MAIN-2019-26,text/turtle,11432,11432,0.0004\nCC-MAIN-2019-26,text/vcard,17259,17235,0.0007\nCC-MAIN-2019-26,text/x-bibtex,6249,6249,0.0002\nCC-MAIN-2019-26,text/x-c,8545,8545,0.0003\nCC-MAIN-2019-26,text/x-csrc,12863,12863,0.0005\nCC-MAIN-2019-26,text/x-diff,11024,11017,0.0004\nCC-MAIN-2019-26,text/x-patch,6252,6248,0.0002\nCC-MAIN-2019-26,text/x-perl,1122,1122,0.0000\nCC-MAIN-2019-26,text/x-vcalendar,19491,19476,0.0008\nCC-MAIN-2019-26,text/x-vcard,43370,43329,0.0017\nCC-MAIN-2019-26,text/xml,2265528,2259756,0.0873\nCC-MAIN-2019-26,unknown/unknown,11744,11725,0.0005\nCC-MAIN-2019-26,video/mp4,27579,27413,0.0011\nCC-MAIN-2019-26,video/webm,1547,1544,0.0001\nCC-MAIN-2019-26,video/x-ms-asf,7940,7938,0.0003\nCC-MAIN-2019-30,<other>,39646323,39362326,1.5279\nCC-MAIN-2019-30,application/atom+xml,4105365,4104740,0.1582\nCC-MAIN-2019-30,application/calendar,5619,5616,0.0002\nCC-MAIN-2019-30,application/download,37328,37321,0.0014\nCC-MAIN-2019-30,application/epub+zip,33180,33093,0.0013\nCC-MAIN-2019-30,application/force-download,84288,83997,0.0032\nCC-MAIN-2019-30,application/gpx+xml,5009,5003,0.0002\nCC-MAIN-2019-30,application/ics,16441,16440,0.0006\nCC-MAIN-2019-30,application/javascript,11158,11151,0.0004\nCC-MAIN-2019-30,application/json,556712,556128,0.0215\nCC-MAIN-2019-30,application/ld+json,9604,9601,0.0004\nCC-MAIN-2019-30,application/marc,7470,7470,0.0003\nCC-MAIN-2019-30,application/msword,78129,77840,0.0030\nCC-MAIN-2019-30,application/octet-stream,1105032,1103788,0.0426\nCC-MAIN-2019-30,application/octetstream,4915,4910,0.0002\nCC-MAIN-2019-30,application/pdf,3155725,3135150,0.1216\nCC-MAIN-2019-30,application/pgp-encrypted,1544,1544,0.0001\nCC-MAIN-2019-30,application/pgp-signature,18140,18138,0.0007\nCC-MAIN-2019-30,application/postscript,4953,4952,0.0002\nCC-MAIN-2019-30,application/rdf+xml,58512,58488,0.0023\nCC-MAIN-2019-30,application/rss+xml,2235292,2230898,0.0861\nCC-MAIN-2019-30,application/rtf,16573,16561,0.0006\nCC-MAIN-2019-30,application/save-to-disk,132,132,0.0000\nCC-MAIN-2019-30,application/text,73379,73113,0.0028\nCC-MAIN-2019-30,application/unknown,5792,5792,0.0002\nCC-MAIN-2019-30,application/vnd.android.package-archive,22509,22339,0.0009\nCC-MAIN-2019-30,application/vnd.google-earth.kml+xml,33433,33417,0.0013\nCC-MAIN-2019-30,application/vnd.google-earth.kmz,5177,5118,0.0002\nCC-MAIN-2019-30,application/vnd.ms-excel,30186,30121,0.0012\nCC-MAIN-2019-30,application/vnd.ms-powerpoint,23762,23735,0.0009\nCC-MAIN-2019-30,application/vnd.ms-word,17501,17501,0.0007\nCC-MAIN-2019-30,application/vnd.oasis.opendocument.text,12674,12662,0.0005\nCC-MAIN-2019-30,application/vnd.openxmlformats-officedocument.presentationml.presentation,6147,6132,0.0002\nCC-MAIN-2019-30,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,28846,28760,0.0011\nCC-MAIN-2019-30,application/vnd.openxmlformats-officedocument.wordprocessingml.document,53111,52909,0.0020\nCC-MAIN-2019-30,application/vnd.wap.xhtml+xml,1637,1627,0.0001\nCC-MAIN-2019-30,application/x-bibtex,45244,45196,0.0017\nCC-MAIN-2019-30,application/x-bittorrent,7180,6783,0.0003\nCC-MAIN-2019-30,application/x-debian-package,1575,1574,0.0001\nCC-MAIN-2019-30,application/x-download,22525,22518,0.0009\nCC-MAIN-2019-30,application/x-endnote-refer,87804,87503,0.0034\nCC-MAIN-2019-30,application/x-gzip,23969,23958,0.0009\nCC-MAIN-2019-30,application/x-httpd-php,12497,12290,0.0005\nCC-MAIN-2019-30,application/x-java-jnlp-file,6740,6738,0.0003\nCC-MAIN-2019-30,application/x-javascript,9340,9332,0.0004\nCC-MAIN-2019-30,application/x-json,891,891,0.0000\nCC-MAIN-2019-30,application/x-mobipocket-ebook,4017,4017,0.0002\nCC-MAIN-2019-30,application/x-msdownload,11757,11661,0.0005\nCC-MAIN-2019-30,application/x-netcdf,8131,8131,0.0003\nCC-MAIN-2019-30,application/x-research-info-systems,130922,130875,0.0050\nCC-MAIN-2019-30,application/x-shockwave-flash,23894,23732,0.0009\nCC-MAIN-2019-30,application/x-tar,5901,5892,0.0002\nCC-MAIN-2019-30,application/x-tex,3535,3535,0.0001\nCC-MAIN-2019-30,application/x-troff-man,8991,8990,0.0003\nCC-MAIN-2019-30,application/x-zip-compressed,15983,15909,0.0006\nCC-MAIN-2019-30,application/xhtml+xml,946841,939853,0.0365\nCC-MAIN-2019-30,application/xml,814880,812430,0.0314\nCC-MAIN-2019-30,application/zip,103308,102389,0.0040\nCC-MAIN-2019-30,audio/mpeg,114368,111782,0.0044\nCC-MAIN-2019-30,audio/x-mpegurl,26143,26052,0.0010\nCC-MAIN-2019-30,audio/x-scpls,3402,3397,0.0001\nCC-MAIN-2019-30,audio/x-wav,11184,11180,0.0004\nCC-MAIN-2019-30,binary/octet-stream,12831,12666,0.0005\nCC-MAIN-2019-30,image/gif,68634,68062,0.0026\nCC-MAIN-2019-30,image/jp2,5958,5958,0.0002\nCC-MAIN-2019-30,image/jpeg,3320364,3313208,0.1280\nCC-MAIN-2019-30,image/jpg,79180,77778,0.0031\nCC-MAIN-2019-30,image/pjpeg,10393,10374,0.0004\nCC-MAIN-2019-30,image/png,482326,478923,0.0186\nCC-MAIN-2019-30,image/svg+xml,7990,7959,0.0003\nCC-MAIN-2019-30,image/tiff,12149,12147,0.0005\nCC-MAIN-2019-30,image/vnd.djvu,10204,10130,0.0004\nCC-MAIN-2019-30,image/webp,19361,19361,0.0007\nCC-MAIN-2019-30,message/rfc822,8358,8355,0.0003\nCC-MAIN-2019-30,text/calendar,1037339,1036429,0.0400\nCC-MAIN-2019-30,text/css,5596,5593,0.0002\nCC-MAIN-2019-30,text/csv,55273,55236,0.0021\nCC-MAIN-2019-30,text/directory,8611,8609,0.0003\nCC-MAIN-2019-30,text/enriched,28531,28308,0.0011\nCC-MAIN-2019-30,text/html,2531715286,2508172788,97.5689\nCC-MAIN-2019-30,text/javascript,14522,14517,0.0006\nCC-MAIN-2019-30,text/markdown,788,788,0.0000\nCC-MAIN-2019-30,text/pdf,305,305,0.0000\nCC-MAIN-2019-30,text/plain,1348812,1347970,0.0520\nCC-MAIN-2019-30,text/prs.lines.tag,3882,3882,0.0001\nCC-MAIN-2019-30,text/tab-separated-values,14417,14417,0.0006\nCC-MAIN-2019-30,text/turtle,12434,12434,0.0005\nCC-MAIN-2019-30,text/vcard,21061,21005,0.0008\nCC-MAIN-2019-30,text/x-bibtex,5729,5728,0.0002\nCC-MAIN-2019-30,text/x-c,4952,4952,0.0002\nCC-MAIN-2019-30,text/x-csrc,14246,14245,0.0005\nCC-MAIN-2019-30,text/x-diff,5245,5233,0.0002\nCC-MAIN-2019-30,text/x-patch,5830,5802,0.0002\nCC-MAIN-2019-30,text/x-perl,691,690,0.0000\nCC-MAIN-2019-30,text/x-vcalendar,19392,19386,0.0007\nCC-MAIN-2019-30,text/x-vcard,45112,45056,0.0017\nCC-MAIN-2019-30,text/xml,2371112,2366316,0.0914\nCC-MAIN-2019-30,unknown/unknown,14595,14577,0.0006\nCC-MAIN-2019-30,video/mp4,34159,33961,0.0013\nCC-MAIN-2019-30,video/webm,2295,2293,0.0001\nCC-MAIN-2019-30,video/x-ms-asf,7792,7791,0.0003\nCC-MAIN-2019-35,<other>,44278022,43823177,1.4985\nCC-MAIN-2019-35,application/atom+xml,3997591,3996859,0.1353\nCC-MAIN-2019-35,application/calendar,6606,6606,0.0002\nCC-MAIN-2019-35,application/download,42697,42682,0.0014\nCC-MAIN-2019-35,application/epub+zip,33760,33647,0.0011\nCC-MAIN-2019-35,application/force-download,97142,96881,0.0033\nCC-MAIN-2019-35,application/gpx+xml,6811,6809,0.0002\nCC-MAIN-2019-35,application/ics,15300,15293,0.0005\nCC-MAIN-2019-35,application/javascript,14588,14585,0.0005\nCC-MAIN-2019-35,application/json,582303,581826,0.0197\nCC-MAIN-2019-35,application/ld+json,10365,10364,0.0004\nCC-MAIN-2019-35,application/marc,8372,8372,0.0003\nCC-MAIN-2019-35,application/msword,101778,101392,0.0034\nCC-MAIN-2019-35,application/octet-stream,1229747,1228009,0.0416\nCC-MAIN-2019-35,application/octetstream,7086,7084,0.0002\nCC-MAIN-2019-35,application/pdf,3897669,3867743,0.1319\nCC-MAIN-2019-35,application/pgp-encrypted,1928,1928,0.0001\nCC-MAIN-2019-35,application/pgp-signature,38007,38003,0.0013\nCC-MAIN-2019-35,application/postscript,5682,5679,0.0002\nCC-MAIN-2019-35,application/rdf+xml,62778,62762,0.0021\nCC-MAIN-2019-35,application/rss+xml,2579076,2573126,0.0873\nCC-MAIN-2019-35,application/rtf,24730,24718,0.0008\nCC-MAIN-2019-35,application/save-to-disk,349,349,0.0000\nCC-MAIN-2019-35,application/text,73303,73174,0.0025\nCC-MAIN-2019-35,application/unknown,8558,8558,0.0003\nCC-MAIN-2019-35,application/vnd.android.package-archive,25471,25282,0.0009\nCC-MAIN-2019-35,application/vnd.google-earth.kml+xml,51402,51384,0.0017\nCC-MAIN-2019-35,application/vnd.google-earth.kmz,13091,13086,0.0004\nCC-MAIN-2019-35,application/vnd.ms-excel,38107,38013,0.0013\nCC-MAIN-2019-35,application/vnd.ms-powerpoint,23990,23968,0.0008\nCC-MAIN-2019-35,application/vnd.ms-word,19876,19874,0.0007\nCC-MAIN-2019-35,application/vnd.oasis.opendocument.text,16223,16202,0.0005\nCC-MAIN-2019-35,application/vnd.openxmlformats-officedocument.presentationml.presentation,6581,6562,0.0002\nCC-MAIN-2019-35,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,32855,32761,0.0011\nCC-MAIN-2019-35,application/vnd.openxmlformats-officedocument.wordprocessingml.document,61075,60807,0.0021\nCC-MAIN-2019-35,application/vnd.wap.xhtml+xml,1936,1902,0.0001\nCC-MAIN-2019-35,application/x-bibtex,49040,48961,0.0017\nCC-MAIN-2019-35,application/x-bittorrent,11394,10868,0.0004\nCC-MAIN-2019-35,application/x-debian-package,2383,2383,0.0001\nCC-MAIN-2019-35,application/x-download,35337,35307,0.0012\nCC-MAIN-2019-35,application/x-endnote-refer,88947,88796,0.0030\nCC-MAIN-2019-35,application/x-gzip,27457,27427,0.0009\nCC-MAIN-2019-35,application/x-httpd-php,16835,16597,0.0006\nCC-MAIN-2019-35,application/x-java-jnlp-file,5438,5432,0.0002\nCC-MAIN-2019-35,application/x-javascript,14379,14375,0.0005\nCC-MAIN-2019-35,application/x-json,514,514,0.0000\nCC-MAIN-2019-35,application/x-mobipocket-ebook,3114,3113,0.0001\nCC-MAIN-2019-35,application/x-msdownload,9540,9434,0.0003\nCC-MAIN-2019-35,application/x-netcdf,4830,4830,0.0002\nCC-MAIN-2019-35,application/x-research-info-systems,152299,152230,0.0052\nCC-MAIN-2019-35,application/x-shockwave-flash,17563,17477,0.0006\nCC-MAIN-2019-35,application/x-tar,4202,4199,0.0001\nCC-MAIN-2019-35,application/x-tex,1903,1903,0.0001\nCC-MAIN-2019-35,application/x-troff-man,6608,6590,0.0002\nCC-MAIN-2019-35,application/x-zip-compressed,17251,17182,0.0006\nCC-MAIN-2019-35,application/xhtml+xml,1131443,1124627,0.0383\nCC-MAIN-2019-35,application/xml,934469,933047,0.0316\nCC-MAIN-2019-35,application/zip,100489,99656,0.0034\nCC-MAIN-2019-35,audio/mpeg,104009,101952,0.0035\nCC-MAIN-2019-35,audio/x-mpegurl,32655,32641,0.0011\nCC-MAIN-2019-35,audio/x-scpls,3934,3931,0.0001\nCC-MAIN-2019-35,audio/x-wav,10293,10292,0.0003\nCC-MAIN-2019-35,binary/octet-stream,24609,24552,0.0008\nCC-MAIN-2019-35,image/gif,73605,72956,0.0025\nCC-MAIN-2019-35,image/jp2,8893,8885,0.0003\nCC-MAIN-2019-35,image/jpeg,3770941,3762682,0.1276\nCC-MAIN-2019-35,image/jpg,80250,79012,0.0027\nCC-MAIN-2019-35,image/pjpeg,10958,10956,0.0004\nCC-MAIN-2019-35,image/png,570256,567349,0.0193\nCC-MAIN-2019-35,image/svg+xml,14883,14865,0.0005\nCC-MAIN-2019-35,image/tiff,9621,9617,0.0003\nCC-MAIN-2019-35,image/vnd.djvu,8970,8969,0.0003\nCC-MAIN-2019-35,image/webp,18563,18563,0.0006\nCC-MAIN-2019-35,message/rfc822,10606,10602,0.0004\nCC-MAIN-2019-35,text/calendar,1246197,1245330,0.0422\nCC-MAIN-2019-35,text/css,6070,6069,0.0002\nCC-MAIN-2019-35,text/csv,61699,61660,0.0021\nCC-MAIN-2019-35,text/directory,8818,8812,0.0003\nCC-MAIN-2019-35,text/enriched,27679,27583,0.0009\nCC-MAIN-2019-35,text/html,2884262141,2857796267,97.6116\nCC-MAIN-2019-35,text/javascript,12764,12759,0.0004\nCC-MAIN-2019-35,text/markdown,1123,1123,0.0000\nCC-MAIN-2019-35,text/pdf,743,743,0.0000\nCC-MAIN-2019-35,text/plain,1662607,1661479,0.0563\nCC-MAIN-2019-35,text/prs.lines.tag,3840,3840,0.0001\nCC-MAIN-2019-35,text/tab-separated-values,16278,16278,0.0006\nCC-MAIN-2019-35,text/turtle,12342,12341,0.0004\nCC-MAIN-2019-35,text/vcard,22541,22525,0.0008\nCC-MAIN-2019-35,text/x-bibtex,6920,6919,0.0002\nCC-MAIN-2019-35,text/x-c,2504,2496,0.0001\nCC-MAIN-2019-35,text/x-csrc,21630,21629,0.0007\nCC-MAIN-2019-35,text/x-diff,15603,15576,0.0005\nCC-MAIN-2019-35,text/x-patch,6875,6826,0.0002\nCC-MAIN-2019-35,text/x-perl,1892,1892,0.0001\nCC-MAIN-2019-35,text/x-vcalendar,22756,22752,0.0008\nCC-MAIN-2019-35,text/x-vcard,61319,61269,0.0021\nCC-MAIN-2019-35,text/xml,2488240,2478867,0.0842\nCC-MAIN-2019-35,unknown/unknown,12667,12659,0.0004\nCC-MAIN-2019-35,video/mp4,36296,36121,0.0012\nCC-MAIN-2019-35,video/webm,1763,1760,0.0001\nCC-MAIN-2019-35,video/x-ms-asf,9422,9415,0.0003\nCC-MAIN-2019-39,<other>,38209814,37967708,1.4920\nCC-MAIN-2019-39,application/atom+xml,3776231,3775633,0.1474\nCC-MAIN-2019-39,application/calendar,5953,5953,0.0002\nCC-MAIN-2019-39,application/download,57359,57355,0.0022\nCC-MAIN-2019-39,application/epub+zip,37770,37560,0.0015\nCC-MAIN-2019-39,application/force-download,139370,139008,0.0054\nCC-MAIN-2019-39,application/gpx+xml,6057,6051,0.0002\nCC-MAIN-2019-39,application/ics,13635,13635,0.0005\nCC-MAIN-2019-39,application/javascript,18905,18899,0.0007\nCC-MAIN-2019-39,application/json,624244,623395,0.0244\nCC-MAIN-2019-39,application/ld+json,11409,11409,0.0004\nCC-MAIN-2019-39,application/marc,9760,9746,0.0004\nCC-MAIN-2019-39,application/msword,100039,99440,0.0039\nCC-MAIN-2019-39,application/octet-stream,1354049,1351871,0.0529\nCC-MAIN-2019-39,application/octetstream,9457,9420,0.0004\nCC-MAIN-2019-39,application/pdf,24899169,24821534,0.9722\nCC-MAIN-2019-39,application/pgp-encrypted,1602,1602,0.0001\nCC-MAIN-2019-39,application/pgp-signature,38128,38128,0.0015\nCC-MAIN-2019-39,application/postscript,22334,22317,0.0009\nCC-MAIN-2019-39,application/rdf+xml,76795,76783,0.0030\nCC-MAIN-2019-39,application/rss+xml,2189634,2185344,0.0855\nCC-MAIN-2019-39,application/rtf,26846,26835,0.0010\nCC-MAIN-2019-39,application/save-to-disk,360,360,0.0000\nCC-MAIN-2019-39,application/text,83520,83338,0.0033\nCC-MAIN-2019-39,application/unknown,9535,9530,0.0004\nCC-MAIN-2019-39,application/vnd.android.package-archive,25639,25415,0.0010\nCC-MAIN-2019-39,application/vnd.google-earth.kml+xml,44024,43945,0.0017\nCC-MAIN-2019-39,application/vnd.google-earth.kmz,6806,6795,0.0003\nCC-MAIN-2019-39,application/vnd.ms-excel,44290,44209,0.0017\nCC-MAIN-2019-39,application/vnd.ms-powerpoint,19778,19749,0.0008\nCC-MAIN-2019-39,application/vnd.ms-word,18338,18329,0.0007\nCC-MAIN-2019-39,application/vnd.oasis.opendocument.text,20306,20279,0.0008\nCC-MAIN-2019-39,application/vnd.openxmlformats-officedocument.presentationml.presentation,6932,6914,0.0003\nCC-MAIN-2019-39,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,32469,32349,0.0013\nCC-MAIN-2019-39,application/vnd.openxmlformats-officedocument.wordprocessingml.document,63950,63641,0.0025\nCC-MAIN-2019-39,application/vnd.wap.xhtml+xml,2026,1944,0.0001\nCC-MAIN-2019-39,application/x-bibtex,52020,51941,0.0020\nCC-MAIN-2019-39,application/x-bittorrent,11123,10616,0.0004\nCC-MAIN-2019-39,application/x-debian-package,1193,1193,0.0000\nCC-MAIN-2019-39,application/x-download,36109,36089,0.0014\nCC-MAIN-2019-39,application/x-endnote-refer,98433,98237,0.0038\nCC-MAIN-2019-39,application/x-gzip,31884,31862,0.0012\nCC-MAIN-2019-39,application/x-httpd-php,15172,15113,0.0006\nCC-MAIN-2019-39,application/x-java-jnlp-file,6139,6134,0.0002\nCC-MAIN-2019-39,application/x-javascript,8455,8453,0.0003\nCC-MAIN-2019-39,application/x-json,334,334,0.0000\nCC-MAIN-2019-39,application/x-mobipocket-ebook,2887,2887,0.0001\nCC-MAIN-2019-39,application/x-msdownload,12978,12840,0.0005\nCC-MAIN-2019-39,application/x-netcdf,2788,2788,0.0001\nCC-MAIN-2019-39,application/x-research-info-systems,150973,150846,0.0059\nCC-MAIN-2019-39,application/x-shockwave-flash,19594,19492,0.0008\nCC-MAIN-2019-39,application/x-tar,9591,9578,0.0004\nCC-MAIN-2019-39,application/x-tex,3025,3023,0.0001\nCC-MAIN-2019-39,application/x-troff-man,12749,12739,0.0005\nCC-MAIN-2019-39,application/x-zip-compressed,18216,18101,0.0007\nCC-MAIN-2019-39,application/xhtml+xml,1133280,1126343,0.0443\nCC-MAIN-2019-39,application/xml,823318,821869,0.0321\nCC-MAIN-2019-39,application/zip,121503,120725,0.0047\nCC-MAIN-2019-39,audio/mpeg,119773,116332,0.0047\nCC-MAIN-2019-39,audio/x-mpegurl,25297,25263,0.0010\nCC-MAIN-2019-39,audio/x-scpls,2831,2829,0.0001\nCC-MAIN-2019-39,audio/x-wav,14835,14804,0.0006\nCC-MAIN-2019-39,binary/octet-stream,26744,26614,0.0010\nCC-MAIN-2019-39,image/gif,76513,75882,0.0030\nCC-MAIN-2019-39,image/jp2,8298,8297,0.0003\nCC-MAIN-2019-39,image/jpeg,4009282,4000375,0.1565\nCC-MAIN-2019-39,image/jpg,74257,73232,0.0029\nCC-MAIN-2019-39,image/pjpeg,14950,14950,0.0006\nCC-MAIN-2019-39,image/png,624142,621277,0.0244\nCC-MAIN-2019-39,image/svg+xml,12010,11999,0.0005\nCC-MAIN-2019-39,image/tiff,13208,13205,0.0005\nCC-MAIN-2019-39,image/vnd.djvu,6958,6958,0.0003\nCC-MAIN-2019-39,image/webp,17322,17322,0.0007\nCC-MAIN-2019-39,message/rfc822,12175,12174,0.0005\nCC-MAIN-2019-39,text/calendar,1086381,1085708,0.0424\nCC-MAIN-2019-39,text/css,6028,6027,0.0002\nCC-MAIN-2019-39,text/csv,60559,60530,0.0024\nCC-MAIN-2019-39,text/directory,11501,11498,0.0004\nCC-MAIN-2019-39,text/enriched,31462,31386,0.0012\nCC-MAIN-2019-39,text/html,2476345244,2454374451,96.6921\nCC-MAIN-2019-39,text/javascript,11536,11533,0.0005\nCC-MAIN-2019-39,text/markdown,828,828,0.0000\nCC-MAIN-2019-39,text/pdf,1510,1510,0.0001\nCC-MAIN-2019-39,text/plain,1483597,1482556,0.0579\nCC-MAIN-2019-39,text/prs.lines.tag,2892,2892,0.0001\nCC-MAIN-2019-39,text/tab-separated-values,14110,14110,0.0006\nCC-MAIN-2019-39,text/turtle,14703,14703,0.0006\nCC-MAIN-2019-39,text/vcard,21320,21295,0.0008\nCC-MAIN-2019-39,text/x-bibtex,6730,6729,0.0003\nCC-MAIN-2019-39,text/x-c,3758,3756,0.0001\nCC-MAIN-2019-39,text/x-csrc,21173,21173,0.0008\nCC-MAIN-2019-39,text/x-diff,8018,8007,0.0003\nCC-MAIN-2019-39,text/x-patch,7721,7703,0.0003\nCC-MAIN-2019-39,text/x-perl,3249,3249,0.0001\nCC-MAIN-2019-39,text/x-vcalendar,22100,22100,0.0009\nCC-MAIN-2019-39,text/x-vcard,59646,59593,0.0023\nCC-MAIN-2019-39,text/xml,2136162,2130138,0.0834\nCC-MAIN-2019-39,unknown/unknown,16912,16903,0.0007\nCC-MAIN-2019-39,video/mp4,38053,37873,0.0015\nCC-MAIN-2019-39,video/webm,2003,1994,0.0001\nCC-MAIN-2019-39,video/x-ms-asf,8824,8819,0.0003\nCC-MAIN-2019-43,<other>,38053275,37753143,1.2604\nCC-MAIN-2019-43,application/atom+xml,3217018,3216327,0.1066\nCC-MAIN-2019-43,application/calendar,5302,5301,0.0002\nCC-MAIN-2019-43,application/download,51836,51827,0.0017\nCC-MAIN-2019-43,application/epub+zip,31127,31005,0.0010\nCC-MAIN-2019-43,application/force-download,132406,132216,0.0044\nCC-MAIN-2019-43,application/gpx+xml,5663,5663,0.0002\nCC-MAIN-2019-43,application/ics,11440,11439,0.0004\nCC-MAIN-2019-43,application/javascript,13124,13122,0.0004\nCC-MAIN-2019-43,application/json,688530,687570,0.0228\nCC-MAIN-2019-43,application/ld+json,16652,16652,0.0006\nCC-MAIN-2019-43,application/marc,14945,14943,0.0005\nCC-MAIN-2019-43,application/msword,78613,78228,0.0026\nCC-MAIN-2019-43,application/octet-stream,1239858,1238101,0.0411\nCC-MAIN-2019-43,application/octetstream,6292,6286,0.0002\nCC-MAIN-2019-43,application/pdf,11363786,11317186,0.3764\nCC-MAIN-2019-43,application/pgp-encrypted,2391,2391,0.0001\nCC-MAIN-2019-43,application/pgp-signature,26185,26181,0.0009\nCC-MAIN-2019-43,application/postscript,19671,19660,0.0007\nCC-MAIN-2019-43,application/rdf+xml,95889,95880,0.0032\nCC-MAIN-2019-43,application/rss+xml,2242848,2237841,0.0743\nCC-MAIN-2019-43,application/rtf,38173,38164,0.0013\nCC-MAIN-2019-43,application/save-to-disk,236,236,0.0000\nCC-MAIN-2019-43,application/text,97640,97575,0.0032\nCC-MAIN-2019-43,application/unknown,7305,7299,0.0002\nCC-MAIN-2019-43,application/vnd.android.package-archive,31793,31562,0.0011\nCC-MAIN-2019-43,application/vnd.google-earth.kml+xml,45948,45927,0.0015\nCC-MAIN-2019-43,application/vnd.google-earth.kmz,8552,8546,0.0003\nCC-MAIN-2019-43,application/vnd.ms-excel,37517,37424,0.0012\nCC-MAIN-2019-43,application/vnd.ms-powerpoint,34590,34468,0.0011\nCC-MAIN-2019-43,application/vnd.ms-word,20857,20844,0.0007\nCC-MAIN-2019-43,application/vnd.oasis.opendocument.text,17896,17886,0.0006\nCC-MAIN-2019-43,application/vnd.openxmlformats-officedocument.presentationml.presentation,6139,6115,0.0002\nCC-MAIN-2019-43,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,30864,30760,0.0010\nCC-MAIN-2019-43,application/vnd.openxmlformats-officedocument.wordprocessingml.document,67575,67308,0.0022\nCC-MAIN-2019-43,application/vnd.wap.xhtml+xml,2525,2416,0.0001\nCC-MAIN-2019-43,application/x-bibtex,67423,67283,0.0022\nCC-MAIN-2019-43,application/x-bittorrent,14215,13515,0.0005\nCC-MAIN-2019-43,application/x-debian-package,2976,2976,0.0001\nCC-MAIN-2019-43,application/x-download,34287,34091,0.0011\nCC-MAIN-2019-43,application/x-endnote-refer,126828,126691,0.0042\nCC-MAIN-2019-43,application/x-gzip,31816,31718,0.0011\nCC-MAIN-2019-43,application/x-httpd-php,19208,19173,0.0006\nCC-MAIN-2019-43,application/x-java-jnlp-file,4357,4350,0.0001\nCC-MAIN-2019-43,application/x-javascript,14707,14703,0.0005\nCC-MAIN-2019-43,application/x-json,213,213,0.0000\nCC-MAIN-2019-43,application/x-mobipocket-ebook,3376,3375,0.0001\nCC-MAIN-2019-43,application/x-msdownload,8754,8563,0.0003\nCC-MAIN-2019-43,application/x-netcdf,9052,9052,0.0003\nCC-MAIN-2019-43,application/x-research-info-systems,223393,222873,0.0074\nCC-MAIN-2019-43,application/x-shockwave-flash,19200,19132,0.0006\nCC-MAIN-2019-43,application/x-tar,4445,4441,0.0001\nCC-MAIN-2019-43,application/x-tex,1381,1379,0.0000\nCC-MAIN-2019-43,application/x-troff-man,17170,17166,0.0006\nCC-MAIN-2019-43,application/x-zip-compressed,14649,14546,0.0005\nCC-MAIN-2019-43,application/xhtml+xml,1576151,1572752,0.0522\nCC-MAIN-2019-43,application/xml,900010,898786,0.0298\nCC-MAIN-2019-43,application/zip,92521,91894,0.0031\nCC-MAIN-2019-43,audio/mpeg,97023,93477,0.0032\nCC-MAIN-2019-43,audio/x-mpegurl,28776,28752,0.0010\nCC-MAIN-2019-43,audio/x-scpls,2886,2885,0.0001\nCC-MAIN-2019-43,audio/x-wav,20833,20831,0.0007\nCC-MAIN-2019-43,binary/octet-stream,16474,16403,0.0005\nCC-MAIN-2019-43,image/gif,77485,76809,0.0026\nCC-MAIN-2019-43,image/jp2,6140,6139,0.0002\nCC-MAIN-2019-43,image/jpeg,3512057,3506758,0.1163\nCC-MAIN-2019-43,image/jpg,69429,67131,0.0023\nCC-MAIN-2019-43,image/pjpeg,10820,10819,0.0004\nCC-MAIN-2019-43,image/png,548148,545863,0.0182\nCC-MAIN-2019-43,image/svg+xml,10944,10912,0.0004\nCC-MAIN-2019-43,image/tiff,10682,10681,0.0004\nCC-MAIN-2019-43,image/vnd.djvu,7726,7724,0.0003\nCC-MAIN-2019-43,image/webp,29135,29117,0.0010\nCC-MAIN-2019-43,message/rfc822,11387,11382,0.0004\nCC-MAIN-2019-43,text/calendar,1025407,1024812,0.0340\nCC-MAIN-2019-43,text/css,7700,7695,0.0003\nCC-MAIN-2019-43,text/csv,93722,93709,0.0031\nCC-MAIN-2019-43,text/directory,7720,7719,0.0003\nCC-MAIN-2019-43,text/enriched,39081,39067,0.0013\nCC-MAIN-2019-43,text/html,2947958725,2922909341,97.6457\nCC-MAIN-2019-43,text/javascript,12694,12692,0.0004\nCC-MAIN-2019-43,text/markdown,754,754,0.0000\nCC-MAIN-2019-43,text/pdf,641,639,0.0000\nCC-MAIN-2019-43,text/plain,1817478,1816150,0.0602\nCC-MAIN-2019-43,text/prs.lines.tag,5227,5226,0.0002\nCC-MAIN-2019-43,text/tab-separated-values,17152,17151,0.0006\nCC-MAIN-2019-43,text/turtle,24513,24513,0.0008\nCC-MAIN-2019-43,text/vcard,23350,23338,0.0008\nCC-MAIN-2019-43,text/x-bibtex,7725,7725,0.0003\nCC-MAIN-2019-43,text/x-c,2451,2451,0.0001\nCC-MAIN-2019-43,text/x-csrc,39402,39402,0.0013\nCC-MAIN-2019-43,text/x-diff,5405,5382,0.0002\nCC-MAIN-2019-43,text/x-patch,12380,12354,0.0004\nCC-MAIN-2019-43,text/x-perl,3906,3906,0.0001\nCC-MAIN-2019-43,text/x-vcalendar,18965,18963,0.0006\nCC-MAIN-2019-43,text/x-vcard,59747,59649,0.0020\nCC-MAIN-2019-43,text/xml,2382823,2377089,0.0789\nCC-MAIN-2019-43,unknown/unknown,18465,18460,0.0006\nCC-MAIN-2019-43,video/mp4,30371,30194,0.0010\nCC-MAIN-2019-43,video/webm,1859,1850,0.0001\nCC-MAIN-2019-43,video/x-ms-asf,8328,8320,0.0003\nCC-MAIN-2019-47,<other>,20055095,19876530,0.7742\nCC-MAIN-2019-47,application/atom+xml,3153106,3152383,0.1217\nCC-MAIN-2019-47,application/calendar,4875,4875,0.0002\nCC-MAIN-2019-47,application/download,50292,50281,0.0019\nCC-MAIN-2019-47,application/epub+zip,47663,47605,0.0018\nCC-MAIN-2019-47,application/force-download,131554,131480,0.0051\nCC-MAIN-2019-47,application/gpx+xml,6127,6127,0.0002\nCC-MAIN-2019-47,application/ics,8227,8225,0.0003\nCC-MAIN-2019-47,application/javascript,8961,8955,0.0003\nCC-MAIN-2019-47,application/json,588109,587619,0.0227\nCC-MAIN-2019-47,application/ld+json,8412,8412,0.0003\nCC-MAIN-2019-47,application/marc,11649,11647,0.0004\nCC-MAIN-2019-47,application/msword,83066,82668,0.0032\nCC-MAIN-2019-47,application/octet-stream,1180463,1178241,0.0456\nCC-MAIN-2019-47,application/octetstream,6926,6922,0.0003\nCC-MAIN-2019-47,application/pdf,11737202,11694983,0.4531\nCC-MAIN-2019-47,application/pgp-encrypted,3364,3363,0.0001\nCC-MAIN-2019-47,application/pgp-signature,33288,33285,0.0013\nCC-MAIN-2019-47,application/postscript,15638,15631,0.0006\nCC-MAIN-2019-47,application/rdf+xml,68543,68533,0.0026\nCC-MAIN-2019-47,application/rss+xml,1908969,1904353,0.0737\nCC-MAIN-2019-47,application/rtf,27370,27345,0.0011\nCC-MAIN-2019-47,application/save-to-disk,79,79,0.0000\nCC-MAIN-2019-47,application/text,75663,75629,0.0029\nCC-MAIN-2019-47,application/unknown,8217,8216,0.0003\nCC-MAIN-2019-47,application/vnd.android.package-archive,29218,28953,0.0011\nCC-MAIN-2019-47,application/vnd.google-earth.kml+xml,41374,41309,0.0016\nCC-MAIN-2019-47,application/vnd.google-earth.kmz,8460,8456,0.0003\nCC-MAIN-2019-47,application/vnd.ms-excel,33887,33837,0.0013\nCC-MAIN-2019-47,application/vnd.ms-powerpoint,40213,40201,0.0016\nCC-MAIN-2019-47,application/vnd.ms-word,17111,17101,0.0007\nCC-MAIN-2019-47,application/vnd.oasis.opendocument.text,18454,18432,0.0007\nCC-MAIN-2019-47,application/vnd.openxmlformats-officedocument.presentationml.presentation,5833,5819,0.0002\nCC-MAIN-2019-47,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,30404,30336,0.0012\nCC-MAIN-2019-47,application/vnd.openxmlformats-officedocument.wordprocessingml.document,60739,60497,0.0023\nCC-MAIN-2019-47,application/vnd.wap.xhtml+xml,2773,2668,0.0001\nCC-MAIN-2019-47,application/x-bibtex,47788,47760,0.0018\nCC-MAIN-2019-47,application/x-bittorrent,6859,6419,0.0003\nCC-MAIN-2019-47,application/x-debian-package,4354,4354,0.0002\nCC-MAIN-2019-47,application/x-download,29144,29038,0.0011\nCC-MAIN-2019-47,application/x-endnote-refer,92013,91978,0.0036\nCC-MAIN-2019-47,application/x-gzip,23030,23014,0.0009\nCC-MAIN-2019-47,application/x-httpd-php,17631,17595,0.0007\nCC-MAIN-2019-47,application/x-java-jnlp-file,7339,7336,0.0003\nCC-MAIN-2019-47,application/x-javascript,8617,8610,0.0003\nCC-MAIN-2019-47,application/x-json,406,406,0.0000\nCC-MAIN-2019-47,application/x-mobipocket-ebook,6374,6374,0.0002\nCC-MAIN-2019-47,application/x-msdownload,7871,7694,0.0003\nCC-MAIN-2019-47,application/x-netcdf,4587,4587,0.0002\nCC-MAIN-2019-47,application/x-research-info-systems,162693,162527,0.0063\nCC-MAIN-2019-47,application/x-shockwave-flash,13604,13537,0.0005\nCC-MAIN-2019-47,application/x-tar,4577,4563,0.0002\nCC-MAIN-2019-47,application/x-tex,2151,2150,0.0001\nCC-MAIN-2019-47,application/x-troff-man,7834,7813,0.0003\nCC-MAIN-2019-47,application/x-zip-compressed,18665,18538,0.0007\nCC-MAIN-2019-47,application/xhtml+xml,1039520,1036711,0.0401\nCC-MAIN-2019-47,application/xml,687746,686540,0.0265\nCC-MAIN-2019-47,application/zip,103727,102908,0.0040\nCC-MAIN-2019-47,audio/mpeg,114163,110028,0.0044\nCC-MAIN-2019-47,audio/x-mpegurl,22266,22249,0.0009\nCC-MAIN-2019-47,audio/x-scpls,2816,2816,0.0001\nCC-MAIN-2019-47,audio/x-wav,19827,19670,0.0008\nCC-MAIN-2019-47,binary/octet-stream,41246,41179,0.0016\nCC-MAIN-2019-47,image/gif,69083,68450,0.0027\nCC-MAIN-2019-47,image/jp2,5765,5739,0.0002\nCC-MAIN-2019-47,image/jpeg,3651941,3643555,0.1410\nCC-MAIN-2019-47,image/jpg,69849,69238,0.0027\nCC-MAIN-2019-47,image/pjpeg,12414,12412,0.0005\nCC-MAIN-2019-47,image/png,567928,565097,0.0219\nCC-MAIN-2019-47,image/svg+xml,14952,14935,0.0006\nCC-MAIN-2019-47,image/tiff,9595,9592,0.0004\nCC-MAIN-2019-47,image/vnd.djvu,7241,7240,0.0003\nCC-MAIN-2019-47,image/webp,18071,18062,0.0007\nCC-MAIN-2019-47,message/rfc822,10649,10645,0.0004\nCC-MAIN-2019-47,text/calendar,923437,922896,0.0356\nCC-MAIN-2019-47,text/css,11169,11167,0.0004\nCC-MAIN-2019-47,text/csv,72587,72574,0.0028\nCC-MAIN-2019-47,text/directory,10942,10894,0.0004\nCC-MAIN-2019-47,text/enriched,33705,33676,0.0013\nCC-MAIN-2019-47,text/html,2539342397,2516612522,98.0216\nCC-MAIN-2019-47,text/javascript,12308,12304,0.0005\nCC-MAIN-2019-47,text/markdown,1625,1625,0.0001\nCC-MAIN-2019-47,text/pdf,357,356,0.0000\nCC-MAIN-2019-47,text/plain,1387515,1386583,0.0536\nCC-MAIN-2019-47,text/prs.lines.tag,4581,4568,0.0002\nCC-MAIN-2019-47,text/tab-separated-values,15590,15586,0.0006\nCC-MAIN-2019-47,text/turtle,17557,17556,0.0007\nCC-MAIN-2019-47,text/vcard,24567,24522,0.0009\nCC-MAIN-2019-47,text/x-bibtex,5776,5775,0.0002\nCC-MAIN-2019-47,text/x-c,2116,2114,0.0001\nCC-MAIN-2019-47,text/x-csrc,20809,20808,0.0008\nCC-MAIN-2019-47,text/x-diff,6588,6583,0.0003\nCC-MAIN-2019-47,text/x-patch,9708,9697,0.0004\nCC-MAIN-2019-47,text/x-perl,2630,2630,0.0001\nCC-MAIN-2019-47,text/x-vcalendar,16702,16695,0.0006\nCC-MAIN-2019-47,text/x-vcard,50505,50471,0.0019\nCC-MAIN-2019-47,text/xml,2120635,2114910,0.0819\nCC-MAIN-2019-47,unknown/unknown,14722,14718,0.0006\nCC-MAIN-2019-47,video/mp4,35378,35287,0.0014\nCC-MAIN-2019-47,video/webm,1920,1914,0.0001\nCC-MAIN-2019-47,video/x-ms-asf,3687,3684,0.0001\nCC-MAIN-2019-51,<other>,16004603,15834273,0.6475\nCC-MAIN-2019-51,application/atom+xml,3175743,3175400,0.1285\nCC-MAIN-2019-51,application/calendar,5098,5098,0.0002\nCC-MAIN-2019-51,application/download,63423,63417,0.0026\nCC-MAIN-2019-51,application/epub+zip,35155,35047,0.0014\nCC-MAIN-2019-51,application/force-download,112776,112756,0.0046\nCC-MAIN-2019-51,application/gpx+xml,6488,6486,0.0003\nCC-MAIN-2019-51,application/ics,10151,10149,0.0004\nCC-MAIN-2019-51,application/javascript,8570,8562,0.0003\nCC-MAIN-2019-51,application/json,566783,566581,0.0229\nCC-MAIN-2019-51,application/ld+json,8845,8845,0.0004\nCC-MAIN-2019-51,application/marc,11780,11777,0.0005\nCC-MAIN-2019-51,application/msword,72546,72277,0.0029\nCC-MAIN-2019-51,application/octet-stream,1122645,1120759,0.0454\nCC-MAIN-2019-51,application/octetstream,4638,4637,0.0002\nCC-MAIN-2019-51,application/pdf,2995223,2974168,0.1212\nCC-MAIN-2019-51,application/pgp-encrypted,934,934,0.0000\nCC-MAIN-2019-51,application/pgp-signature,22770,22770,0.0009\nCC-MAIN-2019-51,application/postscript,5735,5731,0.0002\nCC-MAIN-2019-51,application/rdf+xml,68585,68554,0.0028\nCC-MAIN-2019-51,application/rss+xml,1925020,1920069,0.0779\nCC-MAIN-2019-51,application/rtf,25491,25466,0.0010\nCC-MAIN-2019-51,application/save-to-disk,186,186,0.0000\nCC-MAIN-2019-51,application/text,74322,74294,0.0030\nCC-MAIN-2019-51,application/unknown,6164,6164,0.0002\nCC-MAIN-2019-51,application/vnd.android.package-archive,30320,30048,0.0012\nCC-MAIN-2019-51,application/vnd.google-earth.kml+xml,41760,41664,0.0017\nCC-MAIN-2019-51,application/vnd.google-earth.kmz,7445,7440,0.0003\nCC-MAIN-2019-51,application/vnd.ms-excel,34880,34814,0.0014\nCC-MAIN-2019-51,application/vnd.ms-powerpoint,21272,21262,0.0009\nCC-MAIN-2019-51,application/vnd.ms-word,18490,18478,0.0007\nCC-MAIN-2019-51,application/vnd.oasis.opendocument.text,16666,16655,0.0007\nCC-MAIN-2019-51,application/vnd.openxmlformats-officedocument.presentationml.presentation,6338,6310,0.0003\nCC-MAIN-2019-51,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,30907,30812,0.0013\nCC-MAIN-2019-51,application/vnd.openxmlformats-officedocument.wordprocessingml.document,57515,57290,0.0023\nCC-MAIN-2019-51,application/vnd.wap.xhtml+xml,2558,2473,0.0001\nCC-MAIN-2019-51,application/x-bibtex,48433,48429,0.0020\nCC-MAIN-2019-51,application/x-bittorrent,8085,7719,0.0003\nCC-MAIN-2019-51,application/x-debian-package,951,951,0.0000\nCC-MAIN-2019-51,application/x-download,32356,32165,0.0013\nCC-MAIN-2019-51,application/x-endnote-refer,91773,91751,0.0037\nCC-MAIN-2019-51,application/x-gzip,23355,23320,0.0009\nCC-MAIN-2019-51,application/x-httpd-php,13636,13603,0.0006\nCC-MAIN-2019-51,application/x-java-jnlp-file,7635,7633,0.0003\nCC-MAIN-2019-51,application/x-javascript,13872,13869,0.0006\nCC-MAIN-2019-51,application/x-json,156,156,0.0000\nCC-MAIN-2019-51,application/x-mobipocket-ebook,3805,3750,0.0002\nCC-MAIN-2019-51,application/x-msdownload,8138,7984,0.0003\nCC-MAIN-2019-51,application/x-netcdf,3809,3809,0.0002\nCC-MAIN-2019-51,application/x-research-info-systems,170613,170497,0.0069\nCC-MAIN-2019-51,application/x-shockwave-flash,15300,15236,0.0006\nCC-MAIN-2019-51,application/x-tar,5728,5725,0.0002\nCC-MAIN-2019-51,application/x-tex,1369,1369,0.0001\nCC-MAIN-2019-51,application/x-troff-man,14186,14169,0.0006\nCC-MAIN-2019-51,application/x-zip-compressed,16687,16595,0.0007\nCC-MAIN-2019-51,application/xhtml+xml,1114689,1112297,0.0451\nCC-MAIN-2019-51,application/xml,721152,719856,0.0292\nCC-MAIN-2019-51,application/zip,98022,97305,0.0040\nCC-MAIN-2019-51,audio/mpeg,104910,100647,0.0042\nCC-MAIN-2019-51,audio/x-mpegurl,26283,26274,0.0011\nCC-MAIN-2019-51,audio/x-scpls,3564,3564,0.0001\nCC-MAIN-2019-51,audio/x-wav,17272,16791,0.0007\nCC-MAIN-2019-51,binary/octet-stream,14500,14490,0.0006\nCC-MAIN-2019-51,image/gif,67382,66787,0.0027\nCC-MAIN-2019-51,image/jp2,4018,4018,0.0002\nCC-MAIN-2019-51,image/jpeg,3160649,3152828,0.1279\nCC-MAIN-2019-51,image/jpg,66219,65315,0.0027\nCC-MAIN-2019-51,image/pjpeg,16585,16585,0.0007\nCC-MAIN-2019-51,image/png,470267,467659,0.0190\nCC-MAIN-2019-51,image/svg+xml,10854,10842,0.0004\nCC-MAIN-2019-51,image/tiff,8990,8984,0.0004\nCC-MAIN-2019-51,image/vnd.djvu,7517,7514,0.0003\nCC-MAIN-2019-51,image/webp,16761,16761,0.0007\nCC-MAIN-2019-51,message/rfc822,13197,13197,0.0005\nCC-MAIN-2019-51,text/calendar,1042976,1042300,0.0422\nCC-MAIN-2019-51,text/css,8544,8540,0.0003\nCC-MAIN-2019-51,text/csv,70202,70196,0.0028\nCC-MAIN-2019-51,text/directory,10072,10056,0.0004\nCC-MAIN-2019-51,text/enriched,28883,28871,0.0012\nCC-MAIN-2019-51,text/html,2433894960,2413626083,98.4623\nCC-MAIN-2019-51,text/javascript,15050,15046,0.0006\nCC-MAIN-2019-51,text/markdown,1392,1392,0.0001\nCC-MAIN-2019-51,text/pdf,106,106,0.0000\nCC-MAIN-2019-51,text/plain,1269880,1269015,0.0514\nCC-MAIN-2019-51,text/prs.lines.tag,7440,7440,0.0003\nCC-MAIN-2019-51,text/tab-separated-values,16623,16620,0.0007\nCC-MAIN-2019-51,text/turtle,21389,21387,0.0009\nCC-MAIN-2019-51,text/vcard,25946,25911,0.0010\nCC-MAIN-2019-51,text/x-bibtex,6375,6375,0.0003\nCC-MAIN-2019-51,text/x-c,2400,2400,0.0001\nCC-MAIN-2019-51,text/x-csrc,20572,20571,0.0008\nCC-MAIN-2019-51,text/x-diff,6604,6599,0.0003\nCC-MAIN-2019-51,text/x-patch,9310,9285,0.0004\nCC-MAIN-2019-51,text/x-perl,3924,3924,0.0002\nCC-MAIN-2019-51,text/x-vcalendar,17879,17877,0.0007\nCC-MAIN-2019-51,text/x-vcard,53763,53701,0.0022\nCC-MAIN-2019-51,text/xml,2289316,2284762,0.0926\nCC-MAIN-2019-51,unknown/unknown,15757,15747,0.0006\nCC-MAIN-2019-51,video/mp4,34749,34474,0.0014\nCC-MAIN-2019-51,video/webm,1374,1370,0.0001\nCC-MAIN-2019-51,video/x-ms-asf,4936,4931,0.0002\nCC-MAIN-2020-05,<other>,22493312,22266295,0.7253\nCC-MAIN-2020-05,application/atom+xml,3821692,3821116,0.1232\nCC-MAIN-2020-05,application/calendar,5648,5647,0.0002\nCC-MAIN-2020-05,application/download,64238,64218,0.0021\nCC-MAIN-2020-05,application/epub+zip,32321,32294,0.0010\nCC-MAIN-2020-05,application/force-download,137989,137977,0.0044\nCC-MAIN-2020-05,application/gpx+xml,6539,6535,0.0002\nCC-MAIN-2020-05,application/ics,12676,12674,0.0004\nCC-MAIN-2020-05,application/javascript,11720,11716,0.0004\nCC-MAIN-2020-05,application/json,585288,584936,0.0189\nCC-MAIN-2020-05,application/ld+json,9395,9395,0.0003\nCC-MAIN-2020-05,application/marc,13051,13048,0.0004\nCC-MAIN-2020-05,application/msword,60760,60516,0.0020\nCC-MAIN-2020-05,application/octet-stream,1091019,1089714,0.0352\nCC-MAIN-2020-05,application/octetstream,4543,4541,0.0001\nCC-MAIN-2020-05,application/pdf,2457200,2438702,0.0792\nCC-MAIN-2020-05,application/pgp-encrypted,809,809,0.0000\nCC-MAIN-2020-05,application/pgp-signature,28975,28975,0.0009\nCC-MAIN-2020-05,application/postscript,3502,3499,0.0001\nCC-MAIN-2020-05,application/rdf+xml,71471,71436,0.0023\nCC-MAIN-2020-05,application/rss+xml,2250033,2244551,0.0726\nCC-MAIN-2020-05,application/rtf,29096,29064,0.0009\nCC-MAIN-2020-05,application/save-to-disk,31,31,0.0000\nCC-MAIN-2020-05,application/text,84079,84059,0.0027\nCC-MAIN-2020-05,application/unknown,7796,7796,0.0003\nCC-MAIN-2020-05,application/vnd.android.package-archive,23704,23418,0.0008\nCC-MAIN-2020-05,application/vnd.google-earth.kml+xml,48663,48626,0.0016\nCC-MAIN-2020-05,application/vnd.google-earth.kmz,9656,9654,0.0003\nCC-MAIN-2020-05,application/vnd.ms-excel,33478,33408,0.0011\nCC-MAIN-2020-05,application/vnd.ms-powerpoint,21646,21639,0.0007\nCC-MAIN-2020-05,application/vnd.ms-word,18167,18153,0.0006\nCC-MAIN-2020-05,application/vnd.oasis.opendocument.text,20114,20095,0.0006\nCC-MAIN-2020-05,application/vnd.openxmlformats-officedocument.presentationml.presentation,6172,6163,0.0002\nCC-MAIN-2020-05,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,30631,30558,0.0010\nCC-MAIN-2020-05,application/vnd.openxmlformats-officedocument.wordprocessingml.document,56912,56674,0.0018\nCC-MAIN-2020-05,application/vnd.wap.xhtml+xml,2779,2767,0.0001\nCC-MAIN-2020-05,application/x-bibtex,51508,51503,0.0017\nCC-MAIN-2020-05,application/x-bittorrent,8404,8200,0.0003\nCC-MAIN-2020-05,application/x-debian-package,1676,1676,0.0001\nCC-MAIN-2020-05,application/x-download,32151,31963,0.0010\nCC-MAIN-2020-05,application/x-endnote-refer,99460,99443,0.0032\nCC-MAIN-2020-05,application/x-gzip,23266,23231,0.0008\nCC-MAIN-2020-05,application/x-httpd-php,17935,17877,0.0006\nCC-MAIN-2020-05,application/x-java-jnlp-file,8373,8369,0.0003\nCC-MAIN-2020-05,application/x-javascript,11810,11709,0.0004\nCC-MAIN-2020-05,application/x-json,262,262,0.0000\nCC-MAIN-2020-05,application/x-mobipocket-ebook,3965,3963,0.0001\nCC-MAIN-2020-05,application/x-msdownload,7755,7629,0.0003\nCC-MAIN-2020-05,application/x-netcdf,1371,1371,0.0000\nCC-MAIN-2020-05,application/x-research-info-systems,177134,177004,0.0057\nCC-MAIN-2020-05,application/x-shockwave-flash,15076,15020,0.0005\nCC-MAIN-2020-05,application/x-tar,5463,5460,0.0002\nCC-MAIN-2020-05,application/x-tex,2415,2415,0.0001\nCC-MAIN-2020-05,application/x-troff-man,9324,9320,0.0003\nCC-MAIN-2020-05,application/x-zip-compressed,16378,16323,0.0005\nCC-MAIN-2020-05,application/xhtml+xml,1158918,1156621,0.0374\nCC-MAIN-2020-05,application/xml,900437,898333,0.0290\nCC-MAIN-2020-05,application/zip,109584,108506,0.0035\nCC-MAIN-2020-05,audio/mpeg,89921,87143,0.0029\nCC-MAIN-2020-05,audio/x-mpegurl,31811,31794,0.0010\nCC-MAIN-2020-05,audio/x-scpls,3869,3865,0.0001\nCC-MAIN-2020-05,audio/x-wav,18071,18041,0.0006\nCC-MAIN-2020-05,binary/octet-stream,18302,18290,0.0006\nCC-MAIN-2020-05,image/gif,74255,73686,0.0024\nCC-MAIN-2020-05,image/jp2,6281,6281,0.0002\nCC-MAIN-2020-05,image/jpeg,2986202,2979118,0.0963\nCC-MAIN-2020-05,image/jpg,61062,60856,0.0020\nCC-MAIN-2020-05,image/pjpeg,17973,17972,0.0006\nCC-MAIN-2020-05,image/png,441391,438826,0.0142\nCC-MAIN-2020-05,image/svg+xml,7836,7830,0.0003\nCC-MAIN-2020-05,image/tiff,9732,9726,0.0003\nCC-MAIN-2020-05,image/vnd.djvu,10441,10441,0.0003\nCC-MAIN-2020-05,image/webp,16051,16040,0.0005\nCC-MAIN-2020-05,message/rfc822,12847,12847,0.0004\nCC-MAIN-2020-05,text/calendar,1059332,1058622,0.0342\nCC-MAIN-2020-05,text/css,8136,8135,0.0003\nCC-MAIN-2020-05,text/csv,79647,79623,0.0026\nCC-MAIN-2020-05,text/directory,12846,12819,0.0004\nCC-MAIN-2020-05,text/enriched,30171,30165,0.0010\nCC-MAIN-2020-05,text/html,3054621555,3027152235,98.5013\nCC-MAIN-2020-05,text/javascript,18181,18179,0.0006\nCC-MAIN-2020-05,text/markdown,2061,2061,0.0001\nCC-MAIN-2020-05,text/pdf,216,216,0.0000\nCC-MAIN-2020-05,text/plain,2231572,2230701,0.0720\nCC-MAIN-2020-05,text/prs.lines.tag,5055,5055,0.0002\nCC-MAIN-2020-05,text/tab-separated-values,15004,15004,0.0005\nCC-MAIN-2020-05,text/turtle,24560,24559,0.0008\nCC-MAIN-2020-05,text/vcard,28854,28613,0.0009\nCC-MAIN-2020-05,text/x-bibtex,13590,13581,0.0004\nCC-MAIN-2020-05,text/x-c,3978,3977,0.0001\nCC-MAIN-2020-05,text/x-csrc,21081,21079,0.0007\nCC-MAIN-2020-05,text/x-diff,7199,7197,0.0002\nCC-MAIN-2020-05,text/x-patch,12463,12452,0.0004\nCC-MAIN-2020-05,text/x-perl,4593,4593,0.0001\nCC-MAIN-2020-05,text/x-vcalendar,16861,16860,0.0005\nCC-MAIN-2020-05,text/x-vcard,64206,64142,0.0021\nCC-MAIN-2020-05,text/xml,2730201,2724084,0.0880\nCC-MAIN-2020-05,unknown/unknown,17270,17267,0.0006\nCC-MAIN-2020-05,video/mp4,31157,31038,0.0010\nCC-MAIN-2020-05,video/webm,2116,2110,0.0001\nCC-MAIN-2020-05,video/x-ms-asf,11453,11441,0.0004\nCC-MAIN-2020-10,<other>,22193465,21977321,0.8439\nCC-MAIN-2020-10,application/atom+xml,3591315,3590843,0.1366\nCC-MAIN-2020-10,application/calendar,7800,7800,0.0003\nCC-MAIN-2020-10,application/download,84155,84099,0.0032\nCC-MAIN-2020-10,application/epub+zip,47327,47123,0.0018\nCC-MAIN-2020-10,application/force-download,177642,177562,0.0068\nCC-MAIN-2020-10,application/gpx+xml,9807,9803,0.0004\nCC-MAIN-2020-10,application/ics,15499,15485,0.0006\nCC-MAIN-2020-10,application/javascript,14589,14576,0.0006\nCC-MAIN-2020-10,application/json,594056,593712,0.0226\nCC-MAIN-2020-10,application/ld+json,12263,12263,0.0005\nCC-MAIN-2020-10,application/marc,14055,14048,0.0005\nCC-MAIN-2020-10,application/msword,90553,90136,0.0034\nCC-MAIN-2020-10,application/octet-stream,1255936,1253783,0.0478\nCC-MAIN-2020-10,application/octetstream,6454,6451,0.0002\nCC-MAIN-2020-10,application/pdf,3422652,3391765,0.1301\nCC-MAIN-2020-10,application/pgp-encrypted,1265,1265,0.0000\nCC-MAIN-2020-10,application/pgp-signature,34077,34072,0.0013\nCC-MAIN-2020-10,application/postscript,6200,6180,0.0002\nCC-MAIN-2020-10,application/rdf+xml,80580,80558,0.0031\nCC-MAIN-2020-10,application/rss+xml,2219358,2214497,0.0844\nCC-MAIN-2020-10,application/rtf,37811,37777,0.0014\nCC-MAIN-2020-10,application/save-to-disk,268,268,0.0000\nCC-MAIN-2020-10,application/text,75759,75698,0.0029\nCC-MAIN-2020-10,application/unknown,8773,8769,0.0003\nCC-MAIN-2020-10,application/vnd.android.package-archive,40074,39763,0.0015\nCC-MAIN-2020-10,application/vnd.google-earth.kml+xml,49266,49250,0.0019\nCC-MAIN-2020-10,application/vnd.google-earth.kmz,13203,13202,0.0005\nCC-MAIN-2020-10,application/vnd.ms-excel,46488,46370,0.0018\nCC-MAIN-2020-10,application/vnd.ms-powerpoint,23079,23053,0.0009\nCC-MAIN-2020-10,application/vnd.ms-word,19092,19087,0.0007\nCC-MAIN-2020-10,application/vnd.oasis.opendocument.text,25794,25776,0.0010\nCC-MAIN-2020-10,application/vnd.openxmlformats-officedocument.presentationml.presentation,9439,9402,0.0004\nCC-MAIN-2020-10,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,36718,36567,0.0014\nCC-MAIN-2020-10,application/vnd.openxmlformats-officedocument.wordprocessingml.document,79713,79476,0.0030\nCC-MAIN-2020-10,application/vnd.wap.xhtml+xml,2693,2591,0.0001\nCC-MAIN-2020-10,application/x-bibtex,61125,61115,0.0023\nCC-MAIN-2020-10,application/x-bittorrent,12928,12675,0.0005\nCC-MAIN-2020-10,application/x-debian-package,2432,2431,0.0001\nCC-MAIN-2020-10,application/x-download,38722,38243,0.0015\nCC-MAIN-2020-10,application/x-endnote-refer,99219,99183,0.0038\nCC-MAIN-2020-10,application/x-gzip,27295,27243,0.0010\nCC-MAIN-2020-10,application/x-httpd-php,20058,20025,0.0008\nCC-MAIN-2020-10,application/x-java-jnlp-file,6345,6345,0.0002\nCC-MAIN-2020-10,application/x-javascript,15059,14986,0.0006\nCC-MAIN-2020-10,application/x-json,162,162,0.0000\nCC-MAIN-2020-10,application/x-mobipocket-ebook,3920,3901,0.0001\nCC-MAIN-2020-10,application/x-msdownload,10401,10306,0.0004\nCC-MAIN-2020-10,application/x-netcdf,7371,7371,0.0003\nCC-MAIN-2020-10,application/x-research-info-systems,187539,187427,0.0071\nCC-MAIN-2020-10,application/x-shockwave-flash,15991,15929,0.0006\nCC-MAIN-2020-10,application/x-tar,10770,10767,0.0004\nCC-MAIN-2020-10,application/x-tex,3647,3644,0.0001\nCC-MAIN-2020-10,application/x-troff-man,6518,6483,0.0002\nCC-MAIN-2020-10,application/x-zip-compressed,22693,22527,0.0009\nCC-MAIN-2020-10,application/xhtml+xml,1195965,1193691,0.0455\nCC-MAIN-2020-10,application/xml,895052,893074,0.0340\nCC-MAIN-2020-10,application/zip,125164,123821,0.0048\nCC-MAIN-2020-10,audio/mpeg,139469,135707,0.0053\nCC-MAIN-2020-10,audio/x-mpegurl,40545,40362,0.0015\nCC-MAIN-2020-10,audio/x-scpls,4470,4464,0.0002\nCC-MAIN-2020-10,audio/x-wav,14345,14032,0.0005\nCC-MAIN-2020-10,binary/octet-stream,19505,19470,0.0007\nCC-MAIN-2020-10,image/gif,83620,83112,0.0032\nCC-MAIN-2020-10,image/jp2,5670,5670,0.0002\nCC-MAIN-2020-10,image/jpeg,3828843,3819965,0.1456\nCC-MAIN-2020-10,image/jpg,83997,83364,0.0032\nCC-MAIN-2020-10,image/pjpeg,13864,13863,0.0005\nCC-MAIN-2020-10,image/png,545026,542387,0.0207\nCC-MAIN-2020-10,image/svg+xml,11375,11357,0.0004\nCC-MAIN-2020-10,image/tiff,8763,8717,0.0003\nCC-MAIN-2020-10,image/vnd.djvu,15709,15701,0.0006\nCC-MAIN-2020-10,image/webp,22514,22505,0.0009\nCC-MAIN-2020-10,message/rfc822,17986,17984,0.0007\nCC-MAIN-2020-10,text/calendar,1271579,1270642,0.0483\nCC-MAIN-2020-10,text/css,7717,7714,0.0003\nCC-MAIN-2020-10,text/csv,93826,93789,0.0036\nCC-MAIN-2020-10,text/directory,13489,13476,0.0005\nCC-MAIN-2020-10,text/enriched,26406,26330,0.0010\nCC-MAIN-2020-10,text/html,2581303355,2559829230,98.1498\nCC-MAIN-2020-10,text/javascript,12975,12966,0.0005\nCC-MAIN-2020-10,text/markdown,1663,1663,0.0001\nCC-MAIN-2020-10,text/pdf,223,223,0.0000\nCC-MAIN-2020-10,text/plain,1985122,1983754,0.0755\nCC-MAIN-2020-10,text/prs.lines.tag,2208,2207,0.0001\nCC-MAIN-2020-10,text/tab-separated-values,18954,18949,0.0007\nCC-MAIN-2020-10,text/turtle,26399,26386,0.0010\nCC-MAIN-2020-10,text/vcard,32401,32356,0.0012\nCC-MAIN-2020-10,text/x-bibtex,11926,11835,0.0005\nCC-MAIN-2020-10,text/x-c,3357,3356,0.0001\nCC-MAIN-2020-10,text/x-csrc,25279,25279,0.0010\nCC-MAIN-2020-10,text/x-diff,9348,9302,0.0004\nCC-MAIN-2020-10,text/x-patch,14409,14356,0.0005\nCC-MAIN-2020-10,text/x-perl,4627,4627,0.0002\nCC-MAIN-2020-10,text/x-vcalendar,25075,25069,0.0010\nCC-MAIN-2020-10,text/x-vcard,78379,78322,0.0030\nCC-MAIN-2020-10,text/xml,2958805,2953695,0.1125\nCC-MAIN-2020-10,unknown/unknown,14855,14827,0.0006\nCC-MAIN-2020-10,video/mp4,36316,36170,0.0014\nCC-MAIN-2020-10,video/webm,1739,1735,0.0001\nCC-MAIN-2020-10,video/x-ms-asf,11735,11722,0.0004\nCC-MAIN-2020-16,<other>,24278193,24053735,0.8412\nCC-MAIN-2020-16,application/atom+xml,2646984,2646462,0.0917\nCC-MAIN-2020-16,application/calendar,4730,4730,0.0002\nCC-MAIN-2020-16,application/download,66626,66609,0.0023\nCC-MAIN-2020-16,application/epub+zip,38704,38605,0.0013\nCC-MAIN-2020-16,application/force-download,122488,122441,0.0042\nCC-MAIN-2020-16,application/gpx+xml,6162,6158,0.0002\nCC-MAIN-2020-16,application/ics,8545,8543,0.0003\nCC-MAIN-2020-16,application/javascript,10329,10304,0.0004\nCC-MAIN-2020-16,application/json,478359,478132,0.0166\nCC-MAIN-2020-16,application/ld+json,10080,10080,0.0003\nCC-MAIN-2020-16,application/marc,12101,12101,0.0004\nCC-MAIN-2020-16,application/msword,77215,77011,0.0027\nCC-MAIN-2020-16,application/octet-stream,1049958,1048689,0.0364\nCC-MAIN-2020-16,application/octetstream,5778,5769,0.0002\nCC-MAIN-2020-16,application/pdf,20913093,20874257,0.7246\nCC-MAIN-2020-16,application/pgp-encrypted,756,756,0.0000\nCC-MAIN-2020-16,application/pgp-signature,37330,37330,0.0013\nCC-MAIN-2020-16,application/postscript,4575,4571,0.0002\nCC-MAIN-2020-16,application/rdf+xml,63612,63585,0.0022\nCC-MAIN-2020-16,application/rss+xml,2068628,2064013,0.0717\nCC-MAIN-2020-16,application/rtf,32701,32684,0.0011\nCC-MAIN-2020-16,application/save-to-disk,397,397,0.0000\nCC-MAIN-2020-16,application/text,62435,62430,0.0022\nCC-MAIN-2020-16,application/unknown,7712,7708,0.0003\nCC-MAIN-2020-16,application/vnd.android.package-archive,29624,29417,0.0010\nCC-MAIN-2020-16,application/vnd.google-earth.kml+xml,37504,37446,0.0013\nCC-MAIN-2020-16,application/vnd.google-earth.kmz,8543,8543,0.0003\nCC-MAIN-2020-16,application/vnd.ms-excel,39168,39117,0.0014\nCC-MAIN-2020-16,application/vnd.ms-powerpoint,21643,21629,0.0007\nCC-MAIN-2020-16,application/vnd.ms-word,15184,15182,0.0005\nCC-MAIN-2020-16,application/vnd.oasis.opendocument.text,21689,21684,0.0008\nCC-MAIN-2020-16,application/vnd.openxmlformats-officedocument.presentationml.presentation,5669,5654,0.0002\nCC-MAIN-2020-16,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,27547,27418,0.0010\nCC-MAIN-2020-16,application/vnd.openxmlformats-officedocument.wordprocessingml.document,58791,58582,0.0020\nCC-MAIN-2020-16,application/vnd.wap.xhtml+xml,3359,3246,0.0001\nCC-MAIN-2020-16,application/x-bibtex,42888,42878,0.0015\nCC-MAIN-2020-16,application/x-bittorrent,8504,8226,0.0003\nCC-MAIN-2020-16,application/x-debian-package,9073,9073,0.0003\nCC-MAIN-2020-16,application/x-download,35642,34481,0.0012\nCC-MAIN-2020-16,application/x-endnote-refer,78593,78568,0.0027\nCC-MAIN-2020-16,application/x-gzip,24710,24669,0.0009\nCC-MAIN-2020-16,application/x-httpd-php,13112,13042,0.0005\nCC-MAIN-2020-16,application/x-java-jnlp-file,3246,3244,0.0001\nCC-MAIN-2020-16,application/x-javascript,6646,6560,0.0002\nCC-MAIN-2020-16,application/x-json,20,20,0.0000\nCC-MAIN-2020-16,application/x-mobipocket-ebook,3329,3329,0.0001\nCC-MAIN-2020-16,application/x-msdownload,8680,8594,0.0003\nCC-MAIN-2020-16,application/x-netcdf,4096,4051,0.0001\nCC-MAIN-2020-16,application/x-research-info-systems,151914,151901,0.0053\nCC-MAIN-2020-16,application/x-shockwave-flash,9641,9598,0.0003\nCC-MAIN-2020-16,application/x-tar,7033,7030,0.0002\nCC-MAIN-2020-16,application/x-tex,2358,2358,0.0001\nCC-MAIN-2020-16,application/x-troff-man,8968,8960,0.0003\nCC-MAIN-2020-16,application/x-zip-compressed,16353,16238,0.0006\nCC-MAIN-2020-16,application/xhtml+xml,1036405,1034330,0.0359\nCC-MAIN-2020-16,application/xml,843372,841411,0.0292\nCC-MAIN-2020-16,application/zip,107285,106467,0.0037\nCC-MAIN-2020-16,audio/mpeg,124918,121958,0.0043\nCC-MAIN-2020-16,audio/x-mpegurl,23756,23714,0.0008\nCC-MAIN-2020-16,audio/x-scpls,3723,3719,0.0001\nCC-MAIN-2020-16,audio/x-wav,10139,10082,0.0004\nCC-MAIN-2020-16,binary/octet-stream,20021,20001,0.0007\nCC-MAIN-2020-16,image/gif,68452,68089,0.0024\nCC-MAIN-2020-16,image/jp2,1688,1688,0.0001\nCC-MAIN-2020-16,image/jpeg,3494310,3488074,0.1211\nCC-MAIN-2020-16,image/jpg,75494,74705,0.0026\nCC-MAIN-2020-16,image/pjpeg,10650,10650,0.0004\nCC-MAIN-2020-16,image/png,570405,568062,0.0198\nCC-MAIN-2020-16,image/svg+xml,11425,11382,0.0004\nCC-MAIN-2020-16,image/tiff,6259,6254,0.0002\nCC-MAIN-2020-16,image/vnd.djvu,9570,9568,0.0003\nCC-MAIN-2020-16,image/webp,19577,19574,0.0007\nCC-MAIN-2020-16,message/rfc822,11027,11027,0.0004\nCC-MAIN-2020-16,text/calendar,898424,897994,0.0311\nCC-MAIN-2020-16,text/css,7925,7886,0.0003\nCC-MAIN-2020-16,text/csv,77660,77647,0.0027\nCC-MAIN-2020-16,text/directory,11587,11583,0.0004\nCC-MAIN-2020-16,text/enriched,20324,20310,0.0007\nCC-MAIN-2020-16,text/html,2821680034,2797850686,97.7633\nCC-MAIN-2020-16,text/javascript,14644,14558,0.0005\nCC-MAIN-2020-16,text/markdown,1573,1573,0.0001\nCC-MAIN-2020-16,text/pdf,409,409,0.0000\nCC-MAIN-2020-16,text/plain,1482663,1481844,0.0514\nCC-MAIN-2020-16,text/prs.lines.tag,3447,3447,0.0001\nCC-MAIN-2020-16,text/tab-separated-values,10981,10981,0.0004\nCC-MAIN-2020-16,text/turtle,25414,25412,0.0009\nCC-MAIN-2020-16,text/vcard,22176,22145,0.0008\nCC-MAIN-2020-16,text/x-bibtex,8524,8521,0.0003\nCC-MAIN-2020-16,text/x-c,2453,2452,0.0001\nCC-MAIN-2020-16,text/x-csrc,20328,20328,0.0007\nCC-MAIN-2020-16,text/x-diff,4777,4769,0.0002\nCC-MAIN-2020-16,text/x-patch,12063,12043,0.0004\nCC-MAIN-2020-16,text/x-perl,4599,4599,0.0002\nCC-MAIN-2020-16,text/x-vcalendar,17175,17173,0.0006\nCC-MAIN-2020-16,text/x-vcard,49719,49694,0.0017\nCC-MAIN-2020-16,text/xml,2641405,2636378,0.0915\nCC-MAIN-2020-16,unknown/unknown,16000,15993,0.0006\nCC-MAIN-2020-16,video/mp4,34704,34613,0.0012\nCC-MAIN-2020-16,video/webm,1801,1800,0.0001\nCC-MAIN-2020-16,video/x-ms-asf,5934,5932,0.0002\nCC-MAIN-2020-24,<other>,28692455,28369816,1.0384\nCC-MAIN-2020-24,application/atom+xml,4340378,4339552,0.1571\nCC-MAIN-2020-24,application/calendar,6163,6160,0.0002\nCC-MAIN-2020-24,application/download,86870,86838,0.0031\nCC-MAIN-2020-24,application/epub+zip,36475,36173,0.0013\nCC-MAIN-2020-24,application/force-download,161683,161523,0.0059\nCC-MAIN-2020-24,application/gpx+xml,7005,7001,0.0003\nCC-MAIN-2020-24,application/ics,13455,13444,0.0005\nCC-MAIN-2020-24,application/javascript,36562,36556,0.0013\nCC-MAIN-2020-24,application/json,568669,568103,0.0206\nCC-MAIN-2020-24,application/ld+json,14966,14966,0.0005\nCC-MAIN-2020-24,application/marc,12758,12757,0.0005\nCC-MAIN-2020-24,application/msword,77845,77605,0.0028\nCC-MAIN-2020-24,application/octet-stream,1104942,1103226,0.0400\nCC-MAIN-2020-24,application/octetstream,5567,5559,0.0002\nCC-MAIN-2020-24,application/pdf,3204225,3181664,0.1160\nCC-MAIN-2020-24,application/pgp-encrypted,1227,1227,0.0000\nCC-MAIN-2020-24,application/pgp-signature,25817,25817,0.0009\nCC-MAIN-2020-24,application/postscript,6116,6115,0.0002\nCC-MAIN-2020-24,application/rdf+xml,73675,73645,0.0027\nCC-MAIN-2020-24,application/rss+xml,2276486,2269539,0.0824\nCC-MAIN-2020-24,application/rtf,36212,36175,0.0013\nCC-MAIN-2020-24,application/save-to-disk,197,197,0.0000\nCC-MAIN-2020-24,application/text,76638,76618,0.0028\nCC-MAIN-2020-24,application/unknown,11852,11834,0.0004\nCC-MAIN-2020-24,application/vnd.android.package-archive,28005,25494,0.0010\nCC-MAIN-2020-24,application/vnd.google-earth.kml+xml,48096,48081,0.0017\nCC-MAIN-2020-24,application/vnd.google-earth.kmz,10083,10073,0.0004\nCC-MAIN-2020-24,application/vnd.ms-excel,42371,42310,0.0015\nCC-MAIN-2020-24,application/vnd.ms-powerpoint,24990,24977,0.0009\nCC-MAIN-2020-24,application/vnd.ms-word,22056,22038,0.0008\nCC-MAIN-2020-24,application/vnd.oasis.opendocument.text,24699,24689,0.0009\nCC-MAIN-2020-24,application/vnd.openxmlformats-officedocument.presentationml.presentation,6678,6663,0.0002\nCC-MAIN-2020-24,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,38631,38529,0.0014\nCC-MAIN-2020-24,application/vnd.openxmlformats-officedocument.wordprocessingml.document,72705,72459,0.0026\nCC-MAIN-2020-24,application/vnd.wap.xhtml+xml,3281,3186,0.0001\nCC-MAIN-2020-24,application/x-bibtex,54854,54840,0.0020\nCC-MAIN-2020-24,application/x-bittorrent,11298,11089,0.0004\nCC-MAIN-2020-24,application/x-debian-package,2164,2164,0.0001\nCC-MAIN-2020-24,application/x-download,34231,34205,0.0012\nCC-MAIN-2020-24,application/x-endnote-refer,94978,94972,0.0034\nCC-MAIN-2020-24,application/x-gzip,20866,20854,0.0008\nCC-MAIN-2020-24,application/x-httpd-php,19092,19037,0.0007\nCC-MAIN-2020-24,application/x-java-jnlp-file,8379,8379,0.0003\nCC-MAIN-2020-24,application/x-javascript,13540,13425,0.0005\nCC-MAIN-2020-24,application/x-json,77,77,0.0000\nCC-MAIN-2020-24,application/x-mobipocket-ebook,2963,2961,0.0001\nCC-MAIN-2020-24,application/x-msdownload,9238,9086,0.0003\nCC-MAIN-2020-24,application/x-netcdf,3497,3497,0.0001\nCC-MAIN-2020-24,application/x-research-info-systems,166683,166638,0.0060\nCC-MAIN-2020-24,application/x-shockwave-flash,9215,9164,0.0003\nCC-MAIN-2020-24,application/x-tar,4802,4792,0.0002\nCC-MAIN-2020-24,application/x-tex,2633,2633,0.0001\nCC-MAIN-2020-24,application/x-troff-man,3141,3128,0.0001\nCC-MAIN-2020-24,application/x-zip-compressed,18015,17942,0.0007\nCC-MAIN-2020-24,application/xhtml+xml,1104546,1103064,0.0400\nCC-MAIN-2020-24,application/xml,834716,833214,0.0302\nCC-MAIN-2020-24,application/zip,93763,93390,0.0034\nCC-MAIN-2020-24,audio/mpeg,114107,110512,0.0041\nCC-MAIN-2020-24,audio/x-mpegurl,27975,27946,0.0010\nCC-MAIN-2020-24,audio/x-scpls,3963,3961,0.0001\nCC-MAIN-2020-24,audio/x-wav,6132,5924,0.0002\nCC-MAIN-2020-24,binary/octet-stream,15463,15427,0.0006\nCC-MAIN-2020-24,image/gif,60853,60397,0.0022\nCC-MAIN-2020-24,image/jp2,634,634,0.0000\nCC-MAIN-2020-24,image/jpeg,3172651,3162643,0.1148\nCC-MAIN-2020-24,image/jpg,59204,59165,0.0021\nCC-MAIN-2020-24,image/pjpeg,14213,14211,0.0005\nCC-MAIN-2020-24,image/png,478028,475412,0.0173\nCC-MAIN-2020-24,image/svg+xml,10719,10710,0.0004\nCC-MAIN-2020-24,image/tiff,9091,9088,0.0003\nCC-MAIN-2020-24,image/vnd.djvu,6121,6119,0.0002\nCC-MAIN-2020-24,image/webp,32137,32133,0.0012\nCC-MAIN-2020-24,message/rfc822,16639,16639,0.0006\nCC-MAIN-2020-24,text/calendar,1305485,1304255,0.0472\nCC-MAIN-2020-24,text/css,5792,5790,0.0002\nCC-MAIN-2020-24,text/csv,93540,93523,0.0034\nCC-MAIN-2020-24,text/directory,10469,10465,0.0004\nCC-MAIN-2020-24,text/enriched,27710,27701,0.0010\nCC-MAIN-2020-24,text/html,2709764484,2686165256,98.0659\nCC-MAIN-2020-24,text/javascript,12944,12924,0.0005\nCC-MAIN-2020-24,text/markdown,1454,1453,0.0001\nCC-MAIN-2020-24,text/pdf,190,175,0.0000\nCC-MAIN-2020-24,text/plain,1348670,1347751,0.0488\nCC-MAIN-2020-24,text/prs.lines.tag,2776,2776,0.0001\nCC-MAIN-2020-24,text/tab-separated-values,19227,19220,0.0007\nCC-MAIN-2020-24,text/turtle,27839,27827,0.0010\nCC-MAIN-2020-24,text/vcard,29289,29272,0.0011\nCC-MAIN-2020-24,text/x-bibtex,6876,6872,0.0002\nCC-MAIN-2020-24,text/x-c,2120,2120,0.0001\nCC-MAIN-2020-24,text/x-csrc,15391,15391,0.0006\nCC-MAIN-2020-24,text/x-diff,5065,5063,0.0002\nCC-MAIN-2020-24,text/x-patch,11413,11410,0.0004\nCC-MAIN-2020-24,text/x-perl,3888,3888,0.0001\nCC-MAIN-2020-24,text/x-vcalendar,24428,24423,0.0009\nCC-MAIN-2020-24,text/x-vcard,64347,64294,0.0023\nCC-MAIN-2020-24,text/xml,2628694,2621326,0.0951\nCC-MAIN-2020-24,unknown/unknown,13908,13903,0.0005\nCC-MAIN-2020-24,video/mp4,32904,32796,0.0012\nCC-MAIN-2020-24,video/webm,2092,2089,0.0001\nCC-MAIN-2020-24,video/x-ms-asf,5313,5311,0.0002\nCC-MAIN-2020-29,<other>,6429954,6419574,0.2045\nCC-MAIN-2020-29,application/atom+xml,3902095,3900874,0.1241\nCC-MAIN-2020-29,application/calendar,6644,6642,0.0002\nCC-MAIN-2020-29,application/download,86063,86055,0.0027\nCC-MAIN-2020-29,application/epub+zip,35185,35091,0.0011\nCC-MAIN-2020-29,application/force-download,174060,174030,0.0055\nCC-MAIN-2020-29,application/gpx+xml,7567,7564,0.0002\nCC-MAIN-2020-29,application/ics,11069,11067,0.0004\nCC-MAIN-2020-29,application/javascript,28839,28835,0.0009\nCC-MAIN-2020-29,application/json,587286,586748,0.0187\nCC-MAIN-2020-29,application/ld+json,12640,12640,0.0004\nCC-MAIN-2020-29,application/marc,13650,13650,0.0004\nCC-MAIN-2020-29,application/msword,95564,95350,0.0030\nCC-MAIN-2020-29,application/octet-stream,1222188,1220260,0.0389\nCC-MAIN-2020-29,application/octetstream,4466,4464,0.0001\nCC-MAIN-2020-29,application/pdf,2829788,2807394,0.0900\nCC-MAIN-2020-29,application/pgp-encrypted,750,750,0.0000\nCC-MAIN-2020-29,application/pgp-signature,34403,34399,0.0011\nCC-MAIN-2020-29,application/postscript,6632,6630,0.0002\nCC-MAIN-2020-29,application/rdf+xml,77783,77736,0.0025\nCC-MAIN-2020-29,application/rss+xml,2429594,2421598,0.0773\nCC-MAIN-2020-29,application/rtf,38522,38451,0.0012\nCC-MAIN-2020-29,application/save-to-disk,79,79,0.0000\nCC-MAIN-2020-29,application/text,76785,76770,0.0024\nCC-MAIN-2020-29,application/unknown,8549,8549,0.0003\nCC-MAIN-2020-29,application/vnd.android.package-archive,44683,41860,0.0014\nCC-MAIN-2020-29,application/vnd.google-earth.kml+xml,57527,57506,0.0018\nCC-MAIN-2020-29,application/vnd.google-earth.kmz,7871,7870,0.0003\nCC-MAIN-2020-29,application/vnd.ms-excel,42390,42277,0.0013\nCC-MAIN-2020-29,application/vnd.ms-powerpoint,21192,21182,0.0007\nCC-MAIN-2020-29,application/vnd.ms-word,22102,22071,0.0007\nCC-MAIN-2020-29,application/vnd.oasis.opendocument.text,27147,27126,0.0009\nCC-MAIN-2020-29,application/vnd.openxmlformats-officedocument.presentationml.presentation,6484,6425,0.0002\nCC-MAIN-2020-29,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,35658,35572,0.0011\nCC-MAIN-2020-29,application/vnd.openxmlformats-officedocument.wordprocessingml.document,77695,77490,0.0025\nCC-MAIN-2020-29,application/vnd.wap.xhtml+xml,4583,4482,0.0001\nCC-MAIN-2020-29,application/x-bibtex,57249,57235,0.0018\nCC-MAIN-2020-29,application/x-bittorrent,11188,11036,0.0004\nCC-MAIN-2020-29,application/x-debian-package,1374,1372,0.0000\nCC-MAIN-2020-29,application/x-download,36845,36766,0.0012\nCC-MAIN-2020-29,application/x-endnote-refer,96964,96941,0.0031\nCC-MAIN-2020-29,application/x-gzip,19001,18991,0.0006\nCC-MAIN-2020-29,application/x-httpd-php,16861,16806,0.0005\nCC-MAIN-2020-29,application/x-java-jnlp-file,8607,8605,0.0003\nCC-MAIN-2020-29,application/x-javascript,13288,13178,0.0004\nCC-MAIN-2020-29,application/x-json,52,52,0.0000\nCC-MAIN-2020-29,application/x-mobipocket-ebook,3475,3472,0.0001\nCC-MAIN-2020-29,application/x-msdownload,9470,9391,0.0003\nCC-MAIN-2020-29,application/x-netcdf,5699,5699,0.0002\nCC-MAIN-2020-29,application/x-research-info-systems,184501,184455,0.0059\nCC-MAIN-2020-29,application/x-shockwave-flash,7393,7373,0.0002\nCC-MAIN-2020-29,application/x-tar,5131,5125,0.0002\nCC-MAIN-2020-29,application/x-tex,2830,2830,0.0001\nCC-MAIN-2020-29,application/x-troff-man,12987,12975,0.0004\nCC-MAIN-2020-29,application/x-zip-compressed,15454,15356,0.0005\nCC-MAIN-2020-29,application/xhtml+xml,1228604,1226877,0.0391\nCC-MAIN-2020-29,application/xml,891479,888950,0.0283\nCC-MAIN-2020-29,application/zip,95249,94785,0.0030\nCC-MAIN-2020-29,audio/mpeg,110297,107923,0.0035\nCC-MAIN-2020-29,audio/x-mpegurl,23125,23056,0.0007\nCC-MAIN-2020-29,audio/x-scpls,3739,3730,0.0001\nCC-MAIN-2020-29,audio/x-wav,3694,3523,0.0001\nCC-MAIN-2020-29,binary/octet-stream,14187,14152,0.0005\nCC-MAIN-2020-29,image/gif,65642,65139,0.0021\nCC-MAIN-2020-29,image/jp2,753,753,0.0000\nCC-MAIN-2020-29,image/jpeg,3779991,3769115,0.1202\nCC-MAIN-2020-29,image/jpg,64805,64299,0.0021\nCC-MAIN-2020-29,image/pjpeg,9935,9932,0.0003\nCC-MAIN-2020-29,image/png,592333,589202,0.0188\nCC-MAIN-2020-29,image/svg+xml,10873,10839,0.0003\nCC-MAIN-2020-29,image/tiff,10040,10033,0.0003\nCC-MAIN-2020-29,image/vnd.djvu,4845,4844,0.0002\nCC-MAIN-2020-29,image/webp,32639,32635,0.0010\nCC-MAIN-2020-29,message/rfc822,20517,20517,0.0007\nCC-MAIN-2020-29,text/calendar,1351072,1349388,0.0430\nCC-MAIN-2020-29,text/css,8299,8293,0.0003\nCC-MAIN-2020-29,text/csv,93227,93087,0.0030\nCC-MAIN-2020-29,text/directory,15879,15859,0.0005\nCC-MAIN-2020-29,text/enriched,30391,30376,0.0010\nCC-MAIN-2020-29,text/html,3112675142,3083160510,98.9806\nCC-MAIN-2020-29,text/javascript,10540,10538,0.0003\nCC-MAIN-2020-29,text/markdown,1704,1704,0.0001\nCC-MAIN-2020-29,text/pdf,81,81,0.0000\nCC-MAIN-2020-29,text/plain,1527424,1526101,0.0486\nCC-MAIN-2020-29,text/prs.lines.tag,3303,3303,0.0001\nCC-MAIN-2020-29,text/tab-separated-values,16711,16710,0.0005\nCC-MAIN-2020-29,text/turtle,26865,26859,0.0009\nCC-MAIN-2020-29,text/vcard,29210,29167,0.0009\nCC-MAIN-2020-29,text/x-bibtex,8389,8389,0.0003\nCC-MAIN-2020-29,text/x-c,2311,2311,0.0001\nCC-MAIN-2020-29,text/x-csrc,14929,14929,0.0005\nCC-MAIN-2020-29,text/x-diff,5407,5400,0.0002\nCC-MAIN-2020-29,text/x-patch,12172,12163,0.0004\nCC-MAIN-2020-29,text/x-perl,6639,6639,0.0002\nCC-MAIN-2020-29,text/x-vcalendar,23090,23075,0.0007\nCC-MAIN-2020-29,text/x-vcard,65765,65634,0.0021\nCC-MAIN-2020-29,text/xml,2812872,2804197,0.0894\nCC-MAIN-2020-29,unknown/unknown,12030,12030,0.0004\nCC-MAIN-2020-29,video/mp4,34447,34361,0.0011\nCC-MAIN-2020-29,video/webm,2079,2077,0.0001\nCC-MAIN-2020-29,video/x-ms-asf,4839,4834,0.0002\nCC-MAIN-2020-34,<other>,3565330,3560503,0.1455\nCC-MAIN-2020-34,application/atom+xml,3580126,3579429,0.1461\nCC-MAIN-2020-34,application/calendar,7547,7547,0.0003\nCC-MAIN-2020-34,application/download,89464,89433,0.0037\nCC-MAIN-2020-34,application/epub+zip,42016,41958,0.0017\nCC-MAIN-2020-34,application/force-download,205427,205124,0.0084\nCC-MAIN-2020-34,application/gpx+xml,9742,9739,0.0004\nCC-MAIN-2020-34,application/ics,11993,11993,0.0005\nCC-MAIN-2020-34,application/javascript,25729,25724,0.0011\nCC-MAIN-2020-34,application/json,638399,638050,0.0261\nCC-MAIN-2020-34,application/ld+json,13793,13793,0.0006\nCC-MAIN-2020-34,application/marc,14748,14736,0.0006\nCC-MAIN-2020-34,application/msword,89260,88914,0.0036\nCC-MAIN-2020-34,application/octet-stream,1327046,1324314,0.0542\nCC-MAIN-2020-34,application/octetstream,4695,4683,0.0002\nCC-MAIN-2020-34,application/pdf,3406041,3381634,0.1390\nCC-MAIN-2020-34,application/pgp-encrypted,690,690,0.0000\nCC-MAIN-2020-34,application/pgp-signature,33363,33355,0.0014\nCC-MAIN-2020-34,application/postscript,7465,7465,0.0003\nCC-MAIN-2020-34,application/rdf+xml,99391,99368,0.0041\nCC-MAIN-2020-34,application/rss+xml,2097569,2092917,0.0856\nCC-MAIN-2020-34,application/rtf,34037,33962,0.0014\nCC-MAIN-2020-34,application/save-to-disk,58,58,0.0000\nCC-MAIN-2020-34,application/text,82894,82864,0.0034\nCC-MAIN-2020-34,application/unknown,8776,8775,0.0004\nCC-MAIN-2020-34,application/vnd.android.package-archive,44451,43559,0.0018\nCC-MAIN-2020-34,application/vnd.google-earth.kml+xml,45546,45438,0.0019\nCC-MAIN-2020-34,application/vnd.google-earth.kmz,7649,7647,0.0003\nCC-MAIN-2020-34,application/vnd.ms-excel,65620,65523,0.0027\nCC-MAIN-2020-34,application/vnd.ms-powerpoint,21950,21938,0.0009\nCC-MAIN-2020-34,application/vnd.ms-word,21120,21091,0.0009\nCC-MAIN-2020-34,application/vnd.oasis.opendocument.text,73091,73065,0.0030\nCC-MAIN-2020-34,application/vnd.openxmlformats-officedocument.presentationml.presentation,7405,7378,0.0003\nCC-MAIN-2020-34,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,40493,40416,0.0017\nCC-MAIN-2020-34,application/vnd.openxmlformats-officedocument.wordprocessingml.document,126246,126065,0.0052\nCC-MAIN-2020-34,application/vnd.wap.xhtml+xml,4263,4150,0.0002\nCC-MAIN-2020-34,application/x-bibtex,72086,72084,0.0029\nCC-MAIN-2020-34,application/x-bittorrent,9721,9533,0.0004\nCC-MAIN-2020-34,application/x-debian-package,4419,4418,0.0002\nCC-MAIN-2020-34,application/x-download,33688,33674,0.0014\nCC-MAIN-2020-34,application/x-endnote-refer,114654,114628,0.0047\nCC-MAIN-2020-34,application/x-gzip,25655,25638,0.0010\nCC-MAIN-2020-34,application/x-httpd-php,19004,18974,0.0008\nCC-MAIN-2020-34,application/x-java-jnlp-file,10706,10705,0.0004\nCC-MAIN-2020-34,application/x-javascript,13874,13769,0.0006\nCC-MAIN-2020-34,application/x-json,249,249,0.0000\nCC-MAIN-2020-34,application/x-mobipocket-ebook,3874,3874,0.0002\nCC-MAIN-2020-34,application/x-msdownload,10580,10514,0.0004\nCC-MAIN-2020-34,application/x-netcdf,4017,4017,0.0002\nCC-MAIN-2020-34,application/x-research-info-systems,225846,225717,0.0092\nCC-MAIN-2020-34,application/x-shockwave-flash,12340,12287,0.0005\nCC-MAIN-2020-34,application/x-tar,9189,9179,0.0004\nCC-MAIN-2020-34,application/x-tex,3251,3251,0.0001\nCC-MAIN-2020-34,application/x-troff-man,14372,14349,0.0006\nCC-MAIN-2020-34,application/x-zip-compressed,17843,17645,0.0007\nCC-MAIN-2020-34,application/xhtml+xml,1226554,1225012,0.0501\nCC-MAIN-2020-34,application/xml,833761,831818,0.0340\nCC-MAIN-2020-34,application/zip,116856,116318,0.0048\nCC-MAIN-2020-34,audio/mpeg,121102,118922,0.0049\nCC-MAIN-2020-34,audio/x-mpegurl,19091,19025,0.0008\nCC-MAIN-2020-34,audio/x-scpls,3385,3375,0.0001\nCC-MAIN-2020-34,audio/x-wav,4561,4501,0.0002\nCC-MAIN-2020-34,binary/octet-stream,21171,21099,0.0009\nCC-MAIN-2020-34,image/gif,78971,78483,0.0032\nCC-MAIN-2020-34,image/jp2,510,510,0.0000\nCC-MAIN-2020-34,image/jpeg,3575698,3567688,0.1460\nCC-MAIN-2020-34,image/jpg,67889,67445,0.0028\nCC-MAIN-2020-34,image/pjpeg,10132,10130,0.0004\nCC-MAIN-2020-34,image/png,510230,507280,0.0208\nCC-MAIN-2020-34,image/svg+xml,13487,13475,0.0006\nCC-MAIN-2020-34,image/tiff,11628,11615,0.0005\nCC-MAIN-2020-34,image/vnd.djvu,10449,10446,0.0004\nCC-MAIN-2020-34,image/webp,37034,37010,0.0015\nCC-MAIN-2020-34,message/rfc822,12545,12545,0.0005\nCC-MAIN-2020-34,text/calendar,1155932,1154723,0.0472\nCC-MAIN-2020-34,text/css,9190,9172,0.0004\nCC-MAIN-2020-34,text/csv,117429,117412,0.0048\nCC-MAIN-2020-34,text/directory,9963,9963,0.0004\nCC-MAIN-2020-34,text/enriched,31960,31954,0.0013\nCC-MAIN-2020-34,text/html,2421023660,2400659821,98.8240\nCC-MAIN-2020-34,text/javascript,10384,10380,0.0004\nCC-MAIN-2020-34,text/markdown,1837,1837,0.0001\nCC-MAIN-2020-34,text/pdf,78,78,0.0000\nCC-MAIN-2020-34,text/plain,1606187,1604364,0.0656\nCC-MAIN-2020-34,text/prs.lines.tag,2483,2483,0.0001\nCC-MAIN-2020-34,text/tab-separated-values,22693,22693,0.0009\nCC-MAIN-2020-34,text/turtle,31890,31888,0.0013\nCC-MAIN-2020-34,text/vcard,28755,28714,0.0012\nCC-MAIN-2020-34,text/x-bibtex,11013,10963,0.0004\nCC-MAIN-2020-34,text/x-c,1570,1570,0.0001\nCC-MAIN-2020-34,text/x-csrc,19331,19331,0.0008\nCC-MAIN-2020-34,text/x-diff,9169,9165,0.0004\nCC-MAIN-2020-34,text/x-patch,16454,16453,0.0007\nCC-MAIN-2020-34,text/x-perl,2600,2600,0.0001\nCC-MAIN-2020-34,text/x-vcalendar,20594,20594,0.0008\nCC-MAIN-2020-34,text/x-vcard,67571,67471,0.0028\nCC-MAIN-2020-34,text/xml,2443202,2438276,0.0997\nCC-MAIN-2020-34,unknown/unknown,9775,9772,0.0004\nCC-MAIN-2020-34,video/mp4,37705,37513,0.0015\nCC-MAIN-2020-34,video/webm,2543,2488,0.0001\nCC-MAIN-2020-34,video/x-ms-asf,6416,6384,0.0003\nCC-MAIN-2020-40,<other>,3382210,3376896,0.0974\nCC-MAIN-2020-40,application/atom+xml,2344754,2344000,0.0675\nCC-MAIN-2020-40,application/calendar,6710,6710,0.0002\nCC-MAIN-2020-40,application/download,87633,87614,0.0025\nCC-MAIN-2020-40,application/epub+zip,35464,35424,0.0010\nCC-MAIN-2020-40,application/force-download,170623,170455,0.0049\nCC-MAIN-2020-40,application/gpx+xml,8159,8159,0.0002\nCC-MAIN-2020-40,application/ics,8686,8685,0.0003\nCC-MAIN-2020-40,application/javascript,18693,18689,0.0005\nCC-MAIN-2020-40,application/json,597696,596800,0.0172\nCC-MAIN-2020-40,application/ld+json,11804,11803,0.0003\nCC-MAIN-2020-40,application/marc,12760,12756,0.0004\nCC-MAIN-2020-40,application/msword,96291,96099,0.0028\nCC-MAIN-2020-40,application/octet-stream,1291560,1289549,0.0372\nCC-MAIN-2020-40,application/octetstream,7097,7094,0.0002\nCC-MAIN-2020-40,application/pdf,34531405,34444176,0.9941\nCC-MAIN-2020-40,application/pgp-encrypted,848,847,0.0000\nCC-MAIN-2020-40,application/pgp-signature,32499,32496,0.0009\nCC-MAIN-2020-40,application/postscript,4997,4991,0.0001\nCC-MAIN-2020-40,application/rdf+xml,81389,81366,0.0023\nCC-MAIN-2020-40,application/rss+xml,2076733,2071433,0.0598\nCC-MAIN-2020-40,application/rtf,36922,36828,0.0011\nCC-MAIN-2020-40,application/save-to-disk,245,245,0.0000\nCC-MAIN-2020-40,application/text,70281,70270,0.0020\nCC-MAIN-2020-40,application/unknown,9653,9650,0.0003\nCC-MAIN-2020-40,application/vnd.android.package-archive,29686,29480,0.0009\nCC-MAIN-2020-40,application/vnd.google-earth.kml+xml,45775,45772,0.0013\nCC-MAIN-2020-40,application/vnd.google-earth.kmz,17800,17797,0.0005\nCC-MAIN-2020-40,application/vnd.ms-excel,62523,62450,0.0018\nCC-MAIN-2020-40,application/vnd.ms-powerpoint,26141,26128,0.0008\nCC-MAIN-2020-40,application/vnd.ms-word,17920,17903,0.0005\nCC-MAIN-2020-40,application/vnd.oasis.opendocument.text,57260,57226,0.0016\nCC-MAIN-2020-40,application/vnd.openxmlformats-officedocument.presentationml.presentation,6619,6609,0.0002\nCC-MAIN-2020-40,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,34955,34869,0.0010\nCC-MAIN-2020-40,application/vnd.openxmlformats-officedocument.wordprocessingml.document,105784,105558,0.0030\nCC-MAIN-2020-40,application/vnd.wap.xhtml+xml,3710,3675,0.0001\nCC-MAIN-2020-40,application/x-bibtex,59553,59537,0.0017\nCC-MAIN-2020-40,application/x-bittorrent,8140,7923,0.0002\nCC-MAIN-2020-40,application/x-debian-package,5078,5064,0.0001\nCC-MAIN-2020-40,application/x-download,38525,38483,0.0011\nCC-MAIN-2020-40,application/x-endnote-refer,97400,97372,0.0028\nCC-MAIN-2020-40,application/x-gzip,25748,25626,0.0007\nCC-MAIN-2020-40,application/x-httpd-php,19014,18947,0.0005\nCC-MAIN-2020-40,application/x-java-jnlp-file,11360,11358,0.0003\nCC-MAIN-2020-40,application/x-javascript,12572,12472,0.0004\nCC-MAIN-2020-40,application/x-json,288,288,0.0000\nCC-MAIN-2020-40,application/x-mobipocket-ebook,3194,3193,0.0001\nCC-MAIN-2020-40,application/x-msdownload,9166,9115,0.0003\nCC-MAIN-2020-40,application/x-netcdf,10245,10245,0.0003\nCC-MAIN-2020-40,application/x-research-info-systems,207534,207439,0.0060\nCC-MAIN-2020-40,application/x-shockwave-flash,10074,10039,0.0003\nCC-MAIN-2020-40,application/x-tar,8036,8032,0.0002\nCC-MAIN-2020-40,application/x-tex,3095,3095,0.0001\nCC-MAIN-2020-40,application/x-troff-man,14257,14253,0.0004\nCC-MAIN-2020-40,application/x-zip-compressed,16920,16709,0.0005\nCC-MAIN-2020-40,application/xhtml+xml,1253342,1251376,0.0361\nCC-MAIN-2020-40,application/xml,855158,853719,0.0246\nCC-MAIN-2020-40,application/zip,106001,105537,0.0031\nCC-MAIN-2020-40,audio/mpeg,112759,111157,0.0032\nCC-MAIN-2020-40,audio/x-mpegurl,19424,19409,0.0006\nCC-MAIN-2020-40,audio/x-scpls,3090,3069,0.0001\nCC-MAIN-2020-40,audio/x-wav,4731,4707,0.0001\nCC-MAIN-2020-40,binary/octet-stream,22587,22505,0.0007\nCC-MAIN-2020-40,image/gif,104865,104090,0.0030\nCC-MAIN-2020-40,image/jp2,544,544,0.0000\nCC-MAIN-2020-40,image/jpeg,6847784,6821639,0.1971\nCC-MAIN-2020-40,image/jpg,63917,62208,0.0018\nCC-MAIN-2020-40,image/pjpeg,9377,9375,0.0003\nCC-MAIN-2020-40,image/png,1505366,1499681,0.0433\nCC-MAIN-2020-40,image/svg+xml,29019,28974,0.0008\nCC-MAIN-2020-40,image/tiff,13386,13377,0.0004\nCC-MAIN-2020-40,image/vnd.djvu,5348,5327,0.0002\nCC-MAIN-2020-40,image/webp,34430,34423,0.0010\nCC-MAIN-2020-40,message/rfc822,12307,12307,0.0004\nCC-MAIN-2020-40,text/calendar,1068483,1067535,0.0308\nCC-MAIN-2020-40,text/css,9297,9293,0.0003\nCC-MAIN-2020-40,text/csv,104531,104518,0.0030\nCC-MAIN-2020-40,text/directory,12546,12542,0.0004\nCC-MAIN-2020-40,text/enriched,26780,26779,0.0008\nCC-MAIN-2020-40,text/html,3411063542,3384193843,98.2005\nCC-MAIN-2020-40,text/javascript,10246,10242,0.0003\nCC-MAIN-2020-40,text/markdown,1786,1785,0.0001\nCC-MAIN-2020-40,text/pdf,186,186,0.0000\nCC-MAIN-2020-40,text/plain,1552643,1550269,0.0447\nCC-MAIN-2020-40,text/prs.lines.tag,5331,5331,0.0002\nCC-MAIN-2020-40,text/tab-separated-values,19214,19214,0.0006\nCC-MAIN-2020-40,text/turtle,29097,29094,0.0008\nCC-MAIN-2020-40,text/vcard,26724,26587,0.0008\nCC-MAIN-2020-40,text/x-bibtex,11973,11928,0.0003\nCC-MAIN-2020-40,text/x-c,2245,2244,0.0001\nCC-MAIN-2020-40,text/x-csrc,14269,14269,0.0004\nCC-MAIN-2020-40,text/x-diff,6952,6937,0.0002\nCC-MAIN-2020-40,text/x-patch,16245,16230,0.0005\nCC-MAIN-2020-40,text/x-perl,1859,1859,0.0001\nCC-MAIN-2020-40,text/x-vcalendar,19425,19423,0.0006\nCC-MAIN-2020-40,text/x-vcard,59305,59260,0.0017\nCC-MAIN-2020-40,text/xml,2522646,2517950,0.0726\nCC-MAIN-2020-40,unknown/unknown,11521,11520,0.0003\nCC-MAIN-2020-40,video/mp4,70180,70020,0.0020\nCC-MAIN-2020-40,video/webm,2690,2682,0.0001\nCC-MAIN-2020-40,video/x-ms-asf,4571,4556,0.0001\nCC-MAIN-2020-45,<other>,2532886,2524367,0.0927\nCC-MAIN-2020-45,application/atom+xml,2278471,2278104,0.0834\nCC-MAIN-2020-45,application/calendar,6373,6373,0.0002\nCC-MAIN-2020-45,application/download,83936,83880,0.0031\nCC-MAIN-2020-45,application/epub+zip,42326,42304,0.0015\nCC-MAIN-2020-45,application/force-download,124029,123980,0.0045\nCC-MAIN-2020-45,application/gpx+xml,7657,7655,0.0003\nCC-MAIN-2020-45,application/ics,9563,9563,0.0004\nCC-MAIN-2020-45,application/javascript,10678,10672,0.0004\nCC-MAIN-2020-45,application/json,587771,587155,0.0215\nCC-MAIN-2020-45,application/ld+json,21083,21083,0.0008\nCC-MAIN-2020-45,application/marc,10491,10491,0.0004\nCC-MAIN-2020-45,application/msword,75241,75102,0.0028\nCC-MAIN-2020-45,application/octet-stream,1175091,1173646,0.0430\nCC-MAIN-2020-45,application/octetstream,7936,7934,0.0003\nCC-MAIN-2020-45,application/pdf,22818018,22751468,0.8355\nCC-MAIN-2020-45,application/pgp-encrypted,1071,1071,0.0000\nCC-MAIN-2020-45,application/pgp-signature,34116,34115,0.0012\nCC-MAIN-2020-45,application/postscript,5436,5422,0.0002\nCC-MAIN-2020-45,application/rdf+xml,85488,85476,0.0031\nCC-MAIN-2020-45,application/rss+xml,1880250,1877952,0.0688\nCC-MAIN-2020-45,application/rtf,34231,34217,0.0013\nCC-MAIN-2020-45,application/save-to-disk,650,650,0.0000\nCC-MAIN-2020-45,application/text,75033,75031,0.0027\nCC-MAIN-2020-45,application/unknown,7714,7714,0.0003\nCC-MAIN-2020-45,application/vnd.android.package-archive,16727,16634,0.0006\nCC-MAIN-2020-45,application/vnd.google-earth.kml+xml,38975,38975,0.0014\nCC-MAIN-2020-45,application/vnd.google-earth.kmz,7302,7302,0.0003\nCC-MAIN-2020-45,application/vnd.ms-excel,56151,56078,0.0021\nCC-MAIN-2020-45,application/vnd.ms-powerpoint,27853,27835,0.0010\nCC-MAIN-2020-45,application/vnd.ms-word,15074,15071,0.0006\nCC-MAIN-2020-45,application/vnd.oasis.opendocument.text,30750,30673,0.0011\nCC-MAIN-2020-45,application/vnd.openxmlformats-officedocument.presentationml.presentation,6997,6981,0.0003\nCC-MAIN-2020-45,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,34689,34621,0.0013\nCC-MAIN-2020-45,application/vnd.openxmlformats-officedocument.wordprocessingml.document,72398,72237,0.0027\nCC-MAIN-2020-45,application/vnd.wap.xhtml+xml,2508,2487,0.0001\nCC-MAIN-2020-45,application/x-bibtex,64561,64557,0.0024\nCC-MAIN-2020-45,application/x-bittorrent,5953,5711,0.0002\nCC-MAIN-2020-45,application/x-debian-package,2462,2462,0.0001\nCC-MAIN-2020-45,application/x-download,37418,37101,0.0014\nCC-MAIN-2020-45,application/x-endnote-refer,112447,112440,0.0041\nCC-MAIN-2020-45,application/x-gzip,31438,31358,0.0012\nCC-MAIN-2020-45,application/x-httpd-php,22568,22534,0.0008\nCC-MAIN-2020-45,application/x-java-jnlp-file,5443,5440,0.0002\nCC-MAIN-2020-45,application/x-javascript,10217,10117,0.0004\nCC-MAIN-2020-45,application/x-json,137,137,0.0000\nCC-MAIN-2020-45,application/x-mobipocket-ebook,6568,6567,0.0002\nCC-MAIN-2020-45,application/x-msdownload,13081,12719,0.0005\nCC-MAIN-2020-45,application/x-netcdf,3869,3869,0.0001\nCC-MAIN-2020-45,application/x-research-info-systems,212738,212709,0.0078\nCC-MAIN-2020-45,application/x-shockwave-flash,11705,11655,0.0004\nCC-MAIN-2020-45,application/x-tar,7248,7229,0.0003\nCC-MAIN-2020-45,application/x-tex,2712,2712,0.0001\nCC-MAIN-2020-45,application/x-troff-man,8899,8829,0.0003\nCC-MAIN-2020-45,application/x-zip-compressed,22185,22027,0.0008\nCC-MAIN-2020-45,application/xhtml+xml,1426415,1420105,0.0522\nCC-MAIN-2020-45,application/xml,810367,809553,0.0297\nCC-MAIN-2020-45,application/zip,119795,118200,0.0044\nCC-MAIN-2020-45,audio/mpeg,138160,135535,0.0051\nCC-MAIN-2020-45,audio/x-mpegurl,14663,14638,0.0005\nCC-MAIN-2020-45,audio/x-scpls,2996,2977,0.0001\nCC-MAIN-2020-45,audio/x-wav,5195,5120,0.0002\nCC-MAIN-2020-45,binary/octet-stream,21024,20933,0.0008\nCC-MAIN-2020-45,image/gif,92782,92148,0.0034\nCC-MAIN-2020-45,image/jp2,1200,1200,0.0000\nCC-MAIN-2020-45,image/jpeg,5414807,5394639,0.1983\nCC-MAIN-2020-45,image/jpg,81528,80474,0.0030\nCC-MAIN-2020-45,image/pjpeg,13916,13914,0.0005\nCC-MAIN-2020-45,image/png,970390,965870,0.0355\nCC-MAIN-2020-45,image/svg+xml,19898,19814,0.0007\nCC-MAIN-2020-45,image/tiff,14711,14699,0.0005\nCC-MAIN-2020-45,image/vnd.djvu,5516,5516,0.0002\nCC-MAIN-2020-45,image/webp,3380,3379,0.0001\nCC-MAIN-2020-45,message/rfc822,11427,11422,0.0004\nCC-MAIN-2020-45,text/calendar,874945,874642,0.0320\nCC-MAIN-2020-45,text/css,9528,9466,0.0003\nCC-MAIN-2020-45,text/csv,97642,97640,0.0036\nCC-MAIN-2020-45,text/directory,10377,10376,0.0004\nCC-MAIN-2020-45,text/enriched,29437,29437,0.0011\nCC-MAIN-2020-45,text/html,2683965967,2662859453,98.2755\nCC-MAIN-2020-45,text/javascript,11155,11151,0.0004\nCC-MAIN-2020-45,text/markdown,1672,1672,0.0001\nCC-MAIN-2020-45,text/pdf,153,153,0.0000\nCC-MAIN-2020-45,text/plain,1438572,1437598,0.0527\nCC-MAIN-2020-45,text/prs.lines.tag,7497,7497,0.0003\nCC-MAIN-2020-45,text/tab-separated-values,15986,15986,0.0006\nCC-MAIN-2020-45,text/turtle,29594,29594,0.0011\nCC-MAIN-2020-45,text/vcard,23481,23476,0.0009\nCC-MAIN-2020-45,text/x-bibtex,10252,10131,0.0004\nCC-MAIN-2020-45,text/x-c,2188,2187,0.0001\nCC-MAIN-2020-45,text/x-csrc,23443,23443,0.0009\nCC-MAIN-2020-45,text/x-diff,7848,7848,0.0003\nCC-MAIN-2020-45,text/x-patch,12852,12849,0.0005\nCC-MAIN-2020-45,text/x-perl,1974,1974,0.0001\nCC-MAIN-2020-45,text/x-vcalendar,17845,17844,0.0007\nCC-MAIN-2020-45,text/x-vcard,56767,56733,0.0021\nCC-MAIN-2020-45,text/xml,2366646,2362320,0.0867\nCC-MAIN-2020-45,unknown/unknown,13646,13645,0.0005\nCC-MAIN-2020-45,video/mp4,52723,52630,0.0019\nCC-MAIN-2020-45,video/webm,2743,2737,0.0001\nCC-MAIN-2020-45,video/x-ms-asf,3528,3489,0.0001\nCC-MAIN-2020-50,<other>,2289930,2280616,0.0867\nCC-MAIN-2020-50,application/atom+xml,1523121,1522698,0.0576\nCC-MAIN-2020-50,application/calendar,7764,7764,0.0003\nCC-MAIN-2020-50,application/download,73099,73034,0.0028\nCC-MAIN-2020-50,application/epub+zip,43745,43711,0.0017\nCC-MAIN-2020-50,application/force-download,105063,105035,0.0040\nCC-MAIN-2020-50,application/gpx+xml,7139,7135,0.0003\nCC-MAIN-2020-50,application/ics,9678,9678,0.0004\nCC-MAIN-2020-50,application/javascript,8353,8345,0.0003\nCC-MAIN-2020-50,application/json,564730,564300,0.0214\nCC-MAIN-2020-50,application/ld+json,19057,19057,0.0007\nCC-MAIN-2020-50,application/marc,14322,14322,0.0005\nCC-MAIN-2020-50,application/msword,64531,64420,0.0024\nCC-MAIN-2020-50,application/octet-stream,1052384,1051072,0.0398\nCC-MAIN-2020-50,application/octetstream,7932,7931,0.0003\nCC-MAIN-2020-50,application/pdf,17905640,17854466,0.6776\nCC-MAIN-2020-50,application/pgp-encrypted,1179,1179,0.0000\nCC-MAIN-2020-50,application/pgp-signature,26580,26580,0.0010\nCC-MAIN-2020-50,application/postscript,4378,4375,0.0002\nCC-MAIN-2020-50,application/rdf+xml,85765,85752,0.0032\nCC-MAIN-2020-50,application/rss+xml,1607517,1604883,0.0608\nCC-MAIN-2020-50,application/rtf,30710,30703,0.0012\nCC-MAIN-2020-50,application/save-to-disk,60,60,0.0000\nCC-MAIN-2020-50,application/text,70506,70500,0.0027\nCC-MAIN-2020-50,application/unknown,7197,7197,0.0003\nCC-MAIN-2020-50,application/vnd.android.package-archive,18392,18278,0.0007\nCC-MAIN-2020-50,application/vnd.google-earth.kml+xml,55719,55715,0.0021\nCC-MAIN-2020-50,application/vnd.google-earth.kmz,7708,7706,0.0003\nCC-MAIN-2020-50,application/vnd.ms-excel,56243,56146,0.0021\nCC-MAIN-2020-50,application/vnd.ms-powerpoint,26859,26854,0.0010\nCC-MAIN-2020-50,application/vnd.ms-word,13469,13469,0.0005\nCC-MAIN-2020-50,application/vnd.oasis.opendocument.text,23675,23672,0.0009\nCC-MAIN-2020-50,application/vnd.openxmlformats-officedocument.presentationml.presentation,5807,5635,0.0002\nCC-MAIN-2020-50,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,32505,32481,0.0012\nCC-MAIN-2020-50,application/vnd.openxmlformats-officedocument.wordprocessingml.document,60325,60041,0.0023\nCC-MAIN-2020-50,application/vnd.wap.xhtml+xml,2112,2048,0.0001\nCC-MAIN-2020-50,application/x-bibtex,60831,60821,0.0023\nCC-MAIN-2020-50,application/x-bittorrent,6519,6336,0.0002\nCC-MAIN-2020-50,application/x-debian-package,1286,1286,0.0000\nCC-MAIN-2020-50,application/x-download,32571,31806,0.0012\nCC-MAIN-2020-50,application/x-endnote-refer,104305,104291,0.0039\nCC-MAIN-2020-50,application/x-gzip,27921,27912,0.0011\nCC-MAIN-2020-50,application/x-httpd-php,13806,13781,0.0005\nCC-MAIN-2020-50,application/x-java-jnlp-file,8469,8468,0.0003\nCC-MAIN-2020-50,application/x-javascript,6816,6717,0.0003\nCC-MAIN-2020-50,application/x-json,46,46,0.0000\nCC-MAIN-2020-50,application/x-mobipocket-ebook,3820,3819,0.0001\nCC-MAIN-2020-50,application/x-msdownload,12315,12248,0.0005\nCC-MAIN-2020-50,application/x-netcdf,2300,2300,0.0001\nCC-MAIN-2020-50,application/x-research-info-systems,200436,200411,0.0076\nCC-MAIN-2020-50,application/x-shockwave-flash,8829,8806,0.0003\nCC-MAIN-2020-50,application/x-tar,7566,7558,0.0003\nCC-MAIN-2020-50,application/x-tex,2345,2345,0.0001\nCC-MAIN-2020-50,application/x-troff-man,12410,12407,0.0005\nCC-MAIN-2020-50,application/x-zip-compressed,20159,20063,0.0008\nCC-MAIN-2020-50,application/xhtml+xml,1452760,1450526,0.0550\nCC-MAIN-2020-50,application/xml,781248,780400,0.0296\nCC-MAIN-2020-50,application/zip,117063,116538,0.0044\nCC-MAIN-2020-50,audio/mpeg,115813,113588,0.0044\nCC-MAIN-2020-50,audio/x-mpegurl,14349,14344,0.0005\nCC-MAIN-2020-50,audio/x-scpls,2684,2678,0.0001\nCC-MAIN-2020-50,audio/x-wav,3381,3371,0.0001\nCC-MAIN-2020-50,binary/octet-stream,18737,18622,0.0007\nCC-MAIN-2020-50,image/gif,78204,77619,0.0030\nCC-MAIN-2020-50,image/jp2,842,842,0.0000\nCC-MAIN-2020-50,image/jpeg,4201153,4181984,0.1590\nCC-MAIN-2020-50,image/jpg,72534,71073,0.0027\nCC-MAIN-2020-50,image/pjpeg,15655,15654,0.0006\nCC-MAIN-2020-50,image/png,744965,739813,0.0282\nCC-MAIN-2020-50,image/svg+xml,17906,17837,0.0007\nCC-MAIN-2020-50,image/tiff,13749,13738,0.0005\nCC-MAIN-2020-50,image/vnd.djvu,6705,6703,0.0003\nCC-MAIN-2020-50,image/webp,2585,2583,0.0001\nCC-MAIN-2020-50,message/rfc822,10155,10154,0.0004\nCC-MAIN-2020-50,text/calendar,701945,701747,0.0266\nCC-MAIN-2020-50,text/css,9781,9654,0.0004\nCC-MAIN-2020-50,text/csv,108637,108626,0.0041\nCC-MAIN-2020-50,text/directory,6957,6957,0.0003\nCC-MAIN-2020-50,text/enriched,25589,25585,0.0010\nCC-MAIN-2020-50,text/html,2603929576,2584592781,98.5414\nCC-MAIN-2020-50,text/javascript,12034,12025,0.0005\nCC-MAIN-2020-50,text/markdown,2369,2369,0.0001\nCC-MAIN-2020-50,text/pdf,100,100,0.0000\nCC-MAIN-2020-50,text/plain,1372013,1371337,0.0519\nCC-MAIN-2020-50,text/prs.lines.tag,5414,5414,0.0002\nCC-MAIN-2020-50,text/tab-separated-values,15264,15264,0.0006\nCC-MAIN-2020-50,text/turtle,32225,32224,0.0012\nCC-MAIN-2020-50,text/vcard,24122,24119,0.0009\nCC-MAIN-2020-50,text/x-bibtex,11226,11224,0.0004\nCC-MAIN-2020-50,text/x-c,3753,3751,0.0001\nCC-MAIN-2020-50,text/x-csrc,28401,28401,0.0011\nCC-MAIN-2020-50,text/x-diff,6532,6531,0.0002\nCC-MAIN-2020-50,text/x-patch,13905,13902,0.0005\nCC-MAIN-2020-50,text/x-perl,1618,1618,0.0001\nCC-MAIN-2020-50,text/x-vcalendar,15664,15664,0.0006\nCC-MAIN-2020-50,text/x-vcard,47432,47310,0.0018\nCC-MAIN-2020-50,text/xml,1995858,1992626,0.0755\nCC-MAIN-2020-50,unknown/unknown,13213,13211,0.0005\nCC-MAIN-2020-50,video/mp4,45922,45807,0.0017\nCC-MAIN-2020-50,video/webm,2622,2609,0.0001\nCC-MAIN-2020-50,video/x-ms-asf,2897,2879,0.0001\nCC-MAIN-2021-04,<other>,2662664,2656369,0.0783\nCC-MAIN-2021-04,application/atom+xml,2133151,2132549,0.0627\nCC-MAIN-2021-04,application/calendar,6932,6932,0.0002\nCC-MAIN-2021-04,application/download,74811,74772,0.0022\nCC-MAIN-2021-04,application/epub+zip,40704,40650,0.0012\nCC-MAIN-2021-04,application/force-download,115874,115838,0.0034\nCC-MAIN-2021-04,application/gpx+xml,8332,8332,0.0002\nCC-MAIN-2021-04,application/ics,12131,12128,0.0004\nCC-MAIN-2021-04,application/javascript,9745,9739,0.0003\nCC-MAIN-2021-04,application/json,608751,608459,0.0179\nCC-MAIN-2021-04,application/ld+json,23121,23121,0.0007\nCC-MAIN-2021-04,application/marc,12997,12997,0.0004\nCC-MAIN-2021-04,application/msword,65579,65416,0.0019\nCC-MAIN-2021-04,application/octet-stream,1108215,1106937,0.0326\nCC-MAIN-2021-04,application/octetstream,6637,6632,0.0002\nCC-MAIN-2021-04,application/pdf,26434840,26371530,0.7772\nCC-MAIN-2021-04,application/pgp-encrypted,1570,1570,0.0000\nCC-MAIN-2021-04,application/pgp-signature,39969,39968,0.0012\nCC-MAIN-2021-04,application/postscript,5461,5461,0.0002\nCC-MAIN-2021-04,application/rdf+xml,86709,86695,0.0025\nCC-MAIN-2021-04,application/rss+xml,1919632,1915378,0.0564\nCC-MAIN-2021-04,application/rtf,33320,33280,0.0010\nCC-MAIN-2021-04,application/save-to-disk,9,9,0.0000\nCC-MAIN-2021-04,application/text,70436,70431,0.0021\nCC-MAIN-2021-04,application/unknown,10400,10399,0.0003\nCC-MAIN-2021-04,application/vnd.android.package-archive,17707,17524,0.0005\nCC-MAIN-2021-04,application/vnd.google-earth.kml+xml,39801,39788,0.0012\nCC-MAIN-2021-04,application/vnd.google-earth.kmz,7176,7176,0.0002\nCC-MAIN-2021-04,application/vnd.ms-excel,61266,61154,0.0018\nCC-MAIN-2021-04,application/vnd.ms-powerpoint,25350,25321,0.0007\nCC-MAIN-2021-04,application/vnd.ms-word,15507,15505,0.0005\nCC-MAIN-2021-04,application/vnd.oasis.opendocument.text,21174,21155,0.0006\nCC-MAIN-2021-04,application/vnd.openxmlformats-officedocument.presentationml.presentation,5867,5860,0.0002\nCC-MAIN-2021-04,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,36963,36916,0.0011\nCC-MAIN-2021-04,application/vnd.openxmlformats-officedocument.wordprocessingml.document,63642,63372,0.0019\nCC-MAIN-2021-04,application/vnd.wap.xhtml+xml,2399,2334,0.0001\nCC-MAIN-2021-04,application/x-bibtex,60262,60252,0.0018\nCC-MAIN-2021-04,application/x-bittorrent,6056,5848,0.0002\nCC-MAIN-2021-04,application/x-debian-package,3100,3100,0.0001\nCC-MAIN-2021-04,application/x-download,38922,38372,0.0011\nCC-MAIN-2021-04,application/x-endnote-refer,106562,106556,0.0031\nCC-MAIN-2021-04,application/x-gzip,23171,23168,0.0007\nCC-MAIN-2021-04,application/x-httpd-php,11595,11543,0.0003\nCC-MAIN-2021-04,application/x-java-jnlp-file,9976,9975,0.0003\nCC-MAIN-2021-04,application/x-javascript,16918,16838,0.0005\nCC-MAIN-2021-04,application/x-json,232,232,0.0000\nCC-MAIN-2021-04,application/x-mobipocket-ebook,5240,5238,0.0002\nCC-MAIN-2021-04,application/x-msdownload,7586,7531,0.0002\nCC-MAIN-2021-04,application/x-netcdf,2448,2448,0.0001\nCC-MAIN-2021-04,application/x-research-info-systems,194124,194109,0.0057\nCC-MAIN-2021-04,application/x-shockwave-flash,7633,7594,0.0002\nCC-MAIN-2021-04,application/x-tar,7798,7782,0.0002\nCC-MAIN-2021-04,application/x-tex,2461,2461,0.0001\nCC-MAIN-2021-04,application/x-troff-man,9876,9871,0.0003\nCC-MAIN-2021-04,application/x-zip-compressed,18446,18330,0.0005\nCC-MAIN-2021-04,application/xhtml+xml,1459891,1457513,0.0429\nCC-MAIN-2021-04,application/xml,888496,887412,0.0261\nCC-MAIN-2021-04,application/zip,111856,111304,0.0033\nCC-MAIN-2021-04,audio/mpeg,133900,130121,0.0039\nCC-MAIN-2021-04,audio/x-mpegurl,26436,26423,0.0008\nCC-MAIN-2021-04,audio/x-scpls,3925,3919,0.0001\nCC-MAIN-2021-04,audio/x-wav,3620,3575,0.0001\nCC-MAIN-2021-04,binary/octet-stream,16468,16361,0.0005\nCC-MAIN-2021-04,image/gif,179319,178897,0.0053\nCC-MAIN-2021-04,image/jp2,482,482,0.0000\nCC-MAIN-2021-04,image/jpeg,4556908,4540673,0.1340\nCC-MAIN-2021-04,image/jpg,62453,61977,0.0018\nCC-MAIN-2021-04,image/pjpeg,10004,10003,0.0003\nCC-MAIN-2021-04,image/png,856735,852237,0.0252\nCC-MAIN-2021-04,image/svg+xml,18410,18208,0.0005\nCC-MAIN-2021-04,image/tiff,12703,12697,0.0004\nCC-MAIN-2021-04,image/vnd.djvu,6895,6890,0.0002\nCC-MAIN-2021-04,image/webp,5953,5949,0.0002\nCC-MAIN-2021-04,message/rfc822,10808,10807,0.0003\nCC-MAIN-2021-04,text/calendar,800378,799841,0.0235\nCC-MAIN-2021-04,text/css,9136,9096,0.0003\nCC-MAIN-2021-04,text/csv,114175,114164,0.0034\nCC-MAIN-2021-04,text/directory,10671,10667,0.0003\nCC-MAIN-2021-04,text/enriched,25692,25689,0.0008\nCC-MAIN-2021-04,text/html,3351540618,3324638709,98.5374\nCC-MAIN-2021-04,text/javascript,11868,11854,0.0003\nCC-MAIN-2021-04,text/markdown,2334,2332,0.0001\nCC-MAIN-2021-04,text/pdf,171,171,0.0000\nCC-MAIN-2021-04,text/plain,1456865,1456139,0.0428\nCC-MAIN-2021-04,text/prs.lines.tag,5948,5948,0.0002\nCC-MAIN-2021-04,text/tab-separated-values,13231,13231,0.0004\nCC-MAIN-2021-04,text/turtle,32615,32615,0.0010\nCC-MAIN-2021-04,text/vcard,28397,28357,0.0008\nCC-MAIN-2021-04,text/x-bibtex,9415,9412,0.0003\nCC-MAIN-2021-04,text/x-c,2069,2066,0.0001\nCC-MAIN-2021-04,text/x-csrc,22821,22821,0.0007\nCC-MAIN-2021-04,text/x-diff,4783,4779,0.0001\nCC-MAIN-2021-04,text/x-patch,16905,16902,0.0005\nCC-MAIN-2021-04,text/x-perl,2628,2628,0.0001\nCC-MAIN-2021-04,text/x-vcalendar,15559,15555,0.0005\nCC-MAIN-2021-04,text/x-vcard,55638,55581,0.0016\nCC-MAIN-2021-04,text/xml,2341852,2335974,0.0689\nCC-MAIN-2021-04,unknown/unknown,14224,14222,0.0004\nCC-MAIN-2021-04,video/mp4,55531,55298,0.0016\nCC-MAIN-2021-04,video/webm,2534,2527,0.0001\nCC-MAIN-2021-04,video/x-ms-asf,3839,3831,0.0001\nCC-MAIN-2021-10,<other>,1964343,1960494,0.0718\nCC-MAIN-2021-10,application/atom+xml,2093029,2092352,0.0765\nCC-MAIN-2021-10,application/calendar,7422,7419,0.0003\nCC-MAIN-2021-10,application/download,76844,76831,0.0028\nCC-MAIN-2021-10,application/epub+zip,37933,37914,0.0014\nCC-MAIN-2021-10,application/force-download,107542,107520,0.0039\nCC-MAIN-2021-10,application/gpx+xml,9167,9167,0.0003\nCC-MAIN-2021-10,application/ics,11668,11668,0.0004\nCC-MAIN-2021-10,application/javascript,11026,11019,0.0004\nCC-MAIN-2021-10,application/json,486183,486007,0.0178\nCC-MAIN-2021-10,application/ld+json,19832,19832,0.0007\nCC-MAIN-2021-10,application/marc,9886,9886,0.0004\nCC-MAIN-2021-10,application/msword,71670,71292,0.0026\nCC-MAIN-2021-10,application/octet-stream,998894,997406,0.0365\nCC-MAIN-2021-10,application/octetstream,5866,5860,0.0002\nCC-MAIN-2021-10,application/pdf,15908062,15862598,0.5813\nCC-MAIN-2021-10,application/pgp-encrypted,1268,1268,0.0000\nCC-MAIN-2021-10,application/pgp-signature,20173,20171,0.0007\nCC-MAIN-2021-10,application/postscript,4345,4341,0.0002\nCC-MAIN-2021-10,application/rdf+xml,75199,75190,0.0027\nCC-MAIN-2021-10,application/rss+xml,1755397,1753412,0.0641\nCC-MAIN-2021-10,application/rtf,36822,36810,0.0013\nCC-MAIN-2021-10,application/save-to-disk,44,44,0.0000\nCC-MAIN-2021-10,application/text,65121,65121,0.0024\nCC-MAIN-2021-10,application/unknown,8032,8031,0.0003\nCC-MAIN-2021-10,application/vnd.android.package-archive,14335,14237,0.0005\nCC-MAIN-2021-10,application/vnd.google-earth.kml+xml,30270,30257,0.0011\nCC-MAIN-2021-10,application/vnd.google-earth.kmz,5123,5119,0.0002\nCC-MAIN-2021-10,application/vnd.ms-excel,63463,63385,0.0023\nCC-MAIN-2021-10,application/vnd.ms-powerpoint,26105,26086,0.0010\nCC-MAIN-2021-10,application/vnd.ms-word,13935,13935,0.0005\nCC-MAIN-2021-10,application/vnd.oasis.opendocument.text,23725,23696,0.0009\nCC-MAIN-2021-10,application/vnd.openxmlformats-officedocument.presentationml.presentation,6644,6625,0.0002\nCC-MAIN-2021-10,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,32583,32536,0.0012\nCC-MAIN-2021-10,application/vnd.openxmlformats-officedocument.wordprocessingml.document,70277,69292,0.0026\nCC-MAIN-2021-10,application/vnd.wap.xhtml+xml,2724,2648,0.0001\nCC-MAIN-2021-10,application/x-bibtex,54309,54308,0.0020\nCC-MAIN-2021-10,application/x-bittorrent,5493,5285,0.0002\nCC-MAIN-2021-10,application/x-debian-package,1229,1227,0.0000\nCC-MAIN-2021-10,application/x-download,35644,34920,0.0013\nCC-MAIN-2021-10,application/x-endnote-refer,95265,95265,0.0035\nCC-MAIN-2021-10,application/x-gzip,25300,25289,0.0009\nCC-MAIN-2021-10,application/x-httpd-php,14223,14161,0.0005\nCC-MAIN-2021-10,application/x-java-jnlp-file,7011,7009,0.0003\nCC-MAIN-2021-10,application/x-javascript,10762,10689,0.0004\nCC-MAIN-2021-10,application/x-json,19,19,0.0000\nCC-MAIN-2021-10,application/x-mobipocket-ebook,4819,4814,0.0002\nCC-MAIN-2021-10,application/x-msdownload,8288,8240,0.0003\nCC-MAIN-2021-10,application/x-netcdf,2368,2368,0.0001\nCC-MAIN-2021-10,application/x-research-info-systems,181455,181433,0.0066\nCC-MAIN-2021-10,application/x-shockwave-flash,9225,9197,0.0003\nCC-MAIN-2021-10,application/x-tar,8771,8765,0.0003\nCC-MAIN-2021-10,application/x-tex,3555,3555,0.0001\nCC-MAIN-2021-10,application/x-troff-man,7374,7372,0.0003\nCC-MAIN-2021-10,application/x-zip-compressed,20927,20782,0.0008\nCC-MAIN-2021-10,application/xhtml+xml,1367485,1365313,0.0500\nCC-MAIN-2021-10,application/xml,859554,858849,0.0314\nCC-MAIN-2021-10,application/zip,120099,119294,0.0044\nCC-MAIN-2021-10,audio/mpeg,106821,104560,0.0039\nCC-MAIN-2021-10,audio/x-mpegurl,17673,17661,0.0006\nCC-MAIN-2021-10,audio/x-scpls,3034,3023,0.0001\nCC-MAIN-2021-10,audio/x-wav,3121,3117,0.0001\nCC-MAIN-2021-10,binary/octet-stream,19607,19180,0.0007\nCC-MAIN-2021-10,image/gif,124628,124255,0.0046\nCC-MAIN-2021-10,image/jp2,578,578,0.0000\nCC-MAIN-2021-10,image/jpeg,3471008,3460985,0.1268\nCC-MAIN-2021-10,image/jpg,67108,66585,0.0025\nCC-MAIN-2021-10,image/pjpeg,10612,10610,0.0004\nCC-MAIN-2021-10,image/png,582392,579951,0.0213\nCC-MAIN-2021-10,image/svg+xml,14151,14133,0.0005\nCC-MAIN-2021-10,image/tiff,10395,10390,0.0004\nCC-MAIN-2021-10,image/vnd.djvu,16267,16266,0.0006\nCC-MAIN-2021-10,image/webp,4369,4364,0.0002\nCC-MAIN-2021-10,message/rfc822,12250,12250,0.0004\nCC-MAIN-2021-10,text/calendar,752144,751993,0.0275\nCC-MAIN-2021-10,text/css,6895,6894,0.0003\nCC-MAIN-2021-10,text/csv,103940,103933,0.0038\nCC-MAIN-2021-10,text/directory,8257,8257,0.0003\nCC-MAIN-2021-10,text/enriched,26557,26557,0.0010\nCC-MAIN-2021-10,text/html,2700846285,2681749723,98.6881\nCC-MAIN-2021-10,text/javascript,9517,9514,0.0003\nCC-MAIN-2021-10,text/markdown,2977,2977,0.0001\nCC-MAIN-2021-10,text/pdf,63,63,0.0000\nCC-MAIN-2021-10,text/plain,1368400,1367789,0.0500\nCC-MAIN-2021-10,text/prs.lines.tag,2423,2423,0.0001\nCC-MAIN-2021-10,text/tab-separated-values,14389,14389,0.0005\nCC-MAIN-2021-10,text/turtle,29219,29219,0.0011\nCC-MAIN-2021-10,text/vcard,25300,25292,0.0009\nCC-MAIN-2021-10,text/x-bibtex,11572,11535,0.0004\nCC-MAIN-2021-10,text/x-c,1500,1500,0.0001\nCC-MAIN-2021-10,text/x-csrc,20614,20614,0.0008\nCC-MAIN-2021-10,text/x-diff,4638,4638,0.0002\nCC-MAIN-2021-10,text/x-patch,12660,12660,0.0005\nCC-MAIN-2021-10,text/x-perl,2129,2129,0.0001\nCC-MAIN-2021-10,text/x-vcalendar,17111,17111,0.0006\nCC-MAIN-2021-10,text/x-vcard,52857,52763,0.0019\nCC-MAIN-2021-10,text/xml,1982252,1979179,0.0724\nCC-MAIN-2021-10,unknown/unknown,12131,12127,0.0004\nCC-MAIN-2021-10,video/mp4,47319,47181,0.0017\nCC-MAIN-2021-10,video/webm,2926,2920,0.0001\nCC-MAIN-2021-10,video/x-ms-asf,3667,3662,0.0001\nCC-MAIN-2021-17,<other>,2022426,2018694,0.0645\nCC-MAIN-2021-17,application/atom+xml,2200843,2200451,0.0702\nCC-MAIN-2021-17,application/calendar,6704,6702,0.0002\nCC-MAIN-2021-17,application/download,79698,79694,0.0025\nCC-MAIN-2021-17,application/epub+zip,39301,39236,0.0013\nCC-MAIN-2021-17,application/force-download,123578,123540,0.0039\nCC-MAIN-2021-17,application/gpx+xml,13574,13572,0.0004\nCC-MAIN-2021-17,application/ics,12925,12925,0.0004\nCC-MAIN-2021-17,application/javascript,10279,10275,0.0003\nCC-MAIN-2021-17,application/json,514967,514817,0.0164\nCC-MAIN-2021-17,application/ld+json,20661,20661,0.0007\nCC-MAIN-2021-17,application/marc,12993,12993,0.0004\nCC-MAIN-2021-17,application/msword,81808,81697,0.0026\nCC-MAIN-2021-17,application/octet-stream,1133879,1132540,0.0362\nCC-MAIN-2021-17,application/octetstream,5794,5792,0.0002\nCC-MAIN-2021-17,application/pdf,14343981,14305181,0.4576\nCC-MAIN-2021-17,application/pgp-encrypted,856,856,0.0000\nCC-MAIN-2021-17,application/pgp-signature,24378,24376,0.0008\nCC-MAIN-2021-17,application/postscript,4451,4449,0.0001\nCC-MAIN-2021-17,application/rdf+xml,82825,82820,0.0026\nCC-MAIN-2021-17,application/rss+xml,1959403,1956884,0.0625\nCC-MAIN-2021-17,application/rtf,31942,31936,0.0010\nCC-MAIN-2021-17,application/save-to-disk,97,97,0.0000\nCC-MAIN-2021-17,application/text,65366,65366,0.0021\nCC-MAIN-2021-17,application/unknown,8638,8638,0.0003\nCC-MAIN-2021-17,application/vnd.android.package-archive,16427,16342,0.0005\nCC-MAIN-2021-17,application/vnd.google-earth.kml+xml,35986,35981,0.0011\nCC-MAIN-2021-17,application/vnd.google-earth.kmz,9560,9558,0.0003\nCC-MAIN-2021-17,application/vnd.ms-excel,64566,64507,0.0021\nCC-MAIN-2021-17,application/vnd.ms-powerpoint,28910,28899,0.0009\nCC-MAIN-2021-17,application/vnd.ms-word,11657,11657,0.0004\nCC-MAIN-2021-17,application/vnd.oasis.opendocument.text,26229,26221,0.0008\nCC-MAIN-2021-17,application/vnd.openxmlformats-officedocument.presentationml.presentation,6950,6933,0.0002\nCC-MAIN-2021-17,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,33642,33595,0.0011\nCC-MAIN-2021-17,application/vnd.openxmlformats-officedocument.wordprocessingml.document,72387,72154,0.0023\nCC-MAIN-2021-17,application/vnd.wap.xhtml+xml,2386,2364,0.0001\nCC-MAIN-2021-17,application/x-bibtex,69061,69056,0.0022\nCC-MAIN-2021-17,application/x-bittorrent,5935,5716,0.0002\nCC-MAIN-2021-17,application/x-debian-package,2223,2222,0.0001\nCC-MAIN-2021-17,application/x-download,42615,41288,0.0014\nCC-MAIN-2021-17,application/x-endnote-refer,98522,98522,0.0031\nCC-MAIN-2021-17,application/x-gzip,24103,24064,0.0008\nCC-MAIN-2021-17,application/x-httpd-php,10451,10375,0.0003\nCC-MAIN-2021-17,application/x-java-jnlp-file,5289,5288,0.0002\nCC-MAIN-2021-17,application/x-javascript,11534,11433,0.0004\nCC-MAIN-2021-17,application/x-json,137,137,0.0000\nCC-MAIN-2021-17,application/x-mobipocket-ebook,6788,6788,0.0002\nCC-MAIN-2021-17,application/x-msdownload,9854,9779,0.0003\nCC-MAIN-2021-17,application/x-netcdf,20391,20391,0.0007\nCC-MAIN-2021-17,application/x-research-info-systems,186766,186735,0.0060\nCC-MAIN-2021-17,application/x-shockwave-flash,10018,9983,0.0003\nCC-MAIN-2021-17,application/x-tar,10338,10332,0.0003\nCC-MAIN-2021-17,application/x-tex,2878,2878,0.0001\nCC-MAIN-2021-17,application/x-troff-man,6892,6890,0.0002\nCC-MAIN-2021-17,application/x-zip-compressed,17268,17146,0.0006\nCC-MAIN-2021-17,application/xhtml+xml,1469387,1467237,0.0469\nCC-MAIN-2021-17,application/xml,884856,883417,0.0282\nCC-MAIN-2021-17,application/zip,123822,122926,0.0040\nCC-MAIN-2021-17,audio/mpeg,111887,110669,0.0036\nCC-MAIN-2021-17,audio/x-mpegurl,19301,19284,0.0006\nCC-MAIN-2021-17,audio/x-scpls,3880,3876,0.0001\nCC-MAIN-2021-17,audio/x-wav,2997,2957,0.0001\nCC-MAIN-2021-17,binary/octet-stream,21251,21074,0.0007\nCC-MAIN-2021-17,image/gif,142483,142132,0.0045\nCC-MAIN-2021-17,image/jp2,435,435,0.0000\nCC-MAIN-2021-17,image/jpeg,5125682,5116706,0.1635\nCC-MAIN-2021-17,image/jpg,74116,73156,0.0024\nCC-MAIN-2021-17,image/pjpeg,13295,13293,0.0004\nCC-MAIN-2021-17,image/png,1040823,1037669,0.0332\nCC-MAIN-2021-17,image/svg+xml,24255,24214,0.0008\nCC-MAIN-2021-17,image/tiff,11382,11378,0.0004\nCC-MAIN-2021-17,image/vnd.djvu,10371,10370,0.0003\nCC-MAIN-2021-17,image/webp,3642,3638,0.0001\nCC-MAIN-2021-17,message/rfc822,10429,10428,0.0003\nCC-MAIN-2021-17,text/calendar,773157,772866,0.0247\nCC-MAIN-2021-17,text/css,7404,7402,0.0002\nCC-MAIN-2021-17,text/csv,118869,118861,0.0038\nCC-MAIN-2021-17,text/directory,9224,9213,0.0003\nCC-MAIN-2021-17,text/enriched,25480,25480,0.0008\nCC-MAIN-2021-17,text/html,3096779513,3078743587,98.7990\nCC-MAIN-2021-17,text/javascript,7838,7811,0.0003\nCC-MAIN-2021-17,text/markdown,2458,2458,0.0001\nCC-MAIN-2021-17,text/pdf,635,635,0.0000\nCC-MAIN-2021-17,text/plain,1456414,1455657,0.0465\nCC-MAIN-2021-17,text/prs.lines.tag,2971,2971,0.0001\nCC-MAIN-2021-17,text/tab-separated-values,12860,12860,0.0004\nCC-MAIN-2021-17,text/turtle,34812,34811,0.0011\nCC-MAIN-2021-17,text/vcard,26854,26819,0.0009\nCC-MAIN-2021-17,text/x-bibtex,10593,10593,0.0003\nCC-MAIN-2021-17,text/x-c,2360,2357,0.0001\nCC-MAIN-2021-17,text/x-csrc,21330,21329,0.0007\nCC-MAIN-2021-17,text/x-diff,4537,4537,0.0001\nCC-MAIN-2021-17,text/x-patch,15633,15631,0.0005\nCC-MAIN-2021-17,text/x-perl,2198,2198,0.0001\nCC-MAIN-2021-17,text/x-vcalendar,13566,13566,0.0004\nCC-MAIN-2021-17,text/x-vcard,60073,60050,0.0019\nCC-MAIN-2021-17,text/xml,2201047,2197400,0.0702\nCC-MAIN-2021-17,unknown/unknown,14393,14393,0.0005\nCC-MAIN-2021-17,video/mp4,67787,67534,0.0022\nCC-MAIN-2021-17,video/webm,2821,2816,0.0001\nCC-MAIN-2021-17,video/x-ms-asf,4555,4549,0.0001\nCC-MAIN-2021-21,<other>,2012354,2007082,0.0765\nCC-MAIN-2021-21,application/atom+xml,1906746,1906491,0.0724\nCC-MAIN-2021-21,application/calendar,6406,6403,0.0002\nCC-MAIN-2021-21,application/download,58903,58889,0.0022\nCC-MAIN-2021-21,application/epub+zip,35336,35326,0.0013\nCC-MAIN-2021-21,application/force-download,106961,106941,0.0041\nCC-MAIN-2021-21,application/gpx+xml,10620,10618,0.0004\nCC-MAIN-2021-21,application/ics,7407,7407,0.0003\nCC-MAIN-2021-21,application/javascript,13015,13012,0.0005\nCC-MAIN-2021-21,application/json,517718,517448,0.0197\nCC-MAIN-2021-21,application/ld+json,21370,21367,0.0008\nCC-MAIN-2021-21,application/marc,9277,9277,0.0004\nCC-MAIN-2021-21,application/msword,73004,72835,0.0028\nCC-MAIN-2021-21,application/octet-stream,1154690,1153785,0.0439\nCC-MAIN-2021-21,application/octetstream,7931,7930,0.0003\nCC-MAIN-2021-21,application/pdf,27382345,27329757,1.0403\nCC-MAIN-2021-21,application/pgp-encrypted,1247,1246,0.0000\nCC-MAIN-2021-21,application/pgp-signature,28171,28171,0.0011\nCC-MAIN-2021-21,application/postscript,4802,4801,0.0002\nCC-MAIN-2021-21,application/rdf+xml,67871,67837,0.0026\nCC-MAIN-2021-21,application/rss+xml,1866220,1864071,0.0709\nCC-MAIN-2021-21,application/rtf,29893,29881,0.0011\nCC-MAIN-2021-21,application/save-to-disk,58,58,0.0000\nCC-MAIN-2021-21,application/text,82836,82707,0.0031\nCC-MAIN-2021-21,application/unknown,30858,30858,0.0012\nCC-MAIN-2021-21,application/vnd.android.package-archive,15442,15375,0.0006\nCC-MAIN-2021-21,application/vnd.google-earth.kml+xml,42302,42294,0.0016\nCC-MAIN-2021-21,application/vnd.google-earth.kmz,9635,9632,0.0004\nCC-MAIN-2021-21,application/vnd.ms-excel,56487,56427,0.0021\nCC-MAIN-2021-21,application/vnd.ms-powerpoint,30135,30130,0.0011\nCC-MAIN-2021-21,application/vnd.ms-word,13211,13210,0.0005\nCC-MAIN-2021-21,application/vnd.oasis.opendocument.text,26556,26524,0.0010\nCC-MAIN-2021-21,application/vnd.openxmlformats-officedocument.presentationml.presentation,6632,6601,0.0003\nCC-MAIN-2021-21,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,33713,33662,0.0013\nCC-MAIN-2021-21,application/vnd.openxmlformats-officedocument.wordprocessingml.document,70123,69543,0.0027\nCC-MAIN-2021-21,application/vnd.wap.xhtml+xml,2396,2384,0.0001\nCC-MAIN-2021-21,application/x-bibtex,56052,56044,0.0021\nCC-MAIN-2021-21,application/x-bittorrent,4874,4874,0.0002\nCC-MAIN-2021-21,application/x-debian-package,321,321,0.0000\nCC-MAIN-2021-21,application/x-download,19919,19805,0.0008\nCC-MAIN-2021-21,application/x-endnote-refer,109007,108890,0.0041\nCC-MAIN-2021-21,application/x-gzip,27294,27290,0.0010\nCC-MAIN-2021-21,application/x-httpd-php,18121,18069,0.0007\nCC-MAIN-2021-21,application/x-java-jnlp-file,10087,10078,0.0004\nCC-MAIN-2021-21,application/x-javascript,7866,7780,0.0003\nCC-MAIN-2021-21,application/x-json,108,108,0.0000\nCC-MAIN-2021-21,application/x-mobipocket-ebook,5204,5198,0.0002\nCC-MAIN-2021-21,application/x-msdownload,7056,6863,0.0003\nCC-MAIN-2021-21,application/x-netcdf,5481,5481,0.0002\nCC-MAIN-2021-21,application/x-research-info-systems,186563,186534,0.0071\nCC-MAIN-2021-21,application/x-shockwave-flash,10695,10663,0.0004\nCC-MAIN-2021-21,application/x-tar,6791,6789,0.0003\nCC-MAIN-2021-21,application/x-tex,3980,3980,0.0002\nCC-MAIN-2021-21,application/x-troff-man,8813,8808,0.0003\nCC-MAIN-2021-21,application/x-zip-compressed,15935,15781,0.0006\nCC-MAIN-2021-21,application/xhtml+xml,1357122,1354898,0.0516\nCC-MAIN-2021-21,application/xml,823881,822017,0.0313\nCC-MAIN-2021-21,application/zip,105621,105237,0.0040\nCC-MAIN-2021-21,audio/mpeg,92966,91357,0.0035\nCC-MAIN-2021-21,audio/x-mpegurl,24777,24755,0.0009\nCC-MAIN-2021-21,audio/x-scpls,5228,5211,0.0002\nCC-MAIN-2021-21,audio/x-wav,2746,2623,0.0001\nCC-MAIN-2021-21,binary/octet-stream,24457,24410,0.0009\nCC-MAIN-2021-21,image/gif,119521,119149,0.0045\nCC-MAIN-2021-21,image/jp2,333,333,0.0000\nCC-MAIN-2021-21,image/jpeg,3914167,3906308,0.1487\nCC-MAIN-2021-21,image/jpg,76743,76591,0.0029\nCC-MAIN-2021-21,image/pjpeg,12168,12122,0.0005\nCC-MAIN-2021-21,image/png,722530,719955,0.0275\nCC-MAIN-2021-21,image/svg+xml,17195,17185,0.0007\nCC-MAIN-2021-21,image/tiff,10621,10617,0.0004\nCC-MAIN-2021-21,image/vnd.djvu,4318,4317,0.0002\nCC-MAIN-2021-21,image/webp,8243,8243,0.0003\nCC-MAIN-2021-21,message/rfc822,11695,11686,0.0004\nCC-MAIN-2021-21,text/calendar,713791,713663,0.0271\nCC-MAIN-2021-21,text/css,10803,10798,0.0004\nCC-MAIN-2021-21,text/csv,108908,108884,0.0041\nCC-MAIN-2021-21,text/directory,7642,7641,0.0003\nCC-MAIN-2021-21,text/enriched,34340,34248,0.0013\nCC-MAIN-2021-21,text/html,2583928003,2568161605,98.1682\nCC-MAIN-2021-21,text/javascript,6944,6944,0.0003\nCC-MAIN-2021-21,text/markdown,2895,2894,0.0001\nCC-MAIN-2021-21,text/pdf,104,104,0.0000\nCC-MAIN-2021-21,text/plain,1550642,1549398,0.0589\nCC-MAIN-2021-21,text/prs.lines.tag,946,946,0.0000\nCC-MAIN-2021-21,text/tab-separated-values,16354,16354,0.0006\nCC-MAIN-2021-21,text/turtle,23388,23381,0.0009\nCC-MAIN-2021-21,text/vcard,30269,30258,0.0011\nCC-MAIN-2021-21,text/x-bibtex,15496,15488,0.0006\nCC-MAIN-2021-21,text/x-c,3358,3346,0.0001\nCC-MAIN-2021-21,text/x-csrc,14511,14510,0.0006\nCC-MAIN-2021-21,text/x-diff,11230,11222,0.0004\nCC-MAIN-2021-21,text/x-patch,15408,15405,0.0006\nCC-MAIN-2021-21,text/x-perl,2753,2752,0.0001\nCC-MAIN-2021-21,text/x-vcalendar,8681,8680,0.0003\nCC-MAIN-2021-21,text/x-vcard,55103,55091,0.0021\nCC-MAIN-2021-21,text/xml,1918910,1915559,0.0729\nCC-MAIN-2021-21,unknown/unknown,7361,7360,0.0003\nCC-MAIN-2021-21,video/mp4,57408,57003,0.0022\nCC-MAIN-2021-21,video/webm,2839,2838,0.0001\nCC-MAIN-2021-21,video/x-ms-asf,13208,13203,0.0005\nCC-MAIN-2021-25,<other>,2025220,2020019,0.0824\nCC-MAIN-2021-25,application/atom+xml,1888160,1887888,0.0768\nCC-MAIN-2021-25,application/calendar,5680,5680,0.0002\nCC-MAIN-2021-25,application/download,58477,58471,0.0024\nCC-MAIN-2021-25,application/epub+zip,34362,34293,0.0014\nCC-MAIN-2021-25,application/force-download,100325,100308,0.0041\nCC-MAIN-2021-25,application/gpx+xml,9338,9335,0.0004\nCC-MAIN-2021-25,application/ics,6072,6072,0.0002\nCC-MAIN-2021-25,application/javascript,9733,9728,0.0004\nCC-MAIN-2021-25,application/json,531198,530715,0.0216\nCC-MAIN-2021-25,application/ld+json,14373,14373,0.0006\nCC-MAIN-2021-25,application/marc,10931,10930,0.0004\nCC-MAIN-2021-25,application/msword,61456,61348,0.0025\nCC-MAIN-2021-25,application/octet-stream,1054421,1053237,0.0429\nCC-MAIN-2021-25,application/octetstream,6377,6368,0.0003\nCC-MAIN-2021-25,application/pdf,13045989,13018582,0.5308\nCC-MAIN-2021-25,application/pgp-encrypted,886,886,0.0000\nCC-MAIN-2021-25,application/pgp-signature,51615,51602,0.0021\nCC-MAIN-2021-25,application/postscript,4000,4000,0.0002\nCC-MAIN-2021-25,application/rdf+xml,74141,74134,0.0030\nCC-MAIN-2021-25,application/rss+xml,1489301,1488097,0.0606\nCC-MAIN-2021-25,application/rtf,30665,30601,0.0012\nCC-MAIN-2021-25,application/text,54960,54949,0.0022\nCC-MAIN-2021-25,application/unknown,11489,11488,0.0005\nCC-MAIN-2021-25,application/vnd.android.package-archive,6797,6744,0.0003\nCC-MAIN-2021-25,application/vnd.google-earth.kml+xml,31462,31462,0.0013\nCC-MAIN-2021-25,application/vnd.google-earth.kmz,7405,7403,0.0003\nCC-MAIN-2021-25,application/vnd.ms-excel,58204,58098,0.0024\nCC-MAIN-2021-25,application/vnd.ms-powerpoint,28668,28665,0.0012\nCC-MAIN-2021-25,application/vnd.ms-word,10884,10881,0.0004\nCC-MAIN-2021-25,application/vnd.oasis.opendocument.text,24521,24511,0.0010\nCC-MAIN-2021-25,application/vnd.openxmlformats-officedocument.presentationml.presentation,5803,5797,0.0002\nCC-MAIN-2021-25,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,30729,30394,0.0013\nCC-MAIN-2021-25,application/vnd.openxmlformats-officedocument.wordprocessingml.document,60191,60106,0.0024\nCC-MAIN-2021-25,application/vnd.wap.xhtml+xml,2764,2752,0.0001\nCC-MAIN-2021-25,application/x-bibtex,63274,63273,0.0026\nCC-MAIN-2021-25,application/x-bittorrent,4885,4884,0.0002\nCC-MAIN-2021-25,application/x-debian-package,236,236,0.0000\nCC-MAIN-2021-25,application/x-download,25316,25091,0.0010\nCC-MAIN-2021-25,application/x-endnote-refer,97677,97670,0.0040\nCC-MAIN-2021-25,application/x-gzip,26562,26561,0.0011\nCC-MAIN-2021-25,application/x-httpd-php,7849,7815,0.0003\nCC-MAIN-2021-25,application/x-java-jnlp-file,9015,9012,0.0004\nCC-MAIN-2021-25,application/x-javascript,6568,6560,0.0003\nCC-MAIN-2021-25,application/x-json,19,19,0.0000\nCC-MAIN-2021-25,application/x-mobipocket-ebook,6065,6065,0.0002\nCC-MAIN-2021-25,application/x-msdownload,7432,7382,0.0003\nCC-MAIN-2021-25,application/x-netcdf,9633,9627,0.0004\nCC-MAIN-2021-25,application/x-research-info-systems,192012,191847,0.0078\nCC-MAIN-2021-25,application/x-shockwave-flash,8200,8180,0.0003\nCC-MAIN-2021-25,application/x-tar,11069,11062,0.0005\nCC-MAIN-2021-25,application/x-tex,3945,3945,0.0002\nCC-MAIN-2021-25,application/x-troff-man,8453,8451,0.0003\nCC-MAIN-2021-25,application/x-zip-compressed,13628,13560,0.0006\nCC-MAIN-2021-25,application/xhtml+xml,1335536,1333294,0.0543\nCC-MAIN-2021-25,application/xml,727697,726919,0.0296\nCC-MAIN-2021-25,application/zip,107860,107337,0.0044\nCC-MAIN-2021-25,audio/mpeg,84611,83819,0.0034\nCC-MAIN-2021-25,audio/x-mpegurl,22197,22078,0.0009\nCC-MAIN-2021-25,audio/x-scpls,3102,3096,0.0001\nCC-MAIN-2021-25,audio/x-wav,3585,3585,0.0001\nCC-MAIN-2021-25,binary/octet-stream,17833,17781,0.0007\nCC-MAIN-2021-25,image/gif,111748,111468,0.0045\nCC-MAIN-2021-25,image/jp2,702,702,0.0000\nCC-MAIN-2021-25,image/jpeg,4402594,4389623,0.1791\nCC-MAIN-2021-25,image/jpg,73578,72901,0.0030\nCC-MAIN-2021-25,image/pjpeg,8777,8763,0.0004\nCC-MAIN-2021-25,image/png,901026,897240,0.0367\nCC-MAIN-2021-25,image/svg+xml,19730,19665,0.0008\nCC-MAIN-2021-25,image/tiff,10637,10635,0.0004\nCC-MAIN-2021-25,image/vnd.djvu,8460,8459,0.0003\nCC-MAIN-2021-25,image/webp,4524,4524,0.0002\nCC-MAIN-2021-25,message/rfc822,9162,9162,0.0004\nCC-MAIN-2021-25,text/calendar,631093,630945,0.0257\nCC-MAIN-2021-25,text/css,6371,6369,0.0003\nCC-MAIN-2021-25,text/csv,99820,99809,0.0041\nCC-MAIN-2021-25,text/directory,6703,6703,0.0003\nCC-MAIN-2021-25,text/enriched,19336,19333,0.0008\nCC-MAIN-2021-25,text/html,2424311412,2409918480,98.6442\nCC-MAIN-2021-25,text/javascript,7066,7065,0.0003\nCC-MAIN-2021-25,text/markdown,2104,2104,0.0001\nCC-MAIN-2021-25,text/pdf,1278,1278,0.0001\nCC-MAIN-2021-25,text/plain,1417231,1415462,0.0577\nCC-MAIN-2021-25,text/prs.lines.tag,2391,2391,0.0001\nCC-MAIN-2021-25,text/tab-separated-values,12511,12511,0.0005\nCC-MAIN-2021-25,text/turtle,26830,26826,0.0011\nCC-MAIN-2021-25,text/vcard,22361,22356,0.0009\nCC-MAIN-2021-25,text/x-bibtex,11950,11950,0.0005\nCC-MAIN-2021-25,text/x-c,4288,4287,0.0002\nCC-MAIN-2021-25,text/x-csrc,21531,21530,0.0009\nCC-MAIN-2021-25,text/x-diff,9631,9630,0.0004\nCC-MAIN-2021-25,text/x-patch,13078,13078,0.0005\nCC-MAIN-2021-25,text/x-perl,3812,3812,0.0002\nCC-MAIN-2021-25,text/x-vcalendar,7872,7872,0.0003\nCC-MAIN-2021-25,text/x-vcard,41152,41099,0.0017\nCC-MAIN-2021-25,text/xml,1667911,1665423,0.0679\nCC-MAIN-2021-25,unknown/unknown,5895,5895,0.0002\nCC-MAIN-2021-25,video/mp4,63484,63337,0.0026\nCC-MAIN-2021-25,video/webm,2671,2666,0.0001\nCC-MAIN-2021-25,video/x-ms-asf,10180,10175,0.0004\nCC-MAIN-2021-31,<other>,1582648,1576292,0.0500\nCC-MAIN-2021-31,application/atom+xml,2085924,2085547,0.0659\nCC-MAIN-2021-31,application/calendar,6858,6857,0.0002\nCC-MAIN-2021-31,application/download,50355,50345,0.0016\nCC-MAIN-2021-31,application/epub+zip,26624,26615,0.0008\nCC-MAIN-2021-31,application/force-download,77001,76997,0.0024\nCC-MAIN-2021-31,application/gpx+xml,8500,8500,0.0003\nCC-MAIN-2021-31,application/ics,6455,6454,0.0002\nCC-MAIN-2021-31,application/javascript,8714,8712,0.0003\nCC-MAIN-2021-31,application/json,517344,516814,0.0163\nCC-MAIN-2021-31,application/ld+json,17848,17844,0.0006\nCC-MAIN-2021-31,application/marc,8495,8495,0.0003\nCC-MAIN-2021-31,application/msword,60261,60118,0.0019\nCC-MAIN-2021-31,application/octet-stream,861337,860127,0.0272\nCC-MAIN-2021-31,application/octetstream,2918,2918,0.0001\nCC-MAIN-2021-31,application/pdf,8156251,8135596,0.2577\nCC-MAIN-2021-31,application/pgp-encrypted,1878,1878,0.0001\nCC-MAIN-2021-31,application/pgp-signature,25125,25122,0.0008\nCC-MAIN-2021-31,application/postscript,2523,2523,0.0001\nCC-MAIN-2021-31,application/rdf+xml,71560,71550,0.0023\nCC-MAIN-2021-31,application/rss+xml,1604468,1602867,0.0507\nCC-MAIN-2021-31,application/rtf,29670,29662,0.0009\nCC-MAIN-2021-31,application/save-to-disk,3,3,0.0000\nCC-MAIN-2021-31,application/text,53017,53015,0.0017\nCC-MAIN-2021-31,application/unknown,5462,5462,0.0002\nCC-MAIN-2021-31,application/vnd.android.package-archive,6629,6567,0.0002\nCC-MAIN-2021-31,application/vnd.google-earth.kml+xml,29439,29436,0.0009\nCC-MAIN-2021-31,application/vnd.google-earth.kmz,10254,10254,0.0003\nCC-MAIN-2021-31,application/vnd.ms-excel,35208,35187,0.0011\nCC-MAIN-2021-31,application/vnd.ms-powerpoint,24477,24475,0.0008\nCC-MAIN-2021-31,application/vnd.ms-word,10300,10299,0.0003\nCC-MAIN-2021-31,application/vnd.oasis.opendocument.text,17502,17499,0.0006\nCC-MAIN-2021-31,application/vnd.openxmlformats-officedocument.presentationml.presentation,5938,5929,0.0002\nCC-MAIN-2021-31,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,30530,30512,0.0010\nCC-MAIN-2021-31,application/vnd.openxmlformats-officedocument.wordprocessingml.document,53926,53828,0.0017\nCC-MAIN-2021-31,application/vnd.wap.xhtml+xml,2276,2265,0.0001\nCC-MAIN-2021-31,application/x-bibtex,51755,51749,0.0016\nCC-MAIN-2021-31,application/x-bittorrent,3349,3343,0.0001\nCC-MAIN-2021-31,application/x-debian-package,154,154,0.0000\nCC-MAIN-2021-31,application/x-download,18632,18024,0.0006\nCC-MAIN-2021-31,application/x-endnote-refer,86835,86828,0.0027\nCC-MAIN-2021-31,application/x-gzip,18804,18799,0.0006\nCC-MAIN-2021-31,application/x-httpd-php,7405,7382,0.0002\nCC-MAIN-2021-31,application/x-java-jnlp-file,6608,6608,0.0002\nCC-MAIN-2021-31,application/x-javascript,7032,7029,0.0002\nCC-MAIN-2021-31,application/x-json,24,24,0.0000\nCC-MAIN-2021-31,application/x-mobipocket-ebook,3875,3875,0.0001\nCC-MAIN-2021-31,application/x-msdownload,5518,5436,0.0002\nCC-MAIN-2021-31,application/x-netcdf,4531,4531,0.0001\nCC-MAIN-2021-31,application/x-research-info-systems,186717,186661,0.0059\nCC-MAIN-2021-31,application/x-shockwave-flash,6096,6072,0.0002\nCC-MAIN-2021-31,application/x-tar,6907,6904,0.0002\nCC-MAIN-2021-31,application/x-tex,3117,3117,0.0001\nCC-MAIN-2021-31,application/x-troff-man,12616,12615,0.0004\nCC-MAIN-2021-31,application/x-zip-compressed,12555,12519,0.0004\nCC-MAIN-2021-31,application/xhtml+xml,1274710,1272736,0.0403\nCC-MAIN-2021-31,application/xml,678113,677388,0.0214\nCC-MAIN-2021-31,application/zip,87681,87185,0.0028\nCC-MAIN-2021-31,audio/mpeg,61666,61395,0.0019\nCC-MAIN-2021-31,audio/x-mpegurl,16370,16366,0.0005\nCC-MAIN-2021-31,audio/x-scpls,4155,4154,0.0001\nCC-MAIN-2021-31,audio/x-wav,2917,2917,0.0001\nCC-MAIN-2021-31,binary/octet-stream,11667,11638,0.0004\nCC-MAIN-2021-31,image/gif,107449,107048,0.0034\nCC-MAIN-2021-31,image/jp2,1139,1139,0.0000\nCC-MAIN-2021-31,image/jpeg,4563478,4551409,0.1442\nCC-MAIN-2021-31,image/jpg,51210,50980,0.0016\nCC-MAIN-2021-31,image/pjpeg,6172,6086,0.0002\nCC-MAIN-2021-31,image/png,991932,989748,0.0313\nCC-MAIN-2021-31,image/svg+xml,21549,21496,0.0007\nCC-MAIN-2021-31,image/tiff,9514,9511,0.0003\nCC-MAIN-2021-31,image/vnd.djvu,2046,2046,0.0001\nCC-MAIN-2021-31,image/webp,2378,2377,0.0001\nCC-MAIN-2021-31,message/rfc822,9583,9583,0.0003\nCC-MAIN-2021-31,text/calendar,624211,624074,0.0197\nCC-MAIN-2021-31,text/css,8947,8942,0.0003\nCC-MAIN-2021-31,text/csv,98476,98452,0.0031\nCC-MAIN-2021-31,text/directory,5832,5830,0.0002\nCC-MAIN-2021-31,text/enriched,19445,19443,0.0006\nCC-MAIN-2021-31,text/html,3137295751,3120545142,99.1219\nCC-MAIN-2021-31,text/javascript,5844,5838,0.0002\nCC-MAIN-2021-31,text/markdown,2006,2006,0.0001\nCC-MAIN-2021-31,text/pdf,107,107,0.0000\nCC-MAIN-2021-31,text/plain,1319130,1318450,0.0417\nCC-MAIN-2021-31,text/prs.lines.tag,616,616,0.0000\nCC-MAIN-2021-31,text/tab-separated-values,8961,8961,0.0003\nCC-MAIN-2021-31,text/turtle,28260,28259,0.0009\nCC-MAIN-2021-31,text/vcard,24403,24400,0.0008\nCC-MAIN-2021-31,text/x-bibtex,10149,10049,0.0003\nCC-MAIN-2021-31,text/x-c,2610,2606,0.0001\nCC-MAIN-2021-31,text/x-csrc,15418,15418,0.0005\nCC-MAIN-2021-31,text/x-diff,4121,4121,0.0001\nCC-MAIN-2021-31,text/x-patch,15567,15567,0.0005\nCC-MAIN-2021-31,text/x-perl,2493,2493,0.0001\nCC-MAIN-2021-31,text/x-vcalendar,7499,7499,0.0002\nCC-MAIN-2021-31,text/x-vcard,40416,40406,0.0013\nCC-MAIN-2021-31,text/xml,1633454,1631049,0.0516\nCC-MAIN-2021-31,unknown/unknown,5757,5757,0.0002\nCC-MAIN-2021-31,video/mp4,59009,58936,0.0019\nCC-MAIN-2021-31,video/webm,2234,2232,0.0001\nCC-MAIN-2021-31,video/x-ms-asf,5162,5161,0.0002\nCC-MAIN-2021-39,<other>,1981649,1977462,0.0669\nCC-MAIN-2021-39,application/atom+xml,3569655,3569435,0.1206\nCC-MAIN-2021-39,application/calendar,9568,9568,0.0003\nCC-MAIN-2021-39,application/download,106199,106191,0.0036\nCC-MAIN-2021-39,application/epub+zip,49034,48998,0.0017\nCC-MAIN-2021-39,application/force-download,151980,151957,0.0051\nCC-MAIN-2021-39,application/gpx+xml,14855,14854,0.0005\nCC-MAIN-2021-39,application/ics,18748,18748,0.0006\nCC-MAIN-2021-39,application/javascript,8897,8894,0.0003\nCC-MAIN-2021-39,application/json,708745,708365,0.0239\nCC-MAIN-2021-39,application/ld+json,18538,18523,0.0006\nCC-MAIN-2021-39,application/marc,10975,10975,0.0004\nCC-MAIN-2021-39,application/msword,99356,99147,0.0034\nCC-MAIN-2021-39,application/octet-stream,1338162,1336725,0.0452\nCC-MAIN-2021-39,application/octetstream,9860,9852,0.0003\nCC-MAIN-2021-39,application/pdf,26854739,26775565,0.9073\nCC-MAIN-2021-39,application/pgp-encrypted,2206,2206,0.0001\nCC-MAIN-2021-39,application/pgp-signature,64507,64487,0.0022\nCC-MAIN-2021-39,application/postscript,6873,6868,0.0002\nCC-MAIN-2021-39,application/rdf+xml,98371,98354,0.0033\nCC-MAIN-2021-39,application/rss+xml,2346462,2344615,0.0793\nCC-MAIN-2021-39,application/rtf,36019,35979,0.0012\nCC-MAIN-2021-39,application/save-to-disk,447,447,0.0000\nCC-MAIN-2021-39,application/text,74604,74599,0.0025\nCC-MAIN-2021-39,application/unknown,8797,8790,0.0003\nCC-MAIN-2021-39,application/vnd.android.package-archive,8119,8018,0.0003\nCC-MAIN-2021-39,application/vnd.google-earth.kml+xml,41396,41392,0.0014\nCC-MAIN-2021-39,application/vnd.google-earth.kmz,12185,12184,0.0004\nCC-MAIN-2021-39,application/vnd.ms-excel,62223,62092,0.0021\nCC-MAIN-2021-39,application/vnd.ms-powerpoint,34083,34076,0.0012\nCC-MAIN-2021-39,application/vnd.ms-word,17102,17102,0.0006\nCC-MAIN-2021-39,application/vnd.oasis.opendocument.text,26303,26291,0.0009\nCC-MAIN-2021-39,application/vnd.openxmlformats-officedocument.presentationml.presentation,10780,10760,0.0004\nCC-MAIN-2021-39,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,48500,48424,0.0016\nCC-MAIN-2021-39,application/vnd.openxmlformats-officedocument.wordprocessingml.document,91566,91176,0.0031\nCC-MAIN-2021-39,application/vnd.wap.xhtml+xml,9047,8998,0.0003\nCC-MAIN-2021-39,application/x-bibtex,96580,96580,0.0033\nCC-MAIN-2021-39,application/x-bittorrent,5336,5335,0.0002\nCC-MAIN-2021-39,application/x-debian-package,442,442,0.0000\nCC-MAIN-2021-39,application/x-download,31477,30894,0.0011\nCC-MAIN-2021-39,application/x-endnote-refer,115645,115645,0.0039\nCC-MAIN-2021-39,application/x-gzip,29036,29009,0.0010\nCC-MAIN-2021-39,application/x-httpd-php,8477,8455,0.0003\nCC-MAIN-2021-39,application/x-java-jnlp-file,9882,9838,0.0003\nCC-MAIN-2021-39,application/x-javascript,10959,10845,0.0004\nCC-MAIN-2021-39,application/x-json,40,40,0.0000\nCC-MAIN-2021-39,application/x-mobipocket-ebook,7917,7914,0.0003\nCC-MAIN-2021-39,application/x-msdownload,10543,10425,0.0004\nCC-MAIN-2021-39,application/x-netcdf,21883,21883,0.0007\nCC-MAIN-2021-39,application/x-research-info-systems,263572,263539,0.0089\nCC-MAIN-2021-39,application/x-shockwave-flash,11723,11664,0.0004\nCC-MAIN-2021-39,application/x-tar,11645,11642,0.0004\nCC-MAIN-2021-39,application/x-tex,8667,8658,0.0003\nCC-MAIN-2021-39,application/x-troff-man,13381,13381,0.0005\nCC-MAIN-2021-39,application/x-zip-compressed,20088,20002,0.0007\nCC-MAIN-2021-39,application/xhtml+xml,1453998,1451604,0.0491\nCC-MAIN-2021-39,application/xml,957363,956624,0.0323\nCC-MAIN-2021-39,application/zip,151603,150703,0.0051\nCC-MAIN-2021-39,audio/mpeg,117470,116491,0.0040\nCC-MAIN-2021-39,audio/x-mpegurl,19258,19242,0.0007\nCC-MAIN-2021-39,audio/x-scpls,6421,6415,0.0002\nCC-MAIN-2021-39,audio/x-wav,5211,5203,0.0002\nCC-MAIN-2021-39,binary/octet-stream,40081,40060,0.0014\nCC-MAIN-2021-39,image/gif,172147,171565,0.0058\nCC-MAIN-2021-39,image/jp2,618,618,0.0000\nCC-MAIN-2021-39,image/jpeg,5337701,5325873,0.1803\nCC-MAIN-2021-39,image/jpg,83323,82862,0.0028\nCC-MAIN-2021-39,image/pjpeg,11858,11828,0.0004\nCC-MAIN-2021-39,image/png,953807,951344,0.0322\nCC-MAIN-2021-39,image/svg+xml,25970,25847,0.0009\nCC-MAIN-2021-39,image/tiff,17322,17318,0.0006\nCC-MAIN-2021-39,image/vnd.djvu,6726,6715,0.0002\nCC-MAIN-2021-39,image/webp,6999,6998,0.0002\nCC-MAIN-2021-39,message/rfc822,15279,15278,0.0005\nCC-MAIN-2021-39,text/calendar,1097236,1096954,0.0371\nCC-MAIN-2021-39,text/css,12936,12929,0.0004\nCC-MAIN-2021-39,text/csv,166420,166394,0.0056\nCC-MAIN-2021-39,text/directory,9288,9288,0.0003\nCC-MAIN-2021-39,text/enriched,24465,24463,0.0008\nCC-MAIN-2021-39,text/html,2906066108,2888650788,98.1811\nCC-MAIN-2021-39,text/javascript,10059,10051,0.0003\nCC-MAIN-2021-39,text/markdown,2825,2825,0.0001\nCC-MAIN-2021-39,text/pdf,272,272,0.0000\nCC-MAIN-2021-39,text/plain,1921704,1920422,0.0649\nCC-MAIN-2021-39,text/prs.lines.tag,27604,27604,0.0009\nCC-MAIN-2021-39,text/tab-separated-values,20191,20191,0.0007\nCC-MAIN-2021-39,text/turtle,35368,35358,0.0012\nCC-MAIN-2021-39,text/vcard,43195,43191,0.0015\nCC-MAIN-2021-39,text/x-bibtex,17825,17825,0.0006\nCC-MAIN-2021-39,text/x-c,9826,9825,0.0003\nCC-MAIN-2021-39,text/x-csrc,16279,16278,0.0005\nCC-MAIN-2021-39,text/x-diff,6441,6440,0.0002\nCC-MAIN-2021-39,text/x-patch,23844,23834,0.0008\nCC-MAIN-2021-39,text/x-perl,4561,4561,0.0002\nCC-MAIN-2021-39,text/x-vcalendar,12648,12647,0.0004\nCC-MAIN-2021-39,text/x-vcard,76487,76396,0.0026\nCC-MAIN-2021-39,text/xml,2186177,2182566,0.0739\nCC-MAIN-2021-39,unknown/unknown,10333,10332,0.0003\nCC-MAIN-2021-39,video/mp4,76581,76466,0.0026\nCC-MAIN-2021-39,video/webm,4019,4007,0.0001\nCC-MAIN-2021-39,video/x-ms-asf,10089,10078,0.0003\nCC-MAIN-2021-43,<other>,2254425,2249327,0.0673\nCC-MAIN-2021-43,application/atom+xml,2882868,2882714,0.0861\nCC-MAIN-2021-43,application/calendar,8731,8730,0.0003\nCC-MAIN-2021-43,application/download,114467,114456,0.0034\nCC-MAIN-2021-43,application/epub+zip,47654,47623,0.0014\nCC-MAIN-2021-43,application/force-download,155350,155298,0.0046\nCC-MAIN-2021-43,application/gpx+xml,16618,16618,0.0005\nCC-MAIN-2021-43,application/ics,13413,13413,0.0004\nCC-MAIN-2021-43,application/javascript,10267,10264,0.0003\nCC-MAIN-2021-43,application/json,767399,767198,0.0229\nCC-MAIN-2021-43,application/ld+json,19136,19136,0.0006\nCC-MAIN-2021-43,application/marc,12052,12052,0.0004\nCC-MAIN-2021-43,application/msword,110655,110425,0.0033\nCC-MAIN-2021-43,application/octet-stream,1567349,1565678,0.0468\nCC-MAIN-2021-43,application/octetstream,11359,11359,0.0003\nCC-MAIN-2021-43,application/pdf,33777876,33711794,1.0085\nCC-MAIN-2021-43,application/pgp-encrypted,2937,2937,0.0001\nCC-MAIN-2021-43,application/pgp-signature,71510,71444,0.0021\nCC-MAIN-2021-43,application/postscript,7653,7648,0.0002\nCC-MAIN-2021-43,application/rdf+xml,115998,115980,0.0035\nCC-MAIN-2021-43,application/rss+xml,2242826,2241480,0.0670\nCC-MAIN-2021-43,application/rtf,32855,32847,0.0010\nCC-MAIN-2021-43,application/save-to-disk,128,128,0.0000\nCC-MAIN-2021-43,application/text,78905,78904,0.0024\nCC-MAIN-2021-43,application/unknown,15069,15069,0.0004\nCC-MAIN-2021-43,application/vnd.android.package-archive,11883,11781,0.0004\nCC-MAIN-2021-43,application/vnd.google-earth.kml+xml,46500,46485,0.0014\nCC-MAIN-2021-43,application/vnd.google-earth.kmz,11042,11040,0.0003\nCC-MAIN-2021-43,application/vnd.ms-excel,73593,73437,0.0022\nCC-MAIN-2021-43,application/vnd.ms-powerpoint,38752,38727,0.0012\nCC-MAIN-2021-43,application/vnd.ms-word,19855,19855,0.0006\nCC-MAIN-2021-43,application/vnd.oasis.opendocument.text,39887,39875,0.0012\nCC-MAIN-2021-43,application/vnd.openxmlformats-officedocument.presentationml.presentation,9977,9957,0.0003\nCC-MAIN-2021-43,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,47550,47438,0.0014\nCC-MAIN-2021-43,application/vnd.openxmlformats-officedocument.wordprocessingml.document,107045,106715,0.0032\nCC-MAIN-2021-43,application/vnd.wap.xhtml+xml,8561,8523,0.0003\nCC-MAIN-2021-43,application/x-bibtex,101077,101077,0.0030\nCC-MAIN-2021-43,application/x-bittorrent,6785,6784,0.0002\nCC-MAIN-2021-43,application/x-debian-package,169,169,0.0000\nCC-MAIN-2021-43,application/x-download,42831,42046,0.0013\nCC-MAIN-2021-43,application/x-endnote-refer,125825,125824,0.0038\nCC-MAIN-2021-43,application/x-gzip,43161,43154,0.0013\nCC-MAIN-2021-43,application/x-httpd-php,6750,6723,0.0002\nCC-MAIN-2021-43,application/x-java-jnlp-file,10637,10611,0.0003\nCC-MAIN-2021-43,application/x-javascript,7854,7810,0.0002\nCC-MAIN-2021-43,application/x-json,619,619,0.0000\nCC-MAIN-2021-43,application/x-mobipocket-ebook,5138,5133,0.0002\nCC-MAIN-2021-43,application/x-msdownload,11910,11702,0.0004\nCC-MAIN-2021-43,application/x-netcdf,12465,12465,0.0004\nCC-MAIN-2021-43,application/x-research-info-systems,296807,296779,0.0089\nCC-MAIN-2021-43,application/x-shockwave-flash,11424,11384,0.0003\nCC-MAIN-2021-43,application/x-tar,15234,15222,0.0005\nCC-MAIN-2021-43,application/x-tex,6724,6724,0.0002\nCC-MAIN-2021-43,application/x-troff-man,19748,19741,0.0006\nCC-MAIN-2021-43,application/x-zip-compressed,23965,23842,0.0007\nCC-MAIN-2021-43,application/xhtml+xml,1595525,1593287,0.0476\nCC-MAIN-2021-43,application/xml,940903,940135,0.0281\nCC-MAIN-2021-43,application/zip,172761,171736,0.0052\nCC-MAIN-2021-43,audio/mpeg,114247,113414,0.0034\nCC-MAIN-2021-43,audio/x-mpegurl,19586,19585,0.0006\nCC-MAIN-2021-43,audio/x-scpls,4540,4534,0.0001\nCC-MAIN-2021-43,audio/x-wav,4836,4775,0.0001\nCC-MAIN-2021-43,binary/octet-stream,34749,34709,0.0010\nCC-MAIN-2021-43,image/gif,169056,168282,0.0050\nCC-MAIN-2021-43,image/jp2,776,776,0.0000\nCC-MAIN-2021-43,image/jpeg,5294591,5278911,0.1581\nCC-MAIN-2021-43,image/jpg,77574,76992,0.0023\nCC-MAIN-2021-43,image/pjpeg,13289,13278,0.0004\nCC-MAIN-2021-43,image/png,905559,900694,0.0270\nCC-MAIN-2021-43,image/svg+xml,27582,27481,0.0008\nCC-MAIN-2021-43,image/tiff,17601,17443,0.0005\nCC-MAIN-2021-43,image/vnd.djvu,12564,12542,0.0004\nCC-MAIN-2021-43,image/webp,10192,10174,0.0003\nCC-MAIN-2021-43,message/rfc822,12489,12487,0.0004\nCC-MAIN-2021-43,text/calendar,1118390,1117926,0.0334\nCC-MAIN-2021-43,text/css,11697,11686,0.0003\nCC-MAIN-2021-43,text/csv,184623,184574,0.0055\nCC-MAIN-2021-43,text/directory,10380,10380,0.0003\nCC-MAIN-2021-43,text/enriched,28979,28978,0.0009\nCC-MAIN-2021-43,text/html,3288141956,3271348940,98.1776\nCC-MAIN-2021-43,text/javascript,9697,9684,0.0003\nCC-MAIN-2021-43,text/markdown,3843,3843,0.0001\nCC-MAIN-2021-43,text/pdf,1670,1670,0.0000\nCC-MAIN-2021-43,text/plain,2153633,2152915,0.0643\nCC-MAIN-2021-43,text/prs.lines.tag,3813,3813,0.0001\nCC-MAIN-2021-43,text/tab-separated-values,21065,21064,0.0006\nCC-MAIN-2021-43,text/turtle,40872,40867,0.0012\nCC-MAIN-2021-43,text/vcard,44965,44960,0.0013\nCC-MAIN-2021-43,text/x-bibtex,16284,16278,0.0005\nCC-MAIN-2021-43,text/x-c,9811,9810,0.0003\nCC-MAIN-2021-43,text/x-csrc,24775,24774,0.0007\nCC-MAIN-2021-43,text/x-diff,16581,16579,0.0005\nCC-MAIN-2021-43,text/x-patch,21765,21760,0.0006\nCC-MAIN-2021-43,text/x-perl,3065,3065,0.0001\nCC-MAIN-2021-43,text/x-vcalendar,12779,12779,0.0004\nCC-MAIN-2021-43,text/x-vcard,69678,69668,0.0021\nCC-MAIN-2021-43,text/xml,2201598,2199179,0.0657\nCC-MAIN-2021-43,unknown/unknown,13221,13217,0.0004\nCC-MAIN-2021-43,video/mp4,71346,70816,0.0021\nCC-MAIN-2021-43,video/webm,4062,4061,0.0001\nCC-MAIN-2021-43,video/x-ms-asf,7779,7778,0.0002\nCC-MAIN-2021-49,<other>,2588504,2582416,0.1024\nCC-MAIN-2021-49,application/atom+xml,3121452,3121224,0.1235\nCC-MAIN-2021-49,application/calendar,12062,12056,0.0005\nCC-MAIN-2021-49,application/download,116046,116031,0.0046\nCC-MAIN-2021-49,application/epub+zip,54086,54066,0.0021\nCC-MAIN-2021-49,application/force-download,160026,160002,0.0063\nCC-MAIN-2021-49,application/gpx+xml,18269,18267,0.0007\nCC-MAIN-2021-49,application/ics,13865,13865,0.0005\nCC-MAIN-2021-49,application/javascript,8784,8780,0.0003\nCC-MAIN-2021-49,application/json,849482,849166,0.0336\nCC-MAIN-2021-49,application/ld+json,26683,26682,0.0011\nCC-MAIN-2021-49,application/marc,14954,14951,0.0006\nCC-MAIN-2021-49,application/msword,119165,118724,0.0047\nCC-MAIN-2021-49,application/octet-stream,1851580,1849672,0.0733\nCC-MAIN-2021-49,application/octetstream,10046,10042,0.0004\nCC-MAIN-2021-49,application/pdf,34978700,34894692,1.3842\nCC-MAIN-2021-49,application/pgp-encrypted,4699,4698,0.0002\nCC-MAIN-2021-49,application/pgp-signature,74855,74853,0.0030\nCC-MAIN-2021-49,application/postscript,8965,8951,0.0004\nCC-MAIN-2021-49,application/rdf+xml,129928,129923,0.0051\nCC-MAIN-2021-49,application/rss+xml,2171529,2170243,0.0859\nCC-MAIN-2021-49,application/rtf,38978,38963,0.0015\nCC-MAIN-2021-49,application/save-to-disk,312,312,0.0000\nCC-MAIN-2021-49,application/text,71911,71911,0.0028\nCC-MAIN-2021-49,application/unknown,11753,11753,0.0005\nCC-MAIN-2021-49,application/vnd.android.package-archive,12060,11972,0.0005\nCC-MAIN-2021-49,application/vnd.google-earth.kml+xml,56565,56522,0.0022\nCC-MAIN-2021-49,application/vnd.google-earth.kmz,11296,11295,0.0004\nCC-MAIN-2021-49,application/vnd.ms-excel,81439,81254,0.0032\nCC-MAIN-2021-49,application/vnd.ms-powerpoint,36632,36623,0.0014\nCC-MAIN-2021-49,application/vnd.ms-word,22036,22023,0.0009\nCC-MAIN-2021-49,application/vnd.oasis.opendocument.text,33619,33606,0.0013\nCC-MAIN-2021-49,application/vnd.openxmlformats-officedocument.presentationml.presentation,11556,11481,0.0005\nCC-MAIN-2021-49,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,60534,60229,0.0024\nCC-MAIN-2021-49,application/vnd.openxmlformats-officedocument.wordprocessingml.document,105396,104994,0.0042\nCC-MAIN-2021-49,application/vnd.wap.xhtml+xml,8685,8649,0.0003\nCC-MAIN-2021-49,application/x-bibtex,110839,110839,0.0044\nCC-MAIN-2021-49,application/x-bittorrent,6498,6497,0.0003\nCC-MAIN-2021-49,application/x-debian-package,412,411,0.0000\nCC-MAIN-2021-49,application/x-download,57742,57342,0.0023\nCC-MAIN-2021-49,application/x-endnote-refer,125038,125036,0.0049\nCC-MAIN-2021-49,application/x-gzip,44686,44673,0.0018\nCC-MAIN-2021-49,application/x-httpd-php,7166,7129,0.0003\nCC-MAIN-2021-49,application/x-java-jnlp-file,13559,13535,0.0005\nCC-MAIN-2021-49,application/x-javascript,7549,7488,0.0003\nCC-MAIN-2021-49,application/x-json,17,17,0.0000\nCC-MAIN-2021-49,application/x-mobipocket-ebook,6061,6057,0.0002\nCC-MAIN-2021-49,application/x-msdownload,10289,10189,0.0004\nCC-MAIN-2021-49,application/x-netcdf,25549,25549,0.0010\nCC-MAIN-2021-49,application/x-research-info-systems,289480,289478,0.0115\nCC-MAIN-2021-49,application/x-shockwave-flash,12489,12458,0.0005\nCC-MAIN-2021-49,application/x-tar,15321,15312,0.0006\nCC-MAIN-2021-49,application/x-tex,7394,7394,0.0003\nCC-MAIN-2021-49,application/x-troff-man,16310,16306,0.0006\nCC-MAIN-2021-49,application/x-zip-compressed,26689,26561,0.0011\nCC-MAIN-2021-49,application/xhtml+xml,1653195,1650782,0.0654\nCC-MAIN-2021-49,application/xml,956493,955532,0.0378\nCC-MAIN-2021-49,application/zip,185505,184665,0.0073\nCC-MAIN-2021-49,audio/mpeg,134021,132432,0.0053\nCC-MAIN-2021-49,audio/x-mpegurl,25936,25923,0.0010\nCC-MAIN-2021-49,audio/x-scpls,4488,4481,0.0002\nCC-MAIN-2021-49,audio/x-wav,6044,5952,0.0002\nCC-MAIN-2021-49,binary/octet-stream,45091,45007,0.0018\nCC-MAIN-2021-49,image/gif,206854,206347,0.0082\nCC-MAIN-2021-49,image/jp2,919,919,0.0000\nCC-MAIN-2021-49,image/jpeg,5719156,5707070,0.2263\nCC-MAIN-2021-49,image/jpg,82544,82273,0.0033\nCC-MAIN-2021-49,image/pjpeg,22523,22452,0.0009\nCC-MAIN-2021-49,image/png,1002821,1000016,0.0397\nCC-MAIN-2021-49,image/svg+xml,29173,29144,0.0012\nCC-MAIN-2021-49,image/tiff,22413,22410,0.0009\nCC-MAIN-2021-49,image/vnd.djvu,14321,14320,0.0006\nCC-MAIN-2021-49,image/webp,18219,18214,0.0007\nCC-MAIN-2021-49,message/rfc822,24307,24305,0.0010\nCC-MAIN-2021-49,text/calendar,1195548,1195312,0.0473\nCC-MAIN-2021-49,text/css,11985,11926,0.0005\nCC-MAIN-2021-49,text/csv,186108,186054,0.0074\nCC-MAIN-2021-49,text/directory,8295,8295,0.0003\nCC-MAIN-2021-49,text/enriched,28933,28933,0.0011\nCC-MAIN-2021-49,text/html,2462602194,2446291534,97.4487\nCC-MAIN-2021-49,text/javascript,20540,20525,0.0008\nCC-MAIN-2021-49,text/markdown,5162,5157,0.0002\nCC-MAIN-2021-49,text/pdf,1007,1007,0.0000\nCC-MAIN-2021-49,text/plain,2580687,2579544,0.1021\nCC-MAIN-2021-49,text/prs.lines.tag,20395,20395,0.0008\nCC-MAIN-2021-49,text/tab-separated-values,29270,29270,0.0012\nCC-MAIN-2021-49,text/turtle,54389,54388,0.0022\nCC-MAIN-2021-49,text/vcard,48657,48631,0.0019\nCC-MAIN-2021-49,text/x-bibtex,18549,18520,0.0007\nCC-MAIN-2021-49,text/x-c,24064,24063,0.0010\nCC-MAIN-2021-49,text/x-csrc,24384,24383,0.0010\nCC-MAIN-2021-49,text/x-diff,11882,11857,0.0005\nCC-MAIN-2021-49,text/x-patch,23185,23164,0.0009\nCC-MAIN-2021-49,text/x-perl,1935,1935,0.0001\nCC-MAIN-2021-49,text/x-vcalendar,20530,20530,0.0008\nCC-MAIN-2021-49,text/x-vcard,76494,76481,0.0030\nCC-MAIN-2021-49,text/xml,2135484,2133113,0.0845\nCC-MAIN-2021-49,unknown/unknown,14896,14892,0.0006\nCC-MAIN-2021-49,video/mp4,85697,84886,0.0034\nCC-MAIN-2021-49,video/webm,3694,3694,0.0001\nCC-MAIN-2021-49,video/x-ms-asf,8272,8272,0.0003\nCC-MAIN-2022-05,<other>,2496214,2491311,0.0836\nCC-MAIN-2022-05,application/atom+xml,2442704,2442561,0.0818\nCC-MAIN-2022-05,application/calendar,8176,8174,0.0003\nCC-MAIN-2022-05,application/download,88190,88181,0.0030\nCC-MAIN-2022-05,application/epub+zip,60654,60624,0.0020\nCC-MAIN-2022-05,application/force-download,133313,133304,0.0045\nCC-MAIN-2022-05,application/gpx+xml,12956,12956,0.0004\nCC-MAIN-2022-05,application/ics,9289,9289,0.0003\nCC-MAIN-2022-05,application/javascript,6140,6137,0.0002\nCC-MAIN-2022-05,application/json,835105,834888,0.0280\nCC-MAIN-2022-05,application/ld+json,26254,26243,0.0009\nCC-MAIN-2022-05,application/marc,14089,14089,0.0005\nCC-MAIN-2022-05,application/msword,100158,99951,0.0034\nCC-MAIN-2022-05,application/octet-stream,1586448,1584890,0.0531\nCC-MAIN-2022-05,application/octetstream,9642,9638,0.0003\nCC-MAIN-2022-05,application/pdf,25020936,24963211,0.8378\nCC-MAIN-2022-05,application/pgp-encrypted,3383,3383,0.0001\nCC-MAIN-2022-05,application/pgp-signature,65144,65143,0.0022\nCC-MAIN-2022-05,application/postscript,5670,5663,0.0002\nCC-MAIN-2022-05,application/rdf+xml,143064,143053,0.0048\nCC-MAIN-2022-05,application/rss+xml,2014466,2013023,0.0675\nCC-MAIN-2022-05,application/rtf,29841,29840,0.0010\nCC-MAIN-2022-05,application/save-to-disk,112,112,0.0000\nCC-MAIN-2022-05,application/text,70343,70342,0.0024\nCC-MAIN-2022-05,application/unknown,11105,11104,0.0004\nCC-MAIN-2022-05,application/vnd.android.package-archive,11683,11609,0.0004\nCC-MAIN-2022-05,application/vnd.google-earth.kml+xml,53786,53759,0.0018\nCC-MAIN-2022-05,application/vnd.google-earth.kmz,24335,24334,0.0008\nCC-MAIN-2022-05,application/vnd.ms-excel,69088,68912,0.0023\nCC-MAIN-2022-05,application/vnd.ms-powerpoint,20671,20668,0.0007\nCC-MAIN-2022-05,application/vnd.ms-word,21260,21260,0.0007\nCC-MAIN-2022-05,application/vnd.oasis.opendocument.text,28004,28000,0.0009\nCC-MAIN-2022-05,application/vnd.openxmlformats-officedocument.presentationml.presentation,8136,8061,0.0003\nCC-MAIN-2022-05,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,52306,52175,0.0018\nCC-MAIN-2022-05,application/vnd.openxmlformats-officedocument.wordprocessingml.document,78521,78321,0.0026\nCC-MAIN-2022-05,application/vnd.wap.xhtml+xml,6448,6431,0.0002\nCC-MAIN-2022-05,application/x-bibtex,104295,104295,0.0035\nCC-MAIN-2022-05,application/x-bittorrent,6465,6464,0.0002\nCC-MAIN-2022-05,application/x-debian-package,644,643,0.0000\nCC-MAIN-2022-05,application/x-download,55395,54993,0.0019\nCC-MAIN-2022-05,application/x-endnote-refer,125858,125858,0.0042\nCC-MAIN-2022-05,application/x-gzip,37976,37970,0.0013\nCC-MAIN-2022-05,application/x-httpd-php,8874,8829,0.0003\nCC-MAIN-2022-05,application/x-java-jnlp-file,14449,14398,0.0005\nCC-MAIN-2022-05,application/x-javascript,5977,5917,0.0002\nCC-MAIN-2022-05,application/x-json,45,45,0.0000\nCC-MAIN-2022-05,application/x-mobipocket-ebook,5796,5794,0.0002\nCC-MAIN-2022-05,application/x-msdownload,10981,10840,0.0004\nCC-MAIN-2022-05,application/x-netcdf,13623,13623,0.0005\nCC-MAIN-2022-05,application/x-research-info-systems,284311,284310,0.0095\nCC-MAIN-2022-05,application/x-shockwave-flash,9599,9572,0.0003\nCC-MAIN-2022-05,application/x-tar,23559,23556,0.0008\nCC-MAIN-2022-05,application/x-tex,7085,7082,0.0002\nCC-MAIN-2022-05,application/x-troff-man,18140,18135,0.0006\nCC-MAIN-2022-05,application/x-zip-compressed,28282,28201,0.0009\nCC-MAIN-2022-05,application/xhtml+xml,1659722,1658548,0.0556\nCC-MAIN-2022-05,application/xml,964988,964294,0.0323\nCC-MAIN-2022-05,application/zip,195705,194958,0.0066\nCC-MAIN-2022-05,audio/mpeg,105007,103573,0.0035\nCC-MAIN-2022-05,audio/x-mpegurl,27408,27368,0.0009\nCC-MAIN-2022-05,audio/x-scpls,3559,3549,0.0001\nCC-MAIN-2022-05,audio/x-wav,5077,4969,0.0002\nCC-MAIN-2022-05,binary/octet-stream,21702,21667,0.0007\nCC-MAIN-2022-05,image/gif,172437,172088,0.0058\nCC-MAIN-2022-05,image/jp2,1534,1534,0.0001\nCC-MAIN-2022-05,image/jpeg,4449886,4441925,0.1490\nCC-MAIN-2022-05,image/jpg,75572,75328,0.0025\nCC-MAIN-2022-05,image/pjpeg,62107,62107,0.0021\nCC-MAIN-2022-05,image/png,754835,752819,0.0253\nCC-MAIN-2022-05,image/svg+xml,27601,27584,0.0009\nCC-MAIN-2022-05,image/tiff,16916,16915,0.0006\nCC-MAIN-2022-05,image/vnd.djvu,15026,15024,0.0005\nCC-MAIN-2022-05,image/webp,11718,11609,0.0004\nCC-MAIN-2022-05,message/rfc822,14319,14318,0.0005\nCC-MAIN-2022-05,text/calendar,1024586,1024429,0.0343\nCC-MAIN-2022-05,text/css,12144,12112,0.0004\nCC-MAIN-2022-05,text/csv,171155,171102,0.0057\nCC-MAIN-2022-05,text/directory,9738,9733,0.0003\nCC-MAIN-2022-05,text/enriched,29158,29158,0.0010\nCC-MAIN-2022-05,text/html,2935178256,2919958170,98.2851\nCC-MAIN-2022-05,text/javascript,11717,11689,0.0004\nCC-MAIN-2022-05,text/markdown,5226,5226,0.0002\nCC-MAIN-2022-05,text/pdf,595,595,0.0000\nCC-MAIN-2022-05,text/plain,2323250,2322491,0.0778\nCC-MAIN-2022-05,text/prs.lines.tag,12825,12825,0.0004\nCC-MAIN-2022-05,text/tab-separated-values,24611,24611,0.0008\nCC-MAIN-2022-05,text/turtle,54722,54719,0.0018\nCC-MAIN-2022-05,text/vcard,39372,39367,0.0013\nCC-MAIN-2022-05,text/x-bibtex,18821,18817,0.0006\nCC-MAIN-2022-05,text/x-c,16775,16775,0.0006\nCC-MAIN-2022-05,text/x-csrc,28118,28118,0.0009\nCC-MAIN-2022-05,text/x-diff,8633,8626,0.0003\nCC-MAIN-2022-05,text/x-patch,26698,26683,0.0009\nCC-MAIN-2022-05,text/x-perl,2958,2958,0.0001\nCC-MAIN-2022-05,text/x-vcalendar,13362,13362,0.0004\nCC-MAIN-2022-05,text/x-vcard,63781,63759,0.0021\nCC-MAIN-2022-05,text/xml,2311054,2308477,0.0774\nCC-MAIN-2022-05,unknown/unknown,15377,15377,0.0005\nCC-MAIN-2022-05,video/mp4,63395,63143,0.0021\nCC-MAIN-2022-05,video/webm,3223,3223,0.0001\nCC-MAIN-2022-05,video/x-ms-asf,8373,8372,0.0003\nCC-MAIN-2022-21,<other>,2084315,2079682,0.0604\nCC-MAIN-2022-21,application/atom+xml,3001754,3001524,0.0870\nCC-MAIN-2022-21,application/calendar,9721,9719,0.0003\nCC-MAIN-2022-21,application/download,96407,96405,0.0028\nCC-MAIN-2022-21,application/epub+zip,41118,41072,0.0012\nCC-MAIN-2022-21,application/force-download,146268,146251,0.0042\nCC-MAIN-2022-21,application/gpx+xml,14570,14568,0.0004\nCC-MAIN-2022-21,application/ics,12819,12819,0.0004\nCC-MAIN-2022-21,application/javascript,6854,6849,0.0002\nCC-MAIN-2022-21,application/json,797498,797246,0.0231\nCC-MAIN-2022-21,application/ld+json,24520,24520,0.0007\nCC-MAIN-2022-21,application/marc,12563,12563,0.0004\nCC-MAIN-2022-21,application/msword,97011,96849,0.0028\nCC-MAIN-2022-21,application/octet-stream,1370374,1369063,0.0397\nCC-MAIN-2022-21,application/octetstream,9461,9456,0.0003\nCC-MAIN-2022-21,application/pdf,26832203,26771883,0.7778\nCC-MAIN-2022-21,application/pgp-encrypted,4187,4187,0.0001\nCC-MAIN-2022-21,application/pgp-signature,58458,58449,0.0017\nCC-MAIN-2022-21,application/postscript,5871,5865,0.0002\nCC-MAIN-2022-21,application/rdf+xml,115382,115374,0.0033\nCC-MAIN-2022-21,application/rss+xml,2036550,2034195,0.0590\nCC-MAIN-2022-21,application/rtf,36313,36293,0.0011\nCC-MAIN-2022-21,application/save-to-disk,86,86,0.0000\nCC-MAIN-2022-21,application/text,87823,87812,0.0025\nCC-MAIN-2022-21,application/unknown,10795,10793,0.0003\nCC-MAIN-2022-21,application/vnd.android.package-archive,8303,8243,0.0002\nCC-MAIN-2022-21,application/vnd.google-earth.kml+xml,47280,47259,0.0014\nCC-MAIN-2022-21,application/vnd.google-earth.kmz,10973,10969,0.0003\nCC-MAIN-2022-21,application/vnd.ms-excel,59046,58985,0.0017\nCC-MAIN-2022-21,application/vnd.ms-powerpoint,14465,14465,0.0004\nCC-MAIN-2022-21,application/vnd.ms-word,17335,17335,0.0005\nCC-MAIN-2022-21,application/vnd.oasis.opendocument.text,23573,23529,0.0007\nCC-MAIN-2022-21,application/vnd.openxmlformats-officedocument.presentationml.presentation,7805,7761,0.0002\nCC-MAIN-2022-21,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,49171,49123,0.0014\nCC-MAIN-2022-21,application/vnd.openxmlformats-officedocument.wordprocessingml.document,75962,75711,0.0022\nCC-MAIN-2022-21,application/vnd.wap.xhtml+xml,17660,17584,0.0005\nCC-MAIN-2022-21,application/x-bibtex,80616,80602,0.0023\nCC-MAIN-2022-21,application/x-bittorrent,5366,5366,0.0002\nCC-MAIN-2022-21,application/x-debian-package,276,276,0.0000\nCC-MAIN-2022-21,application/x-download,42388,42308,0.0012\nCC-MAIN-2022-21,application/x-endnote-refer,111352,111340,0.0032\nCC-MAIN-2022-21,application/x-gzip,52244,52233,0.0015\nCC-MAIN-2022-21,application/x-httpd-php,6003,5943,0.0002\nCC-MAIN-2022-21,application/x-java-jnlp-file,10312,10288,0.0003\nCC-MAIN-2022-21,application/x-javascript,9758,9678,0.0003\nCC-MAIN-2022-21,application/x-json,29,29,0.0000\nCC-MAIN-2022-21,application/x-mobipocket-ebook,4667,4661,0.0001\nCC-MAIN-2022-21,application/x-msdownload,10778,10678,0.0003\nCC-MAIN-2022-21,application/x-netcdf,25911,25911,0.0008\nCC-MAIN-2022-21,application/x-research-info-systems,204057,204044,0.0059\nCC-MAIN-2022-21,application/x-shockwave-flash,8793,8784,0.0003\nCC-MAIN-2022-21,application/x-tar,18685,18676,0.0005\nCC-MAIN-2022-21,application/x-tex,4870,4869,0.0001\nCC-MAIN-2022-21,application/x-troff-man,15967,15960,0.0005\nCC-MAIN-2022-21,application/x-zip-compressed,20067,19859,0.0006\nCC-MAIN-2022-21,application/xhtml+xml,1765483,1763813,0.0512\nCC-MAIN-2022-21,application/xml,941510,940105,0.0273\nCC-MAIN-2022-21,application/zip,166355,165640,0.0048\nCC-MAIN-2022-21,audio/mpeg,107137,106025,0.0031\nCC-MAIN-2022-21,audio/x-mpegurl,25405,25398,0.0007\nCC-MAIN-2022-21,audio/x-scpls,3488,3484,0.0001\nCC-MAIN-2022-21,audio/x-wav,3920,3746,0.0001\nCC-MAIN-2022-21,binary/octet-stream,13094,13016,0.0004\nCC-MAIN-2022-21,image/gif,199332,198956,0.0058\nCC-MAIN-2022-21,image/jp2,1448,1448,0.0000\nCC-MAIN-2022-21,image/jpeg,6284096,6271676,0.1822\nCC-MAIN-2022-21,image/jpg,72191,70848,0.0021\nCC-MAIN-2022-21,image/pjpeg,31168,31168,0.0009\nCC-MAIN-2022-21,image/png,1443465,1439912,0.0418\nCC-MAIN-2022-21,image/svg+xml,44979,44941,0.0013\nCC-MAIN-2022-21,image/tiff,14080,14056,0.0004\nCC-MAIN-2022-21,image/vnd.djvu,11769,11767,0.0003\nCC-MAIN-2022-21,image/webp,19552,19499,0.0006\nCC-MAIN-2022-21,message/rfc822,8931,8931,0.0003\nCC-MAIN-2022-21,text/calendar,966546,966165,0.0280\nCC-MAIN-2022-21,text/css,13317,13293,0.0004\nCC-MAIN-2022-21,text/csv,157604,157556,0.0046\nCC-MAIN-2022-21,text/directory,8545,8541,0.0002\nCC-MAIN-2022-21,text/enriched,33190,33185,0.0010\nCC-MAIN-2022-21,text/html,3395013929,3373088669,98.4112\nCC-MAIN-2022-21,text/javascript,14911,14891,0.0004\nCC-MAIN-2022-21,text/markdown,5522,5520,0.0002\nCC-MAIN-2022-21,text/pdf,260,260,0.0000\nCC-MAIN-2022-21,text/plain,2001809,2000814,0.0580\nCC-MAIN-2022-21,text/prs.lines.tag,22095,22095,0.0006\nCC-MAIN-2022-21,text/tab-separated-values,25329,25316,0.0007\nCC-MAIN-2022-21,text/turtle,40937,40918,0.0012\nCC-MAIN-2022-21,text/vcard,42643,42635,0.0012\nCC-MAIN-2022-21,text/x-bibtex,25170,25170,0.0007\nCC-MAIN-2022-21,text/x-c,5585,5584,0.0002\nCC-MAIN-2022-21,text/x-csrc,22975,22974,0.0007\nCC-MAIN-2022-21,text/x-diff,8993,8986,0.0003\nCC-MAIN-2022-21,text/x-patch,17939,17923,0.0005\nCC-MAIN-2022-21,text/x-perl,3555,3555,0.0001\nCC-MAIN-2022-21,text/x-vcalendar,15260,15260,0.0004\nCC-MAIN-2022-21,text/x-vcard,60071,60030,0.0017\nCC-MAIN-2022-21,text/xml,2178194,2174663,0.0631\nCC-MAIN-2022-21,unknown/unknown,6512,6512,0.0002\nCC-MAIN-2022-21,video/mp4,88276,88156,0.0026\nCC-MAIN-2022-21,video/webm,3416,3415,0.0001\nCC-MAIN-2022-21,video/x-ms-asf,7596,7592,0.0002\nCC-MAIN-2022-27,<other>,2200618,2195983,0.0708\nCC-MAIN-2022-27,application/atom+xml,3361465,3361270,0.1081\nCC-MAIN-2022-27,application/calendar,15710,15705,0.0005\nCC-MAIN-2022-27,application/download,116504,116500,0.0037\nCC-MAIN-2022-27,application/epub+zip,46159,46147,0.0015\nCC-MAIN-2022-27,application/force-download,177114,177087,0.0057\nCC-MAIN-2022-27,application/gpx+xml,16142,16141,0.0005\nCC-MAIN-2022-27,application/ics,16079,16075,0.0005\nCC-MAIN-2022-27,application/javascript,7430,7423,0.0002\nCC-MAIN-2022-27,application/json,791372,791144,0.0254\nCC-MAIN-2022-27,application/ld+json,31150,31102,0.0010\nCC-MAIN-2022-27,application/marc,12903,12903,0.0004\nCC-MAIN-2022-27,application/msword,112537,112435,0.0036\nCC-MAIN-2022-27,application/octet-stream,1673631,1671981,0.0538\nCC-MAIN-2022-27,application/octetstream,10503,10502,0.0003\nCC-MAIN-2022-27,application/pdf,30914874,30838517,0.9942\nCC-MAIN-2022-27,application/pgp-encrypted,3536,3536,0.0001\nCC-MAIN-2022-27,application/pgp-signature,62854,62852,0.0020\nCC-MAIN-2022-27,application/postscript,5842,5838,0.0002\nCC-MAIN-2022-27,application/rdf+xml,124672,124641,0.0040\nCC-MAIN-2022-27,application/rss+xml,2158883,2157096,0.0694\nCC-MAIN-2022-27,application/rtf,35394,35384,0.0011\nCC-MAIN-2022-27,application/save-to-disk,152,152,0.0000\nCC-MAIN-2022-27,application/text,73507,73506,0.0024\nCC-MAIN-2022-27,application/unknown,10812,10812,0.0003\nCC-MAIN-2022-27,application/vnd.android.package-archive,8039,7928,0.0003\nCC-MAIN-2022-27,application/vnd.google-earth.kml+xml,47041,47003,0.0015\nCC-MAIN-2022-27,application/vnd.google-earth.kmz,8444,8441,0.0003\nCC-MAIN-2022-27,application/vnd.ms-excel,76467,76379,0.0025\nCC-MAIN-2022-27,application/vnd.ms-powerpoint,15263,15259,0.0005\nCC-MAIN-2022-27,application/vnd.ms-word,19927,19926,0.0006\nCC-MAIN-2022-27,application/vnd.oasis.opendocument.text,28378,28369,0.0009\nCC-MAIN-2022-27,application/vnd.openxmlformats-officedocument.presentationml.presentation,10376,10337,0.0003\nCC-MAIN-2022-27,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,56476,56261,0.0018\nCC-MAIN-2022-27,application/vnd.openxmlformats-officedocument.wordprocessingml.document,97400,97188,0.0031\nCC-MAIN-2022-27,application/vnd.wap.xhtml+xml,21987,21880,0.0007\nCC-MAIN-2022-27,application/x-bibtex,90592,90568,0.0029\nCC-MAIN-2022-27,application/x-bittorrent,5563,5561,0.0002\nCC-MAIN-2022-27,application/x-debian-package,638,638,0.0000\nCC-MAIN-2022-27,application/x-download,48205,48200,0.0016\nCC-MAIN-2022-27,application/x-endnote-refer,104025,104009,0.0033\nCC-MAIN-2022-27,application/x-gzip,42763,42689,0.0014\nCC-MAIN-2022-27,application/x-httpd-php,5115,5094,0.0002\nCC-MAIN-2022-27,application/x-java-jnlp-file,4370,4365,0.0001\nCC-MAIN-2022-27,application/x-javascript,10517,10455,0.0003\nCC-MAIN-2022-27,application/x-json,84,84,0.0000\nCC-MAIN-2022-27,application/x-mobipocket-ebook,4901,4901,0.0002\nCC-MAIN-2022-27,application/x-msdownload,13629,13405,0.0004\nCC-MAIN-2022-27,application/x-netcdf,52096,52096,0.0017\nCC-MAIN-2022-27,application/x-research-info-systems,220836,220809,0.0071\nCC-MAIN-2022-27,application/x-shockwave-flash,8159,8151,0.0003\nCC-MAIN-2022-27,application/x-tar,12678,12672,0.0004\nCC-MAIN-2022-27,application/x-tex,4661,4661,0.0001\nCC-MAIN-2022-27,application/x-troff-man,25100,25100,0.0008\nCC-MAIN-2022-27,application/x-zip-compressed,24873,24727,0.0008\nCC-MAIN-2022-27,application/xhtml+xml,1543912,1542350,0.0496\nCC-MAIN-2022-27,application/xml,996452,995430,0.0320\nCC-MAIN-2022-27,application/zip,196916,196062,0.0063\nCC-MAIN-2022-27,audio/mpeg,127136,125868,0.0041\nCC-MAIN-2022-27,audio/x-mpegurl,32172,32146,0.0010\nCC-MAIN-2022-27,audio/x-scpls,4922,4914,0.0002\nCC-MAIN-2022-27,audio/x-wav,5111,4992,0.0002\nCC-MAIN-2022-27,binary/octet-stream,42933,42919,0.0014\nCC-MAIN-2022-27,image/gif,145481,145119,0.0047\nCC-MAIN-2022-27,image/jp2,689,689,0.0000\nCC-MAIN-2022-27,image/jpeg,5509572,5499230,0.1772\nCC-MAIN-2022-27,image/jpg,86455,86390,0.0028\nCC-MAIN-2022-27,image/pjpeg,34205,34203,0.0011\nCC-MAIN-2022-27,image/png,1101330,1096951,0.0354\nCC-MAIN-2022-27,image/svg+xml,37901,37875,0.0012\nCC-MAIN-2022-27,image/tiff,21731,21731,0.0007\nCC-MAIN-2022-27,image/vnd.djvu,10235,10235,0.0003\nCC-MAIN-2022-27,image/webp,21973,21949,0.0007\nCC-MAIN-2022-27,message/rfc822,9542,9542,0.0003\nCC-MAIN-2022-27,text/calendar,1113605,1113130,0.0358\nCC-MAIN-2022-27,text/css,14543,14522,0.0005\nCC-MAIN-2022-27,text/csv,143612,143559,0.0046\nCC-MAIN-2022-27,text/directory,10079,10079,0.0003\nCC-MAIN-2022-27,text/enriched,25902,25902,0.0008\nCC-MAIN-2022-27,text/html,3050744070,3033044068,98.1070\nCC-MAIN-2022-27,text/javascript,8325,8306,0.0003\nCC-MAIN-2022-27,text/markdown,5621,5620,0.0002\nCC-MAIN-2022-27,text/pdf,480,480,0.0000\nCC-MAIN-2022-27,text/plain,2014936,2013945,0.0648\nCC-MAIN-2022-27,text/prs.lines.tag,22510,22510,0.0007\nCC-MAIN-2022-27,text/tab-separated-values,25636,25636,0.0008\nCC-MAIN-2022-27,text/turtle,39583,39551,0.0013\nCC-MAIN-2022-27,text/vcard,36930,36831,0.0012\nCC-MAIN-2022-27,text/x-bibtex,17417,17417,0.0006\nCC-MAIN-2022-27,text/x-c,9207,9207,0.0003\nCC-MAIN-2022-27,text/x-csrc,18354,18354,0.0006\nCC-MAIN-2022-27,text/x-diff,5696,5695,0.0002\nCC-MAIN-2022-27,text/x-patch,21009,20990,0.0007\nCC-MAIN-2022-27,text/x-perl,4261,4261,0.0001\nCC-MAIN-2022-27,text/x-vcalendar,14843,14843,0.0005\nCC-MAIN-2022-27,text/x-vcard,69954,69943,0.0022\nCC-MAIN-2022-27,text/xml,2176438,2173916,0.0700\nCC-MAIN-2022-27,unknown/unknown,8062,8061,0.0003\nCC-MAIN-2022-27,video/mp4,69515,69304,0.0022\nCC-MAIN-2022-27,video/webm,6570,6564,0.0002\nCC-MAIN-2022-27,video/x-ms-asf,5400,5398,0.0002\nCC-MAIN-2022-33,<other>,2904953,2899590,0.1122\nCC-MAIN-2022-33,application/atom+xml,2812723,2812550,0.1087\nCC-MAIN-2022-33,application/calendar,9616,9615,0.0004\nCC-MAIN-2022-33,application/download,102599,102586,0.0040\nCC-MAIN-2022-33,application/epub+zip,56465,56451,0.0022\nCC-MAIN-2022-33,application/force-download,203438,203351,0.0079\nCC-MAIN-2022-33,application/gpx+xml,15653,15653,0.0006\nCC-MAIN-2022-33,application/ics,14925,14924,0.0006\nCC-MAIN-2022-33,application/javascript,8242,8238,0.0003\nCC-MAIN-2022-33,application/json,813121,812930,0.0314\nCC-MAIN-2022-33,application/ld+json,31014,31003,0.0012\nCC-MAIN-2022-33,application/marc,11469,11465,0.0004\nCC-MAIN-2022-33,application/msword,113401,113088,0.0044\nCC-MAIN-2022-33,application/octet-stream,1676161,1674438,0.0647\nCC-MAIN-2022-33,application/octetstream,12410,12402,0.0005\nCC-MAIN-2022-33,application/pdf,28497506,28437384,1.1008\nCC-MAIN-2022-33,application/pgp-encrypted,5816,5816,0.0002\nCC-MAIN-2022-33,application/pgp-signature,61614,61609,0.0024\nCC-MAIN-2022-33,application/postscript,6527,6495,0.0003\nCC-MAIN-2022-33,application/rdf+xml,132699,132683,0.0051\nCC-MAIN-2022-33,application/rss+xml,1991615,1989897,0.0769\nCC-MAIN-2022-33,application/rtf,40654,40631,0.0016\nCC-MAIN-2022-33,application/save-to-disk,233,233,0.0000\nCC-MAIN-2022-33,application/text,75166,75158,0.0029\nCC-MAIN-2022-33,application/unknown,12174,12171,0.0005\nCC-MAIN-2022-33,application/vnd.android.package-archive,5852,5757,0.0002\nCC-MAIN-2022-33,application/vnd.google-earth.kml+xml,43668,43657,0.0017\nCC-MAIN-2022-33,application/vnd.google-earth.kmz,10174,10171,0.0004\nCC-MAIN-2022-33,application/vnd.ms-excel,74486,74296,0.0029\nCC-MAIN-2022-33,application/vnd.ms-powerpoint,18358,18347,0.0007\nCC-MAIN-2022-33,application/vnd.ms-word,20223,20221,0.0008\nCC-MAIN-2022-33,application/vnd.oasis.opendocument.text,28477,28449,0.0011\nCC-MAIN-2022-33,application/vnd.openxmlformats-officedocument.presentationml.presentation,9485,9405,0.0004\nCC-MAIN-2022-33,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,59576,59296,0.0023\nCC-MAIN-2022-33,application/vnd.openxmlformats-officedocument.wordprocessingml.document,102784,102512,0.0040\nCC-MAIN-2022-33,application/vnd.wap.xhtml+xml,24906,24748,0.0010\nCC-MAIN-2022-33,application/x-bibtex,100050,100020,0.0039\nCC-MAIN-2022-33,application/x-bittorrent,6492,6491,0.0003\nCC-MAIN-2022-33,application/x-debian-package,436,436,0.0000\nCC-MAIN-2022-33,application/x-download,53790,53761,0.0021\nCC-MAIN-2022-33,application/x-endnote-refer,102940,102922,0.0040\nCC-MAIN-2022-33,application/x-gzip,48778,48671,0.0019\nCC-MAIN-2022-33,application/x-httpd-php,11851,11822,0.0005\nCC-MAIN-2022-33,application/x-java-jnlp-file,4493,4489,0.0002\nCC-MAIN-2022-33,application/x-javascript,11060,10985,0.0004\nCC-MAIN-2022-33,application/x-json,29,29,0.0000\nCC-MAIN-2022-33,application/x-mobipocket-ebook,5859,5859,0.0002\nCC-MAIN-2022-33,application/x-msdownload,16034,15886,0.0006\nCC-MAIN-2022-33,application/x-netcdf,58170,58170,0.0022\nCC-MAIN-2022-33,application/x-research-info-systems,218018,217992,0.0084\nCC-MAIN-2022-33,application/x-shockwave-flash,8321,8312,0.0003\nCC-MAIN-2022-33,application/x-tar,10291,10289,0.0004\nCC-MAIN-2022-33,application/x-tex,5249,5249,0.0002\nCC-MAIN-2022-33,application/x-troff-man,20896,20893,0.0008\nCC-MAIN-2022-33,application/x-zip-compressed,25674,25527,0.0010\nCC-MAIN-2022-33,application/xhtml+xml,1637116,1635336,0.0632\nCC-MAIN-2022-33,application/xml,913400,911582,0.0353\nCC-MAIN-2022-33,application/zip,218648,217690,0.0084\nCC-MAIN-2022-33,audio/mpeg,119622,118353,0.0046\nCC-MAIN-2022-33,audio/x-mpegurl,35828,35789,0.0014\nCC-MAIN-2022-33,audio/x-scpls,3046,3035,0.0001\nCC-MAIN-2022-33,audio/x-wav,7034,6974,0.0003\nCC-MAIN-2022-33,binary/octet-stream,14770,14734,0.0006\nCC-MAIN-2022-33,image/gif,159721,159299,0.0062\nCC-MAIN-2022-33,image/jp2,310,310,0.0000\nCC-MAIN-2022-33,image/jpeg,6467320,6447810,0.2498\nCC-MAIN-2022-33,image/jpg,79930,79756,0.0031\nCC-MAIN-2022-33,image/pjpeg,23488,23487,0.0009\nCC-MAIN-2022-33,image/png,1248562,1243679,0.0482\nCC-MAIN-2022-33,image/svg+xml,42844,42761,0.0017\nCC-MAIN-2022-33,image/tiff,18665,18665,0.0007\nCC-MAIN-2022-33,image/vnd.djvu,14279,14279,0.0006\nCC-MAIN-2022-33,image/webp,24859,24762,0.0010\nCC-MAIN-2022-33,message/rfc822,8610,8610,0.0003\nCC-MAIN-2022-33,text/calendar,1257561,1257265,0.0486\nCC-MAIN-2022-33,text/css,9622,9597,0.0004\nCC-MAIN-2022-33,text/csv,151871,151831,0.0059\nCC-MAIN-2022-33,text/directory,7490,7478,0.0003\nCC-MAIN-2022-33,text/enriched,27351,27348,0.0011\nCC-MAIN-2022-33,text/html,2531107776,2512640796,97.7756\nCC-MAIN-2022-33,text/javascript,16689,16661,0.0006\nCC-MAIN-2022-33,text/markdown,6859,6858,0.0003\nCC-MAIN-2022-33,text/pdf,722,722,0.0000\nCC-MAIN-2022-33,text/plain,2031083,2028607,0.0785\nCC-MAIN-2022-33,text/prs.lines.tag,13034,13034,0.0005\nCC-MAIN-2022-33,text/tab-separated-values,25993,25977,0.0010\nCC-MAIN-2022-33,text/turtle,41337,41329,0.0016\nCC-MAIN-2022-33,text/vcard,36867,36846,0.0014\nCC-MAIN-2022-33,text/x-bibtex,17649,17648,0.0007\nCC-MAIN-2022-33,text/x-c,6564,6556,0.0003\nCC-MAIN-2022-33,text/x-csrc,22440,22439,0.0009\nCC-MAIN-2022-33,text/x-diff,6924,6919,0.0003\nCC-MAIN-2022-33,text/x-patch,21399,21368,0.0008\nCC-MAIN-2022-33,text/x-perl,3675,3675,0.0001\nCC-MAIN-2022-33,text/x-vcalendar,14457,14453,0.0006\nCC-MAIN-2022-33,text/x-vcard,68120,68084,0.0026\nCC-MAIN-2022-33,text/xml,1958466,1955352,0.0757\nCC-MAIN-2022-33,unknown/unknown,8029,8028,0.0003\nCC-MAIN-2022-33,video/mp4,65225,64995,0.0025\nCC-MAIN-2022-33,video/webm,3969,3951,0.0002\nCC-MAIN-2022-33,video/x-ms-asf,4412,4411,0.0002\nCC-MAIN-2022-40,<other>,2108985,2105527,0.0664\nCC-MAIN-2022-40,application/atom+xml,2233179,2233064,0.0703\nCC-MAIN-2022-40,application/calendar,8973,8970,0.0003\nCC-MAIN-2022-40,application/download,68247,68240,0.0021\nCC-MAIN-2022-40,application/epub+zip,36773,36767,0.0012\nCC-MAIN-2022-40,application/force-download,145930,145904,0.0046\nCC-MAIN-2022-40,application/gpx+xml,11885,11875,0.0004\nCC-MAIN-2022-40,application/ics,10009,10009,0.0003\nCC-MAIN-2022-40,application/javascript,5944,5942,0.0002\nCC-MAIN-2022-40,application/json,772265,772060,0.0243\nCC-MAIN-2022-40,application/ld+json,41426,41109,0.0013\nCC-MAIN-2022-40,application/marc,11201,11200,0.0004\nCC-MAIN-2022-40,application/msword,87686,87570,0.0028\nCC-MAIN-2022-40,application/octet-stream,1530728,1529501,0.0482\nCC-MAIN-2022-40,application/octetstream,9187,9185,0.0003\nCC-MAIN-2022-40,application/pdf,22450733,22397862,0.7067\nCC-MAIN-2022-40,application/pgp-encrypted,3426,3426,0.0001\nCC-MAIN-2022-40,application/pgp-signature,65210,65206,0.0021\nCC-MAIN-2022-40,application/postscript,4525,4516,0.0001\nCC-MAIN-2022-40,application/rdf+xml,133732,133432,0.0042\nCC-MAIN-2022-40,application/rss+xml,1783885,1782247,0.0562\nCC-MAIN-2022-40,application/rtf,36018,36013,0.0011\nCC-MAIN-2022-40,application/save-to-disk,55,55,0.0000\nCC-MAIN-2022-40,application/text,73415,73261,0.0023\nCC-MAIN-2022-40,application/unknown,7754,7754,0.0002\nCC-MAIN-2022-40,application/vnd.android.package-archive,4439,4321,0.0001\nCC-MAIN-2022-40,application/vnd.google-earth.kml+xml,47908,47855,0.0015\nCC-MAIN-2022-40,application/vnd.google-earth.kmz,10840,10839,0.0003\nCC-MAIN-2022-40,application/vnd.ms-excel,58461,58378,0.0018\nCC-MAIN-2022-40,application/vnd.ms-powerpoint,9245,9240,0.0003\nCC-MAIN-2022-40,application/vnd.ms-word,15107,15107,0.0005\nCC-MAIN-2022-40,application/vnd.oasis.opendocument.text,21729,21710,0.0007\nCC-MAIN-2022-40,application/vnd.openxmlformats-officedocument.presentationml.presentation,6309,6283,0.0002\nCC-MAIN-2022-40,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,53784,53645,0.0017\nCC-MAIN-2022-40,application/vnd.openxmlformats-officedocument.wordprocessingml.document,74702,74471,0.0024\nCC-MAIN-2022-40,application/vnd.wap.xhtml+xml,27610,27495,0.0009\nCC-MAIN-2022-40,application/x-bibtex,97594,97581,0.0031\nCC-MAIN-2022-40,application/x-bittorrent,5750,5749,0.0002\nCC-MAIN-2022-40,application/x-debian-package,236,236,0.0000\nCC-MAIN-2022-40,application/x-download,52760,52511,0.0017\nCC-MAIN-2022-40,application/x-endnote-refer,109308,109152,0.0034\nCC-MAIN-2022-40,application/x-gzip,40764,40758,0.0013\nCC-MAIN-2022-40,application/x-httpd-php,6661,6638,0.0002\nCC-MAIN-2022-40,application/x-java-jnlp-file,10005,10003,0.0003\nCC-MAIN-2022-40,application/x-javascript,11158,11158,0.0004\nCC-MAIN-2022-40,application/x-json,22,22,0.0000\nCC-MAIN-2022-40,application/x-mobipocket-ebook,5408,5407,0.0002\nCC-MAIN-2022-40,application/x-msdownload,14678,14573,0.0005\nCC-MAIN-2022-40,application/x-netcdf,46938,46935,0.0015\nCC-MAIN-2022-40,application/x-research-info-systems,218904,218890,0.0069\nCC-MAIN-2022-40,application/x-shockwave-flash,5542,5533,0.0002\nCC-MAIN-2022-40,application/x-tar,22729,22723,0.0007\nCC-MAIN-2022-40,application/x-tex,6129,6129,0.0002\nCC-MAIN-2022-40,application/x-troff-man,25582,25582,0.0008\nCC-MAIN-2022-40,application/x-zip-compressed,16325,16089,0.0005\nCC-MAIN-2022-40,application/xhtml+xml,1544489,1542923,0.0486\nCC-MAIN-2022-40,application/xml,838032,836430,0.0264\nCC-MAIN-2022-40,application/zip,195227,193950,0.0061\nCC-MAIN-2022-40,audio/mpeg,97442,96564,0.0031\nCC-MAIN-2022-40,audio/x-mpegurl,29426,29411,0.0009\nCC-MAIN-2022-40,audio/x-scpls,2665,2660,0.0001\nCC-MAIN-2022-40,audio/x-wav,7623,7621,0.0002\nCC-MAIN-2022-40,binary/octet-stream,15758,15734,0.0005\nCC-MAIN-2022-40,image/gif,134545,134248,0.0042\nCC-MAIN-2022-40,image/jp2,331,330,0.0000\nCC-MAIN-2022-40,image/jpeg,4951710,4940854,0.1559\nCC-MAIN-2022-40,image/jpg,75395,75116,0.0024\nCC-MAIN-2022-40,image/pjpeg,17169,17168,0.0005\nCC-MAIN-2022-40,image/png,993837,990835,0.0313\nCC-MAIN-2022-40,image/svg+xml,31634,31591,0.0010\nCC-MAIN-2022-40,image/tiff,16229,16217,0.0005\nCC-MAIN-2022-40,image/vnd.djvu,13051,13051,0.0004\nCC-MAIN-2022-40,image/webp,30588,30513,0.0010\nCC-MAIN-2022-40,message/rfc822,8083,8082,0.0003\nCC-MAIN-2022-40,text/calendar,1082382,1082029,0.0341\nCC-MAIN-2022-40,text/css,15072,15046,0.0005\nCC-MAIN-2022-40,text/csv,129271,129228,0.0041\nCC-MAIN-2022-40,text/directory,6792,6791,0.0002\nCC-MAIN-2022-40,text/enriched,25679,25677,0.0008\nCC-MAIN-2022-40,text/html,3129332428,3112804018,98.5070\nCC-MAIN-2022-40,text/javascript,6559,6547,0.0002\nCC-MAIN-2022-40,text/markdown,5791,5791,0.0002\nCC-MAIN-2022-40,text/pdf,259,259,0.0000\nCC-MAIN-2022-40,text/plain,2060980,2060355,0.0649\nCC-MAIN-2022-40,text/prs.lines.tag,46257,46257,0.0015\nCC-MAIN-2022-40,text/tab-separated-values,19119,19119,0.0006\nCC-MAIN-2022-40,text/turtle,46950,46664,0.0015\nCC-MAIN-2022-40,text/vcard,29487,29476,0.0009\nCC-MAIN-2022-40,text/x-bibtex,17034,17031,0.0005\nCC-MAIN-2022-40,text/x-c,5479,5479,0.0002\nCC-MAIN-2022-40,text/x-csrc,22308,22307,0.0007\nCC-MAIN-2022-40,text/x-diff,6851,6850,0.0002\nCC-MAIN-2022-40,text/x-patch,13459,13455,0.0004\nCC-MAIN-2022-40,text/x-perl,3680,3678,0.0001\nCC-MAIN-2022-40,text/x-vcalendar,13880,13880,0.0004\nCC-MAIN-2022-40,text/x-vcard,56505,56492,0.0018\nCC-MAIN-2022-40,text/xml,2067214,2064583,0.0651\nCC-MAIN-2022-40,unknown/unknown,6305,6305,0.0002\nCC-MAIN-2022-40,video/mp4,65118,64962,0.0020\nCC-MAIN-2022-40,video/webm,2742,2741,0.0001\nCC-MAIN-2022-40,video/x-ms-asf,4415,4414,0.0001\nCC-MAIN-2022-49,<other>,2419294,2410344,0.0715\nCC-MAIN-2022-49,application/atom+xml,3085516,3085318,0.0912\nCC-MAIN-2022-49,application/calendar,13881,13881,0.0004\nCC-MAIN-2022-49,application/download,95487,95471,0.0028\nCC-MAIN-2022-49,application/epub+zip,41809,41790,0.0012\nCC-MAIN-2022-49,application/force-download,187110,187094,0.0055\nCC-MAIN-2022-49,application/gpx+xml,16165,16161,0.0005\nCC-MAIN-2022-49,application/ics,16482,16481,0.0005\nCC-MAIN-2022-49,application/javascript,7168,7166,0.0002\nCC-MAIN-2022-49,application/json,844955,844740,0.0250\nCC-MAIN-2022-49,application/ld+json,39559,39538,0.0012\nCC-MAIN-2022-49,application/marc,11846,11846,0.0004\nCC-MAIN-2022-49,application/msword,97857,97727,0.0029\nCC-MAIN-2022-49,application/octet-stream,1676807,1674657,0.0496\nCC-MAIN-2022-49,application/octetstream,8910,8908,0.0003\nCC-MAIN-2022-49,application/pdf,27230038,27164104,0.8052\nCC-MAIN-2022-49,application/pgp-encrypted,4066,4066,0.0001\nCC-MAIN-2022-49,application/pgp-signature,77438,77435,0.0023\nCC-MAIN-2022-49,application/postscript,5285,5279,0.0002\nCC-MAIN-2022-49,application/rdf+xml,129073,129052,0.0038\nCC-MAIN-2022-49,application/rss+xml,2167060,2164777,0.0641\nCC-MAIN-2022-49,application/rtf,43450,43445,0.0013\nCC-MAIN-2022-49,application/save-to-disk,42,42,0.0000\nCC-MAIN-2022-49,application/text,82405,82394,0.0024\nCC-MAIN-2022-49,application/unknown,8339,8339,0.0002\nCC-MAIN-2022-49,application/vnd.android.package-archive,5224,5062,0.0002\nCC-MAIN-2022-49,application/vnd.google-earth.kml+xml,53635,53619,0.0016\nCC-MAIN-2022-49,application/vnd.google-earth.kmz,8671,8669,0.0003\nCC-MAIN-2022-49,application/vnd.ms-excel,61713,61650,0.0018\nCC-MAIN-2022-49,application/vnd.ms-powerpoint,14875,14861,0.0004\nCC-MAIN-2022-49,application/vnd.ms-word,19002,19002,0.0006\nCC-MAIN-2022-49,application/vnd.oasis.opendocument.text,27646,27632,0.0008\nCC-MAIN-2022-49,application/vnd.openxmlformats-officedocument.presentationml.presentation,8916,8886,0.0003\nCC-MAIN-2022-49,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,58744,58536,0.0017\nCC-MAIN-2022-49,application/vnd.openxmlformats-officedocument.wordprocessingml.document,89646,89324,0.0027\nCC-MAIN-2022-49,application/vnd.wap.xhtml+xml,27577,27441,0.0008\nCC-MAIN-2022-49,application/x-bibtex,96845,96842,0.0029\nCC-MAIN-2022-49,application/x-bittorrent,5100,5099,0.0002\nCC-MAIN-2022-49,application/x-debian-package,59,54,0.0000\nCC-MAIN-2022-49,application/x-download,64363,64354,0.0019\nCC-MAIN-2022-49,application/x-endnote-refer,115638,115624,0.0034\nCC-MAIN-2022-49,application/x-gzip,34192,34173,0.0010\nCC-MAIN-2022-49,application/x-httpd-php,9521,9487,0.0003\nCC-MAIN-2022-49,application/x-java-jnlp-file,2517,2515,0.0001\nCC-MAIN-2022-49,application/x-javascript,12257,12256,0.0004\nCC-MAIN-2022-49,application/x-json,71,71,0.0000\nCC-MAIN-2022-49,application/x-mobipocket-ebook,5506,5490,0.0002\nCC-MAIN-2022-49,application/x-msdownload,11411,11300,0.0003\nCC-MAIN-2022-49,application/x-netcdf,47826,47826,0.0014\nCC-MAIN-2022-49,application/x-research-info-systems,218045,218042,0.0064\nCC-MAIN-2022-49,application/x-shockwave-flash,8214,8201,0.0002\nCC-MAIN-2022-49,application/x-tar,22328,22323,0.0007\nCC-MAIN-2022-49,application/x-tex,6217,6216,0.0002\nCC-MAIN-2022-49,application/x-troff-man,23544,23544,0.0007\nCC-MAIN-2022-49,application/x-zip-compressed,23769,23657,0.0007\nCC-MAIN-2022-49,application/xhtml+xml,1473389,1470633,0.0436\nCC-MAIN-2022-49,application/xml,921784,920564,0.0273\nCC-MAIN-2022-49,application/zip,176787,175613,0.0052\nCC-MAIN-2022-49,audio/mpeg,110528,109506,0.0033\nCC-MAIN-2022-49,audio/x-mpegurl,23433,23406,0.0007\nCC-MAIN-2022-49,audio/x-scpls,3554,3546,0.0001\nCC-MAIN-2022-49,audio/x-wav,7061,7061,0.0002\nCC-MAIN-2022-49,binary/octet-stream,18987,18946,0.0006\nCC-MAIN-2022-49,image/gif,147558,147236,0.0044\nCC-MAIN-2022-49,image/jp2,255,255,0.0000\nCC-MAIN-2022-49,image/jpeg,5046317,5035259,0.1492\nCC-MAIN-2022-49,image/jpg,77767,77239,0.0023\nCC-MAIN-2022-49,image/pjpeg,21709,21709,0.0006\nCC-MAIN-2022-49,image/png,889183,886440,0.0263\nCC-MAIN-2022-49,image/svg+xml,30778,30728,0.0009\nCC-MAIN-2022-49,image/tiff,20744,20739,0.0006\nCC-MAIN-2022-49,image/vnd.djvu,7203,7202,0.0002\nCC-MAIN-2022-49,image/webp,40637,40477,0.0012\nCC-MAIN-2022-49,message/rfc822,9265,9263,0.0003\nCC-MAIN-2022-49,text/calendar,1189564,1189279,0.0352\nCC-MAIN-2022-49,text/css,15991,15988,0.0005\nCC-MAIN-2022-49,text/csv,136961,136920,0.0041\nCC-MAIN-2022-49,text/directory,10322,10322,0.0003\nCC-MAIN-2022-49,text/enriched,28571,28559,0.0008\nCC-MAIN-2022-49,text/html,3327116873,3306304727,98.3885\nCC-MAIN-2022-49,text/javascript,7790,7790,0.0002\nCC-MAIN-2022-49,text/markdown,5678,5678,0.0002\nCC-MAIN-2022-49,text/pdf,193,193,0.0000\nCC-MAIN-2022-49,text/plain,2078408,2077443,0.0615\nCC-MAIN-2022-49,text/prs.lines.tag,28897,28897,0.0009\nCC-MAIN-2022-49,text/tab-separated-values,31058,31058,0.0009\nCC-MAIN-2022-49,text/turtle,42282,42262,0.0013\nCC-MAIN-2022-49,text/vcard,34837,34827,0.0010\nCC-MAIN-2022-49,text/x-bibtex,14082,14080,0.0004\nCC-MAIN-2022-49,text/x-c,4215,4215,0.0001\nCC-MAIN-2022-49,text/x-csrc,21069,21066,0.0006\nCC-MAIN-2022-49,text/x-diff,10620,10615,0.0003\nCC-MAIN-2022-49,text/x-patch,14997,14982,0.0004\nCC-MAIN-2022-49,text/x-perl,3697,3696,0.0001\nCC-MAIN-2022-49,text/x-vcalendar,14994,14990,0.0004\nCC-MAIN-2022-49,text/x-vcard,71704,71691,0.0021\nCC-MAIN-2022-49,text/xml,2230896,2227766,0.0660\nCC-MAIN-2022-49,unknown/unknown,8062,8042,0.0002\nCC-MAIN-2022-49,video/mp4,64717,64420,0.0019\nCC-MAIN-2022-49,video/webm,3103,3101,0.0001\nCC-MAIN-2022-49,video/x-ms-asf,3254,3254,0.0001\nCC-MAIN-2023-06,<other>,2264024,2257245,0.0710\nCC-MAIN-2023-06,application/atom+xml,2977461,2977353,0.0933\nCC-MAIN-2023-06,application/calendar,8264,8264,0.0003\nCC-MAIN-2023-06,application/download,83344,83339,0.0026\nCC-MAIN-2023-06,application/epub+zip,35631,35622,0.0011\nCC-MAIN-2023-06,application/force-download,196564,196464,0.0062\nCC-MAIN-2023-06,application/gpx+xml,15256,15256,0.0005\nCC-MAIN-2023-06,application/ics,9550,9550,0.0003\nCC-MAIN-2023-06,application/javascript,5821,5817,0.0002\nCC-MAIN-2023-06,application/json,741213,740721,0.0232\nCC-MAIN-2023-06,application/ld+json,38289,38229,0.0012\nCC-MAIN-2023-06,application/marc,11163,11161,0.0003\nCC-MAIN-2023-06,application/msword,93846,93632,0.0029\nCC-MAIN-2023-06,application/octet-stream,1485342,1483896,0.0466\nCC-MAIN-2023-06,application/octetstream,10429,10425,0.0003\nCC-MAIN-2023-06,application/pdf,24918862,24847502,0.7813\nCC-MAIN-2023-06,application/pgp-encrypted,2847,2847,0.0001\nCC-MAIN-2023-06,application/pgp-signature,82156,82110,0.0026\nCC-MAIN-2023-06,application/postscript,4382,4373,0.0001\nCC-MAIN-2023-06,application/rdf+xml,129279,129209,0.0041\nCC-MAIN-2023-06,application/rss+xml,2034157,2032601,0.0638\nCC-MAIN-2023-06,application/rtf,38019,38012,0.0012\nCC-MAIN-2023-06,application/save-to-disk,26,26,0.0000\nCC-MAIN-2023-06,application/text,35165,35165,0.0011\nCC-MAIN-2023-06,application/unknown,8381,8381,0.0003\nCC-MAIN-2023-06,application/vnd.android.package-archive,4214,4085,0.0001\nCC-MAIN-2023-06,application/vnd.google-earth.kml+xml,80796,80783,0.0025\nCC-MAIN-2023-06,application/vnd.google-earth.kmz,10754,10754,0.0003\nCC-MAIN-2023-06,application/vnd.ms-excel,59860,59787,0.0019\nCC-MAIN-2023-06,application/vnd.ms-powerpoint,12169,12166,0.0004\nCC-MAIN-2023-06,application/vnd.ms-word,9631,9630,0.0003\nCC-MAIN-2023-06,application/vnd.oasis.opendocument.text,26571,26551,0.0008\nCC-MAIN-2023-06,application/vnd.openxmlformats-officedocument.presentationml.presentation,7941,7908,0.0002\nCC-MAIN-2023-06,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,49787,49580,0.0016\nCC-MAIN-2023-06,application/vnd.openxmlformats-officedocument.wordprocessingml.document,81471,81261,0.0026\nCC-MAIN-2023-06,application/vnd.wap.xhtml+xml,26970,26891,0.0008\nCC-MAIN-2023-06,application/x-bibtex,101445,101432,0.0032\nCC-MAIN-2023-06,application/x-bittorrent,4280,4280,0.0001\nCC-MAIN-2023-06,application/x-debian-package,211,204,0.0000\nCC-MAIN-2023-06,application/x-download,53792,53788,0.0017\nCC-MAIN-2023-06,application/x-endnote-refer,63716,63716,0.0020\nCC-MAIN-2023-06,application/x-gzip,31861,31834,0.0010\nCC-MAIN-2023-06,application/x-httpd-php,8921,8910,0.0003\nCC-MAIN-2023-06,application/x-java-jnlp-file,8825,8823,0.0003\nCC-MAIN-2023-06,application/x-javascript,5658,5657,0.0002\nCC-MAIN-2023-06,application/x-json,7,7,0.0000\nCC-MAIN-2023-06,application/x-mobipocket-ebook,4736,4735,0.0001\nCC-MAIN-2023-06,application/x-msdownload,8231,8160,0.0003\nCC-MAIN-2023-06,application/x-netcdf,91294,91294,0.0029\nCC-MAIN-2023-06,application/x-research-info-systems,217918,217916,0.0068\nCC-MAIN-2023-06,application/x-shockwave-flash,7309,7294,0.0002\nCC-MAIN-2023-06,application/x-tar,26151,26140,0.0008\nCC-MAIN-2023-06,application/x-tex,4368,4367,0.0001\nCC-MAIN-2023-06,application/x-troff-man,18174,18173,0.0006\nCC-MAIN-2023-06,application/x-zip-compressed,23584,23471,0.0007\nCC-MAIN-2023-06,application/xhtml+xml,1107478,1105692,0.0347\nCC-MAIN-2023-06,application/xml,794885,794116,0.0249\nCC-MAIN-2023-06,application/zip,146782,145354,0.0046\nCC-MAIN-2023-06,audio/mpeg,104667,103869,0.0033\nCC-MAIN-2023-06,audio/x-mpegurl,22343,22304,0.0007\nCC-MAIN-2023-06,audio/x-scpls,3091,3080,0.0001\nCC-MAIN-2023-06,audio/x-wav,5039,5037,0.0002\nCC-MAIN-2023-06,binary/octet-stream,21188,21140,0.0007\nCC-MAIN-2023-06,image/gif,126030,125726,0.0040\nCC-MAIN-2023-06,image/jp2,1394,1394,0.0000\nCC-MAIN-2023-06,image/jpeg,4184015,4176158,0.1312\nCC-MAIN-2023-06,image/jpg,77397,76732,0.0024\nCC-MAIN-2023-06,image/pjpeg,16573,16571,0.0005\nCC-MAIN-2023-06,image/png,649843,647745,0.0204\nCC-MAIN-2023-06,image/svg+xml,20462,20438,0.0006\nCC-MAIN-2023-06,image/tiff,18717,18716,0.0006\nCC-MAIN-2023-06,image/vnd.djvu,9514,9513,0.0003\nCC-MAIN-2023-06,image/webp,63658,63543,0.0020\nCC-MAIN-2023-06,message/rfc822,7596,7596,0.0002\nCC-MAIN-2023-06,text/calendar,943677,942986,0.0296\nCC-MAIN-2023-06,text/css,14730,14727,0.0005\nCC-MAIN-2023-06,text/csv,111293,111275,0.0035\nCC-MAIN-2023-06,text/directory,7448,7447,0.0002\nCC-MAIN-2023-06,text/enriched,13405,13405,0.0004\nCC-MAIN-2023-06,text/html,3140495532,3122485390,98.4612\nCC-MAIN-2023-06,text/javascript,4847,4847,0.0002\nCC-MAIN-2023-06,text/markdown,4128,4128,0.0001\nCC-MAIN-2023-06,text/pdf,689,688,0.0000\nCC-MAIN-2023-06,text/plain,1863648,1862843,0.0584\nCC-MAIN-2023-06,text/prs.lines.tag,76417,76417,0.0024\nCC-MAIN-2023-06,text/tab-separated-values,4364,4364,0.0001\nCC-MAIN-2023-06,text/turtle,39715,39676,0.0012\nCC-MAIN-2023-06,text/vcard,32012,31992,0.0010\nCC-MAIN-2023-06,text/x-bibtex,15235,15234,0.0005\nCC-MAIN-2023-06,text/x-c,4878,4876,0.0002\nCC-MAIN-2023-06,text/x-csrc,11887,11887,0.0004\nCC-MAIN-2023-06,text/x-diff,6822,6660,0.0002\nCC-MAIN-2023-06,text/x-patch,4780,4752,0.0001\nCC-MAIN-2023-06,text/x-perl,2616,2615,0.0001\nCC-MAIN-2023-06,text/x-vcalendar,15426,15424,0.0005\nCC-MAIN-2023-06,text/x-vcard,62097,61982,0.0019\nCC-MAIN-2023-06,text/xml,2122645,2119834,0.0665\nCC-MAIN-2023-06,unknown/unknown,3047,3045,0.0001\nCC-MAIN-2023-06,video/mp4,49675,49455,0.0016\nCC-MAIN-2023-06,video/webm,2679,2679,0.0001\nCC-MAIN-2023-06,video/x-ms-asf,3727,3724,0.0001\nCC-MAIN-2023-14,<other>,2284894,2279427,0.0733\nCC-MAIN-2023-14,application/atom+xml,3422166,3422012,0.1097\nCC-MAIN-2023-14,application/calendar,15058,15058,0.0005\nCC-MAIN-2023-14,application/download,93428,93401,0.0030\nCC-MAIN-2023-14,application/epub+zip,44026,44013,0.0014\nCC-MAIN-2023-14,application/force-download,195039,195018,0.0063\nCC-MAIN-2023-14,application/gpx+xml,15804,15728,0.0005\nCC-MAIN-2023-14,application/ics,13495,13494,0.0004\nCC-MAIN-2023-14,application/javascript,8610,8585,0.0003\nCC-MAIN-2023-14,application/json,721430,721256,0.0231\nCC-MAIN-2023-14,application/ld+json,40664,40571,0.0013\nCC-MAIN-2023-14,application/marc,8711,8711,0.0003\nCC-MAIN-2023-14,application/msword,97176,97026,0.0031\nCC-MAIN-2023-14,application/octet-stream,1542395,1541150,0.0495\nCC-MAIN-2023-14,application/octetstream,12953,12942,0.0004\nCC-MAIN-2023-14,application/pdf,28625244,28557445,0.9179\nCC-MAIN-2023-14,application/pgp-encrypted,2671,2670,0.0001\nCC-MAIN-2023-14,application/pgp-signature,83433,83432,0.0027\nCC-MAIN-2023-14,application/postscript,6836,6830,0.0002\nCC-MAIN-2023-14,application/rdf+xml,128702,128621,0.0041\nCC-MAIN-2023-14,application/rss+xml,1985189,1983667,0.0637\nCC-MAIN-2023-14,application/rtf,42618,42607,0.0014\nCC-MAIN-2023-14,application/save-to-disk,19,19,0.0000\nCC-MAIN-2023-14,application/text,25679,25679,0.0008\nCC-MAIN-2023-14,application/unknown,10123,10123,0.0003\nCC-MAIN-2023-14,application/vnd.android.package-archive,3713,3685,0.0001\nCC-MAIN-2023-14,application/vnd.google-earth.kml+xml,74531,74495,0.0024\nCC-MAIN-2023-14,application/vnd.google-earth.kmz,16142,16138,0.0005\nCC-MAIN-2023-14,application/vnd.ms-excel,68042,67104,0.0022\nCC-MAIN-2023-14,application/vnd.ms-powerpoint,20876,20869,0.0007\nCC-MAIN-2023-14,application/vnd.ms-word,8531,8530,0.0003\nCC-MAIN-2023-14,application/vnd.oasis.opendocument.text,27015,27004,0.0009\nCC-MAIN-2023-14,application/vnd.openxmlformats-officedocument.presentationml.presentation,9590,9561,0.0003\nCC-MAIN-2023-14,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,58342,58136,0.0019\nCC-MAIN-2023-14,application/vnd.openxmlformats-officedocument.wordprocessingml.document,89283,88892,0.0029\nCC-MAIN-2023-14,application/vnd.wap.xhtml+xml,17274,17242,0.0006\nCC-MAIN-2023-14,application/x-bibtex,100629,100627,0.0032\nCC-MAIN-2023-14,application/x-bittorrent,5802,5800,0.0002\nCC-MAIN-2023-14,application/x-debian-package,489,485,0.0000\nCC-MAIN-2023-14,application/x-download,42562,42561,0.0014\nCC-MAIN-2023-14,application/x-endnote-refer,48429,48429,0.0016\nCC-MAIN-2023-14,application/x-gzip,19315,19306,0.0006\nCC-MAIN-2023-14,application/x-httpd-php,11102,11083,0.0004\nCC-MAIN-2023-14,application/x-java-jnlp-file,3677,3676,0.0001\nCC-MAIN-2023-14,application/x-javascript,5899,5899,0.0002\nCC-MAIN-2023-14,application/x-json,40,40,0.0000\nCC-MAIN-2023-14,application/x-mobipocket-ebook,5092,5088,0.0002\nCC-MAIN-2023-14,application/x-msdownload,8806,8737,0.0003\nCC-MAIN-2023-14,application/x-netcdf,85516,85516,0.0027\nCC-MAIN-2023-14,application/x-research-info-systems,233676,233676,0.0075\nCC-MAIN-2023-14,application/x-shockwave-flash,6899,6890,0.0002\nCC-MAIN-2023-14,application/x-tar,16900,16899,0.0005\nCC-MAIN-2023-14,application/x-tex,4417,4417,0.0001\nCC-MAIN-2023-14,application/x-troff-man,22939,22938,0.0007\nCC-MAIN-2023-14,application/x-zip-compressed,19335,19249,0.0006\nCC-MAIN-2023-14,application/xhtml+xml,731902,730229,0.0235\nCC-MAIN-2023-14,application/xml,784493,783431,0.0252\nCC-MAIN-2023-14,application/zip,103649,103010,0.0033\nCC-MAIN-2023-14,audio/mpeg,74191,73671,0.0024\nCC-MAIN-2023-14,audio/x-mpegurl,29051,29023,0.0009\nCC-MAIN-2023-14,audio/x-scpls,5286,5273,0.0002\nCC-MAIN-2023-14,audio/x-wav,2903,2903,0.0001\nCC-MAIN-2023-14,binary/octet-stream,21305,21249,0.0007\nCC-MAIN-2023-14,image/gif,138496,138205,0.0044\nCC-MAIN-2023-14,image/jp2,1665,1665,0.0001\nCC-MAIN-2023-14,image/jpeg,4630256,4621693,0.1485\nCC-MAIN-2023-14,image/jpg,69569,69568,0.0022\nCC-MAIN-2023-14,image/pjpeg,17085,17080,0.0005\nCC-MAIN-2023-14,image/png,876486,873760,0.0281\nCC-MAIN-2023-14,image/svg+xml,28654,28580,0.0009\nCC-MAIN-2023-14,image/tiff,12767,12767,0.0004\nCC-MAIN-2023-14,image/vnd.djvu,6769,6769,0.0002\nCC-MAIN-2023-14,image/webp,67345,67199,0.0022\nCC-MAIN-2023-14,message/rfc822,4986,4954,0.0002\nCC-MAIN-2023-14,text/calendar,903652,903539,0.0290\nCC-MAIN-2023-14,text/css,17302,17298,0.0006\nCC-MAIN-2023-14,text/csv,114011,113958,0.0037\nCC-MAIN-2023-14,text/directory,8880,8880,0.0003\nCC-MAIN-2023-14,text/enriched,9320,9320,0.0003\nCC-MAIN-2023-14,text/html,3065194839,3047100327,98.2865\nCC-MAIN-2023-14,text/javascript,5746,5744,0.0002\nCC-MAIN-2023-14,text/markdown,4513,4512,0.0001\nCC-MAIN-2023-14,text/pdf,310,310,0.0000\nCC-MAIN-2023-14,text/plain,1900662,1899946,0.0609\nCC-MAIN-2023-14,text/prs.lines.tag,45153,45153,0.0014\nCC-MAIN-2023-14,text/tab-separated-values,7286,7286,0.0002\nCC-MAIN-2023-14,text/turtle,46535,46456,0.0015\nCC-MAIN-2023-14,text/vcard,34026,34022,0.0011\nCC-MAIN-2023-14,text/x-bibtex,18444,18439,0.0006\nCC-MAIN-2023-14,text/x-c,7005,6997,0.0002\nCC-MAIN-2023-14,text/x-csrc,14500,14497,0.0005\nCC-MAIN-2023-14,text/x-diff,9217,9215,0.0003\nCC-MAIN-2023-14,text/x-patch,4529,4518,0.0001\nCC-MAIN-2023-14,text/x-perl,2973,2973,0.0001\nCC-MAIN-2023-14,text/x-vcalendar,15944,15940,0.0005\nCC-MAIN-2023-14,text/x-vcard,64979,64969,0.0021\nCC-MAIN-2023-14,text/xml,2088563,2085880,0.0670\nCC-MAIN-2023-14,unknown/unknown,1381,1381,0.0000\nCC-MAIN-2023-14,video/mp4,39635,39553,0.0013\nCC-MAIN-2023-14,video/webm,1853,1853,0.0001\nCC-MAIN-2023-14,video/x-ms-asf,4071,4069,0.0001\nCC-MAIN-2023-23,<other>,2264056,2257986,0.0721\nCC-MAIN-2023-23,application/atom+xml,2948417,2948258,0.0939\nCC-MAIN-2023-23,application/calendar,12290,12290,0.0004\nCC-MAIN-2023-23,application/download,104271,104214,0.0033\nCC-MAIN-2023-23,application/epub+zip,35682,35674,0.0011\nCC-MAIN-2023-23,application/force-download,197754,197738,0.0063\nCC-MAIN-2023-23,application/gpx+xml,13791,13791,0.0004\nCC-MAIN-2023-23,application/ics,12376,12376,0.0004\nCC-MAIN-2023-23,application/javascript,5007,5007,0.0002\nCC-MAIN-2023-23,application/json,735508,735263,0.0234\nCC-MAIN-2023-23,application/ld+json,44187,44179,0.0014\nCC-MAIN-2023-23,application/marc,11580,11579,0.0004\nCC-MAIN-2023-23,application/msword,100101,99853,0.0032\nCC-MAIN-2023-23,application/octet-stream,1361861,1360710,0.0434\nCC-MAIN-2023-23,application/octetstream,9300,9298,0.0003\nCC-MAIN-2023-23,application/pdf,27002645,26941514,0.8598\nCC-MAIN-2023-23,application/pgp-encrypted,3159,3159,0.0001\nCC-MAIN-2023-23,application/pgp-signature,101593,101590,0.0032\nCC-MAIN-2023-23,application/postscript,4258,4244,0.0001\nCC-MAIN-2023-23,application/rdf+xml,126325,126312,0.0040\nCC-MAIN-2023-23,application/rss+xml,2037740,2035780,0.0649\nCC-MAIN-2023-23,application/rtf,44131,44123,0.0014\nCC-MAIN-2023-23,application/save-to-disk,35,35,0.0000\nCC-MAIN-2023-23,application/text,23521,23521,0.0007\nCC-MAIN-2023-23,application/unknown,7087,7082,0.0002\nCC-MAIN-2023-23,application/vnd.android.package-archive,1922,1907,0.0001\nCC-MAIN-2023-23,application/vnd.google-earth.kml+xml,55013,55005,0.0018\nCC-MAIN-2023-23,application/vnd.google-earth.kmz,12292,12291,0.0004\nCC-MAIN-2023-23,application/vnd.ms-excel,61160,60789,0.0019\nCC-MAIN-2023-23,application/vnd.ms-powerpoint,9926,9916,0.0003\nCC-MAIN-2023-23,application/vnd.ms-word,8566,8563,0.0003\nCC-MAIN-2023-23,application/vnd.oasis.opendocument.text,23114,23097,0.0007\nCC-MAIN-2023-23,application/vnd.openxmlformats-officedocument.presentationml.presentation,8614,8593,0.0003\nCC-MAIN-2023-23,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,49742,49375,0.0016\nCC-MAIN-2023-23,application/vnd.openxmlformats-officedocument.wordprocessingml.document,71604,71155,0.0023\nCC-MAIN-2023-23,application/vnd.wap.xhtml+xml,16069,16050,0.0005\nCC-MAIN-2023-23,application/x-bibtex,114964,114920,0.0037\nCC-MAIN-2023-23,application/x-bittorrent,5029,5028,0.0002\nCC-MAIN-2023-23,application/x-debian-package,113,113,0.0000\nCC-MAIN-2023-23,application/x-download,48112,48105,0.0015\nCC-MAIN-2023-23,application/x-endnote-refer,56179,56176,0.0018\nCC-MAIN-2023-23,application/x-gzip,12957,12953,0.0004\nCC-MAIN-2023-23,application/x-httpd-php,11942,11936,0.0004\nCC-MAIN-2023-23,application/x-java-jnlp-file,4805,4805,0.0002\nCC-MAIN-2023-23,application/x-javascript,5325,5325,0.0002\nCC-MAIN-2023-23,application/x-json,16,16,0.0000\nCC-MAIN-2023-23,application/x-mobipocket-ebook,4234,4233,0.0001\nCC-MAIN-2023-23,application/x-msdownload,7764,7742,0.0002\nCC-MAIN-2023-23,application/x-netcdf,43308,43308,0.0014\nCC-MAIN-2023-23,application/x-research-info-systems,240131,240084,0.0076\nCC-MAIN-2023-23,application/x-shockwave-flash,7697,7694,0.0002\nCC-MAIN-2023-23,application/x-tar,5820,5819,0.0002\nCC-MAIN-2023-23,application/x-tex,7498,7496,0.0002\nCC-MAIN-2023-23,application/x-troff-man,22099,22098,0.0007\nCC-MAIN-2023-23,application/x-zip-compressed,13666,13629,0.0004\nCC-MAIN-2023-23,application/xhtml+xml,569280,567873,0.0181\nCC-MAIN-2023-23,application/xml,784989,783682,0.0250\nCC-MAIN-2023-23,application/zip,78406,78047,0.0025\nCC-MAIN-2023-23,audio/mpeg,48238,48057,0.0015\nCC-MAIN-2023-23,audio/x-mpegurl,28107,28065,0.0009\nCC-MAIN-2023-23,audio/x-scpls,4482,4471,0.0001\nCC-MAIN-2023-23,audio/x-wav,1993,1993,0.0001\nCC-MAIN-2023-23,binary/octet-stream,16623,16558,0.0005\nCC-MAIN-2023-23,image/gif,136836,136557,0.0044\nCC-MAIN-2023-23,image/jp2,1832,1832,0.0001\nCC-MAIN-2023-23,image/jpeg,4944558,4934992,0.1574\nCC-MAIN-2023-23,image/jpg,57789,57783,0.0018\nCC-MAIN-2023-23,image/pjpeg,16443,16443,0.0005\nCC-MAIN-2023-23,image/png,981337,978044,0.0312\nCC-MAIN-2023-23,image/svg+xml,27804,27739,0.0009\nCC-MAIN-2023-23,image/tiff,7385,7337,0.0002\nCC-MAIN-2023-23,image/vnd.djvu,6681,6681,0.0002\nCC-MAIN-2023-23,image/webp,67830,67719,0.0022\nCC-MAIN-2023-23,message/rfc822,5765,5765,0.0002\nCC-MAIN-2023-23,text/calendar,968063,967562,0.0308\nCC-MAIN-2023-23,text/css,15837,15835,0.0005\nCC-MAIN-2023-23,text/csv,115103,115004,0.0037\nCC-MAIN-2023-23,text/directory,8169,8168,0.0003\nCC-MAIN-2023-23,text/enriched,8467,8467,0.0003\nCC-MAIN-2023-23,text/html,3089359428,3070797360,98.3693\nCC-MAIN-2023-23,text/javascript,5791,5786,0.0002\nCC-MAIN-2023-23,text/markdown,4620,4619,0.0001\nCC-MAIN-2023-23,text/pdf,610,610,0.0000\nCC-MAIN-2023-23,text/plain,1843360,1842415,0.0587\nCC-MAIN-2023-23,text/prs.lines.tag,61025,61025,0.0019\nCC-MAIN-2023-23,text/tab-separated-values,6589,6584,0.0002\nCC-MAIN-2023-23,text/turtle,46392,46387,0.0015\nCC-MAIN-2023-23,text/vcard,33334,33326,0.0011\nCC-MAIN-2023-23,text/x-bibtex,18442,18430,0.0006\nCC-MAIN-2023-23,text/x-c,5427,5427,0.0002\nCC-MAIN-2023-23,text/x-csrc,10081,10079,0.0003\nCC-MAIN-2023-23,text/x-diff,13016,13014,0.0004\nCC-MAIN-2023-23,text/x-patch,8779,8767,0.0003\nCC-MAIN-2023-23,text/x-perl,1415,1415,0.0000\nCC-MAIN-2023-23,text/x-vcalendar,16230,16226,0.0005\nCC-MAIN-2023-23,text/x-vcard,68345,68282,0.0022\nCC-MAIN-2023-23,text/xml,2002955,1999964,0.0638\nCC-MAIN-2023-23,unknown/unknown,1214,1214,0.0000\nCC-MAIN-2023-23,video/mp4,23185,23134,0.0007\nCC-MAIN-2023-23,video/webm,1344,1344,0.0000\nCC-MAIN-2023-23,video/x-ms-asf,4013,4012,0.0001\nCC-MAIN-2023-40,<other>,2373159,2362899,0.0689\nCC-MAIN-2023-40,application/atom+xml,3425866,3425555,0.0994\nCC-MAIN-2023-40,application/calendar,13036,13036,0.0004\nCC-MAIN-2023-40,application/download,103714,103612,0.0030\nCC-MAIN-2023-40,application/epub+zip,34225,34206,0.0010\nCC-MAIN-2023-40,application/force-download,218020,217919,0.0063\nCC-MAIN-2023-40,application/gpx+xml,16410,16409,0.0005\nCC-MAIN-2023-40,application/ics,13103,13103,0.0004\nCC-MAIN-2023-40,application/javascript,9965,9949,0.0003\nCC-MAIN-2023-40,application/json,719188,718913,0.0209\nCC-MAIN-2023-40,application/ld+json,47741,47701,0.0014\nCC-MAIN-2023-40,application/marc,10396,10396,0.0003\nCC-MAIN-2023-40,application/msword,108894,108537,0.0032\nCC-MAIN-2023-40,application/octet-stream,1543810,1542355,0.0448\nCC-MAIN-2023-40,application/octetstream,9066,9056,0.0003\nCC-MAIN-2023-40,application/pdf,29836873,29769828,0.8661\nCC-MAIN-2023-40,application/pgp-encrypted,3141,3141,0.0001\nCC-MAIN-2023-40,application/pgp-signature,79691,79671,0.0023\nCC-MAIN-2023-40,application/postscript,5247,5242,0.0002\nCC-MAIN-2023-40,application/rdf+xml,130867,130810,0.0038\nCC-MAIN-2023-40,application/rss+xml,1848790,1846146,0.0537\nCC-MAIN-2023-40,application/rtf,38965,38932,0.0011\nCC-MAIN-2023-40,application/save-to-disk,33,33,0.0000\nCC-MAIN-2023-40,application/text,19965,19965,0.0006\nCC-MAIN-2023-40,application/unknown,6039,6036,0.0002\nCC-MAIN-2023-40,application/vnd.android.package-archive,2349,2332,0.0001\nCC-MAIN-2023-40,application/vnd.google-earth.kml+xml,86811,86460,0.0025\nCC-MAIN-2023-40,application/vnd.google-earth.kmz,16774,16769,0.0005\nCC-MAIN-2023-40,application/vnd.ms-excel,63212,63092,0.0018\nCC-MAIN-2023-40,application/vnd.ms-powerpoint,10035,10030,0.0003\nCC-MAIN-2023-40,application/vnd.ms-word,10086,10086,0.0003\nCC-MAIN-2023-40,application/vnd.oasis.opendocument.text,26416,26411,0.0008\nCC-MAIN-2023-40,application/vnd.openxmlformats-officedocument.presentationml.presentation,8289,8198,0.0002\nCC-MAIN-2023-40,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,48134,47932,0.0014\nCC-MAIN-2023-40,application/vnd.openxmlformats-officedocument.wordprocessingml.document,79950,79684,0.0023\nCC-MAIN-2023-40,application/vnd.wap.xhtml+xml,6993,6968,0.0002\nCC-MAIN-2023-40,application/x-bibtex,130715,130678,0.0038\nCC-MAIN-2023-40,application/x-bittorrent,5197,5195,0.0002\nCC-MAIN-2023-40,application/x-debian-package,52,52,0.0000\nCC-MAIN-2023-40,application/x-download,50068,50016,0.0015\nCC-MAIN-2023-40,application/x-endnote-refer,43866,43862,0.0013\nCC-MAIN-2023-40,application/x-gzip,14446,14445,0.0004\nCC-MAIN-2023-40,application/x-httpd-php,17864,17703,0.0005\nCC-MAIN-2023-40,application/x-java-jnlp-file,5612,5593,0.0002\nCC-MAIN-2023-40,application/x-javascript,4071,4069,0.0001\nCC-MAIN-2023-40,application/x-json,67,67,0.0000\nCC-MAIN-2023-40,application/x-mobipocket-ebook,5304,5291,0.0002\nCC-MAIN-2023-40,application/x-msdownload,7422,7394,0.0002\nCC-MAIN-2023-40,application/x-netcdf,47388,47388,0.0014\nCC-MAIN-2023-40,application/x-research-info-systems,259222,259131,0.0075\nCC-MAIN-2023-40,application/x-shockwave-flash,6523,6517,0.0002\nCC-MAIN-2023-40,application/x-tar,7024,7023,0.0002\nCC-MAIN-2023-40,application/x-tex,7036,7035,0.0002\nCC-MAIN-2023-40,application/x-troff-man,16462,16452,0.0005\nCC-MAIN-2023-40,application/x-zip-compressed,11202,11162,0.0003\nCC-MAIN-2023-40,application/xhtml+xml,567753,566180,0.0165\nCC-MAIN-2023-40,application/xml,796121,794353,0.0231\nCC-MAIN-2023-40,application/zip,78131,77771,0.0023\nCC-MAIN-2023-40,audio/mpeg,48022,47633,0.0014\nCC-MAIN-2023-40,audio/x-mpegurl,30712,30648,0.0009\nCC-MAIN-2023-40,audio/x-scpls,6358,6327,0.0002\nCC-MAIN-2023-40,audio/x-wav,1760,1760,0.0001\nCC-MAIN-2023-40,binary/octet-stream,22810,22794,0.0007\nCC-MAIN-2023-40,image/gif,122224,121924,0.0035\nCC-MAIN-2023-40,image/jp2,1499,1499,0.0000\nCC-MAIN-2023-40,image/jpeg,5267572,5255233,0.1529\nCC-MAIN-2023-40,image/jpg,53422,53421,0.0016\nCC-MAIN-2023-40,image/pjpeg,16373,16373,0.0005\nCC-MAIN-2023-40,image/png,1024386,1020976,0.0297\nCC-MAIN-2023-40,image/svg+xml,29988,29897,0.0009\nCC-MAIN-2023-40,image/tiff,9310,9309,0.0003\nCC-MAIN-2023-40,image/vnd.djvu,8631,8630,0.0003\nCC-MAIN-2023-40,image/webp,77556,77327,0.0023\nCC-MAIN-2023-40,message/rfc822,5710,5709,0.0002\nCC-MAIN-2023-40,text/calendar,999723,999317,0.0290\nCC-MAIN-2023-40,text/css,18768,18766,0.0005\nCC-MAIN-2023-40,text/csv,119822,119776,0.0035\nCC-MAIN-2023-40,text/directory,8060,8058,0.0002\nCC-MAIN-2023-40,text/enriched,6944,6944,0.0002\nCC-MAIN-2023-40,text/html,3389576748,3363674814,98.3908\nCC-MAIN-2023-40,text/javascript,7991,7989,0.0002\nCC-MAIN-2023-40,text/markdown,4704,4702,0.0001\nCC-MAIN-2023-40,text/pdf,207,207,0.0000\nCC-MAIN-2023-40,text/plain,1980246,1978864,0.0575\nCC-MAIN-2023-40,text/prs.lines.tag,60691,60691,0.0018\nCC-MAIN-2023-40,text/tab-separated-values,5688,5673,0.0002\nCC-MAIN-2023-40,text/turtle,45528,45488,0.0013\nCC-MAIN-2023-40,text/vcard,31540,31526,0.0009\nCC-MAIN-2023-40,text/x-bibtex,20036,19986,0.0006\nCC-MAIN-2023-40,text/x-c,4122,4119,0.0001\nCC-MAIN-2023-40,text/x-csrc,7402,7399,0.0002\nCC-MAIN-2023-40,text/x-diff,9860,9858,0.0003\nCC-MAIN-2023-40,text/x-patch,8446,8431,0.0002\nCC-MAIN-2023-40,text/x-perl,2101,2101,0.0001\nCC-MAIN-2023-40,text/x-vcalendar,14754,14749,0.0004\nCC-MAIN-2023-40,text/x-vcard,59469,59430,0.0017\nCC-MAIN-2023-40,text/xml,2206179,2201903,0.0640\nCC-MAIN-2023-40,unknown/unknown,955,953,0.0000\nCC-MAIN-2023-40,video/mp4,25346,25309,0.0007\nCC-MAIN-2023-40,video/webm,1509,1508,0.0000\nCC-MAIN-2023-40,video/x-ms-asf,5066,5066,0.0001\nCC-MAIN-2023-50,<other>,2601385,2592461,0.0776\nCC-MAIN-2023-50,application/atom+xml,3219420,3219135,0.0960\nCC-MAIN-2023-50,application/calendar,13245,13243,0.0004\nCC-MAIN-2023-50,application/download,104590,104539,0.0031\nCC-MAIN-2023-50,application/epub+zip,43112,43067,0.0013\nCC-MAIN-2023-50,application/force-download,223474,223268,0.0067\nCC-MAIN-2023-50,application/gpx+xml,20988,20941,0.0006\nCC-MAIN-2023-50,application/ics,12372,12372,0.0004\nCC-MAIN-2023-50,application/javascript,13776,13773,0.0004\nCC-MAIN-2023-50,application/json,735347,735025,0.0219\nCC-MAIN-2023-50,application/ld+json,47991,47858,0.0014\nCC-MAIN-2023-50,application/marc,11735,11735,0.0003\nCC-MAIN-2023-50,application/msword,108263,107979,0.0032\nCC-MAIN-2023-50,application/octet-stream,1565133,1563728,0.0467\nCC-MAIN-2023-50,application/octetstream,7278,7246,0.0002\nCC-MAIN-2023-50,application/pdf,34224671,34141330,1.0204\nCC-MAIN-2023-50,application/pgp-encrypted,2916,2916,0.0001\nCC-MAIN-2023-50,application/pgp-signature,100236,100229,0.0030\nCC-MAIN-2023-50,application/postscript,7172,7142,0.0002\nCC-MAIN-2023-50,application/rdf+xml,124178,123969,0.0037\nCC-MAIN-2023-50,application/rss+xml,1795910,1793710,0.0535\nCC-MAIN-2023-50,application/rtf,38563,38549,0.0011\nCC-MAIN-2023-50,application/save-to-disk,17,17,0.0000\nCC-MAIN-2023-50,application/text,15335,15335,0.0005\nCC-MAIN-2023-50,application/unknown,10850,10850,0.0003\nCC-MAIN-2023-50,application/vnd.android.package-archive,2238,2215,0.0001\nCC-MAIN-2023-50,application/vnd.google-earth.kml+xml,39982,39932,0.0012\nCC-MAIN-2023-50,application/vnd.google-earth.kmz,20230,20224,0.0006\nCC-MAIN-2023-50,application/vnd.ms-excel,67117,67008,0.0020\nCC-MAIN-2023-50,application/vnd.ms-powerpoint,9432,9415,0.0003\nCC-MAIN-2023-50,application/vnd.ms-word,9676,9676,0.0003\nCC-MAIN-2023-50,application/vnd.oasis.opendocument.text,24410,24384,0.0007\nCC-MAIN-2023-50,application/vnd.openxmlformats-officedocument.presentationml.presentation,8598,8408,0.0003\nCC-MAIN-2023-50,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,55072,54793,0.0016\nCC-MAIN-2023-50,application/vnd.openxmlformats-officedocument.wordprocessingml.document,83794,83301,0.0025\nCC-MAIN-2023-50,application/vnd.wap.xhtml+xml,17117,16969,0.0005\nCC-MAIN-2023-50,application/x-bibtex,127627,127600,0.0038\nCC-MAIN-2023-50,application/x-bittorrent,4678,4677,0.0001\nCC-MAIN-2023-50,application/x-debian-package,73,72,0.0000\nCC-MAIN-2023-50,application/x-download,45312,45291,0.0014\nCC-MAIN-2023-50,application/x-endnote-refer,39733,39733,0.0012\nCC-MAIN-2023-50,application/x-gzip,20541,20469,0.0006\nCC-MAIN-2023-50,application/x-httpd-php,13374,13333,0.0004\nCC-MAIN-2023-50,application/x-java-jnlp-file,5018,5015,0.0001\nCC-MAIN-2023-50,application/x-javascript,5770,5677,0.0002\nCC-MAIN-2023-50,application/x-json,102,102,0.0000\nCC-MAIN-2023-50,application/x-mobipocket-ebook,8661,8646,0.0003\nCC-MAIN-2023-50,application/x-msdownload,8302,8297,0.0002\nCC-MAIN-2023-50,application/x-netcdf,94848,94848,0.0028\nCC-MAIN-2023-50,application/x-research-info-systems,248835,248791,0.0074\nCC-MAIN-2023-50,application/x-shockwave-flash,7005,7000,0.0002\nCC-MAIN-2023-50,application/x-tar,4605,4605,0.0001\nCC-MAIN-2023-50,application/x-tex,5670,5669,0.0002\nCC-MAIN-2023-50,application/x-troff-man,25086,25084,0.0007\nCC-MAIN-2023-50,application/x-zip-compressed,11895,11828,0.0004\nCC-MAIN-2023-50,application/xhtml+xml,466190,464847,0.0139\nCC-MAIN-2023-50,application/xml,764420,762793,0.0228\nCC-MAIN-2023-50,application/zip,83110,82808,0.0025\nCC-MAIN-2023-50,audio/mpeg,45133,44855,0.0013\nCC-MAIN-2023-50,audio/x-mpegurl,23631,23625,0.0007\nCC-MAIN-2023-50,audio/x-scpls,4790,4787,0.0001\nCC-MAIN-2023-50,audio/x-wav,2064,2064,0.0001\nCC-MAIN-2023-50,binary/octet-stream,20125,20112,0.0006\nCC-MAIN-2023-50,image/gif,110423,110086,0.0033\nCC-MAIN-2023-50,image/jp2,842,842,0.0000\nCC-MAIN-2023-50,image/jpeg,5251610,5241058,0.1566\nCC-MAIN-2023-50,image/jpg,66400,66394,0.0020\nCC-MAIN-2023-50,image/pjpeg,10340,10339,0.0003\nCC-MAIN-2023-50,image/png,1009285,1005402,0.0301\nCC-MAIN-2023-50,image/svg+xml,34786,34664,0.0010\nCC-MAIN-2023-50,image/tiff,8869,8865,0.0003\nCC-MAIN-2023-50,image/vnd.djvu,11400,11400,0.0003\nCC-MAIN-2023-50,image/webp,92419,92140,0.0028\nCC-MAIN-2023-50,message/rfc822,7846,7844,0.0002\nCC-MAIN-2023-50,text/calendar,1007344,1006469,0.0300\nCC-MAIN-2023-50,text/css,17708,17702,0.0005\nCC-MAIN-2023-50,text/csv,114631,114303,0.0034\nCC-MAIN-2023-50,text/directory,8524,8522,0.0003\nCC-MAIN-2023-50,text/enriched,4837,4837,0.0001\nCC-MAIN-2023-50,text/html,3294349223,3268305088,98.2203\nCC-MAIN-2023-50,text/javascript,7098,7091,0.0002\nCC-MAIN-2023-50,text/markdown,6350,6349,0.0002\nCC-MAIN-2023-50,text/pdf,275,275,0.0000\nCC-MAIN-2023-50,text/plain,1908581,1907415,0.0569\nCC-MAIN-2023-50,text/prs.lines.tag,101137,101137,0.0030\nCC-MAIN-2023-50,text/tab-separated-values,8327,8327,0.0002\nCC-MAIN-2023-50,text/turtle,43045,42972,0.0013\nCC-MAIN-2023-50,text/vcard,33751,33730,0.0010\nCC-MAIN-2023-50,text/x-bibtex,20551,20510,0.0006\nCC-MAIN-2023-50,text/x-c,5798,5787,0.0002\nCC-MAIN-2023-50,text/x-csrc,9306,9305,0.0003\nCC-MAIN-2023-50,text/x-diff,9614,9607,0.0003\nCC-MAIN-2023-50,text/x-patch,8514,8468,0.0003\nCC-MAIN-2023-50,text/x-perl,2657,2650,0.0001\nCC-MAIN-2023-50,text/x-vcalendar,11215,11213,0.0003\nCC-MAIN-2023-50,text/x-vcard,65539,65504,0.0020\nCC-MAIN-2023-50,text/xml,2184434,2180477,0.0651\nCC-MAIN-2023-50,unknown/unknown,1388,1388,0.0000\nCC-MAIN-2023-50,video/mp4,25152,25090,0.0007\nCC-MAIN-2023-50,video/webm,2233,2233,0.0001\nCC-MAIN-2023-50,video/x-ms-asf,8451,8429,0.0003\nCC-MAIN-2024-10,<other>,2285755,2276465,0.0736\nCC-MAIN-2024-10,application/atom+xml,3069149,3068924,0.0988\nCC-MAIN-2024-10,application/calendar,10793,10793,0.0003\nCC-MAIN-2024-10,application/download,99737,99656,0.0032\nCC-MAIN-2024-10,application/epub+zip,41273,41231,0.0013\nCC-MAIN-2024-10,application/force-download,193026,192941,0.0062\nCC-MAIN-2024-10,application/gpx+xml,17074,17070,0.0005\nCC-MAIN-2024-10,application/ics,12119,12114,0.0004\nCC-MAIN-2024-10,application/javascript,33175,33166,0.0011\nCC-MAIN-2024-10,application/json,702626,702159,0.0226\nCC-MAIN-2024-10,application/ld+json,49231,49146,0.0016\nCC-MAIN-2024-10,application/marc,11915,11915,0.0004\nCC-MAIN-2024-10,application/msword,98739,98547,0.0032\nCC-MAIN-2024-10,application/octet-stream,1219895,1218628,0.0393\nCC-MAIN-2024-10,application/octetstream,6575,6570,0.0002\nCC-MAIN-2024-10,application/pdf,29142507,29069603,0.9381\nCC-MAIN-2024-10,application/pgp-encrypted,1956,1956,0.0001\nCC-MAIN-2024-10,application/pgp-signature,84620,84589,0.0027\nCC-MAIN-2024-10,application/postscript,5979,5976,0.0002\nCC-MAIN-2024-10,application/rdf+xml,125354,125241,0.0040\nCC-MAIN-2024-10,application/rss+xml,1716767,1714605,0.0553\nCC-MAIN-2024-10,application/rtf,40004,39996,0.0013\nCC-MAIN-2024-10,application/save-to-disk,195,195,0.0000\nCC-MAIN-2024-10,application/text,6986,6986,0.0002\nCC-MAIN-2024-10,application/unknown,7498,7498,0.0002\nCC-MAIN-2024-10,application/vnd.android.package-archive,160,158,0.0000\nCC-MAIN-2024-10,application/vnd.google-earth.kml+xml,66152,66055,0.0021\nCC-MAIN-2024-10,application/vnd.google-earth.kmz,12025,11997,0.0004\nCC-MAIN-2024-10,application/vnd.ms-excel,60607,60538,0.0020\nCC-MAIN-2024-10,application/vnd.ms-powerpoint,9280,9258,0.0003\nCC-MAIN-2024-10,application/vnd.ms-word,8900,8899,0.0003\nCC-MAIN-2024-10,application/vnd.oasis.opendocument.text,22722,22710,0.0007\nCC-MAIN-2024-10,application/vnd.openxmlformats-officedocument.presentationml.presentation,8522,8455,0.0003\nCC-MAIN-2024-10,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,46251,45977,0.0015\nCC-MAIN-2024-10,application/vnd.openxmlformats-officedocument.wordprocessingml.document,81508,81069,0.0026\nCC-MAIN-2024-10,application/vnd.wap.xhtml+xml,23121,23011,0.0007\nCC-MAIN-2024-10,application/x-bibtex,135975,135957,0.0044\nCC-MAIN-2024-10,application/x-bittorrent,3318,3318,0.0001\nCC-MAIN-2024-10,application/x-debian-package,71,71,0.0000\nCC-MAIN-2024-10,application/x-download,43689,43681,0.0014\nCC-MAIN-2024-10,application/x-endnote-refer,30225,30223,0.0010\nCC-MAIN-2024-10,application/x-gzip,19794,19794,0.0006\nCC-MAIN-2024-10,application/x-httpd-php,13637,13605,0.0004\nCC-MAIN-2024-10,application/x-java-jnlp-file,5247,5241,0.0002\nCC-MAIN-2024-10,application/x-javascript,3102,3101,0.0001\nCC-MAIN-2024-10,application/x-json,33,33,0.0000\nCC-MAIN-2024-10,application/x-mobipocket-ebook,8657,8633,0.0003\nCC-MAIN-2024-10,application/x-msdownload,7521,7520,0.0002\nCC-MAIN-2024-10,application/x-netcdf,12490,12490,0.0004\nCC-MAIN-2024-10,application/x-research-info-systems,241071,241004,0.0078\nCC-MAIN-2024-10,application/x-shockwave-flash,7619,7613,0.0002\nCC-MAIN-2024-10,application/x-tar,4440,4440,0.0001\nCC-MAIN-2024-10,application/x-tex,6400,6386,0.0002\nCC-MAIN-2024-10,application/x-troff-man,18275,18275,0.0006\nCC-MAIN-2024-10,application/x-zip-compressed,286,286,0.0000\nCC-MAIN-2024-10,application/xhtml+xml,278612,277300,0.0090\nCC-MAIN-2024-10,application/xml,697365,695979,0.0224\nCC-MAIN-2024-10,application/zip,4690,4557,0.0002\nCC-MAIN-2024-10,audio/mpeg,2155,2151,0.0001\nCC-MAIN-2024-10,audio/x-mpegurl,15980,15978,0.0005\nCC-MAIN-2024-10,audio/x-scpls,4458,4457,0.0001\nCC-MAIN-2024-10,audio/x-wav,42,42,0.0000\nCC-MAIN-2024-10,binary/octet-stream,17650,17643,0.0006\nCC-MAIN-2024-10,image/gif,24262,24262,0.0008\nCC-MAIN-2024-10,image/jp2,8,8,0.0000\nCC-MAIN-2024-10,image/jpeg,11069,10999,0.0004\nCC-MAIN-2024-10,image/jpg,241,241,0.0000\nCC-MAIN-2024-10,image/pjpeg,17,17,0.0000\nCC-MAIN-2024-10,image/png,6160,6064,0.0002\nCC-MAIN-2024-10,image/svg+xml,83,83,0.0000\nCC-MAIN-2024-10,image/tiff,63,63,0.0000\nCC-MAIN-2024-10,image/webp,66,66,0.0000\nCC-MAIN-2024-10,message/rfc822,6911,6910,0.0002\nCC-MAIN-2024-10,text/calendar,926773,926289,0.0298\nCC-MAIN-2024-10,text/css,20675,20673,0.0007\nCC-MAIN-2024-10,text/csv,101117,101019,0.0033\nCC-MAIN-2024-10,text/directory,6923,6923,0.0002\nCC-MAIN-2024-10,text/enriched,1895,1895,0.0001\nCC-MAIN-2024-10,text/html,3060494990,3035282671,98.5183\nCC-MAIN-2024-10,text/javascript,5396,5390,0.0002\nCC-MAIN-2024-10,text/markdown,4269,4265,0.0001\nCC-MAIN-2024-10,text/pdf,747,747,0.0000\nCC-MAIN-2024-10,text/plain,1866327,1864746,0.0601\nCC-MAIN-2024-10,text/prs.lines.tag,78678,78678,0.0025\nCC-MAIN-2024-10,text/tab-separated-values,6582,6581,0.0002\nCC-MAIN-2024-10,text/turtle,49509,49411,0.0016\nCC-MAIN-2024-10,text/vcard,30422,30391,0.0010\nCC-MAIN-2024-10,text/x-bibtex,18705,18672,0.0006\nCC-MAIN-2024-10,text/x-c,5693,5691,0.0002\nCC-MAIN-2024-10,text/x-csrc,7255,7252,0.0002\nCC-MAIN-2024-10,text/x-diff,10672,10668,0.0003\nCC-MAIN-2024-10,text/x-patch,8144,8124,0.0003\nCC-MAIN-2024-10,text/x-perl,2044,2043,0.0001\nCC-MAIN-2024-10,text/x-vcalendar,13118,13111,0.0004\nCC-MAIN-2024-10,text/x-vcard,60099,60077,0.0019\nCC-MAIN-2024-10,text/xml,1845290,1841771,0.0594\nCC-MAIN-2024-10,unknown/unknown,631,630,0.0000\nCC-MAIN-2024-10,video/mp4,323,322,0.0000\nCC-MAIN-2024-10,video/webm,1,1,0.0000\nCC-MAIN-2024-10,video/x-ms-asf,5410,5403,0.0002\nCC-MAIN-2024-18,<other>,58413132,58327479,2.0961\nCC-MAIN-2024-18,application/atom+xml,2766037,2765846,0.0993\nCC-MAIN-2024-18,application/calendar,11670,11670,0.0004\nCC-MAIN-2024-18,application/download,95302,95261,0.0034\nCC-MAIN-2024-18,application/epub+zip,37610,37565,0.0013\nCC-MAIN-2024-18,application/force-download,189419,189396,0.0068\nCC-MAIN-2024-18,application/gpx+xml,14045,14045,0.0005\nCC-MAIN-2024-18,application/ics,10340,10339,0.0004\nCC-MAIN-2024-18,application/javascript,27846,27836,0.0010\nCC-MAIN-2024-18,application/json,707416,706862,0.0254\nCC-MAIN-2024-18,application/ld+json,43984,43896,0.0016\nCC-MAIN-2024-18,application/marc,13528,13524,0.0005\nCC-MAIN-2024-18,application/msword,90818,90656,0.0033\nCC-MAIN-2024-18,application/octet-stream,1252156,1251408,0.0449\nCC-MAIN-2024-18,application/octetstream,9234,9231,0.0003\nCC-MAIN-2024-18,application/pdf,24996951,24934852,0.8970\nCC-MAIN-2024-18,application/pgp-encrypted,1624,1624,0.0001\nCC-MAIN-2024-18,application/pgp-signature,79035,79035,0.0028\nCC-MAIN-2024-18,application/postscript,5199,5190,0.0002\nCC-MAIN-2024-18,application/rdf+xml,122004,121870,0.0044\nCC-MAIN-2024-18,application/rss+xml,1548593,1547013,0.0556\nCC-MAIN-2024-18,application/rtf,37583,37570,0.0013\nCC-MAIN-2024-18,application/save-to-disk,76,76,0.0000\nCC-MAIN-2024-18,application/text,7532,7532,0.0003\nCC-MAIN-2024-18,application/unknown,10086,10085,0.0004\nCC-MAIN-2024-18,application/vnd.android.package-archive,164,162,0.0000\nCC-MAIN-2024-18,application/vnd.google-earth.kml+xml,55844,55730,0.0020\nCC-MAIN-2024-18,application/vnd.google-earth.kmz,11661,11658,0.0004\nCC-MAIN-2024-18,application/vnd.ms-excel,59104,59028,0.0021\nCC-MAIN-2024-18,application/vnd.ms-powerpoint,8072,8067,0.0003\nCC-MAIN-2024-18,application/vnd.ms-word,8114,8113,0.0003\nCC-MAIN-2024-18,application/vnd.oasis.opendocument.text,19681,19668,0.0007\nCC-MAIN-2024-18,application/vnd.openxmlformats-officedocument.presentationml.presentation,6020,5999,0.0002\nCC-MAIN-2024-18,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,43979,43285,0.0016\nCC-MAIN-2024-18,application/vnd.openxmlformats-officedocument.wordprocessingml.document,70237,69911,0.0025\nCC-MAIN-2024-18,application/vnd.wap.xhtml+xml,19795,19692,0.0007\nCC-MAIN-2024-18,application/x-bibtex,137979,137932,0.0050\nCC-MAIN-2024-18,application/x-bittorrent,4237,4235,0.0002\nCC-MAIN-2024-18,application/x-debian-package,7,7,0.0000\nCC-MAIN-2024-18,application/x-download,47369,47366,0.0017\nCC-MAIN-2024-18,application/x-endnote-refer,31306,31304,0.0011\nCC-MAIN-2024-18,application/x-gzip,6031,6030,0.0002\nCC-MAIN-2024-18,application/x-httpd-php,10371,10341,0.0004\nCC-MAIN-2024-18,application/x-java-jnlp-file,4523,4522,0.0002\nCC-MAIN-2024-18,application/x-javascript,2033,2016,0.0001\nCC-MAIN-2024-18,application/x-json,19,19,0.0000\nCC-MAIN-2024-18,application/x-mobipocket-ebook,7801,7785,0.0003\nCC-MAIN-2024-18,application/x-msdownload,4890,4890,0.0002\nCC-MAIN-2024-18,application/x-netcdf,2979,2979,0.0001\nCC-MAIN-2024-18,application/x-research-info-systems,279892,279843,0.0100\nCC-MAIN-2024-18,application/x-shockwave-flash,7818,7811,0.0003\nCC-MAIN-2024-18,application/x-tar,7820,7820,0.0003\nCC-MAIN-2024-18,application/x-tex,6697,6694,0.0002\nCC-MAIN-2024-18,application/x-troff-man,28031,28026,0.0010\nCC-MAIN-2024-18,application/x-zip-compressed,271,271,0.0000\nCC-MAIN-2024-18,application/xhtml+xml,257763,256637,0.0092\nCC-MAIN-2024-18,application/xml,635084,633862,0.0228\nCC-MAIN-2024-18,application/zip,3975,3972,0.0001\nCC-MAIN-2024-18,audio/mpeg,1214,1214,0.0000\nCC-MAIN-2024-18,audio/x-mpegurl,17275,17263,0.0006\nCC-MAIN-2024-18,audio/x-scpls,3023,3022,0.0001\nCC-MAIN-2024-18,audio/x-wav,12,12,0.0000\nCC-MAIN-2024-18,binary/octet-stream,18671,18625,0.0007\nCC-MAIN-2024-18,image/gif,18569,18569,0.0007\nCC-MAIN-2024-18,image/jp2,4,4,0.0000\nCC-MAIN-2024-18,image/jpeg,8794,8779,0.0003\nCC-MAIN-2024-18,image/jpg,315,315,0.0000\nCC-MAIN-2024-18,image/pjpeg,12,12,0.0000\nCC-MAIN-2024-18,image/png,7253,7243,0.0003\nCC-MAIN-2024-18,image/svg+xml,85,85,0.0000\nCC-MAIN-2024-18,image/tiff,14,14,0.0000\nCC-MAIN-2024-18,image/vnd.djvu,2,2,0.0000\nCC-MAIN-2024-18,image/webp,45,45,0.0000\nCC-MAIN-2024-18,message/rfc822,7025,7025,0.0003\nCC-MAIN-2024-18,text/calendar,831473,831093,0.0298\nCC-MAIN-2024-18,text/css,19840,19837,0.0007\nCC-MAIN-2024-18,text/csv,89852,89375,0.0032\nCC-MAIN-2024-18,text/directory,6021,6020,0.0002\nCC-MAIN-2024-18,text/enriched,1980,1980,0.0001\nCC-MAIN-2024-18,text/html,2689561019,2671508585,96.5107\nCC-MAIN-2024-18,text/javascript,6398,6395,0.0002\nCC-MAIN-2024-18,text/markdown,4954,4954,0.0002\nCC-MAIN-2024-18,text/pdf,649,649,0.0000\nCC-MAIN-2024-18,text/plain,1856255,1855149,0.0666\nCC-MAIN-2024-18,text/prs.lines.tag,100747,100747,0.0036\nCC-MAIN-2024-18,text/tab-separated-values,5935,5927,0.0002\nCC-MAIN-2024-18,text/turtle,45451,45358,0.0016\nCC-MAIN-2024-18,text/vcard,28483,28470,0.0010\nCC-MAIN-2024-18,text/x-bibtex,18460,18213,0.0007\nCC-MAIN-2024-18,text/x-c,4160,4158,0.0001\nCC-MAIN-2024-18,text/x-csrc,8363,8348,0.0003\nCC-MAIN-2024-18,text/x-diff,13504,13501,0.0005\nCC-MAIN-2024-18,text/x-patch,8442,8429,0.0003\nCC-MAIN-2024-18,text/x-perl,2769,2769,0.0001\nCC-MAIN-2024-18,text/x-vcalendar,10949,10948,0.0004\nCC-MAIN-2024-18,text/x-vcard,58130,58118,0.0021\nCC-MAIN-2024-18,text/xml,1748215,1745442,0.0627\nCC-MAIN-2024-18,unknown/unknown,663,663,0.0000\nCC-MAIN-2024-18,video/mp4,219,219,0.0000\nCC-MAIN-2024-18,video/webm,5,5,0.0000\nCC-MAIN-2024-18,video/x-ms-asf,4021,4019,0.0001\nCC-MAIN-2024-22,<other>,80443843,80333237,2.9685\nCC-MAIN-2024-22,application/atom+xml,2703355,2703161,0.0998\nCC-MAIN-2024-22,application/calendar,10994,10994,0.0004\nCC-MAIN-2024-22,application/download,91275,91264,0.0034\nCC-MAIN-2024-22,application/epub+zip,46308,46128,0.0017\nCC-MAIN-2024-22,application/force-download,170567,170484,0.0063\nCC-MAIN-2024-22,application/gpx+xml,14012,14012,0.0005\nCC-MAIN-2024-22,application/ics,10053,10052,0.0004\nCC-MAIN-2024-22,application/javascript,24813,24805,0.0009\nCC-MAIN-2024-22,application/json,665431,664940,0.0246\nCC-MAIN-2024-22,application/ld+json,47785,47760,0.0018\nCC-MAIN-2024-22,application/marc,12967,12967,0.0005\nCC-MAIN-2024-22,application/msword,80074,79933,0.0030\nCC-MAIN-2024-22,application/octet-stream,1094338,1093908,0.0404\nCC-MAIN-2024-22,application/octetstream,8115,8115,0.0003\nCC-MAIN-2024-22,application/pdf,20538387,20487308,0.7579\nCC-MAIN-2024-22,application/pgp-encrypted,2131,2131,0.0001\nCC-MAIN-2024-22,application/pgp-signature,89020,89016,0.0033\nCC-MAIN-2024-22,application/postscript,4637,4631,0.0002\nCC-MAIN-2024-22,application/rdf+xml,127395,127326,0.0047\nCC-MAIN-2024-22,application/rss+xml,1466790,1464967,0.0541\nCC-MAIN-2024-22,application/rtf,32816,32807,0.0012\nCC-MAIN-2024-22,application/save-to-disk,12,12,0.0000\nCC-MAIN-2024-22,application/text,6615,6615,0.0002\nCC-MAIN-2024-22,application/unknown,5871,5871,0.0002\nCC-MAIN-2024-22,application/vnd.android.package-archive,285,285,0.0000\nCC-MAIN-2024-22,application/vnd.google-earth.kml+xml,67341,67064,0.0025\nCC-MAIN-2024-22,application/vnd.google-earth.kmz,41286,41286,0.0015\nCC-MAIN-2024-22,application/vnd.ms-excel,50421,50318,0.0019\nCC-MAIN-2024-22,application/vnd.ms-powerpoint,8550,8539,0.0003\nCC-MAIN-2024-22,application/vnd.ms-word,7404,7404,0.0003\nCC-MAIN-2024-22,application/vnd.oasis.opendocument.text,17484,17473,0.0006\nCC-MAIN-2024-22,application/vnd.openxmlformats-officedocument.presentationml.presentation,4753,4723,0.0002\nCC-MAIN-2024-22,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,35354,35174,0.0013\nCC-MAIN-2024-22,application/vnd.openxmlformats-officedocument.wordprocessingml.document,60004,59719,0.0022\nCC-MAIN-2024-22,application/vnd.wap.xhtml+xml,22146,22047,0.0008\nCC-MAIN-2024-22,application/x-bibtex,135165,135156,0.0050\nCC-MAIN-2024-22,application/x-bittorrent,3585,3585,0.0001\nCC-MAIN-2024-22,application/x-debian-package,88,88,0.0000\nCC-MAIN-2024-22,application/x-download,49895,49878,0.0018\nCC-MAIN-2024-22,application/x-endnote-refer,26320,26319,0.0010\nCC-MAIN-2024-22,application/x-gzip,12117,12116,0.0004\nCC-MAIN-2024-22,application/x-httpd-php,9250,9216,0.0003\nCC-MAIN-2024-22,application/x-java-jnlp-file,8143,8141,0.0003\nCC-MAIN-2024-22,application/x-javascript,2374,2373,0.0001\nCC-MAIN-2024-22,application/x-json,101,101,0.0000\nCC-MAIN-2024-22,application/x-mobipocket-ebook,16265,16128,0.0006\nCC-MAIN-2024-22,application/x-msdownload,5803,5802,0.0002\nCC-MAIN-2024-22,application/x-netcdf,14247,14247,0.0005\nCC-MAIN-2024-22,application/x-research-info-systems,257258,257240,0.0095\nCC-MAIN-2024-22,application/x-shockwave-flash,7050,7047,0.0003\nCC-MAIN-2024-22,application/x-tar,3622,3622,0.0001\nCC-MAIN-2024-22,application/x-tex,7095,7058,0.0003\nCC-MAIN-2024-22,application/x-troff-man,17119,17116,0.0006\nCC-MAIN-2024-22,application/x-zip-compressed,376,375,0.0000\nCC-MAIN-2024-22,application/xhtml+xml,263880,262821,0.0097\nCC-MAIN-2024-22,application/xml,646792,645708,0.0239\nCC-MAIN-2024-22,application/zip,6013,6008,0.0002\nCC-MAIN-2024-22,audio/mpeg,1273,1272,0.0000\nCC-MAIN-2024-22,audio/x-mpegurl,13500,13498,0.0005\nCC-MAIN-2024-22,audio/x-scpls,2590,2589,0.0001\nCC-MAIN-2024-22,audio/x-wav,22,22,0.0000\nCC-MAIN-2024-22,binary/octet-stream,13655,13633,0.0005\nCC-MAIN-2024-22,image/gif,16104,16103,0.0006\nCC-MAIN-2024-22,image/jp2,7,7,0.0000\nCC-MAIN-2024-22,image/jpeg,8313,8307,0.0003\nCC-MAIN-2024-22,image/jpg,164,164,0.0000\nCC-MAIN-2024-22,image/pjpeg,15,15,0.0000\nCC-MAIN-2024-22,image/png,5426,5419,0.0002\nCC-MAIN-2024-22,image/svg+xml,82,82,0.0000\nCC-MAIN-2024-22,image/tiff,8,8,0.0000\nCC-MAIN-2024-22,image/vnd.djvu,1,1,0.0000\nCC-MAIN-2024-22,image/webp,28,28,0.0000\nCC-MAIN-2024-22,message/rfc822,6041,6041,0.0002\nCC-MAIN-2024-22,text/calendar,755741,755518,0.0279\nCC-MAIN-2024-22,text/css,20595,20591,0.0008\nCC-MAIN-2024-22,text/csv,91778,91647,0.0034\nCC-MAIN-2024-22,text/directory,4648,4648,0.0002\nCC-MAIN-2024-22,text/enriched,2609,2609,0.0001\nCC-MAIN-2024-22,text/html,2595856175,2579093439,95.7924\nCC-MAIN-2024-22,text/javascript,4808,4801,0.0002\nCC-MAIN-2024-22,text/markdown,4456,4451,0.0002\nCC-MAIN-2024-22,text/pdf,530,530,0.0000\nCC-MAIN-2024-22,text/plain,1718144,1716983,0.0634\nCC-MAIN-2024-22,text/prs.lines.tag,92951,92951,0.0034\nCC-MAIN-2024-22,text/tab-separated-values,6585,6576,0.0002\nCC-MAIN-2024-22,text/turtle,45276,45241,0.0017\nCC-MAIN-2024-22,text/vcard,25759,25753,0.0010\nCC-MAIN-2024-22,text/x-bibtex,15959,15955,0.0006\nCC-MAIN-2024-22,text/x-c,4301,4300,0.0002\nCC-MAIN-2024-22,text/x-csrc,11211,11205,0.0004\nCC-MAIN-2024-22,text/x-diff,10213,10213,0.0004\nCC-MAIN-2024-22,text/x-patch,8836,8835,0.0003\nCC-MAIN-2024-22,text/x-perl,2049,2049,0.0001\nCC-MAIN-2024-22,text/x-vcalendar,11018,11016,0.0004\nCC-MAIN-2024-22,text/x-vcard,49958,49938,0.0018\nCC-MAIN-2024-22,text/xml,1559052,1556792,0.0575\nCC-MAIN-2024-22,unknown/unknown,741,741,0.0000\nCC-MAIN-2024-22,video/mp4,237,237,0.0000\nCC-MAIN-2024-22,video/webm,2,2,0.0000\nCC-MAIN-2024-22,video/x-ms-asf,1924,1922,0.0001\nCC-MAIN-2024-26,<other>,43808494,43756894,1.5657\nCC-MAIN-2024-26,application/atom+xml,3236943,3236557,0.1157\nCC-MAIN-2024-26,application/calendar,10870,10870,0.0004\nCC-MAIN-2024-26,application/download,73463,73460,0.0026\nCC-MAIN-2024-26,application/epub+zip,46075,45949,0.0016\nCC-MAIN-2024-26,application/force-download,182935,182864,0.0065\nCC-MAIN-2024-26,application/gpx+xml,13107,13107,0.0005\nCC-MAIN-2024-26,application/ics,12017,12015,0.0004\nCC-MAIN-2024-26,application/javascript,23025,23022,0.0008\nCC-MAIN-2024-26,application/json,749827,749461,0.0268\nCC-MAIN-2024-26,application/ld+json,58397,58388,0.0021\nCC-MAIN-2024-26,application/marc,12246,12245,0.0004\nCC-MAIN-2024-26,application/msword,72896,72809,0.0026\nCC-MAIN-2024-26,application/octet-stream,1290646,1289835,0.0461\nCC-MAIN-2024-26,application/octetstream,3698,3698,0.0001\nCC-MAIN-2024-26,application/pdf,19582818,19537516,0.6999\nCC-MAIN-2024-26,application/pgp-encrypted,1709,1709,0.0001\nCC-MAIN-2024-26,application/pgp-signature,78044,78043,0.0028\nCC-MAIN-2024-26,application/postscript,4567,4555,0.0002\nCC-MAIN-2024-26,application/rdf+xml,145524,145453,0.0052\nCC-MAIN-2024-26,application/rss+xml,1604353,1601267,0.0573\nCC-MAIN-2024-26,application/rtf,39489,39481,0.0014\nCC-MAIN-2024-26,application/save-to-disk,18,18,0.0000\nCC-MAIN-2024-26,application/text,6969,6969,0.0002\nCC-MAIN-2024-26,application/unknown,6135,6135,0.0002\nCC-MAIN-2024-26,application/vnd.android.package-archive,340,340,0.0000\nCC-MAIN-2024-26,application/vnd.google-earth.kml+xml,60827,60769,0.0022\nCC-MAIN-2024-26,application/vnd.google-earth.kmz,10222,10219,0.0004\nCC-MAIN-2024-26,application/vnd.ms-excel,50367,50327,0.0018\nCC-MAIN-2024-26,application/vnd.ms-powerpoint,6810,6807,0.0002\nCC-MAIN-2024-26,application/vnd.ms-word,6745,6745,0.0002\nCC-MAIN-2024-26,application/vnd.oasis.opendocument.text,18661,18655,0.0007\nCC-MAIN-2024-26,application/vnd.openxmlformats-officedocument.presentationml.presentation,5879,5865,0.0002\nCC-MAIN-2024-26,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,37942,37625,0.0014\nCC-MAIN-2024-26,application/vnd.openxmlformats-officedocument.wordprocessingml.document,60684,60561,0.0022\nCC-MAIN-2024-26,application/vnd.wap.xhtml+xml,20697,20614,0.0007\nCC-MAIN-2024-26,application/x-bibtex,149582,149562,0.0053\nCC-MAIN-2024-26,application/x-bittorrent,3974,3974,0.0001\nCC-MAIN-2024-26,application/x-debian-package,3,3,0.0000\nCC-MAIN-2024-26,application/x-download,51353,51313,0.0018\nCC-MAIN-2024-26,application/x-endnote-refer,30107,30106,0.0011\nCC-MAIN-2024-26,application/x-gzip,12743,12737,0.0005\nCC-MAIN-2024-26,application/x-httpd-php,13775,13716,0.0005\nCC-MAIN-2024-26,application/x-java-jnlp-file,3168,3168,0.0001\nCC-MAIN-2024-26,application/x-javascript,1867,1866,0.0001\nCC-MAIN-2024-26,application/x-json,85,85,0.0000\nCC-MAIN-2024-26,application/x-mobipocket-ebook,15408,15307,0.0006\nCC-MAIN-2024-26,application/x-msdownload,7102,7101,0.0003\nCC-MAIN-2024-26,application/x-netcdf,5782,5782,0.0002\nCC-MAIN-2024-26,application/x-research-info-systems,265982,265955,0.0095\nCC-MAIN-2024-26,application/x-shockwave-flash,4770,4763,0.0002\nCC-MAIN-2024-26,application/x-tar,5276,5276,0.0002\nCC-MAIN-2024-26,application/x-tex,5097,5095,0.0002\nCC-MAIN-2024-26,application/x-troff-man,21872,21872,0.0008\nCC-MAIN-2024-26,application/x-zip-compressed,383,383,0.0000\nCC-MAIN-2024-26,application/xhtml+xml,269480,268587,0.0096\nCC-MAIN-2024-26,application/xml,660846,659844,0.0236\nCC-MAIN-2024-26,application/zip,5653,5598,0.0002\nCC-MAIN-2024-26,audio/mpeg,1325,1325,0.0000\nCC-MAIN-2024-26,audio/x-mpegurl,14766,14760,0.0005\nCC-MAIN-2024-26,audio/x-scpls,3196,3195,0.0001\nCC-MAIN-2024-26,audio/x-wav,26,26,0.0000\nCC-MAIN-2024-26,binary/octet-stream,12964,12959,0.0005\nCC-MAIN-2024-26,image/gif,15520,15520,0.0006\nCC-MAIN-2024-26,image/jp2,5,5,0.0000\nCC-MAIN-2024-26,image/jpeg,8565,8562,0.0003\nCC-MAIN-2024-26,image/jpg,508,508,0.0000\nCC-MAIN-2024-26,image/pjpeg,26,26,0.0000\nCC-MAIN-2024-26,image/png,3874,3863,0.0001\nCC-MAIN-2024-26,image/svg+xml,89,89,0.0000\nCC-MAIN-2024-26,image/tiff,14,14,0.0000\nCC-MAIN-2024-26,image/vnd.djvu,16,16,0.0000\nCC-MAIN-2024-26,image/webp,23,23,0.0000\nCC-MAIN-2024-26,message/rfc822,7314,7313,0.0003\nCC-MAIN-2024-26,text/calendar,835661,835311,0.0299\nCC-MAIN-2024-26,text/css,22635,22631,0.0008\nCC-MAIN-2024-26,text/csv,103218,103145,0.0037\nCC-MAIN-2024-26,text/directory,5719,5718,0.0002\nCC-MAIN-2024-26,text/enriched,2620,2620,0.0001\nCC-MAIN-2024-26,text/html,2720264139,2702903545,97.2201\nCC-MAIN-2024-26,text/javascript,4600,4597,0.0002\nCC-MAIN-2024-26,text/markdown,4527,4525,0.0002\nCC-MAIN-2024-26,text/pdf,180,180,0.0000\nCC-MAIN-2024-26,text/plain,1821721,1820411,0.0651\nCC-MAIN-2024-26,text/prs.lines.tag,124468,124468,0.0044\nCC-MAIN-2024-26,text/tab-separated-values,6114,6113,0.0002\nCC-MAIN-2024-26,text/turtle,53146,53140,0.0019\nCC-MAIN-2024-26,text/vcard,25717,25710,0.0009\nCC-MAIN-2024-26,text/x-bibtex,16160,16159,0.0006\nCC-MAIN-2024-26,text/x-c,4446,4444,0.0002\nCC-MAIN-2024-26,text/x-csrc,9143,9143,0.0003\nCC-MAIN-2024-26,text/x-diff,11889,11888,0.0004\nCC-MAIN-2024-26,text/x-patch,9910,9907,0.0004\nCC-MAIN-2024-26,text/x-perl,1471,1471,0.0001\nCC-MAIN-2024-26,text/x-vcalendar,11813,11806,0.0004\nCC-MAIN-2024-26,text/x-vcard,54430,54424,0.0019\nCC-MAIN-2024-26,text/xml,1703093,1701087,0.0609\nCC-MAIN-2024-26,unknown/unknown,995,995,0.0000\nCC-MAIN-2024-26,video/mp4,74,73,0.0000\nCC-MAIN-2024-26,video/webm,3,3,0.0000\nCC-MAIN-2024-26,video/x-ms-asf,3156,3155,0.0001\nCC-MAIN-2024-30,<other>,3058008,3051228,0.1201\nCC-MAIN-2024-30,application/atom+xml,2617937,2617819,0.1028\nCC-MAIN-2024-30,application/calendar,12797,12796,0.0005\nCC-MAIN-2024-30,application/download,81358,81351,0.0032\nCC-MAIN-2024-30,application/epub+zip,44084,43964,0.0017\nCC-MAIN-2024-30,application/force-download,190197,190144,0.0075\nCC-MAIN-2024-30,application/gpx+xml,13804,13802,0.0005\nCC-MAIN-2024-30,application/ics,9432,9428,0.0004\nCC-MAIN-2024-30,application/javascript,4812,4805,0.0002\nCC-MAIN-2024-30,application/json,736143,735846,0.0289\nCC-MAIN-2024-30,application/ld+json,51055,50659,0.0020\nCC-MAIN-2024-30,application/marc,15927,15927,0.0006\nCC-MAIN-2024-30,application/msword,76849,76751,0.0030\nCC-MAIN-2024-30,application/octet-stream,1256383,1255866,0.0493\nCC-MAIN-2024-30,application/octetstream,6346,6341,0.0002\nCC-MAIN-2024-30,application/pdf,23625145,23582024,0.9277\nCC-MAIN-2024-30,application/pgp-encrypted,3124,3124,0.0001\nCC-MAIN-2024-30,application/pgp-signature,93511,93440,0.0037\nCC-MAIN-2024-30,application/postscript,4998,4997,0.0002\nCC-MAIN-2024-30,application/rdf+xml,145384,145033,0.0057\nCC-MAIN-2024-30,application/rss+xml,1480778,1479252,0.0581\nCC-MAIN-2024-30,application/rtf,47849,47842,0.0019\nCC-MAIN-2024-30,application/save-to-disk,18,18,0.0000\nCC-MAIN-2024-30,application/text,5074,5074,0.0002\nCC-MAIN-2024-30,application/unknown,11011,11011,0.0004\nCC-MAIN-2024-30,application/vnd.android.package-archive,470,470,0.0000\nCC-MAIN-2024-30,application/vnd.google-earth.kml+xml,75477,75144,0.0030\nCC-MAIN-2024-30,application/vnd.google-earth.kmz,19554,19554,0.0008\nCC-MAIN-2024-30,application/vnd.ms-excel,59274,59164,0.0023\nCC-MAIN-2024-30,application/vnd.ms-powerpoint,7167,7160,0.0003\nCC-MAIN-2024-30,application/vnd.ms-word,7083,7081,0.0003\nCC-MAIN-2024-30,application/vnd.oasis.opendocument.text,18277,18271,0.0007\nCC-MAIN-2024-30,application/vnd.openxmlformats-officedocument.presentationml.presentation,6500,6486,0.0003\nCC-MAIN-2024-30,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,39653,38813,0.0016\nCC-MAIN-2024-30,application/vnd.openxmlformats-officedocument.wordprocessingml.document,64453,64154,0.0025\nCC-MAIN-2024-30,application/vnd.wap.xhtml+xml,14179,14133,0.0006\nCC-MAIN-2024-30,application/x-bibtex,154457,154442,0.0061\nCC-MAIN-2024-30,application/x-bittorrent,3823,3822,0.0002\nCC-MAIN-2024-30,application/x-debian-package,7,7,0.0000\nCC-MAIN-2024-30,application/x-download,54714,54673,0.0021\nCC-MAIN-2024-30,application/x-endnote-refer,29411,29406,0.0012\nCC-MAIN-2024-30,application/x-gzip,8167,8163,0.0003\nCC-MAIN-2024-30,application/x-httpd-php,12869,12854,0.0005\nCC-MAIN-2024-30,application/x-java-jnlp-file,3003,3003,0.0001\nCC-MAIN-2024-30,application/x-javascript,2709,2696,0.0001\nCC-MAIN-2024-30,application/x-json,143,143,0.0000\nCC-MAIN-2024-30,application/x-mobipocket-ebook,13567,13457,0.0005\nCC-MAIN-2024-30,application/x-msdownload,6261,6260,0.0002\nCC-MAIN-2024-30,application/x-netcdf,6356,6356,0.0002\nCC-MAIN-2024-30,application/x-research-info-systems,268404,268346,0.0105\nCC-MAIN-2024-30,application/x-shockwave-flash,6040,6029,0.0002\nCC-MAIN-2024-30,application/x-tar,2919,2919,0.0001\nCC-MAIN-2024-30,application/x-tex,4677,4677,0.0002\nCC-MAIN-2024-30,application/x-troff-man,15576,15575,0.0006\nCC-MAIN-2024-30,application/x-zip-compressed,215,215,0.0000\nCC-MAIN-2024-30,application/xhtml+xml,223143,222304,0.0088\nCC-MAIN-2024-30,application/xml,1641074,1640006,0.0644\nCC-MAIN-2024-30,application/zip,4566,4561,0.0002\nCC-MAIN-2024-30,audio/mpeg,1492,1492,0.0001\nCC-MAIN-2024-30,audio/x-mpegurl,19766,19763,0.0008\nCC-MAIN-2024-30,audio/x-scpls,3544,3542,0.0001\nCC-MAIN-2024-30,audio/x-wav,29,29,0.0000\nCC-MAIN-2024-30,binary/octet-stream,15536,15460,0.0006\nCC-MAIN-2024-30,image/gif,17936,17936,0.0007\nCC-MAIN-2024-30,image/jp2,2,2,0.0000\nCC-MAIN-2024-30,image/jpeg,9138,9135,0.0004\nCC-MAIN-2024-30,image/jpg,516,516,0.0000\nCC-MAIN-2024-30,image/pjpeg,40,40,0.0000\nCC-MAIN-2024-30,image/png,2231,2222,0.0001\nCC-MAIN-2024-30,image/svg+xml,120,120,0.0000\nCC-MAIN-2024-30,image/tiff,27,27,0.0000\nCC-MAIN-2024-30,image/vnd.djvu,1,1,0.0000\nCC-MAIN-2024-30,image/webp,31,31,0.0000\nCC-MAIN-2024-30,message/rfc822,6074,6074,0.0002\nCC-MAIN-2024-30,text/calendar,786525,786290,0.0309\nCC-MAIN-2024-30,text/css,19299,19297,0.0008\nCC-MAIN-2024-30,text/csv,98288,97517,0.0039\nCC-MAIN-2024-30,text/directory,6425,6424,0.0003\nCC-MAIN-2024-30,text/enriched,1876,1876,0.0001\nCC-MAIN-2024-30,text/html,2505350261,2491200342,98.3790\nCC-MAIN-2024-30,text/javascript,4883,4879,0.0002\nCC-MAIN-2024-30,text/markdown,4310,4310,0.0002\nCC-MAIN-2024-30,text/pdf,740,740,0.0000\nCC-MAIN-2024-30,text/plain,1806136,1804853,0.0709\nCC-MAIN-2024-30,text/prs.lines.tag,136372,136366,0.0054\nCC-MAIN-2024-30,text/tab-separated-values,6529,6526,0.0003\nCC-MAIN-2024-30,text/turtle,54224,53886,0.0021\nCC-MAIN-2024-30,text/vcard,23968,23951,0.0009\nCC-MAIN-2024-30,text/x-bibtex,14749,14748,0.0006\nCC-MAIN-2024-30,text/x-c,3877,3877,0.0002\nCC-MAIN-2024-30,text/x-csrc,7619,7617,0.0003\nCC-MAIN-2024-30,text/x-diff,26841,26838,0.0011\nCC-MAIN-2024-30,text/x-patch,7476,7475,0.0003\nCC-MAIN-2024-30,text/x-perl,1488,1488,0.0001\nCC-MAIN-2024-30,text/x-vcalendar,10892,10891,0.0004\nCC-MAIN-2024-30,text/x-vcard,54092,54075,0.0021\nCC-MAIN-2024-30,text/xml,1754751,1753086,0.0689\nCC-MAIN-2024-30,unknown/unknown,1354,1354,0.0001\nCC-MAIN-2024-30,video/mp4,139,139,0.0000\nCC-MAIN-2024-30,video/webm,13,13,0.0000\nCC-MAIN-2024-30,video/x-ms-asf,4573,4572,0.0002\nCC-MAIN-2024-33,<other>,2999012,2989557,0.1295\nCC-MAIN-2024-33,application/atom+xml,2548175,2548069,0.1100\nCC-MAIN-2024-33,application/calendar,10563,10563,0.0005\nCC-MAIN-2024-33,application/download,74598,74591,0.0032\nCC-MAIN-2024-33,application/epub+zip,37278,37217,0.0016\nCC-MAIN-2024-33,application/force-download,173150,173089,0.0075\nCC-MAIN-2024-33,application/gpx+xml,16045,16045,0.0007\nCC-MAIN-2024-33,application/ics,8487,8487,0.0004\nCC-MAIN-2024-33,application/javascript,4072,4064,0.0002\nCC-MAIN-2024-33,application/json,722621,722178,0.0312\nCC-MAIN-2024-33,application/ld+json,45181,45165,0.0020\nCC-MAIN-2024-33,application/marc,13872,13869,0.0006\nCC-MAIN-2024-33,application/msword,87685,87516,0.0038\nCC-MAIN-2024-33,application/octet-stream,1263396,1262803,0.0546\nCC-MAIN-2024-33,application/octetstream,7388,7384,0.0003\nCC-MAIN-2024-33,application/pdf,21215916,21170730,0.9161\nCC-MAIN-2024-33,application/pgp-encrypted,3796,3796,0.0002\nCC-MAIN-2024-33,application/pgp-signature,90561,90556,0.0039\nCC-MAIN-2024-33,application/postscript,4475,4465,0.0002\nCC-MAIN-2024-33,application/rdf+xml,139894,139643,0.0060\nCC-MAIN-2024-33,application/rss+xml,1380359,1378893,0.0596\nCC-MAIN-2024-33,application/rtf,39516,39511,0.0017\nCC-MAIN-2024-33,application/save-to-disk,23,23,0.0000\nCC-MAIN-2024-33,application/text,4767,4767,0.0002\nCC-MAIN-2024-33,application/unknown,6472,6472,0.0003\nCC-MAIN-2024-33,application/vnd.android.package-archive,121,121,0.0000\nCC-MAIN-2024-33,application/vnd.google-earth.kml+xml,34726,34572,0.0015\nCC-MAIN-2024-33,application/vnd.google-earth.kmz,17416,17415,0.0008\nCC-MAIN-2024-33,application/vnd.ms-excel,63998,63956,0.0028\nCC-MAIN-2024-33,application/vnd.ms-powerpoint,7295,7268,0.0003\nCC-MAIN-2024-33,application/vnd.ms-word,6632,6631,0.0003\nCC-MAIN-2024-33,application/vnd.oasis.opendocument.text,15437,15393,0.0007\nCC-MAIN-2024-33,application/vnd.openxmlformats-officedocument.presentationml.presentation,5288,5231,0.0002\nCC-MAIN-2024-33,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,38104,37962,0.0016\nCC-MAIN-2024-33,application/vnd.openxmlformats-officedocument.wordprocessingml.document,59923,59629,0.0026\nCC-MAIN-2024-33,application/vnd.wap.xhtml+xml,4590,4584,0.0002\nCC-MAIN-2024-33,application/x-bibtex,141568,141491,0.0061\nCC-MAIN-2024-33,application/x-bittorrent,3980,3980,0.0002\nCC-MAIN-2024-33,application/x-debian-package,15,15,0.0000\nCC-MAIN-2024-33,application/x-download,55920,55897,0.0024\nCC-MAIN-2024-33,application/x-endnote-refer,28920,28918,0.0012\nCC-MAIN-2024-33,application/x-gzip,7416,7415,0.0003\nCC-MAIN-2024-33,application/x-httpd-php,11474,11465,0.0005\nCC-MAIN-2024-33,application/x-java-jnlp-file,5519,5519,0.0002\nCC-MAIN-2024-33,application/x-javascript,3315,3315,0.0001\nCC-MAIN-2024-33,application/x-json,75,75,0.0000\nCC-MAIN-2024-33,application/x-mobipocket-ebook,12559,12510,0.0005\nCC-MAIN-2024-33,application/x-msdownload,6868,6868,0.0003\nCC-MAIN-2024-33,application/x-netcdf,7261,7261,0.0003\nCC-MAIN-2024-33,application/x-research-info-systems,255701,255631,0.0110\nCC-MAIN-2024-33,application/x-shockwave-flash,4288,4284,0.0002\nCC-MAIN-2024-33,application/x-tar,4069,4069,0.0002\nCC-MAIN-2024-33,application/x-tex,3521,3521,0.0002\nCC-MAIN-2024-33,application/x-troff-man,18074,18074,0.0008\nCC-MAIN-2024-33,application/x-zip-compressed,363,362,0.0000\nCC-MAIN-2024-33,application/xhtml+xml,214274,213054,0.0093\nCC-MAIN-2024-33,application/xml,678044,677421,0.0293\nCC-MAIN-2024-33,application/zip,3983,3981,0.0002\nCC-MAIN-2024-33,audio/mpeg,1413,1413,0.0001\nCC-MAIN-2024-33,audio/x-mpegurl,12987,12985,0.0006\nCC-MAIN-2024-33,audio/x-scpls,3009,3009,0.0001\nCC-MAIN-2024-33,audio/x-wav,41,41,0.0000\nCC-MAIN-2024-33,binary/octet-stream,17216,17182,0.0007\nCC-MAIN-2024-33,image/gif,15686,15686,0.0007\nCC-MAIN-2024-33,image/jp2,13,13,0.0000\nCC-MAIN-2024-33,image/jpeg,9554,9548,0.0004\nCC-MAIN-2024-33,image/jpg,158,158,0.0000\nCC-MAIN-2024-33,image/pjpeg,17,17,0.0000\nCC-MAIN-2024-33,image/png,2573,2566,0.0001\nCC-MAIN-2024-33,image/svg+xml,67,67,0.0000\nCC-MAIN-2024-33,image/tiff,43,43,0.0000\nCC-MAIN-2024-33,image/vnd.djvu,1,1,0.0000\nCC-MAIN-2024-33,image/webp,49,49,0.0000\nCC-MAIN-2024-33,message/rfc822,6496,6496,0.0003\nCC-MAIN-2024-33,text/calendar,719728,719517,0.0311\nCC-MAIN-2024-33,text/css,18793,18789,0.0008\nCC-MAIN-2024-33,text/csv,98955,98318,0.0043\nCC-MAIN-2024-33,text/directory,5854,5853,0.0003\nCC-MAIN-2024-33,text/enriched,2691,2691,0.0001\nCC-MAIN-2024-33,text/html,2278703492,2266311813,98.3927\nCC-MAIN-2024-33,text/javascript,4138,4135,0.0002\nCC-MAIN-2024-33,text/markdown,3283,3281,0.0001\nCC-MAIN-2024-33,text/pdf,224,224,0.0000\nCC-MAIN-2024-33,text/plain,1832009,1831138,0.0791\nCC-MAIN-2024-33,text/prs.lines.tag,91685,91685,0.0040\nCC-MAIN-2024-33,text/tab-separated-values,4917,4916,0.0002\nCC-MAIN-2024-33,text/turtle,49045,49027,0.0021\nCC-MAIN-2024-33,text/vcard,21883,21874,0.0009\nCC-MAIN-2024-33,text/x-bibtex,12983,12974,0.0006\nCC-MAIN-2024-33,text/x-c,4498,4497,0.0002\nCC-MAIN-2024-33,text/x-csrc,10456,10453,0.0005\nCC-MAIN-2024-33,text/x-diff,7320,7319,0.0003\nCC-MAIN-2024-33,text/x-patch,9112,9112,0.0004\nCC-MAIN-2024-33,text/x-perl,2225,2225,0.0001\nCC-MAIN-2024-33,text/x-vcalendar,8915,8914,0.0004\nCC-MAIN-2024-33,text/x-vcard,53819,53798,0.0023\nCC-MAIN-2024-33,text/xml,1568864,1567298,0.0677\nCC-MAIN-2024-33,unknown/unknown,1233,1233,0.0001\nCC-MAIN-2024-33,video/mp4,180,180,0.0000\nCC-MAIN-2024-33,video/webm,10,10,0.0000\nCC-MAIN-2024-33,video/x-ms-asf,2742,2741,0.0001\nCC-MAIN-2024-38,<other>,3578250,3570952,0.1278\nCC-MAIN-2024-38,application/atom+xml,2814113,2813932,0.1005\nCC-MAIN-2024-38,application/calendar,9495,9495,0.0003\nCC-MAIN-2024-38,application/download,65049,65047,0.0023\nCC-MAIN-2024-38,application/epub+zip,31669,31581,0.0011\nCC-MAIN-2024-38,application/force-download,160334,160302,0.0057\nCC-MAIN-2024-38,application/gpx+xml,13764,13761,0.0005\nCC-MAIN-2024-38,application/ics,8379,8361,0.0003\nCC-MAIN-2024-38,application/javascript,4283,4282,0.0002\nCC-MAIN-2024-38,application/json,725520,725007,0.0259\nCC-MAIN-2024-38,application/ld+json,49120,48925,0.0018\nCC-MAIN-2024-38,application/marc,14618,14612,0.0005\nCC-MAIN-2024-38,application/msword,66215,66086,0.0024\nCC-MAIN-2024-38,application/octet-stream,1241810,1241214,0.0443\nCC-MAIN-2024-38,application/octetstream,9643,9637,0.0003\nCC-MAIN-2024-38,application/pdf,16825195,16785575,0.6007\nCC-MAIN-2024-38,application/pgp-encrypted,2806,2806,0.0001\nCC-MAIN-2024-38,application/pgp-signature,76563,76562,0.0027\nCC-MAIN-2024-38,application/postscript,3490,3490,0.0001\nCC-MAIN-2024-38,application/rdf+xml,138856,138655,0.0050\nCC-MAIN-2024-38,application/rss+xml,1393370,1391930,0.0497\nCC-MAIN-2024-38,application/rtf,33437,33427,0.0012\nCC-MAIN-2024-38,application/save-to-disk,11,11,0.0000\nCC-MAIN-2024-38,application/text,5487,5487,0.0002\nCC-MAIN-2024-38,application/unknown,5251,5249,0.0002\nCC-MAIN-2024-38,application/vnd.android.package-archive,149,149,0.0000\nCC-MAIN-2024-38,application/vnd.google-earth.kml+xml,32880,32848,0.0012\nCC-MAIN-2024-38,application/vnd.google-earth.kmz,16673,16672,0.0006\nCC-MAIN-2024-38,application/vnd.ms-excel,50321,50153,0.0018\nCC-MAIN-2024-38,application/vnd.ms-powerpoint,8784,8770,0.0003\nCC-MAIN-2024-38,application/vnd.ms-word,5351,5351,0.0002\nCC-MAIN-2024-38,application/vnd.oasis.opendocument.text,13445,13442,0.0005\nCC-MAIN-2024-38,application/vnd.openxmlformats-officedocument.presentationml.presentation,4502,4479,0.0002\nCC-MAIN-2024-38,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,33941,33615,0.0012\nCC-MAIN-2024-38,application/vnd.openxmlformats-officedocument.wordprocessingml.document,49523,49209,0.0018\nCC-MAIN-2024-38,application/vnd.wap.xhtml+xml,11021,10908,0.0004\nCC-MAIN-2024-38,application/x-bibtex,145659,145637,0.0052\nCC-MAIN-2024-38,application/x-bittorrent,3324,3323,0.0001\nCC-MAIN-2024-38,application/x-debian-package,47,47,0.0000\nCC-MAIN-2024-38,application/x-download,50291,50256,0.0018\nCC-MAIN-2024-38,application/x-endnote-refer,28179,28175,0.0010\nCC-MAIN-2024-38,application/x-gzip,7231,7224,0.0003\nCC-MAIN-2024-38,application/x-httpd-php,7949,7932,0.0003\nCC-MAIN-2024-38,application/x-java-jnlp-file,7687,7687,0.0003\nCC-MAIN-2024-38,application/x-javascript,3391,3391,0.0001\nCC-MAIN-2024-38,application/x-json,43,43,0.0000\nCC-MAIN-2024-38,application/x-mobipocket-ebook,9940,9877,0.0004\nCC-MAIN-2024-38,application/x-msdownload,5647,5647,0.0002\nCC-MAIN-2024-38,application/x-netcdf,7074,7074,0.0003\nCC-MAIN-2024-38,application/x-research-info-systems,257351,257292,0.0092\nCC-MAIN-2024-38,application/x-shockwave-flash,4637,4631,0.0002\nCC-MAIN-2024-38,application/x-tar,2630,2630,0.0001\nCC-MAIN-2024-38,application/x-tex,4780,4780,0.0002\nCC-MAIN-2024-38,application/x-troff-man,21300,21299,0.0008\nCC-MAIN-2024-38,application/x-zip-compressed,328,328,0.0000\nCC-MAIN-2024-38,application/xhtml+xml,252983,251907,0.0090\nCC-MAIN-2024-38,application/xml,666834,666229,0.0238\nCC-MAIN-2024-38,application/zip,3684,3678,0.0001\nCC-MAIN-2024-38,audio/mpeg,2414,2414,0.0001\nCC-MAIN-2024-38,audio/x-mpegurl,12102,12095,0.0004\nCC-MAIN-2024-38,audio/x-scpls,3583,3583,0.0001\nCC-MAIN-2024-38,audio/x-wav,63,63,0.0000\nCC-MAIN-2024-38,binary/octet-stream,16362,16302,0.0006\nCC-MAIN-2024-38,image/gif,13430,13428,0.0005\nCC-MAIN-2024-38,image/jp2,1,1,0.0000\nCC-MAIN-2024-38,image/jpeg,8823,8822,0.0003\nCC-MAIN-2024-38,image/jpg,160,160,0.0000\nCC-MAIN-2024-38,image/pjpeg,16,16,0.0000\nCC-MAIN-2024-38,image/png,2025,2024,0.0001\nCC-MAIN-2024-38,image/svg+xml,90,90,0.0000\nCC-MAIN-2024-38,image/tiff,16,16,0.0000\nCC-MAIN-2024-38,image/webp,36,36,0.0000\nCC-MAIN-2024-38,message/rfc822,5908,5906,0.0002\nCC-MAIN-2024-38,text/calendar,691673,691462,0.0247\nCC-MAIN-2024-38,text/css,17415,17413,0.0006\nCC-MAIN-2024-38,text/csv,92318,92088,0.0033\nCC-MAIN-2024-38,text/directory,4423,4423,0.0002\nCC-MAIN-2024-38,text/enriched,2584,2584,0.0001\nCC-MAIN-2024-38,text/html,2767470215,2753403312,98.8067\nCC-MAIN-2024-38,text/javascript,5072,5071,0.0002\nCC-MAIN-2024-38,text/markdown,3380,3376,0.0001\nCC-MAIN-2024-38,text/pdf,100,100,0.0000\nCC-MAIN-2024-38,text/plain,1678561,1677763,0.0599\nCC-MAIN-2024-38,text/prs.lines.tag,119583,119583,0.0043\nCC-MAIN-2024-38,text/tab-separated-values,4981,4977,0.0002\nCC-MAIN-2024-38,text/turtle,52513,52330,0.0019\nCC-MAIN-2024-38,text/vcard,19940,19936,0.0007\nCC-MAIN-2024-38,text/x-bibtex,16443,16439,0.0006\nCC-MAIN-2024-38,text/x-c,3915,3914,0.0001\nCC-MAIN-2024-38,text/x-csrc,6595,6595,0.0002\nCC-MAIN-2024-38,text/x-diff,7623,7623,0.0003\nCC-MAIN-2024-38,text/x-patch,10040,10040,0.0004\nCC-MAIN-2024-38,text/x-perl,1199,1199,0.0000\nCC-MAIN-2024-38,text/x-vcalendar,10417,10415,0.0004\nCC-MAIN-2024-38,text/x-vcard,54070,54049,0.0019\nCC-MAIN-2024-38,text/xml,1555902,1554057,0.0556\nCC-MAIN-2024-38,unknown/unknown,672,672,0.0000\nCC-MAIN-2024-38,video/mp4,158,158,0.0000\nCC-MAIN-2024-38,video/webm,6,6,0.0000\nCC-MAIN-2024-38,video/x-ms-asf,4329,4325,0.0002\nCC-MAIN-2024-42,<other>,3686798,3653113,0.1478\nCC-MAIN-2024-42,application/atom+xml,2760788,2760648,0.1106\nCC-MAIN-2024-42,application/calendar,13074,13074,0.0005\nCC-MAIN-2024-42,application/download,86347,86346,0.0035\nCC-MAIN-2024-42,application/epub+zip,43551,43383,0.0017\nCC-MAIN-2024-42,application/force-download,203598,203559,0.0082\nCC-MAIN-2024-42,application/gpx+xml,18814,18814,0.0008\nCC-MAIN-2024-42,application/ics,11650,11648,0.0005\nCC-MAIN-2024-42,application/javascript,5349,5342,0.0002\nCC-MAIN-2024-42,application/json,764656,763756,0.0306\nCC-MAIN-2024-42,application/ld+json,50961,50886,0.0020\nCC-MAIN-2024-42,application/marc,14386,14386,0.0006\nCC-MAIN-2024-42,application/msword,84160,84023,0.0034\nCC-MAIN-2024-42,application/octet-stream,1356959,1356498,0.0544\nCC-MAIN-2024-42,application/octetstream,9479,9476,0.0004\nCC-MAIN-2024-42,application/pdf,25362417,25307923,1.0165\nCC-MAIN-2024-42,application/pgp-encrypted,1945,1945,0.0001\nCC-MAIN-2024-42,application/pgp-signature,88380,88378,0.0035\nCC-MAIN-2024-42,application/postscript,4648,4640,0.0002\nCC-MAIN-2024-42,application/rdf+xml,144464,144393,0.0058\nCC-MAIN-2024-42,application/rss+xml,1439554,1438298,0.0577\nCC-MAIN-2024-42,application/rtf,21717,21715,0.0009\nCC-MAIN-2024-42,application/save-to-disk,14,14,0.0000\nCC-MAIN-2024-42,application/text,5400,5400,0.0002\nCC-MAIN-2024-42,application/unknown,7798,7798,0.0003\nCC-MAIN-2024-42,application/vnd.android.package-archive,222,222,0.0000\nCC-MAIN-2024-42,application/vnd.google-earth.kml+xml,35999,35957,0.0014\nCC-MAIN-2024-42,application/vnd.google-earth.kmz,20886,20882,0.0008\nCC-MAIN-2024-42,application/vnd.ms-excel,47742,47654,0.0019\nCC-MAIN-2024-42,application/vnd.ms-powerpoint,9032,9026,0.0004\nCC-MAIN-2024-42,application/vnd.ms-word,5941,5941,0.0002\nCC-MAIN-2024-42,application/vnd.oasis.opendocument.text,19433,19433,0.0008\nCC-MAIN-2024-42,application/vnd.openxmlformats-officedocument.presentationml.presentation,6283,6238,0.0003\nCC-MAIN-2024-42,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,42151,41786,0.0017\nCC-MAIN-2024-42,application/vnd.openxmlformats-officedocument.wordprocessingml.document,67810,67547,0.0027\nCC-MAIN-2024-42,application/vnd.wap.xhtml+xml,16032,15881,0.0006\nCC-MAIN-2024-42,application/x-bibtex,158381,158375,0.0063\nCC-MAIN-2024-42,application/x-bittorrent,4103,4103,0.0002\nCC-MAIN-2024-42,application/x-debian-package,11,11,0.0000\nCC-MAIN-2024-42,application/x-download,51408,51395,0.0021\nCC-MAIN-2024-42,application/x-endnote-refer,32987,32984,0.0013\nCC-MAIN-2024-42,application/x-gzip,9095,9094,0.0004\nCC-MAIN-2024-42,application/x-httpd-php,6623,6607,0.0003\nCC-MAIN-2024-42,application/x-java-jnlp-file,8424,8422,0.0003\nCC-MAIN-2024-42,application/x-javascript,1976,1975,0.0001\nCC-MAIN-2024-42,application/x-json,55,55,0.0000\nCC-MAIN-2024-42,application/x-mobipocket-ebook,14021,13883,0.0006\nCC-MAIN-2024-42,application/x-msdownload,5854,5853,0.0002\nCC-MAIN-2024-42,application/x-netcdf,3447,3447,0.0001\nCC-MAIN-2024-42,application/x-research-info-systems,294384,294356,0.0118\nCC-MAIN-2024-42,application/x-shockwave-flash,5201,5193,0.0002\nCC-MAIN-2024-42,application/x-tar,5220,5220,0.0002\nCC-MAIN-2024-42,application/x-tex,7296,7293,0.0003\nCC-MAIN-2024-42,application/x-troff-man,20140,20140,0.0008\nCC-MAIN-2024-42,application/x-zip-compressed,222,222,0.0000\nCC-MAIN-2024-42,application/xhtml+xml,286364,280375,0.0115\nCC-MAIN-2024-42,application/xml,660877,660251,0.0265\nCC-MAIN-2024-42,application/zip,4838,4801,0.0002\nCC-MAIN-2024-42,audio/mpeg,1464,1464,0.0001\nCC-MAIN-2024-42,audio/x-mpegurl,14120,14113,0.0006\nCC-MAIN-2024-42,audio/x-scpls,2747,2747,0.0001\nCC-MAIN-2024-42,audio/x-wav,31,31,0.0000\nCC-MAIN-2024-42,binary/octet-stream,17099,17075,0.0007\nCC-MAIN-2024-42,image/gif,11727,11726,0.0005\nCC-MAIN-2024-42,image/jp2,1,1,0.0000\nCC-MAIN-2024-42,image/jpeg,9606,9606,0.0004\nCC-MAIN-2024-42,image/jpg,254,254,0.0000\nCC-MAIN-2024-42,image/pjpeg,27,27,0.0000\nCC-MAIN-2024-42,image/png,2650,2644,0.0001\nCC-MAIN-2024-42,image/svg+xml,122,122,0.0000\nCC-MAIN-2024-42,image/tiff,46,46,0.0000\nCC-MAIN-2024-42,image/webp,40,40,0.0000\nCC-MAIN-2024-42,message/rfc822,7162,7160,0.0003\nCC-MAIN-2024-42,text/calendar,837303,837075,0.0336\nCC-MAIN-2024-42,text/css,17199,17196,0.0007\nCC-MAIN-2024-42,text/csv,98444,97646,0.0039\nCC-MAIN-2024-42,text/directory,6337,6336,0.0003\nCC-MAIN-2024-42,text/enriched,1998,1998,0.0001\nCC-MAIN-2024-42,text/html,2452332112,2439301815,98.2824\nCC-MAIN-2024-42,text/javascript,5076,5074,0.0002\nCC-MAIN-2024-42,text/markdown,4794,4792,0.0002\nCC-MAIN-2024-42,text/pdf,662,662,0.0000\nCC-MAIN-2024-42,text/plain,1788085,1787173,0.0717\nCC-MAIN-2024-42,text/prs.lines.tag,102458,102453,0.0041\nCC-MAIN-2024-42,text/tab-separated-values,6820,6819,0.0003\nCC-MAIN-2024-42,text/turtle,55016,54952,0.0022\nCC-MAIN-2024-42,text/vcard,25544,25529,0.0010\nCC-MAIN-2024-42,text/x-bibtex,21645,21639,0.0009\nCC-MAIN-2024-42,text/x-c,5511,5509,0.0002\nCC-MAIN-2024-42,text/x-csrc,9546,9546,0.0004\nCC-MAIN-2024-42,text/x-diff,11920,11920,0.0005\nCC-MAIN-2024-42,text/x-patch,11069,11066,0.0004\nCC-MAIN-2024-42,text/x-perl,1204,1204,0.0000\nCC-MAIN-2024-42,text/x-vcalendar,11275,11275,0.0005\nCC-MAIN-2024-42,text/x-vcard,60699,60682,0.0024\nCC-MAIN-2024-42,text/xml,1663653,1662101,0.0667\nCC-MAIN-2024-42,unknown/unknown,704,704,0.0000\nCC-MAIN-2024-42,video/mp4,195,195,0.0000\nCC-MAIN-2024-42,video/webm,22,22,0.0000\nCC-MAIN-2024-42,video/x-ms-asf,5002,5002,0.0002\nCC-MAIN-2024-46,<other>,3741705,3736027,0.1392\nCC-MAIN-2024-46,application/atom+xml,2658410,2658303,0.0989\nCC-MAIN-2024-46,application/calendar,11514,11509,0.0004\nCC-MAIN-2024-46,application/download,86145,86144,0.0032\nCC-MAIN-2024-46,application/epub+zip,45330,45150,0.0017\nCC-MAIN-2024-46,application/force-download,178283,178262,0.0066\nCC-MAIN-2024-46,application/gpx+xml,15225,15225,0.0006\nCC-MAIN-2024-46,application/ics,9212,9212,0.0003\nCC-MAIN-2024-46,application/javascript,4486,4128,0.0002\nCC-MAIN-2024-46,application/json,861707,860943,0.0321\nCC-MAIN-2024-46,application/ld+json,51372,51212,0.0019\nCC-MAIN-2024-46,application/marc,16914,16914,0.0006\nCC-MAIN-2024-46,application/msword,70078,69913,0.0026\nCC-MAIN-2024-46,application/octet-stream,1334118,1333685,0.0496\nCC-MAIN-2024-46,application/octetstream,5008,5005,0.0002\nCC-MAIN-2024-46,application/pdf,20922522,20876804,0.7784\nCC-MAIN-2024-46,application/pgp-encrypted,2224,2224,0.0001\nCC-MAIN-2024-46,application/pgp-signature,89694,89694,0.0033\nCC-MAIN-2024-46,application/postscript,4013,3999,0.0001\nCC-MAIN-2024-46,application/rdf+xml,139363,139191,0.0052\nCC-MAIN-2024-46,application/rss+xml,1410570,1409353,0.0525\nCC-MAIN-2024-46,application/rtf,20114,20111,0.0007\nCC-MAIN-2024-46,application/save-to-disk,23,23,0.0000\nCC-MAIN-2024-46,application/text,5064,5063,0.0002\nCC-MAIN-2024-46,application/unknown,7720,7718,0.0003\nCC-MAIN-2024-46,application/vnd.android.package-archive,166,166,0.0000\nCC-MAIN-2024-46,application/vnd.google-earth.kml+xml,47621,47033,0.0018\nCC-MAIN-2024-46,application/vnd.google-earth.kmz,20038,20037,0.0007\nCC-MAIN-2024-46,application/vnd.ms-excel,49039,48994,0.0018\nCC-MAIN-2024-46,application/vnd.ms-powerpoint,11874,11870,0.0004\nCC-MAIN-2024-46,application/vnd.ms-word,6409,6409,0.0002\nCC-MAIN-2024-46,application/vnd.oasis.opendocument.text,18722,18719,0.0007\nCC-MAIN-2024-46,application/vnd.openxmlformats-officedocument.presentationml.presentation,5501,5493,0.0002\nCC-MAIN-2024-46,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,37516,37370,0.0014\nCC-MAIN-2024-46,application/vnd.openxmlformats-officedocument.wordprocessingml.document,63279,63125,0.0024\nCC-MAIN-2024-46,application/vnd.wap.xhtml+xml,16178,16070,0.0006\nCC-MAIN-2024-46,application/x-bibtex,166427,166414,0.0062\nCC-MAIN-2024-46,application/x-bittorrent,5402,5402,0.0002\nCC-MAIN-2024-46,application/x-debian-package,14,14,0.0000\nCC-MAIN-2024-46,application/x-download,53454,53357,0.0020\nCC-MAIN-2024-46,application/x-endnote-refer,36788,36787,0.0014\nCC-MAIN-2024-46,application/x-gzip,7297,7296,0.0003\nCC-MAIN-2024-46,application/x-httpd-php,11811,11800,0.0004\nCC-MAIN-2024-46,application/x-java-jnlp-file,5806,5806,0.0002\nCC-MAIN-2024-46,application/x-javascript,1580,1577,0.0001\nCC-MAIN-2024-46,application/x-json,39,39,0.0000\nCC-MAIN-2024-46,application/x-mobipocket-ebook,15046,14881,0.0006\nCC-MAIN-2024-46,application/x-msdownload,6311,6311,0.0002\nCC-MAIN-2024-46,application/x-netcdf,4358,4358,0.0002\nCC-MAIN-2024-46,application/x-research-info-systems,313903,313867,0.0117\nCC-MAIN-2024-46,application/x-shockwave-flash,4919,4917,0.0002\nCC-MAIN-2024-46,application/x-tar,3691,3691,0.0001\nCC-MAIN-2024-46,application/x-tex,5186,5179,0.0002\nCC-MAIN-2024-46,application/x-troff-man,20148,20148,0.0007\nCC-MAIN-2024-46,application/x-zip-compressed,156,156,0.0000\nCC-MAIN-2024-46,application/xhtml+xml,311117,299759,0.0116\nCC-MAIN-2024-46,application/xml,1455489,1454522,0.0542\nCC-MAIN-2024-46,application/zip,3704,3701,0.0001\nCC-MAIN-2024-46,audio/mpeg,1295,1295,0.0000\nCC-MAIN-2024-46,audio/x-mpegurl,11619,11618,0.0004\nCC-MAIN-2024-46,audio/x-scpls,2820,2819,0.0001\nCC-MAIN-2024-46,audio/x-wav,25,25,0.0000\nCC-MAIN-2024-46,binary/octet-stream,20149,20095,0.0007\nCC-MAIN-2024-46,image/gif,13432,13431,0.0005\nCC-MAIN-2024-46,image/jp2,3,3,0.0000\nCC-MAIN-2024-46,image/jpeg,7227,7223,0.0003\nCC-MAIN-2024-46,image/jpg,398,398,0.0000\nCC-MAIN-2024-46,image/pjpeg,16,16,0.0000\nCC-MAIN-2024-46,image/png,3505,3503,0.0001\nCC-MAIN-2024-46,image/svg+xml,36,36,0.0000\nCC-MAIN-2024-46,image/tiff,33,33,0.0000\nCC-MAIN-2024-46,image/vnd.djvu,29,29,0.0000\nCC-MAIN-2024-46,image/webp,49,49,0.0000\nCC-MAIN-2024-46,message/rfc822,7491,7491,0.0003\nCC-MAIN-2024-46,text/calendar,807240,807077,0.0300\nCC-MAIN-2024-46,text/css,14895,14893,0.0006\nCC-MAIN-2024-46,text/csv,94453,93788,0.0035\nCC-MAIN-2024-46,text/directory,5823,5822,0.0002\nCC-MAIN-2024-46,text/enriched,1559,1559,0.0001\nCC-MAIN-2024-46,text/html,2648573839,2635613828,98.5402\nCC-MAIN-2024-46,text/javascript,5594,5593,0.0002\nCC-MAIN-2024-46,text/markdown,5045,5002,0.0002\nCC-MAIN-2024-46,text/pdf,363,363,0.0000\nCC-MAIN-2024-46,text/plain,1749796,1749116,0.0651\nCC-MAIN-2024-46,text/prs.lines.tag,116557,116557,0.0043\nCC-MAIN-2024-46,text/tab-separated-values,8729,8727,0.0003\nCC-MAIN-2024-46,text/turtle,53714,53572,0.0020\nCC-MAIN-2024-46,text/vcard,29594,29585,0.0011\nCC-MAIN-2024-46,text/x-bibtex,24349,24345,0.0009\nCC-MAIN-2024-46,text/x-c,3188,3188,0.0001\nCC-MAIN-2024-46,text/x-csrc,9185,9184,0.0003\nCC-MAIN-2024-46,text/x-diff,12417,12417,0.0005\nCC-MAIN-2024-46,text/x-patch,9849,9849,0.0004\nCC-MAIN-2024-46,text/x-perl,1738,1738,0.0001\nCC-MAIN-2024-46,text/x-vcalendar,12561,12561,0.0005\nCC-MAIN-2024-46,text/x-vcard,52490,52477,0.0020\nCC-MAIN-2024-46,text/xml,1745486,1743606,0.0649\nCC-MAIN-2024-46,unknown/unknown,466,466,0.0000\nCC-MAIN-2024-46,video/mp4,482,482,0.0000\nCC-MAIN-2024-46,video/x-ms-asf,4405,4401,0.0002\nCC-MAIN-2024-51,<other>,2974274,2968917,0.1129\nCC-MAIN-2024-51,application/atom+xml,2895915,2895419,0.1099\nCC-MAIN-2024-51,application/calendar,11556,11556,0.0004\nCC-MAIN-2024-51,application/download,89543,89538,0.0034\nCC-MAIN-2024-51,application/epub+zip,54248,53966,0.0021\nCC-MAIN-2024-51,application/force-download,191189,191118,0.0073\nCC-MAIN-2024-51,application/gpx+xml,15525,15523,0.0006\nCC-MAIN-2024-51,application/ics,11185,11181,0.0004\nCC-MAIN-2024-51,application/javascript,7699,7208,0.0003\nCC-MAIN-2024-51,application/json,909781,908742,0.0345\nCC-MAIN-2024-51,application/ld+json,60437,60266,0.0023\nCC-MAIN-2024-51,application/marc,22070,22069,0.0008\nCC-MAIN-2024-51,application/msword,73133,73029,0.0028\nCC-MAIN-2024-51,application/octet-stream,1468983,1468498,0.0557\nCC-MAIN-2024-51,application/octetstream,6431,6430,0.0002\nCC-MAIN-2024-51,application/pdf,21537975,21487780,0.8173\nCC-MAIN-2024-51,application/pgp-encrypted,2266,2266,0.0001\nCC-MAIN-2024-51,application/pgp-signature,73432,73430,0.0028\nCC-MAIN-2024-51,application/postscript,4237,4228,0.0002\nCC-MAIN-2024-51,application/rdf+xml,147029,146844,0.0056\nCC-MAIN-2024-51,application/rss+xml,1504643,1503613,0.0571\nCC-MAIN-2024-51,application/rtf,25426,25423,0.0010\nCC-MAIN-2024-51,application/save-to-disk,26,26,0.0000\nCC-MAIN-2024-51,application/text,4212,4212,0.0002\nCC-MAIN-2024-51,application/unknown,6772,6770,0.0003\nCC-MAIN-2024-51,application/vnd.android.package-archive,204,204,0.0000\nCC-MAIN-2024-51,application/vnd.google-earth.kml+xml,36784,36679,0.0014\nCC-MAIN-2024-51,application/vnd.google-earth.kmz,12070,12065,0.0005\nCC-MAIN-2024-51,application/vnd.ms-excel,52318,52264,0.0020\nCC-MAIN-2024-51,application/vnd.ms-powerpoint,6453,6442,0.0002\nCC-MAIN-2024-51,application/vnd.ms-word,6187,6187,0.0002\nCC-MAIN-2024-51,application/vnd.oasis.opendocument.text,20141,20132,0.0008\nCC-MAIN-2024-51,application/vnd.openxmlformats-officedocument.presentationml.presentation,6411,6393,0.0002\nCC-MAIN-2024-51,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,38928,38797,0.0015\nCC-MAIN-2024-51,application/vnd.openxmlformats-officedocument.wordprocessingml.document,62833,62658,0.0024\nCC-MAIN-2024-51,application/vnd.wap.xhtml+xml,19235,19071,0.0007\nCC-MAIN-2024-51,application/x-bibtex,175523,175509,0.0067\nCC-MAIN-2024-51,application/x-bittorrent,4260,4256,0.0002\nCC-MAIN-2024-51,application/x-debian-package,126,126,0.0000\nCC-MAIN-2024-51,application/x-download,57978,57901,0.0022\nCC-MAIN-2024-51,application/x-endnote-refer,31978,31978,0.0012\nCC-MAIN-2024-51,application/x-gzip,5283,5282,0.0002\nCC-MAIN-2024-51,application/x-httpd-php,10425,10410,0.0004\nCC-MAIN-2024-51,application/x-java-jnlp-file,8178,8178,0.0003\nCC-MAIN-2024-51,application/x-javascript,1472,1472,0.0001\nCC-MAIN-2024-51,application/x-json,20,20,0.0000\nCC-MAIN-2024-51,application/x-mobipocket-ebook,19037,18759,0.0007\nCC-MAIN-2024-51,application/x-msdownload,9057,9054,0.0003\nCC-MAIN-2024-51,application/x-netcdf,4945,4945,0.0002\nCC-MAIN-2024-51,application/x-research-info-systems,308115,308091,0.0117\nCC-MAIN-2024-51,application/x-shockwave-flash,5290,5289,0.0002\nCC-MAIN-2024-51,application/x-tar,2550,2549,0.0001\nCC-MAIN-2024-51,application/x-tex,4563,4563,0.0002\nCC-MAIN-2024-51,application/x-troff-man,29686,29668,0.0011\nCC-MAIN-2024-51,application/x-zip-compressed,169,169,0.0000\nCC-MAIN-2024-51,application/xhtml+xml,399354,381287,0.0152\nCC-MAIN-2024-51,application/xml,695003,693950,0.0264\nCC-MAIN-2024-51,application/zip,4927,4923,0.0002\nCC-MAIN-2024-51,audio/mpeg,1408,1407,0.0001\nCC-MAIN-2024-51,audio/x-mpegurl,13950,13942,0.0005\nCC-MAIN-2024-51,audio/x-scpls,3217,3217,0.0001\nCC-MAIN-2024-51,audio/x-wav,28,28,0.0000\nCC-MAIN-2024-51,binary/octet-stream,18108,18100,0.0007\nCC-MAIN-2024-51,image/gif,12878,12877,0.0005\nCC-MAIN-2024-51,image/jpeg,9469,9468,0.0004\nCC-MAIN-2024-51,image/jpg,426,426,0.0000\nCC-MAIN-2024-51,image/pjpeg,48,48,0.0000\nCC-MAIN-2024-51,image/png,2878,2876,0.0001\nCC-MAIN-2024-51,image/svg+xml,33,33,0.0000\nCC-MAIN-2024-51,image/tiff,54,54,0.0000\nCC-MAIN-2024-51,image/vnd.djvu,26,26,0.0000\nCC-MAIN-2024-51,image/webp,82,81,0.0000\nCC-MAIN-2024-51,message/rfc822,7160,7160,0.0003\nCC-MAIN-2024-51,text/calendar,873001,872809,0.0331\nCC-MAIN-2024-51,text/css,14711,14709,0.0006\nCC-MAIN-2024-51,text/csv,105122,104876,0.0040\nCC-MAIN-2024-51,text/directory,5912,5912,0.0002\nCC-MAIN-2024-51,text/enriched,2097,2097,0.0001\nCC-MAIN-2024-51,text/html,2596267567,2582869344,98.5165\nCC-MAIN-2024-51,text/javascript,4775,4771,0.0002\nCC-MAIN-2024-51,text/markdown,5700,5700,0.0002\nCC-MAIN-2024-51,text/pdf,528,528,0.0000\nCC-MAIN-2024-51,text/plain,1771124,1770529,0.0672\nCC-MAIN-2024-51,text/prs.lines.tag,132408,132408,0.0050\nCC-MAIN-2024-51,text/tab-separated-values,11046,11046,0.0004\nCC-MAIN-2024-51,text/turtle,63201,63044,0.0024\nCC-MAIN-2024-51,text/vcard,25605,25596,0.0010\nCC-MAIN-2024-51,text/x-bibtex,19367,19364,0.0007\nCC-MAIN-2024-51,text/x-c,3203,3203,0.0001\nCC-MAIN-2024-51,text/x-csrc,10691,10691,0.0004\nCC-MAIN-2024-51,text/x-diff,7106,7105,0.0003\nCC-MAIN-2024-51,text/x-patch,10175,10175,0.0004\nCC-MAIN-2024-51,text/x-perl,1455,1455,0.0001\nCC-MAIN-2024-51,text/x-vcalendar,14932,14931,0.0006\nCC-MAIN-2024-51,text/x-vcard,55129,55041,0.0021\nCC-MAIN-2024-51,text/xml,1744902,1743201,0.0662\nCC-MAIN-2024-51,unknown/unknown,980,980,0.0000\nCC-MAIN-2024-51,video/mp4,539,539,0.0000\nCC-MAIN-2024-51,video/webm,8,8,0.0000\nCC-MAIN-2024-51,video/x-ms-asf,3817,3816,0.0001\nCC-MAIN-2025-05,<other>,2594437,2589845,0.0856\nCC-MAIN-2025-05,application/atom+xml,3101968,3100241,0.1023\nCC-MAIN-2025-05,application/calendar,12427,12426,0.0004\nCC-MAIN-2025-05,application/download,78938,78936,0.0026\nCC-MAIN-2025-05,application/epub+zip,37554,37448,0.0012\nCC-MAIN-2025-05,application/force-download,198489,198419,0.0065\nCC-MAIN-2025-05,application/gpx+xml,14915,14912,0.0005\nCC-MAIN-2025-05,application/ics,10615,10615,0.0004\nCC-MAIN-2025-05,application/javascript,5709,5703,0.0002\nCC-MAIN-2025-05,application/json,933993,933178,0.0308\nCC-MAIN-2025-05,application/ld+json,62456,62415,0.0021\nCC-MAIN-2025-05,application/marc,17001,17000,0.0006\nCC-MAIN-2025-05,application/msword,72127,71968,0.0024\nCC-MAIN-2025-05,application/octet-stream,1395780,1395080,0.0460\nCC-MAIN-2025-05,application/octetstream,4736,4732,0.0002\nCC-MAIN-2025-05,application/pdf,19480352,19430329,0.6426\nCC-MAIN-2025-05,application/pgp-encrypted,2733,2733,0.0001\nCC-MAIN-2025-05,application/pgp-signature,95381,95381,0.0031\nCC-MAIN-2025-05,application/postscript,3852,3849,0.0001\nCC-MAIN-2025-05,application/rdf+xml,151978,151922,0.0050\nCC-MAIN-2025-05,application/rss+xml,1530770,1529642,0.0505\nCC-MAIN-2025-05,application/rtf,25907,25903,0.0009\nCC-MAIN-2025-05,application/save-to-disk,59,59,0.0000\nCC-MAIN-2025-05,application/text,4353,4353,0.0001\nCC-MAIN-2025-05,application/unknown,4646,4646,0.0002\nCC-MAIN-2025-05,application/vnd.android.package-archive,76,75,0.0000\nCC-MAIN-2025-05,application/vnd.google-earth.kml+xml,35888,35426,0.0012\nCC-MAIN-2025-05,application/vnd.google-earth.kmz,10452,10442,0.0003\nCC-MAIN-2025-05,application/vnd.ms-excel,52402,52339,0.0017\nCC-MAIN-2025-05,application/vnd.ms-powerpoint,4461,4458,0.0001\nCC-MAIN-2025-05,application/vnd.ms-word,6758,6758,0.0002\nCC-MAIN-2025-05,application/vnd.oasis.opendocument.text,18204,18195,0.0006\nCC-MAIN-2025-05,application/vnd.openxmlformats-officedocument.presentationml.presentation,6080,6054,0.0002\nCC-MAIN-2025-05,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,38042,37661,0.0013\nCC-MAIN-2025-05,application/vnd.openxmlformats-officedocument.wordprocessingml.document,60852,60562,0.0020\nCC-MAIN-2025-05,application/vnd.wap.xhtml+xml,17320,17245,0.0006\nCC-MAIN-2025-05,application/x-bibtex,179765,179733,0.0059\nCC-MAIN-2025-05,application/x-bittorrent,4428,4427,0.0001\nCC-MAIN-2025-05,application/x-debian-package,26,26,0.0000\nCC-MAIN-2025-05,application/x-download,59154,58286,0.0020\nCC-MAIN-2025-05,application/x-endnote-refer,24691,24691,0.0008\nCC-MAIN-2025-05,application/x-gzip,6974,6973,0.0002\nCC-MAIN-2025-05,application/x-httpd-php,10261,10238,0.0003\nCC-MAIN-2025-05,application/x-java-jnlp-file,7930,7929,0.0003\nCC-MAIN-2025-05,application/x-javascript,2995,2995,0.0001\nCC-MAIN-2025-05,application/x-json,201,201,0.0000\nCC-MAIN-2025-05,application/x-mobipocket-ebook,10564,10482,0.0003\nCC-MAIN-2025-05,application/x-msdownload,8735,8734,0.0003\nCC-MAIN-2025-05,application/x-netcdf,6143,6143,0.0002\nCC-MAIN-2025-05,application/x-research-info-systems,269526,269501,0.0089\nCC-MAIN-2025-05,application/x-shockwave-flash,5024,5022,0.0002\nCC-MAIN-2025-05,application/x-tar,4045,4045,0.0001\nCC-MAIN-2025-05,application/x-tex,5958,5958,0.0002\nCC-MAIN-2025-05,application/x-troff-man,22981,22981,0.0008\nCC-MAIN-2025-05,application/x-zip-compressed,184,184,0.0000\nCC-MAIN-2025-05,application/xhtml+xml,425715,405471,0.0140\nCC-MAIN-2025-05,application/xml,842481,841788,0.0278\nCC-MAIN-2025-05,application/zip,7504,7499,0.0002\nCC-MAIN-2025-05,audio/mpeg,1650,1650,0.0001\nCC-MAIN-2025-05,audio/x-mpegurl,16046,16043,0.0005\nCC-MAIN-2025-05,audio/x-scpls,3681,3679,0.0001\nCC-MAIN-2025-05,audio/x-wav,24,24,0.0000\nCC-MAIN-2025-05,binary/octet-stream,26712,26697,0.0009\nCC-MAIN-2025-05,image/gif,17462,17460,0.0006\nCC-MAIN-2025-05,image/jp2,1,1,0.0000\nCC-MAIN-2025-05,image/jpeg,10096,10096,0.0003\nCC-MAIN-2025-05,image/jpg,866,866,0.0000\nCC-MAIN-2025-05,image/pjpeg,36,36,0.0000\nCC-MAIN-2025-05,image/png,4056,4054,0.0001\nCC-MAIN-2025-05,image/svg+xml,40,40,0.0000\nCC-MAIN-2025-05,image/tiff,38,38,0.0000\nCC-MAIN-2025-05,image/vnd.djvu,1,1,0.0000\nCC-MAIN-2025-05,image/webp,63,63,0.0000\nCC-MAIN-2025-05,message/rfc822,9963,9963,0.0003\nCC-MAIN-2025-05,text/calendar,876538,876244,0.0289\nCC-MAIN-2025-05,text/css,18656,18654,0.0006\nCC-MAIN-2025-05,text/csv,109469,109323,0.0036\nCC-MAIN-2025-05,text/directory,5592,5583,0.0002\nCC-MAIN-2025-05,text/enriched,1768,1768,0.0001\nCC-MAIN-2025-05,text/html,2994256124,2978099600,98.7787\nCC-MAIN-2025-05,text/javascript,6234,6227,0.0002\nCC-MAIN-2025-05,text/markdown,4773,4767,0.0002\nCC-MAIN-2025-05,text/pdf,1299,1299,0.0000\nCC-MAIN-2025-05,text/plain,1689043,1688360,0.0557\nCC-MAIN-2025-05,text/prs.lines.tag,185761,185761,0.0061\nCC-MAIN-2025-05,text/tab-separated-values,10052,10036,0.0003\nCC-MAIN-2025-05,text/turtle,60140,60095,0.0020\nCC-MAIN-2025-05,text/vcard,26065,26058,0.0009\nCC-MAIN-2025-05,text/x-bibtex,27114,27113,0.0009\nCC-MAIN-2025-05,text/x-c,3827,3822,0.0001\nCC-MAIN-2025-05,text/x-csrc,4526,4525,0.0001\nCC-MAIN-2025-05,text/x-diff,6248,6246,0.0002\nCC-MAIN-2025-05,text/x-patch,10964,10964,0.0004\nCC-MAIN-2025-05,text/x-perl,997,997,0.0000\nCC-MAIN-2025-05,text/x-vcalendar,12736,12735,0.0004\nCC-MAIN-2025-05,text/x-vcard,52337,52306,0.0017\nCC-MAIN-2025-05,text/xml,1814946,1812814,0.0599\nCC-MAIN-2025-05,unknown/unknown,868,868,0.0000\nCC-MAIN-2025-05,video/mp4,410,410,0.0000\nCC-MAIN-2025-05,video/webm,2,2,0.0000\nCC-MAIN-2025-05,video/x-ms-asf,4117,4111,0.0001\nCC-MAIN-2025-08,<other>,2703810,2699492,0.1009\nCC-MAIN-2025-08,application/atom+xml,3024419,3023884,0.1129\nCC-MAIN-2025-08,application/calendar,15250,15249,0.0006\nCC-MAIN-2025-08,application/download,91638,91635,0.0034\nCC-MAIN-2025-08,application/epub+zip,43784,43461,0.0016\nCC-MAIN-2025-08,application/force-download,228893,228819,0.0085\nCC-MAIN-2025-08,application/gpx+xml,18570,18570,0.0007\nCC-MAIN-2025-08,application/ics,12145,12140,0.0005\nCC-MAIN-2025-08,application/javascript,6002,5996,0.0002\nCC-MAIN-2025-08,application/json,988693,987514,0.0369\nCC-MAIN-2025-08,application/ld+json,60743,60617,0.0023\nCC-MAIN-2025-08,application/marc,21787,21786,0.0008\nCC-MAIN-2025-08,application/msword,74075,73966,0.0028\nCC-MAIN-2025-08,application/octet-stream,1485309,1484650,0.0554\nCC-MAIN-2025-08,application/octetstream,7109,7109,0.0003\nCC-MAIN-2025-08,application/pdf,20577808,20529959,0.7679\nCC-MAIN-2025-08,application/pgp-encrypted,2179,2179,0.0001\nCC-MAIN-2025-08,application/pgp-signature,86805,86803,0.0032\nCC-MAIN-2025-08,application/postscript,4313,4304,0.0002\nCC-MAIN-2025-08,application/rdf+xml,148402,148248,0.0055\nCC-MAIN-2025-08,application/rss+xml,1539916,1538791,0.0575\nCC-MAIN-2025-08,application/rtf,24844,24838,0.0009\nCC-MAIN-2025-08,application/save-to-disk,43,43,0.0000\nCC-MAIN-2025-08,application/text,4307,4307,0.0002\nCC-MAIN-2025-08,application/unknown,5559,5559,0.0002\nCC-MAIN-2025-08,application/vnd.android.package-archive,349,349,0.0000\nCC-MAIN-2025-08,application/vnd.google-earth.kml+xml,38054,37972,0.0014\nCC-MAIN-2025-08,application/vnd.google-earth.kmz,10665,10662,0.0004\nCC-MAIN-2025-08,application/vnd.ms-excel,53090,53037,0.0020\nCC-MAIN-2025-08,application/vnd.ms-powerpoint,4895,4889,0.0002\nCC-MAIN-2025-08,application/vnd.ms-word,8350,8348,0.0003\nCC-MAIN-2025-08,application/vnd.oasis.opendocument.text,18173,18170,0.0007\nCC-MAIN-2025-08,application/vnd.openxmlformats-officedocument.presentationml.presentation,6091,6066,0.0002\nCC-MAIN-2025-08,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,36461,36339,0.0014\nCC-MAIN-2025-08,application/vnd.openxmlformats-officedocument.wordprocessingml.document,63426,63300,0.0024\nCC-MAIN-2025-08,application/vnd.wap.xhtml+xml,27851,27759,0.0010\nCC-MAIN-2025-08,application/x-bibtex,187202,187174,0.0070\nCC-MAIN-2025-08,application/x-bittorrent,4450,4448,0.0002\nCC-MAIN-2025-08,application/x-debian-package,9,9,0.0000\nCC-MAIN-2025-08,application/x-download,67622,67567,0.0025\nCC-MAIN-2025-08,application/x-endnote-refer,24054,24054,0.0009\nCC-MAIN-2025-08,application/x-gzip,3592,3592,0.0001\nCC-MAIN-2025-08,application/x-httpd-php,19228,19206,0.0007\nCC-MAIN-2025-08,application/x-java-jnlp-file,7107,7106,0.0003\nCC-MAIN-2025-08,application/x-javascript,2402,2400,0.0001\nCC-MAIN-2025-08,application/x-json,54,54,0.0000\nCC-MAIN-2025-08,application/x-mobipocket-ebook,17014,16718,0.0006\nCC-MAIN-2025-08,application/x-msdownload,9922,9922,0.0004\nCC-MAIN-2025-08,application/x-netcdf,12929,12929,0.0005\nCC-MAIN-2025-08,application/x-research-info-systems,280693,280657,0.0105\nCC-MAIN-2025-08,application/x-shockwave-flash,5228,5226,0.0002\nCC-MAIN-2025-08,application/x-tar,1525,1525,0.0001\nCC-MAIN-2025-08,application/x-tex,6030,6030,0.0002\nCC-MAIN-2025-08,application/x-troff-man,27282,27282,0.0010\nCC-MAIN-2025-08,application/x-zip-compressed,196,196,0.0000\nCC-MAIN-2025-08,application/xhtml+xml,384947,383906,0.0144\nCC-MAIN-2025-08,application/xml,755695,754866,0.0282\nCC-MAIN-2025-08,application/zip,3915,3902,0.0001\nCC-MAIN-2025-08,audio/mpeg,1882,1882,0.0001\nCC-MAIN-2025-08,audio/x-mpegurl,16193,16187,0.0006\nCC-MAIN-2025-08,audio/x-scpls,3116,3112,0.0001\nCC-MAIN-2025-08,audio/x-wav,13,13,0.0000\nCC-MAIN-2025-08,binary/octet-stream,19835,19826,0.0007\nCC-MAIN-2025-08,image/gif,11435,11435,0.0004\nCC-MAIN-2025-08,image/jp2,17,17,0.0000\nCC-MAIN-2025-08,image/jpeg,8939,8937,0.0003\nCC-MAIN-2025-08,image/jpg,1600,1600,0.0001\nCC-MAIN-2025-08,image/pjpeg,53,53,0.0000\nCC-MAIN-2025-08,image/png,4607,4605,0.0002\nCC-MAIN-2025-08,image/svg+xml,48,48,0.0000\nCC-MAIN-2025-08,image/tiff,38,38,0.0000\nCC-MAIN-2025-08,image/vnd.djvu,1,1,0.0000\nCC-MAIN-2025-08,image/webp,99,99,0.0000\nCC-MAIN-2025-08,message/rfc822,8858,8858,0.0003\nCC-MAIN-2025-08,text/calendar,918771,918401,0.0343\nCC-MAIN-2025-08,text/css,15158,15156,0.0006\nCC-MAIN-2025-08,text/csv,112543,112490,0.0042\nCC-MAIN-2025-08,text/directory,5445,5445,0.0002\nCC-MAIN-2025-08,text/enriched,2024,2024,0.0001\nCC-MAIN-2025-08,text/html,2641170244,2626889205,98.5619\nCC-MAIN-2025-08,text/javascript,7716,7708,0.0003\nCC-MAIN-2025-08,text/markdown,5451,5450,0.0002\nCC-MAIN-2025-08,text/pdf,336,336,0.0000\nCC-MAIN-2025-08,text/plain,1794042,1793286,0.0669\nCC-MAIN-2025-08,text/prs.lines.tag,159282,159282,0.0059\nCC-MAIN-2025-08,text/tab-separated-values,10178,10178,0.0004\nCC-MAIN-2025-08,text/turtle,65389,65268,0.0024\nCC-MAIN-2025-08,text/vcard,26941,26931,0.0010\nCC-MAIN-2025-08,text/x-bibtex,25165,25165,0.0009\nCC-MAIN-2025-08,text/x-c,5829,5826,0.0002\nCC-MAIN-2025-08,text/x-csrc,7215,7215,0.0003\nCC-MAIN-2025-08,text/x-diff,8181,8181,0.0003\nCC-MAIN-2025-08,text/x-patch,10858,10858,0.0004\nCC-MAIN-2025-08,text/x-perl,1441,1441,0.0001\nCC-MAIN-2025-08,text/x-vcalendar,12789,12786,0.0005\nCC-MAIN-2025-08,text/x-vcard,57215,57199,0.0021\nCC-MAIN-2025-08,text/xml,1936569,1934725,0.0723\nCC-MAIN-2025-08,unknown/unknown,833,833,0.0000\nCC-MAIN-2025-08,video/mp4,180,180,0.0000\nCC-MAIN-2025-08,video/webm,5,5,0.0000\nCC-MAIN-2025-08,video/x-ms-asf,4618,4613,0.0002\nCC-MAIN-2025-13,<other>,2822000,2815790,0.1030\nCC-MAIN-2025-13,application/atom+xml,3050555,3050039,0.1113\nCC-MAIN-2025-13,application/calendar,4964,4963,0.0002\nCC-MAIN-2025-13,application/download,90166,90158,0.0033\nCC-MAIN-2025-13,application/epub+zip,48305,47954,0.0018\nCC-MAIN-2025-13,application/force-download,198012,197946,0.0072\nCC-MAIN-2025-13,application/gpx+xml,14276,14276,0.0005\nCC-MAIN-2025-13,application/ics,8925,8922,0.0003\nCC-MAIN-2025-13,application/javascript,3969,3965,0.0001\nCC-MAIN-2025-13,application/json,896375,896010,0.0327\nCC-MAIN-2025-13,application/ld+json,58291,58179,0.0021\nCC-MAIN-2025-13,application/marc,23511,23511,0.0009\nCC-MAIN-2025-13,application/msword,76981,76824,0.0028\nCC-MAIN-2025-13,application/octet-stream,1546983,1546014,0.0564\nCC-MAIN-2025-13,application/octetstream,7127,7126,0.0003\nCC-MAIN-2025-13,application/pdf,18480241,18435707,0.6743\nCC-MAIN-2025-13,application/pgp-encrypted,3018,3018,0.0001\nCC-MAIN-2025-13,application/pgp-signature,66383,66383,0.0024\nCC-MAIN-2025-13,application/postscript,4671,4661,0.0002\nCC-MAIN-2025-13,application/rdf+xml,155221,155110,0.0057\nCC-MAIN-2025-13,application/rss+xml,1474693,1473605,0.0538\nCC-MAIN-2025-13,application/rtf,25454,25449,0.0009\nCC-MAIN-2025-13,application/save-to-disk,6,6,0.0000\nCC-MAIN-2025-13,application/text,4043,4043,0.0001\nCC-MAIN-2025-13,application/unknown,5106,5106,0.0002\nCC-MAIN-2025-13,application/vnd.android.package-archive,134,134,0.0000\nCC-MAIN-2025-13,application/vnd.google-earth.kml+xml,33382,33235,0.0012\nCC-MAIN-2025-13,application/vnd.google-earth.kmz,11657,11642,0.0004\nCC-MAIN-2025-13,application/vnd.ms-excel,51126,50835,0.0019\nCC-MAIN-2025-13,application/vnd.ms-powerpoint,4253,4227,0.0002\nCC-MAIN-2025-13,application/vnd.ms-word,7302,7301,0.0003\nCC-MAIN-2025-13,application/vnd.oasis.opendocument.text,15199,15183,0.0006\nCC-MAIN-2025-13,application/vnd.openxmlformats-officedocument.presentationml.presentation,6021,5968,0.0002\nCC-MAIN-2025-13,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,41441,41316,0.0015\nCC-MAIN-2025-13,application/vnd.openxmlformats-officedocument.wordprocessingml.document,59743,59407,0.0022\nCC-MAIN-2025-13,application/vnd.wap.xhtml+xml,29791,29673,0.0011\nCC-MAIN-2025-13,application/x-bibtex,187594,187544,0.0068\nCC-MAIN-2025-13,application/x-bittorrent,3812,3812,0.0001\nCC-MAIN-2025-13,application/x-debian-package,32,32,0.0000\nCC-MAIN-2025-13,application/x-download,75472,75459,0.0028\nCC-MAIN-2025-13,application/x-endnote-refer,22564,22564,0.0008\nCC-MAIN-2025-13,application/x-gzip,5219,5218,0.0002\nCC-MAIN-2025-13,application/x-httpd-php,12985,12973,0.0005\nCC-MAIN-2025-13,application/x-java-jnlp-file,9629,9629,0.0004\nCC-MAIN-2025-13,application/x-javascript,2729,2729,0.0001\nCC-MAIN-2025-13,application/x-json,14,14,0.0000\nCC-MAIN-2025-13,application/x-mobipocket-ebook,21108,20783,0.0008\nCC-MAIN-2025-13,application/x-msdownload,13005,13005,0.0005\nCC-MAIN-2025-13,application/x-netcdf,24058,24058,0.0009\nCC-MAIN-2025-13,application/x-research-info-systems,279335,279272,0.0102\nCC-MAIN-2025-13,application/x-shockwave-flash,3817,3816,0.0001\nCC-MAIN-2025-13,application/x-tar,2772,2772,0.0001\nCC-MAIN-2025-13,application/x-tex,4233,4233,0.0002\nCC-MAIN-2025-13,application/x-troff-man,37611,37611,0.0014\nCC-MAIN-2025-13,application/x-zip-compressed,232,232,0.0000\nCC-MAIN-2025-13,application/xhtml+xml,276054,275124,0.0101\nCC-MAIN-2025-13,application/xml,694354,693660,0.0253\nCC-MAIN-2025-13,application/zip,3752,3749,0.0001\nCC-MAIN-2025-13,audio/mpeg,1998,1998,0.0001\nCC-MAIN-2025-13,audio/x-mpegurl,12534,12528,0.0005\nCC-MAIN-2025-13,audio/x-scpls,4218,4217,0.0002\nCC-MAIN-2025-13,audio/x-wav,9,9,0.0000\nCC-MAIN-2025-13,binary/octet-stream,14453,14379,0.0005\nCC-MAIN-2025-13,image/gif,16031,16031,0.0006\nCC-MAIN-2025-13,image/jp2,4,4,0.0000\nCC-MAIN-2025-13,image/jpeg,8795,8794,0.0003\nCC-MAIN-2025-13,image/jpg,1960,1960,0.0001\nCC-MAIN-2025-13,image/pjpeg,18,18,0.0000\nCC-MAIN-2025-13,image/png,18340,18340,0.0007\nCC-MAIN-2025-13,image/svg+xml,61,61,0.0000\nCC-MAIN-2025-13,image/tiff,54,54,0.0000\nCC-MAIN-2025-13,image/vnd.djvu,22080,22079,0.0008\nCC-MAIN-2025-13,image/webp,66,66,0.0000\nCC-MAIN-2025-13,message/rfc822,8673,8669,0.0003\nCC-MAIN-2025-13,text/calendar,849656,849336,0.0310\nCC-MAIN-2025-13,text/css,16545,16541,0.0006\nCC-MAIN-2025-13,text/csv,110532,110442,0.0040\nCC-MAIN-2025-13,text/directory,4822,4821,0.0002\nCC-MAIN-2025-13,text/enriched,1300,1300,0.0000\nCC-MAIN-2025-13,text/html,2704511464,2689682321,98.6744\nCC-MAIN-2025-13,text/javascript,7548,7545,0.0003\nCC-MAIN-2025-13,text/markdown,6699,6697,0.0002\nCC-MAIN-2025-13,text/pdf,415,415,0.0000\nCC-MAIN-2025-13,text/plain,1922942,1922059,0.0702\nCC-MAIN-2025-13,text/prs.lines.tag,248668,248668,0.0091\nCC-MAIN-2025-13,text/tab-separated-values,9932,9932,0.0004\nCC-MAIN-2025-13,text/turtle,63790,63678,0.0023\nCC-MAIN-2025-13,text/vcard,24291,24270,0.0009\nCC-MAIN-2025-13,text/x-bibtex,9973,9972,0.0004\nCC-MAIN-2025-13,text/x-c,5854,5854,0.0002\nCC-MAIN-2025-13,text/x-csrc,6479,6479,0.0002\nCC-MAIN-2025-13,text/x-diff,7735,7735,0.0003\nCC-MAIN-2025-13,text/x-patch,11864,11864,0.0004\nCC-MAIN-2025-13,text/x-perl,1177,1177,0.0000\nCC-MAIN-2025-13,text/x-vcalendar,13213,13212,0.0005\nCC-MAIN-2025-13,text/x-vcard,54878,54859,0.0020\nCC-MAIN-2025-13,text/xml,1829454,1827524,0.0667\nCC-MAIN-2025-13,unknown/unknown,522,522,0.0000\nCC-MAIN-2025-13,video/mp4,419,419,0.0000\nCC-MAIN-2025-13,video/webm,7,7,0.0000\nCC-MAIN-2025-13,video/x-ms-asf,5008,5008,0.0002\nCC-MAIN-2025-18,<other>,3651419,3647433,0.1329\nCC-MAIN-2025-18,application/atom+xml,2909401,2909074,0.1059\nCC-MAIN-2025-18,application/calendar,4712,4712,0.0002\nCC-MAIN-2025-18,application/download,86851,86830,0.0032\nCC-MAIN-2025-18,application/epub+zip,51674,51367,0.0019\nCC-MAIN-2025-18,application/force-download,205939,205854,0.0075\nCC-MAIN-2025-18,application/gpx+xml,15915,15913,0.0006\nCC-MAIN-2025-18,application/ics,10056,10048,0.0004\nCC-MAIN-2025-18,application/javascript,5533,5527,0.0002\nCC-MAIN-2025-18,application/json,857240,856763,0.0312\nCC-MAIN-2025-18,application/ld+json,60520,60427,0.0022\nCC-MAIN-2025-18,application/marc,23337,23336,0.0008\nCC-MAIN-2025-18,application/msword,72971,72819,0.0027\nCC-MAIN-2025-18,application/octet-stream,1576202,1574568,0.0574\nCC-MAIN-2025-18,application/octetstream,4699,4699,0.0002\nCC-MAIN-2025-18,application/pdf,18206098,18162265,0.6627\nCC-MAIN-2025-18,application/pgp-encrypted,2945,2945,0.0001\nCC-MAIN-2025-18,application/pgp-signature,84841,84815,0.0031\nCC-MAIN-2025-18,application/postscript,3736,3731,0.0001\nCC-MAIN-2025-18,application/rdf+xml,151201,151099,0.0055\nCC-MAIN-2025-18,application/rss+xml,1521746,1520466,0.0554\nCC-MAIN-2025-18,application/rtf,23846,23838,0.0009\nCC-MAIN-2025-18,application/save-to-disk,4,4,0.0000\nCC-MAIN-2025-18,application/text,4435,4430,0.0002\nCC-MAIN-2025-18,application/unknown,4805,4805,0.0002\nCC-MAIN-2025-18,application/vnd.android.package-archive,168,168,0.0000\nCC-MAIN-2025-18,application/vnd.google-earth.kml+xml,41652,41563,0.0015\nCC-MAIN-2025-18,application/vnd.google-earth.kmz,8719,8719,0.0003\nCC-MAIN-2025-18,application/vnd.ms-excel,49916,49838,0.0018\nCC-MAIN-2025-18,application/vnd.ms-powerpoint,4903,4895,0.0002\nCC-MAIN-2025-18,application/vnd.ms-word,5994,5994,0.0002\nCC-MAIN-2025-18,application/vnd.oasis.opendocument.text,17151,17144,0.0006\nCC-MAIN-2025-18,application/vnd.openxmlformats-officedocument.presentationml.presentation,6176,6117,0.0002\nCC-MAIN-2025-18,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,47715,47580,0.0017\nCC-MAIN-2025-18,application/vnd.openxmlformats-officedocument.wordprocessingml.document,61802,61514,0.0022\nCC-MAIN-2025-18,application/vnd.wap.xhtml+xml,29973,29917,0.0011\nCC-MAIN-2025-18,application/x-bibtex,184601,184566,0.0067\nCC-MAIN-2025-18,application/x-bittorrent,3488,3487,0.0001\nCC-MAIN-2025-18,application/x-debian-package,7,7,0.0000\nCC-MAIN-2025-18,application/x-download,69945,69933,0.0025\nCC-MAIN-2025-18,application/x-endnote-refer,17464,17463,0.0006\nCC-MAIN-2025-18,application/x-gzip,3891,3891,0.0001\nCC-MAIN-2025-18,application/x-httpd-php,14082,14023,0.0005\nCC-MAIN-2025-18,application/x-java-jnlp-file,8359,8358,0.0003\nCC-MAIN-2025-18,application/x-javascript,3932,3931,0.0001\nCC-MAIN-2025-18,application/x-json,30,30,0.0000\nCC-MAIN-2025-18,application/x-mobipocket-ebook,18644,18365,0.0007\nCC-MAIN-2025-18,application/x-msdownload,11204,11203,0.0004\nCC-MAIN-2025-18,application/x-netcdf,4713,4713,0.0002\nCC-MAIN-2025-18,application/x-research-info-systems,270376,270321,0.0098\nCC-MAIN-2025-18,application/x-shockwave-flash,3320,3317,0.0001\nCC-MAIN-2025-18,application/x-tar,2849,2849,0.0001\nCC-MAIN-2025-18,application/x-tex,4489,4488,0.0002\nCC-MAIN-2025-18,application/x-troff-man,23859,23859,0.0009\nCC-MAIN-2025-18,application/x-zip-compressed,235,235,0.0000\nCC-MAIN-2025-18,application/xhtml+xml,279380,278147,0.0102\nCC-MAIN-2025-18,application/xml,660211,657847,0.0240\nCC-MAIN-2025-18,application/zip,4388,4377,0.0002\nCC-MAIN-2025-18,audio/mpeg,3025,3025,0.0001\nCC-MAIN-2025-18,audio/x-mpegurl,12947,12939,0.0005\nCC-MAIN-2025-18,audio/x-scpls,2738,2737,0.0001\nCC-MAIN-2025-18,audio/x-wav,11,11,0.0000\nCC-MAIN-2025-18,binary/octet-stream,15744,15710,0.0006\nCC-MAIN-2025-18,image/gif,13200,13198,0.0005\nCC-MAIN-2025-18,image/jp2,9,9,0.0000\nCC-MAIN-2025-18,image/jpeg,9723,9720,0.0004\nCC-MAIN-2025-18,image/jpg,1865,1865,0.0001\nCC-MAIN-2025-18,image/pjpeg,35,35,0.0000\nCC-MAIN-2025-18,image/png,2306,2305,0.0001\nCC-MAIN-2025-18,image/svg+xml,60,60,0.0000\nCC-MAIN-2025-18,image/tiff,11,11,0.0000\nCC-MAIN-2025-18,image/vnd.djvu,14819,14817,0.0005\nCC-MAIN-2025-18,image/webp,143,143,0.0000\nCC-MAIN-2025-18,message/rfc822,9387,9384,0.0003\nCC-MAIN-2025-18,text/calendar,887885,887534,0.0323\nCC-MAIN-2025-18,text/css,15943,15939,0.0006\nCC-MAIN-2025-18,text/csv,117413,117341,0.0043\nCC-MAIN-2025-18,text/directory,4923,4920,0.0002\nCC-MAIN-2025-18,text/enriched,1292,1292,0.0000\nCC-MAIN-2025-18,text/html,2710183995,2694706774,98.6477\nCC-MAIN-2025-18,text/javascript,8989,8984,0.0003\nCC-MAIN-2025-18,text/markdown,5692,5692,0.0002\nCC-MAIN-2025-18,text/pdf,207,207,0.0000\nCC-MAIN-2025-18,text/plain,1969383,1968521,0.0717\nCC-MAIN-2025-18,text/prs.lines.tag,187112,187112,0.0068\nCC-MAIN-2025-18,text/tab-separated-values,9582,9582,0.0003\nCC-MAIN-2025-18,text/turtle,65757,65678,0.0024\nCC-MAIN-2025-18,text/vcard,25175,25150,0.0009\nCC-MAIN-2025-18,text/x-bibtex,10690,10690,0.0004\nCC-MAIN-2025-18,text/x-c,7381,7381,0.0003\nCC-MAIN-2025-18,text/x-csrc,11577,11574,0.0004\nCC-MAIN-2025-18,text/x-diff,10656,10656,0.0004\nCC-MAIN-2025-18,text/x-patch,10520,10520,0.0004\nCC-MAIN-2025-18,text/x-perl,1443,1443,0.0001\nCC-MAIN-2025-18,text/x-vcalendar,10150,10147,0.0004\nCC-MAIN-2025-18,text/x-vcard,55199,55178,0.0020\nCC-MAIN-2025-18,text/xml,2241422,2222943,0.0816\nCC-MAIN-2025-18,unknown/unknown,611,611,0.0000\nCC-MAIN-2025-18,video/mp4,300,299,0.0000\nCC-MAIN-2025-18,video/webm,23,23,0.0000\nCC-MAIN-2025-18,video/x-ms-asf,3005,3005,0.0001\nCC-MAIN-2025-21,<other>,4021223,3994563,0.1623\nCC-MAIN-2025-21,application/atom+xml,2594811,2594483,0.1047\nCC-MAIN-2025-21,application/calendar,4467,4467,0.0002\nCC-MAIN-2025-21,application/download,60704,60702,0.0025\nCC-MAIN-2025-21,application/epub+zip,37283,37161,0.0015\nCC-MAIN-2025-21,application/force-download,167454,167430,0.0068\nCC-MAIN-2025-21,application/gpx+xml,15099,15099,0.0006\nCC-MAIN-2025-21,application/ics,7358,7350,0.0003\nCC-MAIN-2025-21,application/javascript,25184,25183,0.0010\nCC-MAIN-2025-21,application/json,591517,590913,0.0239\nCC-MAIN-2025-21,application/ld+json,38170,38153,0.0015\nCC-MAIN-2025-21,application/marc,14115,14115,0.0006\nCC-MAIN-2025-21,application/msword,42308,42035,0.0017\nCC-MAIN-2025-21,application/octet-stream,920864,920129,0.0372\nCC-MAIN-2025-21,application/octetstream,3902,3902,0.0002\nCC-MAIN-2025-21,application/pdf,14543188,14507268,0.5871\nCC-MAIN-2025-21,application/pgp-encrypted,2741,2741,0.0001\nCC-MAIN-2025-21,application/pgp-signature,37924,37914,0.0015\nCC-MAIN-2025-21,application/postscript,3065,3062,0.0001\nCC-MAIN-2025-21,application/rdf+xml,100875,100847,0.0041\nCC-MAIN-2025-21,application/rss+xml,1067774,1066939,0.0431\nCC-MAIN-2025-21,application/rtf,20034,20028,0.0008\nCC-MAIN-2025-21,application/save-to-disk,1,1,0.0000\nCC-MAIN-2025-21,application/text,4070,4067,0.0002\nCC-MAIN-2025-21,application/unknown,3203,3203,0.0001\nCC-MAIN-2025-21,application/vnd.android.package-archive,75,75,0.0000\nCC-MAIN-2025-21,application/vnd.google-earth.kml+xml,29153,29080,0.0012\nCC-MAIN-2025-21,application/vnd.google-earth.kmz,7365,7361,0.0003\nCC-MAIN-2025-21,application/vnd.ms-excel,22814,22716,0.0009\nCC-MAIN-2025-21,application/vnd.ms-powerpoint,3981,3976,0.0002\nCC-MAIN-2025-21,application/vnd.ms-word,3851,3851,0.0002\nCC-MAIN-2025-21,application/vnd.oasis.opendocument.text,12838,12833,0.0005\nCC-MAIN-2025-21,application/vnd.openxmlformats-officedocument.presentationml.presentation,4832,4804,0.0002\nCC-MAIN-2025-21,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,29048,28888,0.0012\nCC-MAIN-2025-21,application/vnd.openxmlformats-officedocument.wordprocessingml.document,49660,49347,0.0020\nCC-MAIN-2025-21,application/vnd.wap.xhtml+xml,24804,24747,0.0010\nCC-MAIN-2025-21,application/x-bibtex,172442,172389,0.0070\nCC-MAIN-2025-21,application/x-bittorrent,3453,3453,0.0001\nCC-MAIN-2025-21,application/x-debian-package,4,4,0.0000\nCC-MAIN-2025-21,application/x-download,46535,46386,0.0019\nCC-MAIN-2025-21,application/x-endnote-refer,18200,18197,0.0007\nCC-MAIN-2025-21,application/x-gzip,3107,3106,0.0001\nCC-MAIN-2025-21,application/x-httpd-php,9989,9977,0.0004\nCC-MAIN-2025-21,application/x-java-jnlp-file,6298,6298,0.0003\nCC-MAIN-2025-21,application/x-javascript,2750,2750,0.0001\nCC-MAIN-2025-21,application/x-json,97,97,0.0000\nCC-MAIN-2025-21,application/x-mobipocket-ebook,13369,13268,0.0005\nCC-MAIN-2025-21,application/x-msdownload,5657,5656,0.0002\nCC-MAIN-2025-21,application/x-netcdf,4565,4565,0.0002\nCC-MAIN-2025-21,application/x-research-info-systems,242386,242284,0.0098\nCC-MAIN-2025-21,application/x-shockwave-flash,3186,3183,0.0001\nCC-MAIN-2025-21,application/x-tar,1033,1032,0.0000\nCC-MAIN-2025-21,application/x-tex,2817,2817,0.0001\nCC-MAIN-2025-21,application/x-troff-man,6821,6821,0.0003\nCC-MAIN-2025-21,application/x-zip-compressed,153,153,0.0000\nCC-MAIN-2025-21,application/xhtml+xml,239354,237975,0.0097\nCC-MAIN-2025-21,application/xml,538814,537012,0.0218\nCC-MAIN-2025-21,application/zip,2348,2347,0.0001\nCC-MAIN-2025-21,audio/mpeg,1166,1166,0.0000\nCC-MAIN-2025-21,audio/x-mpegurl,10042,10039,0.0004\nCC-MAIN-2025-21,audio/x-scpls,2592,2591,0.0001\nCC-MAIN-2025-21,audio/x-wav,7,7,0.0000\nCC-MAIN-2025-21,binary/octet-stream,9395,9361,0.0004\nCC-MAIN-2025-21,image/gif,11589,11589,0.0005\nCC-MAIN-2025-21,image/jp2,1,1,0.0000\nCC-MAIN-2025-21,image/jpeg,6030,6022,0.0002\nCC-MAIN-2025-21,image/jpg,802,802,0.0000\nCC-MAIN-2025-21,image/pjpeg,22,22,0.0000\nCC-MAIN-2025-21,image/png,4200,4195,0.0002\nCC-MAIN-2025-21,image/svg+xml,35,35,0.0000\nCC-MAIN-2025-21,image/tiff,115,115,0.0000\nCC-MAIN-2025-21,image/vnd.djvu,10618,10616,0.0004\nCC-MAIN-2025-21,image/webp,81,81,0.0000\nCC-MAIN-2025-21,message/rfc822,8124,8123,0.0003\nCC-MAIN-2025-21,text/calendar,740366,740114,0.0299\nCC-MAIN-2025-21,text/css,13401,13399,0.0005\nCC-MAIN-2025-21,text/csv,72908,72857,0.0029\nCC-MAIN-2025-21,text/directory,5865,5857,0.0002\nCC-MAIN-2025-21,text/enriched,1952,1952,0.0001\nCC-MAIN-2025-21,text/html,2447548987,2434718826,98.8044\nCC-MAIN-2025-21,text/javascript,6685,6682,0.0003\nCC-MAIN-2025-21,text/markdown,4945,4945,0.0002\nCC-MAIN-2025-21,text/pdf,243,243,0.0000\nCC-MAIN-2025-21,text/plain,1213102,1212257,0.0490\nCC-MAIN-2025-21,text/prs.lines.tag,41588,41588,0.0017\nCC-MAIN-2025-21,text/tab-separated-values,7695,7695,0.0003\nCC-MAIN-2025-21,text/turtle,50318,50296,0.0020\nCC-MAIN-2025-21,text/vcard,23673,23596,0.0010\nCC-MAIN-2025-21,text/x-bibtex,10455,10455,0.0004\nCC-MAIN-2025-21,text/x-c,2528,2526,0.0001\nCC-MAIN-2025-21,text/x-csrc,2612,2611,0.0001\nCC-MAIN-2025-21,text/x-diff,4754,4753,0.0002\nCC-MAIN-2025-21,text/x-patch,5461,5461,0.0002\nCC-MAIN-2025-21,text/x-perl,664,664,0.0000\nCC-MAIN-2025-21,text/x-vcalendar,7808,7808,0.0003\nCC-MAIN-2025-21,text/x-vcard,43366,43347,0.0018\nCC-MAIN-2025-21,text/xml,1447735,1423496,0.0584\nCC-MAIN-2025-21,unknown/unknown,498,498,0.0000\nCC-MAIN-2025-21,video/mp4,528,526,0.0000\nCC-MAIN-2025-21,video/webm,200,200,0.0000\nCC-MAIN-2025-21,video/x-ms-asf,3313,3313,0.0001\nCC-MAIN-2025-26,<other>,4189316,4178915,0.1756\nCC-MAIN-2025-26,application/atom+xml,3061889,3061615,0.1283\nCC-MAIN-2025-26,application/calendar,4169,4169,0.0002\nCC-MAIN-2025-26,application/download,44764,44756,0.0019\nCC-MAIN-2025-26,application/epub+zip,42683,42544,0.0018\nCC-MAIN-2025-26,application/force-download,158308,158292,0.0066\nCC-MAIN-2025-26,application/gpx+xml,15066,15064,0.0006\nCC-MAIN-2025-26,application/ics,8580,8576,0.0004\nCC-MAIN-2025-26,application/javascript,31851,31842,0.0013\nCC-MAIN-2025-26,application/json,630943,630257,0.0264\nCC-MAIN-2025-26,application/ld+json,40530,40500,0.0017\nCC-MAIN-2025-26,application/marc,11769,11768,0.0005\nCC-MAIN-2025-26,application/msword,46020,45841,0.0019\nCC-MAIN-2025-26,application/octet-stream,964057,963174,0.0404\nCC-MAIN-2025-26,application/octetstream,4291,4291,0.0002\nCC-MAIN-2025-26,application/pdf,14635465,14601266,0.6135\nCC-MAIN-2025-26,application/pgp-encrypted,2392,2392,0.0001\nCC-MAIN-2025-26,application/pgp-signature,43694,43678,0.0018\nCC-MAIN-2025-26,application/postscript,3100,3099,0.0001\nCC-MAIN-2025-26,application/rdf+xml,98734,98688,0.0041\nCC-MAIN-2025-26,application/rss+xml,1038372,1037582,0.0435\nCC-MAIN-2025-26,application/rtf,19651,19638,0.0008\nCC-MAIN-2025-26,application/save-to-disk,12,12,0.0000\nCC-MAIN-2025-26,application/text,4070,4070,0.0002\nCC-MAIN-2025-26,application/unknown,4997,4997,0.0002\nCC-MAIN-2025-26,application/vnd.android.package-archive,148,148,0.0000\nCC-MAIN-2025-26,application/vnd.google-earth.kml+xml,34053,33992,0.0014\nCC-MAIN-2025-26,application/vnd.google-earth.kmz,6591,6588,0.0003\nCC-MAIN-2025-26,application/vnd.ms-excel,21379,21321,0.0009\nCC-MAIN-2025-26,application/vnd.ms-powerpoint,3451,3438,0.0001\nCC-MAIN-2025-26,application/vnd.ms-word,3665,3665,0.0002\nCC-MAIN-2025-26,application/vnd.oasis.opendocument.text,12223,12209,0.0005\nCC-MAIN-2025-26,application/vnd.openxmlformats-officedocument.presentationml.presentation,4938,4891,0.0002\nCC-MAIN-2025-26,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,32541,32325,0.0014\nCC-MAIN-2025-26,application/vnd.openxmlformats-officedocument.wordprocessingml.document,46804,46533,0.0020\nCC-MAIN-2025-26,application/vnd.wap.xhtml+xml,4404,4361,0.0002\nCC-MAIN-2025-26,application/x-bibtex,172398,172267,0.0072\nCC-MAIN-2025-26,application/x-bittorrent,3733,3732,0.0002\nCC-MAIN-2025-26,application/x-debian-package,53,53,0.0000\nCC-MAIN-2025-26,application/x-download,48245,48209,0.0020\nCC-MAIN-2025-26,application/x-endnote-refer,19828,19827,0.0008\nCC-MAIN-2025-26,application/x-gzip,1685,1684,0.0001\nCC-MAIN-2025-26,application/x-httpd-php,8618,8605,0.0004\nCC-MAIN-2025-26,application/x-java-jnlp-file,4804,4799,0.0002\nCC-MAIN-2025-26,application/x-javascript,2585,2584,0.0001\nCC-MAIN-2025-26,application/x-json,142,142,0.0000\nCC-MAIN-2025-26,application/x-mobipocket-ebook,12638,12538,0.0005\nCC-MAIN-2025-26,application/x-msdownload,7485,7484,0.0003\nCC-MAIN-2025-26,application/x-netcdf,3290,3290,0.0001\nCC-MAIN-2025-26,application/x-research-info-systems,227481,227331,0.0095\nCC-MAIN-2025-26,application/x-shockwave-flash,2860,2857,0.0001\nCC-MAIN-2025-26,application/x-tar,1035,1035,0.0000\nCC-MAIN-2025-26,application/x-tex,2628,2628,0.0001\nCC-MAIN-2025-26,application/x-troff-man,8632,8632,0.0004\nCC-MAIN-2025-26,application/x-zip-compressed,379,379,0.0000\nCC-MAIN-2025-26,application/xhtml+xml,218343,217579,0.0092\nCC-MAIN-2025-26,application/xml,560670,559822,0.0235\nCC-MAIN-2025-26,application/zip,2132,2132,0.0001\nCC-MAIN-2025-26,audio/mpeg,1034,1034,0.0000\nCC-MAIN-2025-26,audio/x-mpegurl,9988,9984,0.0004\nCC-MAIN-2025-26,audio/x-scpls,2524,2524,0.0001\nCC-MAIN-2025-26,audio/x-wav,40,40,0.0000\nCC-MAIN-2025-26,binary/octet-stream,10888,10772,0.0005\nCC-MAIN-2025-26,image/gif,12263,12263,0.0005\nCC-MAIN-2025-26,image/jp2,4,4,0.0000\nCC-MAIN-2025-26,image/jpeg,6693,6686,0.0003\nCC-MAIN-2025-26,image/jpg,682,679,0.0000\nCC-MAIN-2025-26,image/pjpeg,35,35,0.0000\nCC-MAIN-2025-26,image/png,23249,23247,0.0010\nCC-MAIN-2025-26,image/svg+xml,28,28,0.0000\nCC-MAIN-2025-26,image/tiff,75,75,0.0000\nCC-MAIN-2025-26,image/vnd.djvu,22564,22563,0.0009\nCC-MAIN-2025-26,image/webp,78,78,0.0000\nCC-MAIN-2025-26,message/rfc822,6004,6004,0.0003\nCC-MAIN-2025-26,text/calendar,748182,747911,0.0314\nCC-MAIN-2025-26,text/css,17439,17437,0.0007\nCC-MAIN-2025-26,text/csv,73324,73192,0.0031\nCC-MAIN-2025-26,text/directory,6085,6085,0.0003\nCC-MAIN-2025-26,text/enriched,1470,1470,0.0001\nCC-MAIN-2025-26,text/html,2355157483,2342742686,98.7237\nCC-MAIN-2025-26,text/javascript,6844,6836,0.0003\nCC-MAIN-2025-26,text/markdown,5987,5984,0.0003\nCC-MAIN-2025-26,text/pdf,190,190,0.0000\nCC-MAIN-2025-26,text/plain,1244444,1243585,0.0522\nCC-MAIN-2025-26,text/prs.lines.tag,34583,34583,0.0014\nCC-MAIN-2025-26,text/tab-separated-values,10920,10917,0.0005\nCC-MAIN-2025-26,text/turtle,49641,49615,0.0021\nCC-MAIN-2025-26,text/vcard,24767,24747,0.0010\nCC-MAIN-2025-26,text/x-bibtex,9810,9795,0.0004\nCC-MAIN-2025-26,text/x-c,1915,1913,0.0001\nCC-MAIN-2025-26,text/x-csrc,3953,3952,0.0002\nCC-MAIN-2025-26,text/x-diff,5537,5537,0.0002\nCC-MAIN-2025-26,text/x-patch,6027,6027,0.0003\nCC-MAIN-2025-26,text/x-perl,1064,1064,0.0000\nCC-MAIN-2025-26,text/x-vcalendar,9186,9183,0.0004\nCC-MAIN-2025-26,text/x-vcard,48793,48776,0.0020\nCC-MAIN-2025-26,text/xml,1452381,1448663,0.0609\nCC-MAIN-2025-26,unknown/unknown,282,282,0.0000\nCC-MAIN-2025-26,video/mp4,371,371,0.0000\nCC-MAIN-2025-26,video/webm,2,2,0.0000\nCC-MAIN-2025-26,video/x-ms-asf,2536,2535,0.0001\nCC-MAIN-2025-30,<other>,1828086,1823151,0.0755\nCC-MAIN-2025-30,application/atom+xml,3174628,3174299,0.1310\nCC-MAIN-2025-30,application/calendar,4224,4224,0.0002\nCC-MAIN-2025-30,application/download,60374,60361,0.0025\nCC-MAIN-2025-30,application/epub+zip,39572,39470,0.0016\nCC-MAIN-2025-30,application/force-download,243978,243724,0.0101\nCC-MAIN-2025-30,application/gpx+xml,14183,14183,0.0006\nCC-MAIN-2025-30,application/ics,9494,9491,0.0004\nCC-MAIN-2025-30,application/javascript,28033,28024,0.0012\nCC-MAIN-2025-30,application/json,665860,665331,0.0275\nCC-MAIN-2025-30,application/ld+json,41504,41476,0.0017\nCC-MAIN-2025-30,application/marc,12497,12496,0.0005\nCC-MAIN-2025-30,application/msword,52236,52157,0.0022\nCC-MAIN-2025-30,application/octet-stream,1016206,1015644,0.0419\nCC-MAIN-2025-30,application/octetstream,7559,7559,0.0003\nCC-MAIN-2025-30,application/pdf,15488784,15458931,0.6394\nCC-MAIN-2025-30,application/pgp-encrypted,2313,2313,0.0001\nCC-MAIN-2025-30,application/pgp-signature,42796,42795,0.0018\nCC-MAIN-2025-30,application/postscript,4019,4006,0.0002\nCC-MAIN-2025-30,application/rdf+xml,107796,107753,0.0044\nCC-MAIN-2025-30,application/rss+xml,1043584,1042983,0.0431\nCC-MAIN-2025-30,application/rtf,19559,19550,0.0008\nCC-MAIN-2025-30,application/save-to-disk,12,12,0.0000\nCC-MAIN-2025-30,application/text,3696,3696,0.0002\nCC-MAIN-2025-30,application/unknown,4899,4899,0.0002\nCC-MAIN-2025-30,application/vnd.android.package-archive,103,103,0.0000\nCC-MAIN-2025-30,application/vnd.google-earth.kml+xml,28114,28099,0.0012\nCC-MAIN-2025-30,application/vnd.google-earth.kmz,7754,7752,0.0003\nCC-MAIN-2025-30,application/vnd.ms-excel,30596,30567,0.0013\nCC-MAIN-2025-30,application/vnd.ms-powerpoint,4427,4414,0.0002\nCC-MAIN-2025-30,application/vnd.ms-word,4713,4713,0.0002\nCC-MAIN-2025-30,application/vnd.oasis.opendocument.text,14397,14393,0.0006\nCC-MAIN-2025-30,application/vnd.openxmlformats-officedocument.presentationml.presentation,6350,6328,0.0003\nCC-MAIN-2025-30,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,35872,35785,0.0015\nCC-MAIN-2025-30,application/vnd.openxmlformats-officedocument.wordprocessingml.document,52639,52464,0.0022\nCC-MAIN-2025-30,application/vnd.wap.xhtml+xml,4854,4809,0.0002\nCC-MAIN-2025-30,application/x-bibtex,175520,175398,0.0072\nCC-MAIN-2025-30,application/x-bittorrent,3614,3614,0.0001\nCC-MAIN-2025-30,application/x-debian-package,10,10,0.0000\nCC-MAIN-2025-30,application/x-download,48947,48928,0.0020\nCC-MAIN-2025-30,application/x-endnote-refer,19251,19242,0.0008\nCC-MAIN-2025-30,application/x-gzip,1537,1536,0.0001\nCC-MAIN-2025-30,application/x-httpd-php,8258,8215,0.0003\nCC-MAIN-2025-30,application/x-java-jnlp-file,2092,2092,0.0001\nCC-MAIN-2025-30,application/x-javascript,2701,2701,0.0001\nCC-MAIN-2025-30,application/x-json,150,150,0.0000\nCC-MAIN-2025-30,application/x-mobipocket-ebook,12313,12212,0.0005\nCC-MAIN-2025-30,application/x-msdownload,7572,7572,0.0003\nCC-MAIN-2025-30,application/x-netcdf,7019,7019,0.0003\nCC-MAIN-2025-30,application/x-research-info-systems,252922,252712,0.0104\nCC-MAIN-2025-30,application/x-shockwave-flash,2335,2335,0.0001\nCC-MAIN-2025-30,application/x-tar,1548,1548,0.0001\nCC-MAIN-2025-30,application/x-tex,3345,3345,0.0001\nCC-MAIN-2025-30,application/x-troff-man,11052,11052,0.0005\nCC-MAIN-2025-30,application/x-zip-compressed,511,508,0.0000\nCC-MAIN-2025-30,application/xhtml+xml,246778,246025,0.0102\nCC-MAIN-2025-30,application/xml,584478,583430,0.0241\nCC-MAIN-2025-30,application/zip,2577,2577,0.0001\nCC-MAIN-2025-30,audio/mpeg,1145,1145,0.0000\nCC-MAIN-2025-30,audio/x-mpegurl,8738,8736,0.0004\nCC-MAIN-2025-30,audio/x-scpls,2678,2677,0.0001\nCC-MAIN-2025-30,audio/x-wav,25,25,0.0000\nCC-MAIN-2025-30,binary/octet-stream,9737,9697,0.0004\nCC-MAIN-2025-30,image/gif,8298,8298,0.0003\nCC-MAIN-2025-30,image/jpeg,8487,8485,0.0004\nCC-MAIN-2025-30,image/jpg,179,179,0.0000\nCC-MAIN-2025-30,image/pjpeg,170,170,0.0000\nCC-MAIN-2025-30,image/png,14543,14538,0.0006\nCC-MAIN-2025-30,image/svg+xml,24,24,0.0000\nCC-MAIN-2025-30,image/tiff,160,160,0.0000\nCC-MAIN-2025-30,image/vnd.djvu,26209,26209,0.0011\nCC-MAIN-2025-30,image/webp,76,76,0.0000\nCC-MAIN-2025-30,message/rfc822,7967,7964,0.0003\nCC-MAIN-2025-30,text/calendar,766538,765835,0.0316\nCC-MAIN-2025-30,text/css,11754,11750,0.0005\nCC-MAIN-2025-30,text/csv,74877,74864,0.0031\nCC-MAIN-2025-30,text/directory,6251,6251,0.0003\nCC-MAIN-2025-30,text/enriched,1064,1064,0.0000\nCC-MAIN-2025-30,text/html,2393010518,2380349242,98.7794\nCC-MAIN-2025-30,text/javascript,7503,7497,0.0003\nCC-MAIN-2025-30,text/markdown,6079,6075,0.0003\nCC-MAIN-2025-30,text/pdf,400,400,0.0000\nCC-MAIN-2025-30,text/plain,1354879,1353844,0.0559\nCC-MAIN-2025-30,text/prs.lines.tag,49906,49905,0.0021\nCC-MAIN-2025-30,text/tab-separated-values,8057,8057,0.0003\nCC-MAIN-2025-30,text/turtle,50989,50956,0.0021\nCC-MAIN-2025-30,text/vcard,25471,25451,0.0011\nCC-MAIN-2025-30,text/x-bibtex,9636,9634,0.0004\nCC-MAIN-2025-30,text/x-c,1626,1626,0.0001\nCC-MAIN-2025-30,text/x-csrc,7474,7474,0.0003\nCC-MAIN-2025-30,text/x-diff,7661,7661,0.0003\nCC-MAIN-2025-30,text/x-patch,6105,6105,0.0003\nCC-MAIN-2025-30,text/x-perl,1121,1121,0.0000\nCC-MAIN-2025-30,text/x-vcalendar,9639,9637,0.0004\nCC-MAIN-2025-30,text/x-vcard,48444,48429,0.0020\nCC-MAIN-2025-30,text/xml,1521778,1515777,0.0628\nCC-MAIN-2025-30,unknown/unknown,527,527,0.0000\nCC-MAIN-2025-30,video/mp4,321,320,0.0000\nCC-MAIN-2025-30,video/webm,1,1,0.0000\nCC-MAIN-2025-30,video/x-ms-asf,3211,3210,0.0001\nCC-MAIN-2025-33,<other>,1856292,1851685,0.0760\nCC-MAIN-2025-33,application/atom+xml,2893213,2892962,0.1185\nCC-MAIN-2025-33,application/calendar,3741,3741,0.0002\nCC-MAIN-2025-33,application/download,67941,67928,0.0028\nCC-MAIN-2025-33,application/epub+zip,43117,42970,0.0018\nCC-MAIN-2025-33,application/force-download,190692,190663,0.0078\nCC-MAIN-2025-33,application/gpx+xml,13912,13912,0.0006\nCC-MAIN-2025-33,application/ics,7197,7196,0.0003\nCC-MAIN-2025-33,application/javascript,24877,24860,0.0010\nCC-MAIN-2025-33,application/json,637997,637681,0.0261\nCC-MAIN-2025-33,application/ld+json,46737,46724,0.0019\nCC-MAIN-2025-33,application/marc,10667,10666,0.0004\nCC-MAIN-2025-33,application/msword,50039,49949,0.0020\nCC-MAIN-2025-33,application/octet-stream,1041423,1040247,0.0426\nCC-MAIN-2025-33,application/octetstream,4594,4594,0.0002\nCC-MAIN-2025-33,application/pdf,14167416,14138664,0.5800\nCC-MAIN-2025-33,application/pgp-encrypted,2532,2532,0.0001\nCC-MAIN-2025-33,application/pgp-signature,31111,31110,0.0013\nCC-MAIN-2025-33,application/postscript,2998,2996,0.0001\nCC-MAIN-2025-33,application/rdf+xml,104879,104790,0.0043\nCC-MAIN-2025-33,application/rss+xml,1010239,1009684,0.0414\nCC-MAIN-2025-33,application/rtf,21772,21768,0.0009\nCC-MAIN-2025-33,application/save-to-disk,14,14,0.0000\nCC-MAIN-2025-33,application/text,3322,3322,0.0001\nCC-MAIN-2025-33,application/unknown,4452,4452,0.0002\nCC-MAIN-2025-33,application/vnd.android.package-archive,69,69,0.0000\nCC-MAIN-2025-33,application/vnd.google-earth.kml+xml,28393,28369,0.0012\nCC-MAIN-2025-33,application/vnd.google-earth.kmz,6548,6548,0.0003\nCC-MAIN-2025-33,application/vnd.ms-excel,31065,31061,0.0013\nCC-MAIN-2025-33,application/vnd.ms-powerpoint,3961,3950,0.0002\nCC-MAIN-2025-33,application/vnd.ms-word,4793,4793,0.0002\nCC-MAIN-2025-33,application/vnd.oasis.opendocument.text,12535,12516,0.0005\nCC-MAIN-2025-33,application/vnd.openxmlformats-officedocument.presentationml.presentation,5928,5868,0.0002\nCC-MAIN-2025-33,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,33732,33681,0.0014\nCC-MAIN-2025-33,application/vnd.openxmlformats-officedocument.wordprocessingml.document,48059,47887,0.0020\nCC-MAIN-2025-33,application/vnd.wap.xhtml+xml,3298,3269,0.0001\nCC-MAIN-2025-33,application/x-bibtex,173494,173345,0.0071\nCC-MAIN-2025-33,application/x-bittorrent,4656,4656,0.0002\nCC-MAIN-2025-33,application/x-debian-package,48,48,0.0000\nCC-MAIN-2025-33,application/x-download,42783,42747,0.0018\nCC-MAIN-2025-33,application/x-endnote-refer,21067,21059,0.0009\nCC-MAIN-2025-33,application/x-gzip,2203,2203,0.0001\nCC-MAIN-2025-33,application/x-httpd-php,7249,7243,0.0003\nCC-MAIN-2025-33,application/x-java-jnlp-file,1689,1685,0.0001\nCC-MAIN-2025-33,application/x-javascript,2239,2239,0.0001\nCC-MAIN-2025-33,application/x-json,61,61,0.0000\nCC-MAIN-2025-33,application/x-mobipocket-ebook,14819,14679,0.0006\nCC-MAIN-2025-33,application/x-msdownload,9371,9370,0.0004\nCC-MAIN-2025-33,application/x-netcdf,18293,18293,0.0007\nCC-MAIN-2025-33,application/x-research-info-systems,243492,243324,0.0100\nCC-MAIN-2025-33,application/x-shockwave-flash,1777,1774,0.0001\nCC-MAIN-2025-33,application/x-tar,1260,1260,0.0001\nCC-MAIN-2025-33,application/x-tex,4617,4617,0.0002\nCC-MAIN-2025-33,application/x-troff-man,9965,9965,0.0004\nCC-MAIN-2025-33,application/x-zip-compressed,268,268,0.0000\nCC-MAIN-2025-33,application/xhtml+xml,246067,245229,0.0101\nCC-MAIN-2025-33,application/xml,580731,580199,0.0238\nCC-MAIN-2025-33,application/zip,1673,1672,0.0001\nCC-MAIN-2025-33,audio/mpeg,1049,1049,0.0000\nCC-MAIN-2025-33,audio/x-mpegurl,9943,9939,0.0004\nCC-MAIN-2025-33,audio/x-scpls,2622,2621,0.0001\nCC-MAIN-2025-33,audio/x-wav,41,41,0.0000\nCC-MAIN-2025-33,binary/octet-stream,9048,9033,0.0004\nCC-MAIN-2025-33,image/gif,8464,8464,0.0003\nCC-MAIN-2025-33,image/jp2,3,3,0.0000\nCC-MAIN-2025-33,image/jpeg,8528,8525,0.0003\nCC-MAIN-2025-33,image/jpg,303,303,0.0000\nCC-MAIN-2025-33,image/pjpeg,39,39,0.0000\nCC-MAIN-2025-33,image/png,2220,2220,0.0001\nCC-MAIN-2025-33,image/svg+xml,43,43,0.0000\nCC-MAIN-2025-33,image/tiff,155,155,0.0000\nCC-MAIN-2025-33,image/vnd.djvu,2919,2918,0.0001\nCC-MAIN-2025-33,image/webp,35,35,0.0000\nCC-MAIN-2025-33,message/rfc822,8406,8406,0.0003\nCC-MAIN-2025-33,text/calendar,755172,754916,0.0309\nCC-MAIN-2025-33,text/css,11704,11701,0.0005\nCC-MAIN-2025-33,text/csv,77417,77214,0.0032\nCC-MAIN-2025-33,text/directory,4596,4595,0.0002\nCC-MAIN-2025-33,text/enriched,1092,1092,0.0000\nCC-MAIN-2025-33,text/html,2414875942,2402349217,98.8693\nCC-MAIN-2025-33,text/javascript,7033,7031,0.0003\nCC-MAIN-2025-33,text/markdown,8707,8704,0.0004\nCC-MAIN-2025-33,text/pdf,111,111,0.0000\nCC-MAIN-2025-33,text/plain,1211151,1210209,0.0496\nCC-MAIN-2025-33,text/prs.lines.tag,47907,47907,0.0020\nCC-MAIN-2025-33,text/tab-separated-values,8151,8150,0.0003\nCC-MAIN-2025-33,text/turtle,52243,52225,0.0021\nCC-MAIN-2025-33,text/vcard,20530,20513,0.0008\nCC-MAIN-2025-33,text/x-bibtex,8776,8774,0.0004\nCC-MAIN-2025-33,text/x-c,1684,1684,0.0001\nCC-MAIN-2025-33,text/x-csrc,3689,3688,0.0002\nCC-MAIN-2025-33,text/x-diff,6745,6744,0.0003\nCC-MAIN-2025-33,text/x-patch,5604,5604,0.0002\nCC-MAIN-2025-33,text/x-perl,680,680,0.0000\nCC-MAIN-2025-33,text/x-vcalendar,9604,9600,0.0004\nCC-MAIN-2025-33,text/x-vcard,43486,43465,0.0018\nCC-MAIN-2025-33,text/xml,1465877,1456776,0.0600\nCC-MAIN-2025-33,unknown/unknown,652,652,0.0000\nCC-MAIN-2025-33,video/mp4,580,579,0.0000\nCC-MAIN-2025-33,video/x-ms-asf,3150,3150,0.0001\nCC-MAIN-2025-38,<other>,1661096,1656665,0.0696\nCC-MAIN-2025-38,application/atom+xml,2759384,2759094,0.1157\nCC-MAIN-2025-38,application/calendar,3808,3808,0.0002\nCC-MAIN-2025-38,application/download,63517,63506,0.0027\nCC-MAIN-2025-38,application/epub+zip,36095,35993,0.0015\nCC-MAIN-2025-38,application/force-download,221222,221185,0.0093\nCC-MAIN-2025-38,application/gpx+xml,14264,14263,0.0006\nCC-MAIN-2025-38,application/ics,7645,7645,0.0003\nCC-MAIN-2025-38,application/javascript,34618,34611,0.0015\nCC-MAIN-2025-38,application/json,659934,659660,0.0277\nCC-MAIN-2025-38,application/ld+json,42919,42910,0.0018\nCC-MAIN-2025-38,application/marc,10447,10436,0.0004\nCC-MAIN-2025-38,application/msword,42607,42571,0.0018\nCC-MAIN-2025-38,application/octet-stream,930153,929623,0.0390\nCC-MAIN-2025-38,application/octetstream,4564,4563,0.0002\nCC-MAIN-2025-38,application/pdf,13364916,13337702,0.5601\nCC-MAIN-2025-38,application/pgp-encrypted,1698,1698,0.0001\nCC-MAIN-2025-38,application/pgp-signature,28460,28458,0.0012\nCC-MAIN-2025-38,application/postscript,3389,3387,0.0001\nCC-MAIN-2025-38,application/rdf+xml,101577,101556,0.0043\nCC-MAIN-2025-38,application/rss+xml,962249,961697,0.0403\nCC-MAIN-2025-38,application/rtf,21064,21046,0.0009\nCC-MAIN-2025-38,application/save-to-disk,17,17,0.0000\nCC-MAIN-2025-38,application/text,3322,3322,0.0001\nCC-MAIN-2025-38,application/unknown,4017,4017,0.0002\nCC-MAIN-2025-38,application/vnd.android.package-archive,108,108,0.0000\nCC-MAIN-2025-38,application/vnd.google-earth.kml+xml,22464,22449,0.0009\nCC-MAIN-2025-38,application/vnd.google-earth.kmz,4644,4643,0.0002\nCC-MAIN-2025-38,application/vnd.ms-excel,31568,31538,0.0013\nCC-MAIN-2025-38,application/vnd.ms-powerpoint,4143,4137,0.0002\nCC-MAIN-2025-38,application/vnd.ms-word,4742,4742,0.0002\nCC-MAIN-2025-38,application/vnd.oasis.opendocument.text,10028,10026,0.0004\nCC-MAIN-2025-38,application/vnd.openxmlformats-officedocument.presentationml.presentation,5232,5208,0.0002\nCC-MAIN-2025-38,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,29247,29167,0.0012\nCC-MAIN-2025-38,application/vnd.openxmlformats-officedocument.wordprocessingml.document,44933,44805,0.0019\nCC-MAIN-2025-38,application/vnd.wap.xhtml+xml,16476,16371,0.0007\nCC-MAIN-2025-38,application/x-bibtex,175009,174925,0.0073\nCC-MAIN-2025-38,application/x-bittorrent,3825,3824,0.0002\nCC-MAIN-2025-38,application/x-debian-package,86,86,0.0000\nCC-MAIN-2025-38,application/x-download,40151,40142,0.0017\nCC-MAIN-2025-38,application/x-endnote-refer,19093,19091,0.0008\nCC-MAIN-2025-38,application/x-gzip,1474,1473,0.0001\nCC-MAIN-2025-38,application/x-httpd-php,8328,8317,0.0003\nCC-MAIN-2025-38,application/x-java-jnlp-file,3318,3317,0.0001\nCC-MAIN-2025-38,application/x-javascript,2852,2851,0.0001\nCC-MAIN-2025-38,application/x-json,84,84,0.0000\nCC-MAIN-2025-38,application/x-mobipocket-ebook,12509,12410,0.0005\nCC-MAIN-2025-38,application/x-msdownload,9609,9608,0.0004\nCC-MAIN-2025-38,application/x-netcdf,1538,1538,0.0001\nCC-MAIN-2025-38,application/x-research-info-systems,234944,234829,0.0098\nCC-MAIN-2025-38,application/x-shockwave-flash,1925,1922,0.0001\nCC-MAIN-2025-38,application/x-tar,1783,1783,0.0001\nCC-MAIN-2025-38,application/x-tex,3658,3657,0.0002\nCC-MAIN-2025-38,application/x-troff-man,7486,7486,0.0003\nCC-MAIN-2025-38,application/x-zip-compressed,248,248,0.0000\nCC-MAIN-2025-38,application/xhtml+xml,236079,235469,0.0099\nCC-MAIN-2025-38,application/xml,549402,549029,0.0230\nCC-MAIN-2025-38,application/zip,1856,1852,0.0001\nCC-MAIN-2025-38,audio/mpeg,1062,1062,0.0000\nCC-MAIN-2025-38,audio/x-mpegurl,9575,9574,0.0004\nCC-MAIN-2025-38,audio/x-scpls,2975,2974,0.0001\nCC-MAIN-2025-38,audio/x-wav,88,88,0.0000\nCC-MAIN-2025-38,binary/octet-stream,8745,8583,0.0004\nCC-MAIN-2025-38,image/gif,9842,9842,0.0004\nCC-MAIN-2025-38,image/jpeg,6506,6504,0.0003\nCC-MAIN-2025-38,image/jpg,712,712,0.0000\nCC-MAIN-2025-38,image/pjpeg,29,29,0.0000\nCC-MAIN-2025-38,image/png,3307,3304,0.0001\nCC-MAIN-2025-38,image/svg+xml,24,24,0.0000\nCC-MAIN-2025-38,image/tiff,183,183,0.0000\nCC-MAIN-2025-38,image/vnd.djvu,3739,3738,0.0002\nCC-MAIN-2025-38,image/webp,88,87,0.0000\nCC-MAIN-2025-38,message/rfc822,8039,8039,0.0003\nCC-MAIN-2025-38,text/calendar,719613,719362,0.0302\nCC-MAIN-2025-38,text/css,13004,13001,0.0005\nCC-MAIN-2025-38,text/csv,73357,73351,0.0031\nCC-MAIN-2025-38,text/directory,4112,4112,0.0002\nCC-MAIN-2025-38,text/enriched,1006,1006,0.0000\nCC-MAIN-2025-38,text/html,2359778185,2347216275,98.9025\nCC-MAIN-2025-38,text/javascript,6572,6570,0.0003\nCC-MAIN-2025-38,text/markdown,11994,11977,0.0005\nCC-MAIN-2025-38,text/pdf,117,117,0.0000\nCC-MAIN-2025-38,text/plain,1125605,1124996,0.0472\nCC-MAIN-2025-38,text/prs.lines.tag,52892,52892,0.0022\nCC-MAIN-2025-38,text/tab-separated-values,9162,9162,0.0004\nCC-MAIN-2025-38,text/turtle,45736,45730,0.0019\nCC-MAIN-2025-38,text/vcard,23254,23065,0.0010\nCC-MAIN-2025-38,text/x-bibtex,8854,8853,0.0004\nCC-MAIN-2025-38,text/x-c,1982,1982,0.0001\nCC-MAIN-2025-38,text/x-csrc,2552,2551,0.0001\nCC-MAIN-2025-38,text/x-diff,4909,4909,0.0002\nCC-MAIN-2025-38,text/x-patch,5547,5546,0.0002\nCC-MAIN-2025-38,text/x-perl,546,545,0.0000\nCC-MAIN-2025-38,text/x-vcalendar,10296,10295,0.0004\nCC-MAIN-2025-38,text/x-vcard,36854,36837,0.0015\nCC-MAIN-2025-38,text/xml,1495492,1493629,0.0627\nCC-MAIN-2025-38,unknown/unknown,602,602,0.0000\nCC-MAIN-2025-38,video/mp4,158,158,0.0000\nCC-MAIN-2025-38,video/x-ms-asf,5070,5070,0.0002\nCC-MAIN-2025-43,<other>,1878980,1875145,0.0718\nCC-MAIN-2025-43,application/atom+xml,2486426,2486166,0.0950\nCC-MAIN-2025-43,application/calendar,3778,3778,0.0001\nCC-MAIN-2025-43,application/download,65325,65324,0.0025\nCC-MAIN-2025-43,application/epub+zip,40480,40337,0.0015\nCC-MAIN-2025-43,application/force-download,216149,216107,0.0083\nCC-MAIN-2025-43,application/gpx+xml,15421,15421,0.0006\nCC-MAIN-2025-43,application/ics,8670,8670,0.0003\nCC-MAIN-2025-43,application/javascript,22719,22709,0.0009\nCC-MAIN-2025-43,application/json,626456,626016,0.0239\nCC-MAIN-2025-43,application/ld+json,46665,46662,0.0018\nCC-MAIN-2025-43,application/marc,13370,13367,0.0005\nCC-MAIN-2025-43,application/msword,46970,46834,0.0018\nCC-MAIN-2025-43,application/octet-stream,936051,935452,0.0358\nCC-MAIN-2025-43,application/octetstream,4419,4418,0.0002\nCC-MAIN-2025-43,application/pdf,15020588,14990208,0.5740\nCC-MAIN-2025-43,application/pgp-encrypted,2918,2918,0.0001\nCC-MAIN-2025-43,application/pgp-signature,32353,32353,0.0012\nCC-MAIN-2025-43,application/postscript,3451,3450,0.0001\nCC-MAIN-2025-43,application/rdf+xml,100394,100362,0.0038\nCC-MAIN-2025-43,application/rss+xml,1027904,1027282,0.0393\nCC-MAIN-2025-43,application/rtf,21640,21632,0.0008\nCC-MAIN-2025-43,application/save-to-disk,15,15,0.0000\nCC-MAIN-2025-43,application/text,3403,3403,0.0001\nCC-MAIN-2025-43,application/unknown,4217,4217,0.0002\nCC-MAIN-2025-43,application/vnd.android.package-archive,56,56,0.0000\nCC-MAIN-2025-43,application/vnd.google-earth.kml+xml,25468,25458,0.0010\nCC-MAIN-2025-43,application/vnd.google-earth.kmz,6255,6253,0.0002\nCC-MAIN-2025-43,application/vnd.ms-excel,31176,31117,0.0012\nCC-MAIN-2025-43,application/vnd.ms-powerpoint,4635,4620,0.0002\nCC-MAIN-2025-43,application/vnd.ms-word,4755,4755,0.0002\nCC-MAIN-2025-43,application/vnd.oasis.opendocument.text,11681,11678,0.0004\nCC-MAIN-2025-43,application/vnd.openxmlformats-officedocument.presentationml.presentation,4803,4729,0.0002\nCC-MAIN-2025-43,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,41942,41831,0.0016\nCC-MAIN-2025-43,application/vnd.openxmlformats-officedocument.wordprocessingml.document,49030,48855,0.0019\nCC-MAIN-2025-43,application/vnd.wap.xhtml+xml,12263,12184,0.0005\nCC-MAIN-2025-43,application/x-bibtex,171553,171457,0.0066\nCC-MAIN-2025-43,application/x-bittorrent,3893,3892,0.0001\nCC-MAIN-2025-43,application/x-debian-package,6,6,0.0000\nCC-MAIN-2025-43,application/x-download,41209,41140,0.0016\nCC-MAIN-2025-43,application/x-endnote-refer,20434,20433,0.0008\nCC-MAIN-2025-43,application/x-gzip,1599,1598,0.0001\nCC-MAIN-2025-43,application/x-httpd-php,10216,10185,0.0004\nCC-MAIN-2025-43,application/x-java-jnlp-file,2585,2584,0.0001\nCC-MAIN-2025-43,application/x-javascript,2572,2572,0.0001\nCC-MAIN-2025-43,application/x-json,239,239,0.0000\nCC-MAIN-2025-43,application/x-mobipocket-ebook,14092,13970,0.0005\nCC-MAIN-2025-43,application/x-msdownload,7592,7592,0.0003\nCC-MAIN-2025-43,application/x-netcdf,8830,8830,0.0003\nCC-MAIN-2025-43,application/x-research-info-systems,233065,232994,0.0089\nCC-MAIN-2025-43,application/x-shockwave-flash,1871,1868,0.0001\nCC-MAIN-2025-43,application/x-tar,2107,2107,0.0001\nCC-MAIN-2025-43,application/x-tex,4309,4309,0.0002\nCC-MAIN-2025-43,application/x-troff-man,8036,8036,0.0003\nCC-MAIN-2025-43,application/x-zip-compressed,92,92,0.0000\nCC-MAIN-2025-43,application/xhtml+xml,272871,271799,0.0104\nCC-MAIN-2025-43,application/xml,581770,581165,0.0222\nCC-MAIN-2025-43,application/zip,2161,2159,0.0001\nCC-MAIN-2025-43,audio/mpeg,990,990,0.0000\nCC-MAIN-2025-43,audio/x-mpegurl,10343,10341,0.0004\nCC-MAIN-2025-43,audio/x-scpls,2796,2796,0.0001\nCC-MAIN-2025-43,audio/x-wav,27,27,0.0000\nCC-MAIN-2025-43,binary/octet-stream,10842,10670,0.0004\nCC-MAIN-2025-43,image/gif,6640,6636,0.0003\nCC-MAIN-2025-43,image/jp2,1,1,0.0000\nCC-MAIN-2025-43,image/jpeg,6953,6950,0.0003\nCC-MAIN-2025-43,image/jpg,349,349,0.0000\nCC-MAIN-2025-43,image/pjpeg,14,14,0.0000\nCC-MAIN-2025-43,image/png,5772,5771,0.0002\nCC-MAIN-2025-43,image/svg+xml,21,21,0.0000\nCC-MAIN-2025-43,image/tiff,83,83,0.0000\nCC-MAIN-2025-43,image/vnd.djvu,4149,4144,0.0002\nCC-MAIN-2025-43,image/webp,108,108,0.0000\nCC-MAIN-2025-43,message/rfc822,6895,6895,0.0003\nCC-MAIN-2025-43,text/calendar,821116,820820,0.0314\nCC-MAIN-2025-43,text/css,14297,14297,0.0005\nCC-MAIN-2025-43,text/csv,83795,83610,0.0032\nCC-MAIN-2025-43,text/directory,4505,4505,0.0002\nCC-MAIN-2025-43,text/enriched,1058,1058,0.0000\nCC-MAIN-2025-43,text/html,2588706249,2575484605,98.9265\nCC-MAIN-2025-43,text/javascript,6616,6615,0.0003\nCC-MAIN-2025-43,text/markdown,13084,13060,0.0005\nCC-MAIN-2025-43,text/pdf,53,53,0.0000\nCC-MAIN-2025-43,text/plain,1119652,1118854,0.0428\nCC-MAIN-2025-43,text/prs.lines.tag,65694,65694,0.0025\nCC-MAIN-2025-43,text/tab-separated-values,10118,10118,0.0004\nCC-MAIN-2025-43,text/turtle,46711,46703,0.0018\nCC-MAIN-2025-43,text/vcard,26980,26960,0.0010\nCC-MAIN-2025-43,text/x-bibtex,8974,8973,0.0003\nCC-MAIN-2025-43,text/x-c,1593,1593,0.0001\nCC-MAIN-2025-43,text/x-csrc,2898,2870,0.0001\nCC-MAIN-2025-43,text/x-diff,4605,4592,0.0002\nCC-MAIN-2025-43,text/x-patch,4939,4938,0.0002\nCC-MAIN-2025-43,text/x-perl,641,641,0.0000\nCC-MAIN-2025-43,text/x-vcalendar,8549,8549,0.0003\nCC-MAIN-2025-43,text/x-vcard,43872,43836,0.0017\nCC-MAIN-2025-43,text/xml,1524975,1523441,0.0583\nCC-MAIN-2025-43,unknown/unknown,636,636,0.0000\nCC-MAIN-2025-43,video/mp4,344,343,0.0000\nCC-MAIN-2025-43,video/webm,1,1,0.0000\nCC-MAIN-2025-43,video/x-ms-asf,6991,6991,0.0003\nCC-MAIN-2025-47,<other>,1776679,1773113,0.0774\nCC-MAIN-2025-47,application/atom+xml,3289225,3288924,0.1434\nCC-MAIN-2025-47,application/calendar,8381,8380,0.0004\nCC-MAIN-2025-47,application/download,99564,99560,0.0043\nCC-MAIN-2025-47,application/epub+zip,40550,40444,0.0018\nCC-MAIN-2025-47,application/force-download,261602,261576,0.0114\nCC-MAIN-2025-47,application/gpx+xml,15714,15714,0.0007\nCC-MAIN-2025-47,application/ics,10810,10806,0.0005\nCC-MAIN-2025-47,application/javascript,16448,16399,0.0007\nCC-MAIN-2025-47,application/json,640929,640596,0.0279\nCC-MAIN-2025-47,application/ld+json,41253,41250,0.0018\nCC-MAIN-2025-47,application/marc,8927,8926,0.0004\nCC-MAIN-2025-47,application/msword,51556,51456,0.0022\nCC-MAIN-2025-47,application/octet-stream,940242,938735,0.0410\nCC-MAIN-2025-47,application/octetstream,4636,4636,0.0002\nCC-MAIN-2025-47,application/pdf,15639690,15607123,0.6816\nCC-MAIN-2025-47,application/pgp-encrypted,1870,1870,0.0001\nCC-MAIN-2025-47,application/pgp-signature,31431,31411,0.0014\nCC-MAIN-2025-47,application/postscript,3851,3850,0.0002\nCC-MAIN-2025-47,application/rdf+xml,100261,100235,0.0044\nCC-MAIN-2025-47,application/rss+xml,1006803,1006104,0.0439\nCC-MAIN-2025-47,application/rtf,24064,24055,0.0010\nCC-MAIN-2025-47,application/save-to-disk,24,24,0.0000\nCC-MAIN-2025-47,application/text,3520,3520,0.0002\nCC-MAIN-2025-47,application/unknown,4376,4374,0.0002\nCC-MAIN-2025-47,application/vnd.android.package-archive,363,363,0.0000\nCC-MAIN-2025-47,application/vnd.google-earth.kml+xml,26208,26195,0.0011\nCC-MAIN-2025-47,application/vnd.google-earth.kmz,6049,6047,0.0003\nCC-MAIN-2025-47,application/vnd.ms-excel,32869,32196,0.0014\nCC-MAIN-2025-47,application/vnd.ms-powerpoint,4283,4276,0.0002\nCC-MAIN-2025-47,application/vnd.ms-word,3748,3747,0.0002\nCC-MAIN-2025-47,application/vnd.oasis.opendocument.text,16923,16919,0.0007\nCC-MAIN-2025-47,application/vnd.openxmlformats-officedocument.presentationml.presentation,5216,5141,0.0002\nCC-MAIN-2025-47,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,37399,36137,0.0016\nCC-MAIN-2025-47,application/vnd.openxmlformats-officedocument.wordprocessingml.document,53540,53375,0.0023\nCC-MAIN-2025-47,application/vnd.wap.xhtml+xml,13977,13901,0.0006\nCC-MAIN-2025-47,application/x-bibtex,176702,176626,0.0077\nCC-MAIN-2025-47,application/x-bittorrent,3157,3156,0.0001\nCC-MAIN-2025-47,application/x-debian-package,6,6,0.0000\nCC-MAIN-2025-47,application/x-download,48489,48474,0.0021\nCC-MAIN-2025-47,application/x-endnote-refer,17920,17919,0.0008\nCC-MAIN-2025-47,application/x-gzip,1812,1812,0.0001\nCC-MAIN-2025-47,application/x-httpd-php,10973,10950,0.0005\nCC-MAIN-2025-47,application/x-java-jnlp-file,2713,2711,0.0001\nCC-MAIN-2025-47,application/x-javascript,2714,2713,0.0001\nCC-MAIN-2025-47,application/x-json,82,82,0.0000\nCC-MAIN-2025-47,application/x-mobipocket-ebook,14593,14498,0.0006\nCC-MAIN-2025-47,application/x-msdownload,6160,6160,0.0003\nCC-MAIN-2025-47,application/x-netcdf,6651,6651,0.0003\nCC-MAIN-2025-47,application/x-research-info-systems,244898,244811,0.0107\nCC-MAIN-2025-47,application/x-shockwave-flash,1953,1949,0.0001\nCC-MAIN-2025-47,application/x-tar,855,855,0.0000\nCC-MAIN-2025-47,application/x-tex,3382,3382,0.0001\nCC-MAIN-2025-47,application/x-troff-man,5485,5485,0.0002\nCC-MAIN-2025-47,application/x-zip-compressed,257,257,0.0000\nCC-MAIN-2025-47,application/xhtml+xml,272825,271550,0.0119\nCC-MAIN-2025-47,application/xml,561963,561372,0.0245\nCC-MAIN-2025-47,application/zip,3708,3706,0.0002\nCC-MAIN-2025-47,audio/mpeg,1302,1302,0.0001\nCC-MAIN-2025-47,audio/x-mpegurl,11466,11462,0.0005\nCC-MAIN-2025-47,audio/x-scpls,3283,3283,0.0001\nCC-MAIN-2025-47,audio/x-wav,40,40,0.0000\nCC-MAIN-2025-47,binary/octet-stream,7295,7257,0.0003\nCC-MAIN-2025-47,image/gif,9729,9716,0.0004\nCC-MAIN-2025-47,image/jpeg,6432,6425,0.0003\nCC-MAIN-2025-47,image/jpg,578,578,0.0000\nCC-MAIN-2025-47,image/pjpeg,14,14,0.0000\nCC-MAIN-2025-47,image/png,6223,6220,0.0003\nCC-MAIN-2025-47,image/svg+xml,20,20,0.0000\nCC-MAIN-2025-47,image/tiff,11,11,0.0000\nCC-MAIN-2025-47,image/vnd.djvu,6795,6795,0.0003\nCC-MAIN-2025-47,image/webp,218,218,0.0000\nCC-MAIN-2025-47,message/rfc822,8919,8916,0.0004\nCC-MAIN-2025-47,text/calendar,918842,918276,0.0400\nCC-MAIN-2025-47,text/css,15548,15546,0.0007\nCC-MAIN-2025-47,text/csv,73045,72993,0.0032\nCC-MAIN-2025-47,text/directory,4067,4067,0.0002\nCC-MAIN-2025-47,text/enriched,1289,1289,0.0001\nCC-MAIN-2025-47,text/html,2264894869,2253089907,98.7109\nCC-MAIN-2025-47,text/javascript,7114,7112,0.0003\nCC-MAIN-2025-47,text/markdown,12202,12186,0.0005\nCC-MAIN-2025-47,text/pdf,92,92,0.0000\nCC-MAIN-2025-47,text/plain,1136947,1136238,0.0496\nCC-MAIN-2025-47,text/prs.lines.tag,57363,57361,0.0025\nCC-MAIN-2025-47,text/tab-separated-values,11820,11818,0.0005\nCC-MAIN-2025-47,text/turtle,38883,38878,0.0017\nCC-MAIN-2025-47,text/vcard,27380,27314,0.0012\nCC-MAIN-2025-47,text/x-bibtex,10234,10233,0.0004\nCC-MAIN-2025-47,text/x-c,1979,1977,0.0001\nCC-MAIN-2025-47,text/x-csrc,2833,2829,0.0001\nCC-MAIN-2025-47,text/x-diff,4391,4391,0.0002\nCC-MAIN-2025-47,text/x-patch,5156,5156,0.0002\nCC-MAIN-2025-47,text/x-perl,596,596,0.0000\nCC-MAIN-2025-47,text/x-vcalendar,8621,8620,0.0004\nCC-MAIN-2025-47,text/x-vcard,42409,42391,0.0018\nCC-MAIN-2025-47,text/xml,1520810,1518265,0.0663\nCC-MAIN-2025-47,unknown/unknown,597,597,0.0000\nCC-MAIN-2025-47,video/mp4,407,407,0.0000\nCC-MAIN-2025-47,video/webm,2,2,0.0000\nCC-MAIN-2025-47,video/x-ms-asf,2812,2812,0.0001\nCC-MAIN-2025-51,<other>,1548845,1545194,0.0714\nCC-MAIN-2025-51,application/atom+xml,3242647,3242385,0.1495\nCC-MAIN-2025-51,application/calendar,8192,8192,0.0004\nCC-MAIN-2025-51,application/download,69005,69002,0.0032\nCC-MAIN-2025-51,application/epub+zip,35595,35532,0.0016\nCC-MAIN-2025-51,application/force-download,244589,244566,0.0113\nCC-MAIN-2025-51,application/gpx+xml,15945,15945,0.0007\nCC-MAIN-2025-51,application/ics,9153,9151,0.0004\nCC-MAIN-2025-51,application/javascript,16610,16497,0.0008\nCC-MAIN-2025-51,application/json,605710,605391,0.0279\nCC-MAIN-2025-51,application/ld+json,36993,36992,0.0017\nCC-MAIN-2025-51,application/marc,7861,7861,0.0004\nCC-MAIN-2025-51,application/msword,51339,51202,0.0024\nCC-MAIN-2025-51,application/octet-stream,1097662,1096524,0.0506\nCC-MAIN-2025-51,application/octetstream,4404,4404,0.0002\nCC-MAIN-2025-51,application/pdf,15050775,15016526,0.6939\nCC-MAIN-2025-51,application/pgp-encrypted,1717,1717,0.0001\nCC-MAIN-2025-51,application/pgp-signature,38421,38372,0.0018\nCC-MAIN-2025-51,application/postscript,3513,3512,0.0002\nCC-MAIN-2025-51,application/rdf+xml,91427,91387,0.0042\nCC-MAIN-2025-51,application/rss+xml,952479,951885,0.0439\nCC-MAIN-2025-51,application/rtf,20942,20937,0.0010\nCC-MAIN-2025-51,application/save-to-disk,9,9,0.0000\nCC-MAIN-2025-51,application/text,3537,3537,0.0002\nCC-MAIN-2025-51,application/unknown,4440,4440,0.0002\nCC-MAIN-2025-51,application/vnd.android.package-archive,81,80,0.0000\nCC-MAIN-2025-51,application/vnd.google-earth.kml+xml,24438,24422,0.0011\nCC-MAIN-2025-51,application/vnd.google-earth.kmz,5157,5157,0.0002\nCC-MAIN-2025-51,application/vnd.ms-excel,35175,34995,0.0016\nCC-MAIN-2025-51,application/vnd.ms-powerpoint,4163,4163,0.0002\nCC-MAIN-2025-51,application/vnd.ms-word,4126,4126,0.0002\nCC-MAIN-2025-51,application/vnd.oasis.opendocument.text,11946,11934,0.0006\nCC-MAIN-2025-51,application/vnd.openxmlformats-officedocument.presentationml.presentation,4834,4825,0.0002\nCC-MAIN-2025-51,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,35899,35530,0.0017\nCC-MAIN-2025-51,application/vnd.openxmlformats-officedocument.wordprocessingml.document,50234,50075,0.0023\nCC-MAIN-2025-51,application/vnd.wap.xhtml+xml,3757,3738,0.0002\nCC-MAIN-2025-51,application/x-bibtex,179206,179125,0.0083\nCC-MAIN-2025-51,application/x-bittorrent,3630,3629,0.0002\nCC-MAIN-2025-51,application/x-debian-package,10,10,0.0000\nCC-MAIN-2025-51,application/x-download,54695,54682,0.0025\nCC-MAIN-2025-51,application/x-endnote-refer,10367,10367,0.0005\nCC-MAIN-2025-51,application/x-gzip,1982,1979,0.0001\nCC-MAIN-2025-51,application/x-httpd-php,6444,6428,0.0003\nCC-MAIN-2025-51,application/x-java-jnlp-file,3361,3361,0.0002\nCC-MAIN-2025-51,application/x-javascript,3139,3139,0.0001\nCC-MAIN-2025-51,application/x-json,152,152,0.0000\nCC-MAIN-2025-51,application/x-mobipocket-ebook,13222,13161,0.0006\nCC-MAIN-2025-51,application/x-msdownload,6104,6104,0.0003\nCC-MAIN-2025-51,application/x-netcdf,4255,4255,0.0002\nCC-MAIN-2025-51,application/x-research-info-systems,246464,246334,0.0114\nCC-MAIN-2025-51,application/x-shockwave-flash,1059,1056,0.0000\nCC-MAIN-2025-51,application/x-tar,529,529,0.0000\nCC-MAIN-2025-51,application/x-tex,3806,3806,0.0002\nCC-MAIN-2025-51,application/x-troff-man,8491,8491,0.0004\nCC-MAIN-2025-51,application/x-zip-compressed,399,399,0.0000\nCC-MAIN-2025-51,application/xhtml+xml,257888,256533,0.0119\nCC-MAIN-2025-51,application/xml,542254,541467,0.0250\nCC-MAIN-2025-51,application/zip,3574,3574,0.0002\nCC-MAIN-2025-51,audio/mpeg,1366,1366,0.0001\nCC-MAIN-2025-51,audio/x-mpegurl,9370,9366,0.0004\nCC-MAIN-2025-51,audio/x-scpls,2827,2826,0.0001\nCC-MAIN-2025-51,audio/x-wav,33,33,0.0000\nCC-MAIN-2025-51,binary/octet-stream,7344,7339,0.0003\nCC-MAIN-2025-51,image/gif,8736,8735,0.0004\nCC-MAIN-2025-51,image/jpeg,5931,5921,0.0003\nCC-MAIN-2025-51,image/jpg,408,408,0.0000\nCC-MAIN-2025-51,image/pjpeg,22,22,0.0000\nCC-MAIN-2025-51,image/png,3524,3522,0.0002\nCC-MAIN-2025-51,image/svg+xml,29,29,0.0000\nCC-MAIN-2025-51,image/tiff,5,5,0.0000\nCC-MAIN-2025-51,image/vnd.djvu,12941,12941,0.0006\nCC-MAIN-2025-51,image/webp,37,37,0.0000\nCC-MAIN-2025-51,message/rfc822,7335,7335,0.0003\nCC-MAIN-2025-51,text/calendar,836739,836476,0.0386\nCC-MAIN-2025-51,text/css,11370,11370,0.0005\nCC-MAIN-2025-51,text/csv,68891,68839,0.0032\nCC-MAIN-2025-51,text/directory,4099,4099,0.0002\nCC-MAIN-2025-51,text/enriched,1178,1178,0.0001\nCC-MAIN-2025-51,text/html,2140551223,2129474010,98.6844\nCC-MAIN-2025-51,text/javascript,7648,7644,0.0004\nCC-MAIN-2025-51,text/markdown,13756,13706,0.0006\nCC-MAIN-2025-51,text/pdf,505,505,0.0000\nCC-MAIN-2025-51,text/plain,1106070,1105349,0.0510\nCC-MAIN-2025-51,text/prs.lines.tag,52199,52196,0.0024\nCC-MAIN-2025-51,text/tab-separated-values,11029,11029,0.0005\nCC-MAIN-2025-51,text/turtle,36593,36590,0.0017\nCC-MAIN-2025-51,text/vcard,24955,24953,0.0012\nCC-MAIN-2025-51,text/x-bibtex,9696,9696,0.0004\nCC-MAIN-2025-51,text/x-c,1544,1542,0.0001\nCC-MAIN-2025-51,text/x-csrc,3557,3555,0.0002\nCC-MAIN-2025-51,text/x-diff,4974,4974,0.0002\nCC-MAIN-2025-51,text/x-patch,5343,5342,0.0002\nCC-MAIN-2025-51,text/x-perl,767,767,0.0000\nCC-MAIN-2025-51,text/x-vcalendar,7811,7810,0.0004\nCC-MAIN-2025-51,text/x-vcard,43648,43628,0.0020\nCC-MAIN-2025-51,text/xml,1527111,1525418,0.0704\nCC-MAIN-2025-51,unknown/unknown,883,883,0.0000\nCC-MAIN-2025-51,video/mp4,449,449,0.0000\nCC-MAIN-2025-51,video/webm,1,1,0.0000\nCC-MAIN-2025-51,video/x-ms-asf,2681,2680,0.0001\nCC-MAIN-2026-04,<other>,1536504,1533914,0.0660\nCC-MAIN-2026-04,application/atom+xml,3116706,3116428,0.1338\nCC-MAIN-2026-04,application/calendar,6052,6052,0.0003\nCC-MAIN-2026-04,application/download,27665,27664,0.0012\nCC-MAIN-2026-04,application/epub+zip,34500,34440,0.0015\nCC-MAIN-2026-04,application/force-download,154717,154634,0.0066\nCC-MAIN-2026-04,application/gpx+xml,16390,16386,0.0007\nCC-MAIN-2026-04,application/ics,8590,8589,0.0004\nCC-MAIN-2026-04,application/javascript,16706,16599,0.0007\nCC-MAIN-2026-04,application/json,563969,563584,0.0242\nCC-MAIN-2026-04,application/ld+json,36394,36393,0.0016\nCC-MAIN-2026-04,application/marc,7631,7631,0.0003\nCC-MAIN-2026-04,application/msword,51028,50960,0.0022\nCC-MAIN-2026-04,application/octet-stream,984499,983960,0.0423\nCC-MAIN-2026-04,application/octetstream,5120,5120,0.0002\nCC-MAIN-2026-04,application/pdf,14468757,14436812,0.6211\nCC-MAIN-2026-04,application/pgp-encrypted,2193,2193,0.0001\nCC-MAIN-2026-04,application/pgp-signature,32553,32553,0.0014\nCC-MAIN-2026-04,application/postscript,3304,3303,0.0001\nCC-MAIN-2026-04,application/rdf+xml,84361,84330,0.0036\nCC-MAIN-2026-04,application/rss+xml,971597,970961,0.0417\nCC-MAIN-2026-04,application/rtf,16891,16886,0.0007\nCC-MAIN-2026-04,application/save-to-disk,24,24,0.0000\nCC-MAIN-2026-04,application/text,3473,3473,0.0001\nCC-MAIN-2026-04,application/unknown,3945,3945,0.0002\nCC-MAIN-2026-04,application/vnd.android.package-archive,34,34,0.0000\nCC-MAIN-2026-04,application/vnd.google-earth.kml+xml,25548,25543,0.0011\nCC-MAIN-2026-04,application/vnd.google-earth.kmz,7374,7364,0.0003\nCC-MAIN-2026-04,application/vnd.ms-excel,31668,31528,0.0014\nCC-MAIN-2026-04,application/vnd.ms-powerpoint,2509,2509,0.0001\nCC-MAIN-2026-04,application/vnd.ms-word,3828,3828,0.0002\nCC-MAIN-2026-04,application/vnd.oasis.opendocument.text,13334,13328,0.0006\nCC-MAIN-2026-04,application/vnd.openxmlformats-officedocument.presentationml.presentation,4744,4711,0.0002\nCC-MAIN-2026-04,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,38661,38495,0.0017\nCC-MAIN-2026-04,application/vnd.openxmlformats-officedocument.wordprocessingml.document,50259,50088,0.0022\nCC-MAIN-2026-04,application/vnd.wap.xhtml+xml,5844,5753,0.0003\nCC-MAIN-2026-04,application/x-bibtex,188560,188516,0.0081\nCC-MAIN-2026-04,application/x-bittorrent,14154,14149,0.0006\nCC-MAIN-2026-04,application/x-debian-package,1,1,0.0000\nCC-MAIN-2026-04,application/x-download,58656,58645,0.0025\nCC-MAIN-2026-04,application/x-endnote-refer,9062,9062,0.0004\nCC-MAIN-2026-04,application/x-gzip,1958,1955,0.0001\nCC-MAIN-2026-04,application/x-httpd-php,4924,4914,0.0002\nCC-MAIN-2026-04,application/x-java-jnlp-file,3445,3445,0.0001\nCC-MAIN-2026-04,application/x-javascript,3371,3371,0.0001\nCC-MAIN-2026-04,application/x-json,212,212,0.0000\nCC-MAIN-2026-04,application/x-mobipocket-ebook,10414,10363,0.0004\nCC-MAIN-2026-04,application/x-msdownload,4835,4835,0.0002\nCC-MAIN-2026-04,application/x-netcdf,6724,6724,0.0003\nCC-MAIN-2026-04,application/x-research-info-systems,250645,250577,0.0108\nCC-MAIN-2026-04,application/x-shockwave-flash,1196,1195,0.0001\nCC-MAIN-2026-04,application/x-tar,1543,1543,0.0001\nCC-MAIN-2026-04,application/x-tex,2897,2896,0.0001\nCC-MAIN-2026-04,application/x-troff-man,8991,8990,0.0004\nCC-MAIN-2026-04,application/x-zip-compressed,374,374,0.0000\nCC-MAIN-2026-04,application/xhtml+xml,235324,233608,0.0101\nCC-MAIN-2026-04,application/xml,544311,543840,0.0234\nCC-MAIN-2026-04,application/zip,2514,2514,0.0001\nCC-MAIN-2026-04,audio/mpeg,1799,1799,0.0001\nCC-MAIN-2026-04,audio/x-mpegurl,10630,10627,0.0005\nCC-MAIN-2026-04,audio/x-scpls,3150,3150,0.0001\nCC-MAIN-2026-04,audio/x-wav,12,12,0.0000\nCC-MAIN-2026-04,binary/octet-stream,10800,10733,0.0005\nCC-MAIN-2026-04,image/gif,11861,11861,0.0005\nCC-MAIN-2026-04,image/jp2,2,2,0.0000\nCC-MAIN-2026-04,image/jpeg,6696,6689,0.0003\nCC-MAIN-2026-04,image/jpg,255,255,0.0000\nCC-MAIN-2026-04,image/pjpeg,10,10,0.0000\nCC-MAIN-2026-04,image/png,4601,4599,0.0002\nCC-MAIN-2026-04,image/svg+xml,18,18,0.0000\nCC-MAIN-2026-04,image/tiff,39,39,0.0000\nCC-MAIN-2026-04,image/vnd.djvu,5351,5350,0.0002\nCC-MAIN-2026-04,image/webp,85,85,0.0000\nCC-MAIN-2026-04,message/rfc822,4819,4819,0.0002\nCC-MAIN-2026-04,text/calendar,800947,800655,0.0344\nCC-MAIN-2026-04,text/css,13571,13569,0.0006\nCC-MAIN-2026-04,text/csv,74933,74479,0.0032\nCC-MAIN-2026-04,text/directory,4458,4458,0.0002\nCC-MAIN-2026-04,text/enriched,1130,1130,0.0000\nCC-MAIN-2026-04,text/html,2302267098,2290783436,98.8254\nCC-MAIN-2026-04,text/javascript,6945,6942,0.0003\nCC-MAIN-2026-04,text/markdown,22169,22066,0.0010\nCC-MAIN-2026-04,text/pdf,110,110,0.0000\nCC-MAIN-2026-04,text/plain,1064267,1063326,0.0457\nCC-MAIN-2026-04,text/prs.lines.tag,50378,50375,0.0022\nCC-MAIN-2026-04,text/tab-separated-values,9778,9773,0.0004\nCC-MAIN-2026-04,text/turtle,30073,30073,0.0013\nCC-MAIN-2026-04,text/vcard,22196,22185,0.0010\nCC-MAIN-2026-04,text/x-bibtex,10223,10221,0.0004\nCC-MAIN-2026-04,text/x-c,1486,1486,0.0001\nCC-MAIN-2026-04,text/x-csrc,3052,3051,0.0001\nCC-MAIN-2026-04,text/x-diff,6637,6637,0.0003\nCC-MAIN-2026-04,text/x-patch,4397,4397,0.0002\nCC-MAIN-2026-04,text/x-perl,599,599,0.0000\nCC-MAIN-2026-04,text/x-vcalendar,6818,6817,0.0003\nCC-MAIN-2026-04,text/x-vcard,39757,39740,0.0017\nCC-MAIN-2026-04,text/xml,1434930,1433211,0.0616\nCC-MAIN-2026-04,unknown/unknown,460,460,0.0000\nCC-MAIN-2026-04,video/mp4,258,258,0.0000\nCC-MAIN-2026-04,video/webm,2,2,0.0000\nCC-MAIN-2026-04,video/x-ms-asf,2472,2471,0.0001\nCC-MAIN-2026-08,<other>,1390280,1386883,0.0642\nCC-MAIN-2026-08,application/atom+xml,3165598,3165245,0.1461\nCC-MAIN-2026-08,application/calendar,5872,5872,0.0003\nCC-MAIN-2026-08,application/download,42288,42286,0.0020\nCC-MAIN-2026-08,application/epub+zip,36065,35981,0.0017\nCC-MAIN-2026-08,application/force-download,193605,193551,0.0089\nCC-MAIN-2026-08,application/gpx+xml,17887,17887,0.0008\nCC-MAIN-2026-08,application/ics,8971,8970,0.0004\nCC-MAIN-2026-08,application/javascript,16777,16767,0.0008\nCC-MAIN-2026-08,application/json,567636,566833,0.0262\nCC-MAIN-2026-08,application/ld+json,31942,31941,0.0015\nCC-MAIN-2026-08,application/marc,6895,6893,0.0003\nCC-MAIN-2026-08,application/msword,53511,53450,0.0025\nCC-MAIN-2026-08,application/octet-stream,972560,972054,0.0449\nCC-MAIN-2026-08,application/octetstream,4483,4483,0.0002\nCC-MAIN-2026-08,application/pdf,15883645,15851168,0.7330\nCC-MAIN-2026-08,application/pgp-encrypted,2472,2472,0.0001\nCC-MAIN-2026-08,application/pgp-signature,30617,30616,0.0014\nCC-MAIN-2026-08,application/postscript,3522,3521,0.0002\nCC-MAIN-2026-08,application/rdf+xml,83143,83098,0.0038\nCC-MAIN-2026-08,application/rss+xml,931452,930960,0.0430\nCC-MAIN-2026-08,application/rtf,17400,17398,0.0008\nCC-MAIN-2026-08,application/save-to-disk,14,14,0.0000\nCC-MAIN-2026-08,application/text,3114,3114,0.0001\nCC-MAIN-2026-08,application/unknown,5120,5120,0.0002\nCC-MAIN-2026-08,application/vnd.android.package-archive,40,40,0.0000\nCC-MAIN-2026-08,application/vnd.google-earth.kml+xml,25608,25601,0.0012\nCC-MAIN-2026-08,application/vnd.google-earth.kmz,6260,6256,0.0003\nCC-MAIN-2026-08,application/vnd.ms-excel,31171,31061,0.0014\nCC-MAIN-2026-08,application/vnd.ms-powerpoint,3104,3102,0.0001\nCC-MAIN-2026-08,application/vnd.ms-word,3384,3384,0.0002\nCC-MAIN-2026-08,application/vnd.oasis.opendocument.text,14253,14248,0.0007\nCC-MAIN-2026-08,application/vnd.openxmlformats-officedocument.presentationml.presentation,5218,5208,0.0002\nCC-MAIN-2026-08,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,40095,39968,0.0019\nCC-MAIN-2026-08,application/vnd.openxmlformats-officedocument.wordprocessingml.document,53051,52815,0.0024\nCC-MAIN-2026-08,application/vnd.wap.xhtml+xml,10775,10702,0.0005\nCC-MAIN-2026-08,application/x-bibtex,185821,185766,0.0086\nCC-MAIN-2026-08,application/x-bittorrent,2347,2341,0.0001\nCC-MAIN-2026-08,application/x-debian-package,222,222,0.0000\nCC-MAIN-2026-08,application/x-download,56246,56219,0.0026\nCC-MAIN-2026-08,application/x-endnote-refer,8034,8033,0.0004\nCC-MAIN-2026-08,application/x-gzip,5600,5599,0.0003\nCC-MAIN-2026-08,application/x-httpd-php,6327,6311,0.0003\nCC-MAIN-2026-08,application/x-java-jnlp-file,2980,2980,0.0001\nCC-MAIN-2026-08,application/x-javascript,4122,4119,0.0002\nCC-MAIN-2026-08,application/x-json,274,274,0.0000\nCC-MAIN-2026-08,application/x-mobipocket-ebook,11379,11320,0.0005\nCC-MAIN-2026-08,application/x-msdownload,5832,5831,0.0003\nCC-MAIN-2026-08,application/x-netcdf,2984,2984,0.0001\nCC-MAIN-2026-08,application/x-research-info-systems,248121,248046,0.0115\nCC-MAIN-2026-08,application/x-shockwave-flash,1210,1208,0.0001\nCC-MAIN-2026-08,application/x-tar,935,935,0.0000\nCC-MAIN-2026-08,application/x-tex,3205,3205,0.0001\nCC-MAIN-2026-08,application/x-troff-man,7913,7911,0.0004\nCC-MAIN-2026-08,application/x-zip-compressed,340,340,0.0000\nCC-MAIN-2026-08,application/xhtml+xml,240707,238956,0.0111\nCC-MAIN-2026-08,application/xml,629775,629013,0.0291\nCC-MAIN-2026-08,application/zip,2380,2369,0.0001\nCC-MAIN-2026-08,audio/mpeg,2051,2051,0.0001\nCC-MAIN-2026-08,audio/x-mpegurl,11631,11602,0.0005\nCC-MAIN-2026-08,audio/x-scpls,3356,3356,0.0002\nCC-MAIN-2026-08,audio/x-wav,24,24,0.0000\nCC-MAIN-2026-08,binary/octet-stream,10411,10368,0.0005\nCC-MAIN-2026-08,image/gif,9194,9194,0.0004\nCC-MAIN-2026-08,image/jpeg,5447,5446,0.0003\nCC-MAIN-2026-08,image/jpg,268,268,0.0000\nCC-MAIN-2026-08,image/pjpeg,16,16,0.0000\nCC-MAIN-2026-08,image/png,4277,4273,0.0002\nCC-MAIN-2026-08,image/svg+xml,49,49,0.0000\nCC-MAIN-2026-08,image/tiff,33,33,0.0000\nCC-MAIN-2026-08,image/vnd.djvu,12372,12370,0.0006\nCC-MAIN-2026-08,image/webp,59,59,0.0000\nCC-MAIN-2026-08,message/rfc822,5372,5372,0.0002\nCC-MAIN-2026-08,text/calendar,811520,811227,0.0374\nCC-MAIN-2026-08,text/css,12959,12955,0.0006\nCC-MAIN-2026-08,text/csv,74595,74448,0.0034\nCC-MAIN-2026-08,text/directory,4363,4363,0.0002\nCC-MAIN-2026-08,text/enriched,976,976,0.0000\nCC-MAIN-2026-08,text/html,2138213621,2126869186,98.6720\nCC-MAIN-2026-08,text/javascript,7874,7872,0.0004\nCC-MAIN-2026-08,text/markdown,27197,27123,0.0013\nCC-MAIN-2026-08,text/pdf,1138,1138,0.0001\nCC-MAIN-2026-08,text/plain,1128757,1127416,0.0521\nCC-MAIN-2026-08,text/prs.lines.tag,54739,54737,0.0025\nCC-MAIN-2026-08,text/tab-separated-values,10290,10285,0.0005\nCC-MAIN-2026-08,text/turtle,30040,30037,0.0014\nCC-MAIN-2026-08,text/vcard,24290,24280,0.0011\nCC-MAIN-2026-08,text/x-bibtex,13032,13031,0.0006\nCC-MAIN-2026-08,text/x-c,1773,1772,0.0001\nCC-MAIN-2026-08,text/x-csrc,3005,3005,0.0001\nCC-MAIN-2026-08,text/x-diff,4964,4962,0.0002\nCC-MAIN-2026-08,text/x-patch,5625,5624,0.0003\nCC-MAIN-2026-08,text/x-perl,731,729,0.0000\nCC-MAIN-2026-08,text/x-vcalendar,7424,7423,0.0003\nCC-MAIN-2026-08,text/x-vcard,42705,42697,0.0020\nCC-MAIN-2026-08,text/xml,1347875,1346771,0.0622\nCC-MAIN-2026-08,unknown/unknown,410,410,0.0000\nCC-MAIN-2026-08,video/mp4,149,149,0.0000\nCC-MAIN-2026-08,video/webm,2,2,0.0000\nCC-MAIN-2026-08,video/x-ms-asf,2526,2522,0.0001\nCC-MAIN-2026-12,<other>,1274810,1270416,0.0646\nCC-MAIN-2026-12,application/atom+xml,2983600,2983316,0.1511\nCC-MAIN-2026-12,application/calendar,4073,4073,0.0002\nCC-MAIN-2026-12,application/download,25629,25625,0.0013\nCC-MAIN-2026-12,application/epub+zip,37562,37488,0.0019\nCC-MAIN-2026-12,application/force-download,148682,148653,0.0075\nCC-MAIN-2026-12,application/gpx+xml,15234,15232,0.0008\nCC-MAIN-2026-12,application/ics,7695,7693,0.0004\nCC-MAIN-2026-12,application/javascript,15798,15789,0.0008\nCC-MAIN-2026-12,application/json,505457,504710,0.0256\nCC-MAIN-2026-12,application/ld+json,27130,27130,0.0014\nCC-MAIN-2026-12,application/marc,6175,6175,0.0003\nCC-MAIN-2026-12,application/msword,46119,45980,0.0023\nCC-MAIN-2026-12,application/octet-stream,961531,961055,0.0487\nCC-MAIN-2026-12,application/octetstream,4836,4836,0.0002\nCC-MAIN-2026-12,application/pdf,15775787,15744182,0.7988\nCC-MAIN-2026-12,application/pgp-encrypted,2315,2315,0.0001\nCC-MAIN-2026-12,application/pgp-signature,32511,32509,0.0016\nCC-MAIN-2026-12,application/postscript,3694,3693,0.0002\nCC-MAIN-2026-12,application/rdf+xml,70228,70202,0.0036\nCC-MAIN-2026-12,application/rss+xml,866675,866250,0.0439\nCC-MAIN-2026-12,application/rtf,13416,13415,0.0007\nCC-MAIN-2026-12,application/save-to-disk,2,2,0.0000\nCC-MAIN-2026-12,application/text,2700,2700,0.0001\nCC-MAIN-2026-12,application/unknown,4125,4125,0.0002\nCC-MAIN-2026-12,application/vnd.android.package-archive,38,38,0.0000\nCC-MAIN-2026-12,application/vnd.google-earth.kml+xml,24381,24374,0.0012\nCC-MAIN-2026-12,application/vnd.google-earth.kmz,9209,9208,0.0005\nCC-MAIN-2026-12,application/vnd.ms-excel,28801,28640,0.0015\nCC-MAIN-2026-12,application/vnd.ms-powerpoint,2533,2531,0.0001\nCC-MAIN-2026-12,application/vnd.ms-word,2518,2518,0.0001\nCC-MAIN-2026-12,application/vnd.oasis.opendocument.text,15049,15042,0.0008\nCC-MAIN-2026-12,application/vnd.openxmlformats-officedocument.presentationml.presentation,5003,4968,0.0003\nCC-MAIN-2026-12,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,34435,34275,0.0017\nCC-MAIN-2026-12,application/vnd.openxmlformats-officedocument.wordprocessingml.document,54444,54220,0.0028\nCC-MAIN-2026-12,application/vnd.wap.xhtml+xml,19988,19907,0.0010\nCC-MAIN-2026-12,application/x-bibtex,177492,177413,0.0090\nCC-MAIN-2026-12,application/x-bittorrent,2883,2872,0.0001\nCC-MAIN-2026-12,application/x-debian-package,139,139,0.0000\nCC-MAIN-2026-12,application/x-download,49120,49094,0.0025\nCC-MAIN-2026-12,application/x-endnote-refer,8130,8130,0.0004\nCC-MAIN-2026-12,application/x-gzip,4070,4070,0.0002\nCC-MAIN-2026-12,application/x-httpd-php,6672,6657,0.0003\nCC-MAIN-2026-12,application/x-java-jnlp-file,2263,2263,0.0001\nCC-MAIN-2026-12,application/x-javascript,3675,3671,0.0002\nCC-MAIN-2026-12,application/x-json,65,65,0.0000\nCC-MAIN-2026-12,application/x-mobipocket-ebook,12947,12874,0.0007\nCC-MAIN-2026-12,application/x-msdownload,5992,5991,0.0003\nCC-MAIN-2026-12,application/x-netcdf,6364,6364,0.0003\nCC-MAIN-2026-12,application/x-research-info-systems,230947,230870,0.0117\nCC-MAIN-2026-12,application/x-shockwave-flash,1084,1081,0.0001\nCC-MAIN-2026-12,application/x-tar,1144,1144,0.0001\nCC-MAIN-2026-12,application/x-tex,3112,3112,0.0002\nCC-MAIN-2026-12,application/x-troff-man,6647,6647,0.0003\nCC-MAIN-2026-12,application/x-zip-compressed,360,359,0.0000\nCC-MAIN-2026-12,application/xhtml+xml,214321,213404,0.0109\nCC-MAIN-2026-12,application/xml,524480,523449,0.0266\nCC-MAIN-2026-12,application/zip,2218,2218,0.0001\nCC-MAIN-2026-12,audio/mpeg,2828,2828,0.0001\nCC-MAIN-2026-12,audio/x-mpegurl,11259,11254,0.0006\nCC-MAIN-2026-12,audio/x-scpls,2178,2178,0.0001\nCC-MAIN-2026-12,audio/x-wav,14,14,0.0000\nCC-MAIN-2026-12,binary/octet-stream,9033,9007,0.0005\nCC-MAIN-2026-12,image/gif,6664,6664,0.0003\nCC-MAIN-2026-12,image/jp2,1,1,0.0000\nCC-MAIN-2026-12,image/jpeg,7895,7894,0.0004\nCC-MAIN-2026-12,image/jpg,190,190,0.0000\nCC-MAIN-2026-12,image/pjpeg,5,5,0.0000\nCC-MAIN-2026-12,image/png,8086,8085,0.0004\nCC-MAIN-2026-12,image/svg+xml,54,54,0.0000\nCC-MAIN-2026-12,image/tiff,486,486,0.0000\nCC-MAIN-2026-12,image/vnd.djvu,5295,5295,0.0003\nCC-MAIN-2026-12,image/webp,32,32,0.0000\nCC-MAIN-2026-12,message/rfc822,5046,5046,0.0003\nCC-MAIN-2026-12,text/calendar,755643,755426,0.0383\nCC-MAIN-2026-12,text/css,11713,11712,0.0006\nCC-MAIN-2026-12,text/csv,62400,62371,0.0032\nCC-MAIN-2026-12,text/directory,4331,4331,0.0002\nCC-MAIN-2026-12,text/enriched,897,897,0.0000\nCC-MAIN-2026-12,text/html,1947091170,1936394530,98.5946\nCC-MAIN-2026-12,text/javascript,7298,7295,0.0004\nCC-MAIN-2026-12,text/markdown,66666,66415,0.0034\nCC-MAIN-2026-12,text/pdf,319,319,0.0000\nCC-MAIN-2026-12,text/plain,1068654,1067209,0.0541\nCC-MAIN-2026-12,text/prs.lines.tag,76100,76097,0.0039\nCC-MAIN-2026-12,text/tab-separated-values,7128,7126,0.0004\nCC-MAIN-2026-12,text/turtle,23368,23367,0.0012\nCC-MAIN-2026-12,text/vcard,24582,24575,0.0012\nCC-MAIN-2026-12,text/x-bibtex,9814,9813,0.0005\nCC-MAIN-2026-12,text/x-c,3870,3870,0.0002\nCC-MAIN-2026-12,text/x-csrc,2279,2279,0.0001\nCC-MAIN-2026-12,text/x-diff,5846,5846,0.0003\nCC-MAIN-2026-12,text/x-patch,5480,5480,0.0003\nCC-MAIN-2026-12,text/x-perl,1453,1453,0.0001\nCC-MAIN-2026-12,text/x-vcalendar,7463,7462,0.0004\nCC-MAIN-2026-12,text/x-vcard,38114,38104,0.0019\nCC-MAIN-2026-12,text/xml,1211449,1210381,0.0613\nCC-MAIN-2026-12,unknown/unknown,635,635,0.0000\nCC-MAIN-2026-12,video/mp4,154,154,0.0000\nCC-MAIN-2026-12,video/x-ms-asf,3034,3025,0.0002\nCC-MAIN-2026-17,<other>,1337047,1326275,0.0610\nCC-MAIN-2026-17,application/atom+xml,3220201,3219876,0.1469\nCC-MAIN-2026-17,application/calendar,4839,4839,0.0002\nCC-MAIN-2026-17,application/download,39013,38992,0.0018\nCC-MAIN-2026-17,application/epub+zip,32914,32894,0.0015\nCC-MAIN-2026-17,application/force-download,161035,161013,0.0073\nCC-MAIN-2026-17,application/gpx+xml,19100,19100,0.0009\nCC-MAIN-2026-17,application/ics,7977,7975,0.0004\nCC-MAIN-2026-17,application/javascript,18559,18554,0.0008\nCC-MAIN-2026-17,application/json,550978,550280,0.0251\nCC-MAIN-2026-17,application/ld+json,32075,32075,0.0015\nCC-MAIN-2026-17,application/marc,6932,6932,0.0003\nCC-MAIN-2026-17,application/msword,54353,54212,0.0025\nCC-MAIN-2026-17,application/octet-stream,1028918,1028139,0.0469\nCC-MAIN-2026-17,application/octetstream,4890,4890,0.0002\nCC-MAIN-2026-17,application/pdf,18970262,18937817,0.8655\nCC-MAIN-2026-17,application/pgp-encrypted,1742,1742,0.0001\nCC-MAIN-2026-17,application/pgp-signature,43270,43268,0.0020\nCC-MAIN-2026-17,application/postscript,4017,4017,0.0002\nCC-MAIN-2026-17,application/rdf+xml,68042,67965,0.0031\nCC-MAIN-2026-17,application/rss+xml,916499,915799,0.0418\nCC-MAIN-2026-17,application/rtf,11799,11799,0.0005\nCC-MAIN-2026-17,application/save-to-disk,4,4,0.0000\nCC-MAIN-2026-17,application/text,2845,2845,0.0001\nCC-MAIN-2026-17,application/unknown,4268,4268,0.0002\nCC-MAIN-2026-17,application/vnd.android.package-archive,156,156,0.0000\nCC-MAIN-2026-17,application/vnd.google-earth.kml+xml,24012,24008,0.0011\nCC-MAIN-2026-17,application/vnd.google-earth.kmz,10591,10591,0.0005\nCC-MAIN-2026-17,application/vnd.ms-excel,27006,26859,0.0012\nCC-MAIN-2026-17,application/vnd.ms-powerpoint,3559,3557,0.0002\nCC-MAIN-2026-17,application/vnd.ms-word,2655,2655,0.0001\nCC-MAIN-2026-17,application/vnd.oasis.opendocument.text,16334,16328,0.0007\nCC-MAIN-2026-17,application/vnd.openxmlformats-officedocument.presentationml.presentation,5062,5031,0.0002\nCC-MAIN-2026-17,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,35123,34779,0.0016\nCC-MAIN-2026-17,application/vnd.openxmlformats-officedocument.wordprocessingml.document,61425,61239,0.0028\nCC-MAIN-2026-17,application/vnd.wap.xhtml+xml,19974,19901,0.0009\nCC-MAIN-2026-17,application/x-bibtex,193026,192948,0.0088\nCC-MAIN-2026-17,application/x-bittorrent,2370,2362,0.0001\nCC-MAIN-2026-17,application/x-debian-package,158,158,0.0000\nCC-MAIN-2026-17,application/x-download,47639,47605,0.0022\nCC-MAIN-2026-17,application/x-endnote-refer,6602,6602,0.0003\nCC-MAIN-2026-17,application/x-gzip,4350,4350,0.0002\nCC-MAIN-2026-17,application/x-httpd-php,7643,7633,0.0003\nCC-MAIN-2026-17,application/x-java-jnlp-file,1797,1797,0.0001\nCC-MAIN-2026-17,application/x-javascript,3074,3069,0.0001\nCC-MAIN-2026-17,application/x-json,190,190,0.0000\nCC-MAIN-2026-17,application/x-mobipocket-ebook,8170,8165,0.0004\nCC-MAIN-2026-17,application/x-msdownload,5604,5603,0.0003\nCC-MAIN-2026-17,application/x-netcdf,9533,9533,0.0004\nCC-MAIN-2026-17,application/x-research-info-systems,254988,254889,0.0116\nCC-MAIN-2026-17,application/x-shockwave-flash,807,807,0.0000\nCC-MAIN-2026-17,application/x-tar,1410,1410,0.0001\nCC-MAIN-2026-17,application/x-tex,2824,2823,0.0001\nCC-MAIN-2026-17,application/x-troff-man,8778,8774,0.0004\nCC-MAIN-2026-17,application/x-zip-compressed,160,160,0.0000\nCC-MAIN-2026-17,application/xhtml+xml,227199,226255,0.0104\nCC-MAIN-2026-17,application/xml,557737,557038,0.0254\nCC-MAIN-2026-17,application/zip,3310,3309,0.0002\nCC-MAIN-2026-17,audio/mpeg,1883,1882,0.0001\nCC-MAIN-2026-17,audio/x-mpegurl,12593,12588,0.0006\nCC-MAIN-2026-17,audio/x-scpls,2500,2499,0.0001\nCC-MAIN-2026-17,audio/x-wav,7,7,0.0000\nCC-MAIN-2026-17,binary/octet-stream,10996,10988,0.0005\nCC-MAIN-2026-17,image/gif,4371,4370,0.0002\nCC-MAIN-2026-17,image/jpeg,5415,5413,0.0002\nCC-MAIN-2026-17,image/jpg,297,297,0.0000\nCC-MAIN-2026-17,image/pjpeg,12,12,0.0000\nCC-MAIN-2026-17,image/png,2675,2674,0.0001\nCC-MAIN-2026-17,image/svg+xml,43,43,0.0000\nCC-MAIN-2026-17,image/tiff,35,35,0.0000\nCC-MAIN-2026-17,image/vnd.djvu,10677,10672,0.0005\nCC-MAIN-2026-17,image/webp,40,40,0.0000\nCC-MAIN-2026-17,message/rfc822,4685,4685,0.0002\nCC-MAIN-2026-17,text/calendar,775287,772032,0.0354\nCC-MAIN-2026-17,text/css,12955,12953,0.0006\nCC-MAIN-2026-17,text/csv,66291,65186,0.0030\nCC-MAIN-2026-17,text/directory,4333,4333,0.0002\nCC-MAIN-2026-17,text/enriched,934,934,0.0000\nCC-MAIN-2026-17,text/html,2159906781,2147463476,98.5388\nCC-MAIN-2026-17,text/javascript,8201,8182,0.0004\nCC-MAIN-2026-17,text/markdown,653246,650507,0.0298\nCC-MAIN-2026-17,text/pdf,218,218,0.0000\nCC-MAIN-2026-17,text/plain,1062989,1061235,0.0485\nCC-MAIN-2026-17,text/prs.lines.tag,66488,66487,0.0030\nCC-MAIN-2026-17,text/tab-separated-values,7824,7823,0.0004\nCC-MAIN-2026-17,text/turtle,22789,22787,0.0010\nCC-MAIN-2026-17,text/vcard,26484,26471,0.0012\nCC-MAIN-2026-17,text/x-bibtex,11454,11448,0.0005\nCC-MAIN-2026-17,text/x-c,2784,2781,0.0001\nCC-MAIN-2026-17,text/x-csrc,2912,2912,0.0001\nCC-MAIN-2026-17,text/x-diff,6119,5996,0.0003\nCC-MAIN-2026-17,text/x-patch,5202,5202,0.0002\nCC-MAIN-2026-17,text/x-perl,972,972,0.0000\nCC-MAIN-2026-17,text/x-vcalendar,8283,8282,0.0004\nCC-MAIN-2026-17,text/x-vcard,41910,41894,0.0019\nCC-MAIN-2026-17,text/xml,1086597,1085146,0.0496\nCC-MAIN-2026-17,unknown/unknown,485,485,0.0000\nCC-MAIN-2026-17,video/mp4,220,220,0.0000\nCC-MAIN-2026-17,video/webm,2,2,0.0000\nCC-MAIN-2026-17,video/x-ms-asf,3466,3465,0.0002\n"
  },
  {
    "path": "plots/mimetypes.md",
    "content": "---\nlayout: table\ntable_include:\n - mimetypes-top-100.html\n - mimetypes_detected-top-100.html\ntable_sortlist: \"{sortList: [[3,1]]}\"\ntable_searcher: \"Filter for MIME types\"\n---\n\nMIME Types\n==========\n\nThe crawled content is dominated by HTML pages and contains only a small percentage of other document formats. The tables show the percentage of the top 100 media or MIME types of the latest monthly crawls.\n\nWhile the first table is based the `Content-Type` HTTP header, the second uses the MIME type detected by [Apache Tika](https://tika.apache.org/) based on the actual content. The underlying data including page counts is provided in [mimetypes.csv](./mimetypes.csv) resp. [mimetypes_detected.csv](./mimetypes_detected.csv).\n"
  },
  {
    "path": "plots/mimetypes_detected-top-100.html",
    "content": "<table border=\"1\" class=\"dataframe tablesorter tablepercentage tablesearcher\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th>crawl</th>\n      <th>CC-MAIN-2026-08</th>\n      <th>CC-MAIN-2026-12</th>\n      <th>CC-MAIN-2026-17</th>\n    </tr>\n    <tr>\n      <th>mimetype_detected</th>\n      <th></th>\n      <th></th>\n      <th></th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>&lt;other&gt;</th>\n      <td>0.0114</td>\n      <td>0.0122</td>\n      <td>0.0112</td>\n    </tr>\n    <tr>\n      <th>application/atom+xml</th>\n      <td>0.1476</td>\n      <td>0.1527</td>\n      <td>0.1486</td>\n    </tr>\n    <tr>\n      <th>application/epub+zip</th>\n      <td>0.0020</td>\n      <td>0.0022</td>\n      <td>0.0018</td>\n    </tr>\n    <tr>\n      <th>application/gpx+xml</th>\n      <td>0.0008</td>\n      <td>0.0008</td>\n      <td>0.0009</td>\n    </tr>\n    <tr>\n      <th>application/gzip</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>application/javascript</th>\n      <td>0.0010</td>\n      <td>0.0011</td>\n      <td>0.0011</td>\n    </tr>\n    <tr>\n      <th>application/json</th>\n      <td>0.0262</td>\n      <td>0.0258</td>\n      <td>0.0252</td>\n    </tr>\n    <tr>\n      <th>application/marc</th>\n      <td>0.0007</td>\n      <td>0.0007</td>\n      <td>0.0007</td>\n    </tr>\n    <tr>\n      <th>application/mbox</th>\n      <td>0.0012</td>\n      <td>0.0014</td>\n      <td>0.0011</td>\n    </tr>\n    <tr>\n      <th>application/msword</th>\n      <td>0.0018</td>\n      <td>0.0017</td>\n      <td>0.0018</td>\n    </tr>\n    <tr>\n      <th>application/octet-stream</th>\n      <td>0.0164</td>\n      <td>0.0155</td>\n      <td>0.0139</td>\n    </tr>\n    <tr>\n      <th>application/pdf</th>\n      <td>0.7460</td>\n      <td>0.8127</td>\n      <td>0.8794</td>\n    </tr>\n    <tr>\n      <th>application/pgp-signature</th>\n      <td>0.0011</td>\n      <td>0.0016</td>\n      <td>0.0020</td>\n    </tr>\n    <tr>\n      <th>application/pkcs7-signature</th>\n      <td>0.0003</td>\n      <td>0.0004</td>\n      <td>0.0004</td>\n    </tr>\n    <tr>\n      <th>application/postscript</th>\n      <td>0.0002</td>\n      <td>0.0002</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>application/rdf+xml</th>\n      <td>0.0081</td>\n      <td>0.0074</td>\n      <td>0.0063</td>\n    </tr>\n    <tr>\n      <th>application/rss+xml</th>\n      <td>0.0681</td>\n      <td>0.0684</td>\n      <td>0.0660</td>\n    </tr>\n    <tr>\n      <th>application/rtf</th>\n      <td>0.0013</td>\n      <td>0.0013</td>\n      <td>0.0009</td>\n    </tr>\n    <tr>\n      <th>application/text</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>application/vnd.android.package-archive</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>application/vnd.google-earth.kml+xml</th>\n      <td>0.0024</td>\n      <td>0.0025</td>\n      <td>0.0024</td>\n    </tr>\n    <tr>\n      <th>application/vnd.google-earth.kmz</th>\n      <td>0.0003</td>\n      <td>0.0005</td>\n      <td>0.0005</td>\n    </tr>\n    <tr>\n      <th>application/vnd.ms-excel</th>\n      <td>0.0008</td>\n      <td>0.0007</td>\n      <td>0.0007</td>\n    </tr>\n    <tr>\n      <th>application/vnd.ms-powerpoint</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>application/vnd.oasis.opendocument.spreadsheet</th>\n      <td>0.0004</td>\n      <td>0.0004</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>application/vnd.oasis.opendocument.text</th>\n      <td>0.0008</td>\n      <td>0.0009</td>\n      <td>0.0009</td>\n    </tr>\n    <tr>\n      <th>application/vnd.openxmlformats-officedocument.presentationml.presentation</th>\n      <td>0.0002</td>\n      <td>0.0003</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>application/vnd.openxmlformats-officedocument.spreadsheetml.sheet</th>\n      <td>0.0018</td>\n      <td>0.0017</td>\n      <td>0.0016</td>\n    </tr>\n    <tr>\n      <th>application/vnd.openxmlformats-officedocument.wordprocessingml.document</th>\n      <td>0.0025</td>\n      <td>0.0028</td>\n      <td>0.0028</td>\n    </tr>\n    <tr>\n      <th>application/x-bibtex-text-file</th>\n      <td>0.0143</td>\n      <td>0.0143</td>\n      <td>0.0127</td>\n    </tr>\n    <tr>\n      <th>application/x-bittorrent</th>\n      <td>0.0002</td>\n      <td>0.0002</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>application/x-bzip2</th>\n      <td>NaN</td>\n      <td>0.0000</td>\n      <td>NaN</td>\n    </tr>\n    <tr>\n      <th>application/x-endnote-refer</th>\n      <td>0.0016</td>\n      <td>0.0016</td>\n      <td>0.0014</td>\n    </tr>\n    <tr>\n      <th>application/x-mobipocket-ebook</th>\n      <td>0.0007</td>\n      <td>0.0008</td>\n      <td>0.0006</td>\n    </tr>\n    <tr>\n      <th>application/x-ms-asx</th>\n      <td>0.0001</td>\n      <td>0.0002</td>\n      <td>0.0002</td>\n    </tr>\n    <tr>\n      <th>application/x-msdownload</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>application/x-pds</th>\n      <td>0.0012</td>\n      <td>0.0012</td>\n      <td>0.0012</td>\n    </tr>\n    <tr>\n      <th>application/x-rar-compressed</th>\n      <td>0.0000</td>\n      <td>NaN</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>application/x-research-info-systems</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>application/x-sh</th>\n      <td>0.0007</td>\n      <td>0.0010</td>\n      <td>0.0011</td>\n    </tr>\n    <tr>\n      <th>application/x-shockwave-flash</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>application/x-stata-do</th>\n      <td>0.0005</td>\n      <td>0.0004</td>\n      <td>0.0004</td>\n    </tr>\n    <tr>\n      <th>application/x-tex</th>\n      <td>0.0003</td>\n      <td>0.0003</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>application/x-tex-tfm</th>\n      <td>0.0003</td>\n      <td>0.0003</td>\n      <td>0.0004</td>\n    </tr>\n    <tr>\n      <th>application/x-tika-msoffice</th>\n      <td>0.0023</td>\n      <td>0.0028</td>\n      <td>0.0024</td>\n    </tr>\n    <tr>\n      <th>application/x-tika-ooxml</th>\n      <td>0.0017</td>\n      <td>0.0018</td>\n      <td>0.0019</td>\n    </tr>\n    <tr>\n      <th>application/x-wais-source</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>application/xhtml+xml</th>\n      <td>8.4156</td>\n      <td>8.6282</td>\n      <td>8.1569</td>\n    </tr>\n    <tr>\n      <th>application/xml</th>\n      <td>0.0714</td>\n      <td>0.0697</td>\n      <td>0.0584</td>\n    </tr>\n    <tr>\n      <th>application/zip</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>application/zlib</th>\n      <td>0.0001</td>\n      <td>0.0002</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>audio/mp4</th>\n      <td>NaN</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>audio/mpeg</th>\n      <td>0.0000</td>\n      <td>0.0001</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>audio/vnd.wave</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>audio/x-mpegurl</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>image/gif</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>image/jpeg</th>\n      <td>0.0001</td>\n      <td>0.0002</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>image/png</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>image/svg+xml</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>image/tiff</th>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>image/vnd.djvu</th>\n      <td>0.0008</td>\n      <td>0.0004</td>\n      <td>0.0007</td>\n    </tr>\n    <tr>\n      <th>image/webp</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>message/rfc822</th>\n      <td>0.0008</td>\n      <td>0.0007</td>\n      <td>0.0007</td>\n    </tr>\n    <tr>\n      <th>text/asp</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>NaN</td>\n    </tr>\n    <tr>\n      <th>text/aspdotnet</th>\n      <td>NaN</td>\n      <td>0.0000</td>\n      <td>NaN</td>\n    </tr>\n    <tr>\n      <th>text/calendar</th>\n      <td>0.0449</td>\n      <td>0.0456</td>\n      <td>0.0424</td>\n    </tr>\n    <tr>\n      <th>text/css</th>\n      <td>0.0006</td>\n      <td>0.0006</td>\n      <td>0.0006</td>\n    </tr>\n    <tr>\n      <th>text/csv</th>\n      <td>0.0034</td>\n      <td>0.0032</td>\n      <td>0.0030</td>\n    </tr>\n    <tr>\n      <th>text/html</th>\n      <td>90.2830</td>\n      <td>89.9924</td>\n      <td>90.4072</td>\n    </tr>\n    <tr>\n      <th>text/markdown</th>\n      <td>0.0003</td>\n      <td>0.0024</td>\n      <td>0.0284</td>\n    </tr>\n    <tr>\n      <th>text/plain</th>\n      <td>0.0871</td>\n      <td>0.0898</td>\n      <td>0.0832</td>\n    </tr>\n    <tr>\n      <th>text/prs.lines.tag</th>\n      <td>0.0049</td>\n      <td>0.0067</td>\n      <td>0.0054</td>\n    </tr>\n    <tr>\n      <th>text/tab-separated-values</th>\n      <td>0.0005</td>\n      <td>0.0004</td>\n      <td>0.0004</td>\n    </tr>\n    <tr>\n      <th>text/troff</th>\n      <td>0.0005</td>\n      <td>0.0005</td>\n      <td>0.0005</td>\n    </tr>\n    <tr>\n      <th>text/turtle</th>\n      <td>0.0014</td>\n      <td>0.0012</td>\n      <td>0.0010</td>\n    </tr>\n    <tr>\n      <th>text/vtt</th>\n      <td>0.0009</td>\n      <td>0.0008</td>\n      <td>0.0008</td>\n    </tr>\n    <tr>\n      <th>text/x-c++src</th>\n      <td>0.0002</td>\n      <td>0.0002</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>text/x-chdr</th>\n      <td>0.0006</td>\n      <td>0.0006</td>\n      <td>0.0005</td>\n    </tr>\n    <tr>\n      <th>text/x-csrc</th>\n      <td>0.0005</td>\n      <td>0.0007</td>\n      <td>0.0006</td>\n    </tr>\n    <tr>\n      <th>text/x-diff</th>\n      <td>0.0011</td>\n      <td>0.0010</td>\n      <td>0.0009</td>\n    </tr>\n    <tr>\n      <th>text/x-jsp</th>\n      <td>0.0001</td>\n      <td>0.0001</td>\n      <td>0.0001</td>\n    </tr>\n    <tr>\n      <th>text/x-log</th>\n      <td>0.0017</td>\n      <td>0.0016</td>\n      <td>0.0016</td>\n    </tr>\n    <tr>\n      <th>text/x-matlab</th>\n      <td>0.0010</td>\n      <td>0.0010</td>\n      <td>0.0013</td>\n    </tr>\n    <tr>\n      <th>text/x-perl</th>\n      <td>0.0012</td>\n      <td>0.0013</td>\n      <td>0.0008</td>\n    </tr>\n    <tr>\n      <th>text/x-php</th>\n      <td>0.0032</td>\n      <td>0.0033</td>\n      <td>0.0034</td>\n    </tr>\n    <tr>\n      <th>text/x-python</th>\n      <td>0.0003</td>\n      <td>0.0004</td>\n      <td>0.0003</td>\n    </tr>\n    <tr>\n      <th>text/x-vcalendar</th>\n      <td>0.0004</td>\n      <td>0.0004</td>\n      <td>0.0004</td>\n    </tr>\n    <tr>\n      <th>text/x-vcard</th>\n      <td>0.0036</td>\n      <td>0.0037</td>\n      <td>0.0036</td>\n    </tr>\n    <tr>\n      <th>text/x-web-markdown</th>\n      <td>0.0014</td>\n      <td>0.0013</td>\n      <td>0.0019</td>\n    </tr>\n    <tr>\n      <th>text/x-yaml</th>\n      <td>0.0003</td>\n      <td>0.0004</td>\n      <td>0.0004</td>\n    </tr>\n    <tr>\n      <th>video/mp4</th>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>video/quicktime</th>\n      <td>0.0000</td>\n      <td>NaN</td>\n      <td>0.0000</td>\n    </tr>\n    <tr>\n      <th>video/webm</th>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>0.0000</td>\n    </tr>\n  </tbody>\n</table>"
  },
  {
    "path": "plots/mimetypes_detected.csv",
    "content": "crawl,mimetype_detected,pages,urls,%pages/crawl\nCC-MAIN-2008-2009,<unknown>,1798158091,1798158091,100.0000\nCC-MAIN-2009-2010,<unknown>,2863495211,2863495211,100.0000\nCC-MAIN-2012,<unknown>,3828539877,3828539877,100.0000\nCC-MAIN-2013-20,<unknown>,1796098643,1796098643,100.0000\nCC-MAIN-2013-48,<unknown>,2245773667,2245773667,100.0000\nCC-MAIN-2014-10,<unknown>,2301223474,2301223474,100.0000\nCC-MAIN-2014-15,<unknown>,2641371316,2641371316,100.0000\nCC-MAIN-2014-23,<unknown>,3608720876,3608720876,100.0000\nCC-MAIN-2014-35,<unknown>,2870692423,2870692423,100.0000\nCC-MAIN-2014-41,<unknown>,2979743543,2979743543,100.0000\nCC-MAIN-2014-42,<unknown>,3722131678,3722131678,100.0000\nCC-MAIN-2014-49,<unknown>,1948510433,1948510433,100.0000\nCC-MAIN-2014-52,<unknown>,2085977207,2085977207,100.0000\nCC-MAIN-2015-06,<unknown>,1826024103,1826024103,100.0000\nCC-MAIN-2015-11,<unknown>,1837196089,1837196089,100.0000\nCC-MAIN-2015-14,<unknown>,1646697534,1646697534,100.0000\nCC-MAIN-2015-18,<unknown>,2115818059,2115818059,100.0000\nCC-MAIN-2015-22,<unknown>,2015461448,2015461448,100.0000\nCC-MAIN-2015-27,<unknown>,1675619098,1675619098,100.0000\nCC-MAIN-2015-32,<unknown>,1815492409,1815492409,100.0000\nCC-MAIN-2015-35,<unknown>,1848022475,1848022475,100.0000\nCC-MAIN-2015-40,<unknown>,1321987379,1321987379,100.0000\nCC-MAIN-2015-48,<unknown>,1824170527,1824170527,100.0000\nCC-MAIN-2016-07,<unknown>,1733285122,1733285122,100.0000\nCC-MAIN-2016-18,<unknown>,1335046923,1335046923,100.0000\nCC-MAIN-2016-22,<unknown>,1466220798,1466220798,100.0000\nCC-MAIN-2016-26,<unknown>,1236815660,1236815660,100.0000\nCC-MAIN-2016-30,<unknown>,1737322304,1737322304,100.0000\nCC-MAIN-2016-36,<unknown>,1611613090,1611613090,100.0000\nCC-MAIN-2016-40,<unknown>,1722656393,1722656393,100.0000\nCC-MAIN-2016-44,<unknown>,3254976731,3254976731,100.0000\nCC-MAIN-2016-50,<unknown>,2866282390,2866282390,100.0000\nCC-MAIN-2017-04,<unknown>,3146498026,3146498026,100.0000\nCC-MAIN-2017-09,<unknown>,3084366662,3084366662,100.0000\nCC-MAIN-2017-13,<unknown>,3070720576,3070720576,100.0000\nCC-MAIN-2017-17,<unknown>,2942930482,2942930482,100.0000\nCC-MAIN-2017-22,<other>,425893,424355,0.0144\nCC-MAIN-2017-22,application/atom+xml,7779924,7768743,0.2622\nCC-MAIN-2017-22,application/epub+zip,31786,31585,0.0011\nCC-MAIN-2017-22,application/gpx+xml,1824,1824,0.0001\nCC-MAIN-2017-22,application/gzip,79412,77667,0.0027\nCC-MAIN-2017-22,application/javascript,21186,21171,0.0007\nCC-MAIN-2017-22,application/json,133337,133112,0.0045\nCC-MAIN-2017-22,application/marc,17141,17141,0.0006\nCC-MAIN-2017-22,application/mbox,45942,45923,0.0015\nCC-MAIN-2017-22,application/msword,99138,98298,0.0033\nCC-MAIN-2017-22,application/octet-stream,490408,485460,0.0165\nCC-MAIN-2017-22,application/pdf,18034750,17982913,0.6078\nCC-MAIN-2017-22,application/pgp-signature,22857,22854,0.0008\nCC-MAIN-2017-22,application/pkcs7-signature,3078,3075,0.0001\nCC-MAIN-2017-22,application/postscript,24467,24448,0.0008\nCC-MAIN-2017-22,application/rdf+xml,395450,395047,0.0133\nCC-MAIN-2017-22,application/rss+xml,6158592,6122971,0.2075\nCC-MAIN-2017-22,application/rtf,17323,17276,0.0006\nCC-MAIN-2017-22,application/text,10206,10201,0.0003\nCC-MAIN-2017-22,application/vnd.android.package-archive,25468,25428,0.0009\nCC-MAIN-2017-22,application/vnd.google-earth.kml+xml,59819,59314,0.0020\nCC-MAIN-2017-22,application/vnd.google-earth.kmz,12042,12029,0.0004\nCC-MAIN-2017-22,application/vnd.ms-excel,22739,22427,0.0008\nCC-MAIN-2017-22,application/vnd.ms-powerpoint,18838,18541,0.0006\nCC-MAIN-2017-22,application/vnd.oasis.opendocument.spreadsheet,1782,1777,0.0001\nCC-MAIN-2017-22,application/vnd.oasis.opendocument.text,8107,8093,0.0003\nCC-MAIN-2017-22,application/vnd.openxmlformats-officedocument.presentationml.presentation,4324,4305,0.0001\nCC-MAIN-2017-22,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,8403,8161,0.0003\nCC-MAIN-2017-22,application/vnd.openxmlformats-officedocument.wordprocessingml.document,22955,22565,0.0008\nCC-MAIN-2017-22,application/x-bibtex-text-file,43624,43492,0.0015\nCC-MAIN-2017-22,application/x-bittorrent,5957,5853,0.0002\nCC-MAIN-2017-22,application/x-bzip2,7353,7335,0.0002\nCC-MAIN-2017-22,application/x-dosexec,15528,15401,0.0005\nCC-MAIN-2017-22,application/x-endnote-refer,14735,14734,0.0005\nCC-MAIN-2017-22,application/x-hdf,91,91,0.0000\nCC-MAIN-2017-22,application/x-mobipocket-ebook,13360,13295,0.0005\nCC-MAIN-2017-22,application/x-ms-asx,21359,21262,0.0007\nCC-MAIN-2017-22,application/x-msdownload,7292,7217,0.0002\nCC-MAIN-2017-22,application/x-rar-compressed,11173,11149,0.0004\nCC-MAIN-2017-22,application/x-research-info-systems,46091,46072,0.0016\nCC-MAIN-2017-22,application/x-sh,8893,8794,0.0003\nCC-MAIN-2017-22,application/x-shockwave-flash,20758,20696,0.0007\nCC-MAIN-2017-22,application/x-stata-do,1380,1378,0.0000\nCC-MAIN-2017-22,application/x-tex,6590,6537,0.0002\nCC-MAIN-2017-22,application/x-tex-tfm,759,759,0.0000\nCC-MAIN-2017-22,application/x-tika-msoffice,27838,27785,0.0009\nCC-MAIN-2017-22,application/x-tika-ooxml,13921,13888,0.0005\nCC-MAIN-2017-22,application/x-wais-source,4998,4998,0.0002\nCC-MAIN-2017-22,application/x-xz,37312,37290,0.0013\nCC-MAIN-2017-22,application/xhtml+xml,896923790,887538932,30.2270\nCC-MAIN-2017-22,application/xml,1419859,1414249,0.0479\nCC-MAIN-2017-22,application/zip,173362,172162,0.0058\nCC-MAIN-2017-22,application/zlib,786,775,0.0000\nCC-MAIN-2017-22,audio/mp4,19020,19001,0.0006\nCC-MAIN-2017-22,audio/mpeg,137354,136647,0.0046\nCC-MAIN-2017-22,audio/x-mpegurl,45126,45119,0.0015\nCC-MAIN-2017-22,image/gif,131365,130916,0.0044\nCC-MAIN-2017-22,image/jpeg,4633840,4630130,0.1562\nCC-MAIN-2017-22,image/png,1352618,1350932,0.0456\nCC-MAIN-2017-22,image/svg+xml,4481,4470,0.0002\nCC-MAIN-2017-22,image/tiff,34525,34095,0.0012\nCC-MAIN-2017-22,image/vnd.djvu,34253,34192,0.0012\nCC-MAIN-2017-22,image/vnd.dxf; format=ascii,1936,1936,0.0001\nCC-MAIN-2017-22,image/webp,9381,9352,0.0003\nCC-MAIN-2017-22,message/rfc822,56842,56348,0.0019\nCC-MAIN-2017-22,text/asp,1041567,1039810,0.0351\nCC-MAIN-2017-22,text/aspdotnet,544307,541368,0.0183\nCC-MAIN-2017-22,text/calendar,323606,323035,0.0109\nCC-MAIN-2017-22,text/css,6117,6101,0.0002\nCC-MAIN-2017-22,text/csv,22460,22440,0.0008\nCC-MAIN-2017-22,text/html,2020375643,1981618517,68.0882\nCC-MAIN-2017-22,text/plain,1151678,1146421,0.0388\nCC-MAIN-2017-22,text/prs.lines.tag,1369,1369,0.0000\nCC-MAIN-2017-22,text/tab-separated-values,14562,14555,0.0005\nCC-MAIN-2017-22,text/troff,5858,5857,0.0002\nCC-MAIN-2017-22,text/turtle,14368,14366,0.0005\nCC-MAIN-2017-22,text/vtt,74,74,0.0000\nCC-MAIN-2017-22,text/x-c++src,3100,2936,0.0001\nCC-MAIN-2017-22,text/x-cgi,458874,455098,0.0155\nCC-MAIN-2017-22,text/x-chdr,4358,4245,0.0001\nCC-MAIN-2017-22,text/x-coldfusion,306499,305828,0.0103\nCC-MAIN-2017-22,text/x-csrc,8604,8513,0.0003\nCC-MAIN-2017-22,text/x-diff,17300,17103,0.0006\nCC-MAIN-2017-22,text/x-jsp,435699,371105,0.0147\nCC-MAIN-2017-22,text/x-log,11655,11650,0.0004\nCC-MAIN-2017-22,text/x-matlab,15572,15544,0.0005\nCC-MAIN-2017-22,text/x-perl,75433,75345,0.0025\nCC-MAIN-2017-22,text/x-php,3100427,3089755,0.1045\nCC-MAIN-2017-22,text/x-python,5534,5490,0.0002\nCC-MAIN-2017-22,text/x-vcalendar,6844,6635,0.0002\nCC-MAIN-2017-22,text/x-vcard,28404,28070,0.0010\nCC-MAIN-2017-22,text/x-web-markdown,1805,1802,0.0001\nCC-MAIN-2017-22,text/x-yaml,123,123,0.0000\nCC-MAIN-2017-22,video/mp4,20295,20265,0.0007\nCC-MAIN-2017-22,video/quicktime,6848,6834,0.0002\nCC-MAIN-2017-22,video/webm,9692,9690,0.0003\nCC-MAIN-2017-22,video/x-m4v,10283,10277,0.0003\nCC-MAIN-2017-26,<other>,436245,435708,0.0138\nCC-MAIN-2017-26,application/atom+xml,11726061,11706819,0.3705\nCC-MAIN-2017-26,application/epub+zip,30826,30759,0.0010\nCC-MAIN-2017-26,application/gpx+xml,2420,2420,0.0001\nCC-MAIN-2017-26,application/gzip,115220,112536,0.0036\nCC-MAIN-2017-26,application/javascript,30413,30398,0.0010\nCC-MAIN-2017-26,application/json,153699,153457,0.0049\nCC-MAIN-2017-26,application/marc,16197,16197,0.0005\nCC-MAIN-2017-26,application/mbox,65477,65466,0.0021\nCC-MAIN-2017-26,application/msword,74908,74599,0.0024\nCC-MAIN-2017-26,application/octet-stream,236988,236063,0.0075\nCC-MAIN-2017-26,application/pdf,22997250,22961604,0.7266\nCC-MAIN-2017-26,application/pgp-signature,19994,19962,0.0006\nCC-MAIN-2017-26,application/pkcs7-signature,2682,2680,0.0001\nCC-MAIN-2017-26,application/postscript,22274,22257,0.0007\nCC-MAIN-2017-26,application/rdf+xml,553737,552465,0.0175\nCC-MAIN-2017-26,application/rss+xml,7517436,7490497,0.2375\nCC-MAIN-2017-26,application/rtf,22873,22858,0.0007\nCC-MAIN-2017-26,application/text,9846,9843,0.0003\nCC-MAIN-2017-26,application/vnd.android.package-archive,39457,39378,0.0012\nCC-MAIN-2017-26,application/vnd.google-earth.kml+xml,62003,61940,0.0020\nCC-MAIN-2017-26,application/vnd.google-earth.kmz,13847,13843,0.0004\nCC-MAIN-2017-26,application/vnd.ms-excel,22127,22056,0.0007\nCC-MAIN-2017-26,application/vnd.ms-powerpoint,19695,19649,0.0006\nCC-MAIN-2017-26,application/vnd.oasis.opendocument.spreadsheet,1977,1977,0.0001\nCC-MAIN-2017-26,application/vnd.oasis.opendocument.text,8569,8568,0.0003\nCC-MAIN-2017-26,application/vnd.openxmlformats-officedocument.presentationml.presentation,5683,5678,0.0002\nCC-MAIN-2017-26,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,8808,8770,0.0003\nCC-MAIN-2017-26,application/vnd.openxmlformats-officedocument.wordprocessingml.document,24098,23914,0.0008\nCC-MAIN-2017-26,application/x-bibtex-text-file,26238,26190,0.0008\nCC-MAIN-2017-26,application/x-bittorrent,5456,5451,0.0002\nCC-MAIN-2017-26,application/x-bzip2,9029,8853,0.0003\nCC-MAIN-2017-26,application/x-dosexec,15718,15387,0.0005\nCC-MAIN-2017-26,application/x-endnote-refer,11350,11348,0.0004\nCC-MAIN-2017-26,application/x-hdf,198,198,0.0000\nCC-MAIN-2017-26,application/x-mobipocket-ebook,11026,11000,0.0003\nCC-MAIN-2017-26,application/x-ms-asx,18306,18281,0.0006\nCC-MAIN-2017-26,application/x-msdownload,6907,6812,0.0002\nCC-MAIN-2017-26,application/x-rar-compressed,14709,14578,0.0005\nCC-MAIN-2017-26,application/x-research-info-systems,30893,30890,0.0010\nCC-MAIN-2017-26,application/x-sh,21438,21380,0.0007\nCC-MAIN-2017-26,application/x-shockwave-flash,22527,22465,0.0007\nCC-MAIN-2017-26,application/x-stata-do,1038,1035,0.0000\nCC-MAIN-2017-26,application/x-tex,3387,3384,0.0001\nCC-MAIN-2017-26,application/x-tex-tfm,233,233,0.0000\nCC-MAIN-2017-26,application/x-tika-msoffice,34120,34079,0.0011\nCC-MAIN-2017-26,application/x-tika-ooxml,17597,17569,0.0006\nCC-MAIN-2017-26,application/x-wais-source,4262,4262,0.0001\nCC-MAIN-2017-26,application/x-xz,38920,38847,0.0012\nCC-MAIN-2017-26,application/xhtml+xml,1003165441,996351958,31.6934\nCC-MAIN-2017-26,application/xml,1013265,1010451,0.0320\nCC-MAIN-2017-26,application/zip,170414,169923,0.0054\nCC-MAIN-2017-26,application/zlib,2343,2324,0.0001\nCC-MAIN-2017-26,audio/mp4,30421,30364,0.0010\nCC-MAIN-2017-26,audio/mpeg,157503,156793,0.0050\nCC-MAIN-2017-26,audio/x-mpegurl,42186,42169,0.0013\nCC-MAIN-2017-26,image/gif,133652,133396,0.0042\nCC-MAIN-2017-26,image/jpeg,4946296,4944274,0.1563\nCC-MAIN-2017-26,image/png,897731,897231,0.0284\nCC-MAIN-2017-26,image/svg+xml,3752,3747,0.0001\nCC-MAIN-2017-26,image/tiff,27646,27620,0.0009\nCC-MAIN-2017-26,image/vnd.djvu,31413,31398,0.0010\nCC-MAIN-2017-26,image/vnd.dxf; format=ascii,4829,4829,0.0002\nCC-MAIN-2017-26,image/webp,2858,2823,0.0001\nCC-MAIN-2017-26,message/rfc822,31171,31152,0.0010\nCC-MAIN-2017-26,text/asp,694674,693419,0.0219\nCC-MAIN-2017-26,text/aspdotnet,197023,196570,0.0062\nCC-MAIN-2017-26,text/calendar,341362,341192,0.0108\nCC-MAIN-2017-26,text/css,8784,8780,0.0003\nCC-MAIN-2017-26,text/csv,12835,12765,0.0004\nCC-MAIN-2017-26,text/html,2105181099,2081107184,66.5099\nCC-MAIN-2017-26,text/plain,768672,767043,0.0243\nCC-MAIN-2017-26,text/prs.lines.tag,1445,1436,0.0000\nCC-MAIN-2017-26,text/tab-separated-values,4892,4892,0.0002\nCC-MAIN-2017-26,text/troff,3011,3010,0.0001\nCC-MAIN-2017-26,text/turtle,22365,22364,0.0007\nCC-MAIN-2017-26,text/vtt,1297,1297,0.0000\nCC-MAIN-2017-26,text/x-c++src,2351,2337,0.0001\nCC-MAIN-2017-26,text/x-cgi,43889,43626,0.0014\nCC-MAIN-2017-26,text/x-chdr,3240,3231,0.0001\nCC-MAIN-2017-26,text/x-coldfusion,208194,207533,0.0066\nCC-MAIN-2017-26,text/x-csrc,9823,9821,0.0003\nCC-MAIN-2017-26,text/x-diff,11725,11712,0.0004\nCC-MAIN-2017-26,text/x-jsp,141767,128812,0.0045\nCC-MAIN-2017-26,text/x-log,13609,13609,0.0004\nCC-MAIN-2017-26,text/x-matlab,16330,16322,0.0005\nCC-MAIN-2017-26,text/x-perl,32511,32476,0.0010\nCC-MAIN-2017-26,text/x-php,2183733,2177512,0.0690\nCC-MAIN-2017-26,text/x-python,4450,4442,0.0001\nCC-MAIN-2017-26,text/x-vcalendar,5318,5317,0.0002\nCC-MAIN-2017-26,text/x-vcard,41876,41811,0.0013\nCC-MAIN-2017-26,text/x-web-markdown,1911,1910,0.0001\nCC-MAIN-2017-26,text/x-yaml,227,227,0.0000\nCC-MAIN-2017-26,video/mp4,24227,24199,0.0008\nCC-MAIN-2017-26,video/quicktime,7271,7244,0.0002\nCC-MAIN-2017-26,video/webm,12798,12795,0.0004\nCC-MAIN-2017-26,video/x-m4v,16294,16281,0.0005\nCC-MAIN-2017-30,<other>,849850,848982,0.0294\nCC-MAIN-2017-30,application/atom+xml,9050774,9046147,0.3129\nCC-MAIN-2017-30,application/epub+zip,47901,47441,0.0017\nCC-MAIN-2017-30,application/gpx+xml,2947,2947,0.0001\nCC-MAIN-2017-30,application/gzip,132149,131007,0.0046\nCC-MAIN-2017-30,application/javascript,78232,78166,0.0027\nCC-MAIN-2017-30,application/json,367228,367064,0.0127\nCC-MAIN-2017-30,application/marc,12154,12154,0.0004\nCC-MAIN-2017-30,application/mbox,198532,198526,0.0069\nCC-MAIN-2017-30,application/msword,166034,164612,0.0057\nCC-MAIN-2017-30,application/octet-stream,763883,762296,0.0264\nCC-MAIN-2017-30,application/pdf,22153905,22090556,0.7660\nCC-MAIN-2017-30,application/pgp-signature,42352,42346,0.0015\nCC-MAIN-2017-30,application/pkcs7-signature,6168,6168,0.0002\nCC-MAIN-2017-30,application/postscript,28912,28883,0.0010\nCC-MAIN-2017-30,application/rdf+xml,489116,488850,0.0169\nCC-MAIN-2017-30,application/rss+xml,6998910,6939347,0.2420\nCC-MAIN-2017-30,application/rtf,31210,30889,0.0011\nCC-MAIN-2017-30,application/text,14658,14656,0.0005\nCC-MAIN-2017-30,application/vnd.android.package-archive,23047,22867,0.0008\nCC-MAIN-2017-30,application/vnd.google-earth.kml+xml,231054,230219,0.0080\nCC-MAIN-2017-30,application/vnd.google-earth.kmz,42871,42867,0.0015\nCC-MAIN-2017-30,application/vnd.ms-excel,38981,37964,0.0013\nCC-MAIN-2017-30,application/vnd.ms-powerpoint,27176,27092,0.0009\nCC-MAIN-2017-30,application/vnd.oasis.opendocument.spreadsheet,2163,2158,0.0001\nCC-MAIN-2017-30,application/vnd.oasis.opendocument.text,10960,10947,0.0004\nCC-MAIN-2017-30,application/vnd.openxmlformats-officedocument.presentationml.presentation,16212,16161,0.0006\nCC-MAIN-2017-30,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,23491,23432,0.0008\nCC-MAIN-2017-30,application/vnd.openxmlformats-officedocument.wordprocessingml.document,42582,41818,0.0015\nCC-MAIN-2017-30,application/x-bibtex-text-file,75883,75833,0.0026\nCC-MAIN-2017-30,application/x-bittorrent,5140,5134,0.0002\nCC-MAIN-2017-30,application/x-bzip2,8962,8948,0.0003\nCC-MAIN-2017-30,application/x-dosexec,34121,33969,0.0012\nCC-MAIN-2017-30,application/x-endnote-refer,22866,22854,0.0008\nCC-MAIN-2017-30,application/x-hdf,12025,12025,0.0004\nCC-MAIN-2017-30,application/x-mobipocket-ebook,17396,17232,0.0006\nCC-MAIN-2017-30,application/x-ms-asx,49610,49587,0.0017\nCC-MAIN-2017-30,application/x-msdownload,53046,52887,0.0018\nCC-MAIN-2017-30,application/x-rar-compressed,13529,13409,0.0005\nCC-MAIN-2017-30,application/x-research-info-systems,52232,52202,0.0018\nCC-MAIN-2017-30,application/x-sh,40707,40623,0.0014\nCC-MAIN-2017-30,application/x-shockwave-flash,45047,44928,0.0016\nCC-MAIN-2017-30,application/x-stata-do,4041,4036,0.0001\nCC-MAIN-2017-30,application/x-tex,19931,19927,0.0007\nCC-MAIN-2017-30,application/x-tex-tfm,2551,2551,0.0001\nCC-MAIN-2017-30,application/x-tika-msoffice,48942,48902,0.0017\nCC-MAIN-2017-30,application/x-tika-ooxml,31910,30983,0.0011\nCC-MAIN-2017-30,application/x-wais-source,605,605,0.0000\nCC-MAIN-2017-30,application/x-xz,46176,46151,0.0016\nCC-MAIN-2017-30,application/xhtml+xml,846401467,837380297,29.2648\nCC-MAIN-2017-30,application/xml,1524317,1516867,0.0527\nCC-MAIN-2017-30,application/zip,230884,230477,0.0080\nCC-MAIN-2017-30,application/zlib,1992,1979,0.0001\nCC-MAIN-2017-30,audio/mp4,21740,21695,0.0008\nCC-MAIN-2017-30,audio/mpeg,152037,151698,0.0053\nCC-MAIN-2017-30,audio/vnd.wave,54150,54150,0.0019\nCC-MAIN-2017-30,audio/x-mpegurl,51423,51407,0.0018\nCC-MAIN-2017-30,image/gif,1072559,1070055,0.0371\nCC-MAIN-2017-30,image/jpeg,13479565,13465889,0.4661\nCC-MAIN-2017-30,image/png,3129597,3128262,0.1082\nCC-MAIN-2017-30,image/svg+xml,15209,15205,0.0005\nCC-MAIN-2017-30,image/tiff,24813,24770,0.0009\nCC-MAIN-2017-30,image/vnd.djvu,36744,36701,0.0013\nCC-MAIN-2017-30,image/vnd.dxf; format=ascii,6636,6376,0.0002\nCC-MAIN-2017-30,image/webp,34088,34079,0.0012\nCC-MAIN-2017-30,message/rfc822,199939,199907,0.0069\nCC-MAIN-2017-30,text/asp,972082,968466,0.0336\nCC-MAIN-2017-30,text/aspdotnet,799061,797331,0.0276\nCC-MAIN-2017-30,text/calendar,502013,500369,0.0174\nCC-MAIN-2017-30,text/css,31645,31604,0.0011\nCC-MAIN-2017-30,text/csv,62428,62110,0.0022\nCC-MAIN-2017-30,text/html,1971077660,1933434877,68.1512\nCC-MAIN-2017-30,text/markdown,1,1,0.0000\nCC-MAIN-2017-30,text/plain,2598214,2594438,0.0898\nCC-MAIN-2017-30,text/prs.lines.tag,10307,10307,0.0004\nCC-MAIN-2017-30,text/tab-separated-values,51355,51351,0.0018\nCC-MAIN-2017-30,text/troff,94971,94931,0.0033\nCC-MAIN-2017-30,text/turtle,14959,14959,0.0005\nCC-MAIN-2017-30,text/vtt,442,442,0.0000\nCC-MAIN-2017-30,text/x-c++src,37725,37626,0.0013\nCC-MAIN-2017-30,text/x-cgi,90082,89213,0.0031\nCC-MAIN-2017-30,text/x-chdr,91818,91608,0.0032\nCC-MAIN-2017-30,text/x-coldfusion,863180,862306,0.0298\nCC-MAIN-2017-30,text/x-csrc,117869,117687,0.0041\nCC-MAIN-2017-30,text/x-diff,72960,72928,0.0025\nCC-MAIN-2017-30,text/x-jsp,339800,336922,0.0117\nCC-MAIN-2017-30,text/x-log,26195,26193,0.0009\nCC-MAIN-2017-30,text/x-matlab,56634,56627,0.0020\nCC-MAIN-2017-30,text/x-perl,186689,186598,0.0065\nCC-MAIN-2017-30,text/x-php,5059338,5049256,0.1749\nCC-MAIN-2017-30,text/x-python,13057,13051,0.0005\nCC-MAIN-2017-30,text/x-vcalendar,21047,20882,0.0007\nCC-MAIN-2017-30,text/x-vcard,45550,45472,0.0016\nCC-MAIN-2017-30,text/x-web-markdown,3923,3923,0.0001\nCC-MAIN-2017-30,text/x-yaml,522,522,0.0000\nCC-MAIN-2017-30,video/mp4,31278,31243,0.0011\nCC-MAIN-2017-30,video/quicktime,7103,7099,0.0002\nCC-MAIN-2017-30,video/webm,8490,8472,0.0003\nCC-MAIN-2017-30,video/x-m4v,9922,9919,0.0003\nCC-MAIN-2017-34,<other>,305046,304544,0.0093\nCC-MAIN-2017-34,application/atom+xml,12389543,12380604,0.3777\nCC-MAIN-2017-34,application/epub+zip,38434,38197,0.0012\nCC-MAIN-2017-34,application/gpx+xml,1776,1776,0.0001\nCC-MAIN-2017-34,application/gzip,115728,113785,0.0035\nCC-MAIN-2017-34,application/javascript,32295,32277,0.0010\nCC-MAIN-2017-34,application/json,143790,143718,0.0044\nCC-MAIN-2017-34,application/marc,16208,16208,0.0005\nCC-MAIN-2017-34,application/mbox,53497,53495,0.0016\nCC-MAIN-2017-34,application/msword,81395,81166,0.0025\nCC-MAIN-2017-34,application/octet-stream,184569,183762,0.0056\nCC-MAIN-2017-34,application/pdf,19114561,19091586,0.5827\nCC-MAIN-2017-34,application/pgp-signature,6988,6746,0.0002\nCC-MAIN-2017-34,application/pkcs7-signature,1213,1213,0.0000\nCC-MAIN-2017-34,application/postscript,10968,10963,0.0003\nCC-MAIN-2017-34,application/rdf+xml,425455,425245,0.0130\nCC-MAIN-2017-34,application/rss+xml,6633147,6621743,0.2022\nCC-MAIN-2017-34,application/rtf,12054,12046,0.0004\nCC-MAIN-2017-34,application/text,2559,2559,0.0001\nCC-MAIN-2017-34,application/vnd.android.package-archive,66301,66191,0.0020\nCC-MAIN-2017-34,application/vnd.google-earth.kml+xml,77899,77894,0.0024\nCC-MAIN-2017-34,application/vnd.google-earth.kmz,11089,11086,0.0003\nCC-MAIN-2017-34,application/vnd.ms-excel,24725,23804,0.0008\nCC-MAIN-2017-34,application/vnd.ms-powerpoint,19226,19219,0.0006\nCC-MAIN-2017-34,application/vnd.oasis.opendocument.spreadsheet,1550,1549,0.0000\nCC-MAIN-2017-34,application/vnd.oasis.opendocument.text,7311,7310,0.0002\nCC-MAIN-2017-34,application/vnd.openxmlformats-officedocument.presentationml.presentation,5291,5279,0.0002\nCC-MAIN-2017-34,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,10374,10346,0.0003\nCC-MAIN-2017-34,application/vnd.openxmlformats-officedocument.wordprocessingml.document,25057,24848,0.0008\nCC-MAIN-2017-34,application/x-bibtex-text-file,14495,14487,0.0004\nCC-MAIN-2017-34,application/x-bittorrent,6114,5965,0.0002\nCC-MAIN-2017-34,application/x-bzip2,8678,8666,0.0003\nCC-MAIN-2017-34,application/x-dosexec,13063,12965,0.0004\nCC-MAIN-2017-34,application/x-endnote-refer,2660,2647,0.0001\nCC-MAIN-2017-34,application/x-hdf,147,147,0.0000\nCC-MAIN-2017-34,application/x-mobipocket-ebook,7960,7944,0.0002\nCC-MAIN-2017-34,application/x-ms-asx,12434,12358,0.0004\nCC-MAIN-2017-34,application/x-msdownload,4403,4378,0.0001\nCC-MAIN-2017-34,application/x-rar-compressed,14504,14492,0.0004\nCC-MAIN-2017-34,application/x-research-info-systems,25532,25512,0.0008\nCC-MAIN-2017-34,application/x-sh,8419,8412,0.0003\nCC-MAIN-2017-34,application/x-shockwave-flash,16117,16019,0.0005\nCC-MAIN-2017-34,application/x-stata-do,933,930,0.0000\nCC-MAIN-2017-34,application/x-tex,1851,1850,0.0001\nCC-MAIN-2017-34,application/x-tex-tfm,53,53,0.0000\nCC-MAIN-2017-34,application/x-tika-msoffice,24418,24407,0.0007\nCC-MAIN-2017-34,application/x-tika-ooxml,15259,15254,0.0005\nCC-MAIN-2017-34,application/x-wais-source,1291,1291,0.0000\nCC-MAIN-2017-34,application/x-xz,23698,23615,0.0007\nCC-MAIN-2017-34,application/xhtml+xml,1008007589,1003429974,30.7312\nCC-MAIN-2017-34,application/xml,801405,797268,0.0244\nCC-MAIN-2017-34,application/zip,181905,181196,0.0055\nCC-MAIN-2017-34,application/zlib,1505,1492,0.0000\nCC-MAIN-2017-34,audio/mp4,30129,30079,0.0009\nCC-MAIN-2017-34,audio/mpeg,151042,150740,0.0046\nCC-MAIN-2017-34,audio/vnd.wave,61371,61370,0.0019\nCC-MAIN-2017-34,audio/x-mpegurl,31421,31408,0.0010\nCC-MAIN-2017-34,image/gif,154267,154040,0.0047\nCC-MAIN-2017-34,image/jpeg,5133300,5130183,0.1565\nCC-MAIN-2017-34,image/png,1041698,1040882,0.0318\nCC-MAIN-2017-34,image/svg+xml,3528,3511,0.0001\nCC-MAIN-2017-34,image/tiff,17619,17607,0.0005\nCC-MAIN-2017-34,image/vnd.djvu,23915,23879,0.0007\nCC-MAIN-2017-34,image/vnd.dxf; format=ascii,4084,4084,0.0001\nCC-MAIN-2017-34,image/webp,3618,3142,0.0001\nCC-MAIN-2017-34,message/rfc822,13318,13305,0.0004\nCC-MAIN-2017-34,text/asp,376350,375486,0.0115\nCC-MAIN-2017-34,text/aspdotnet,101620,101458,0.0031\nCC-MAIN-2017-34,text/calendar,350054,349908,0.0107\nCC-MAIN-2017-34,text/css,10199,10166,0.0003\nCC-MAIN-2017-34,text/csv,7522,7457,0.0002\nCC-MAIN-2017-34,text/html,2220985592,2202369448,67.7113\nCC-MAIN-2017-34,text/plain,526723,526032,0.0161\nCC-MAIN-2017-34,text/prs.lines.tag,1172,1172,0.0000\nCC-MAIN-2017-34,text/tab-separated-values,2591,2591,0.0001\nCC-MAIN-2017-34,text/troff,7084,7084,0.0002\nCC-MAIN-2017-34,text/turtle,10323,10323,0.0003\nCC-MAIN-2017-34,text/vtt,170,170,0.0000\nCC-MAIN-2017-34,text/x-c++src,2015,2012,0.0001\nCC-MAIN-2017-34,text/x-cgi,24797,24278,0.0008\nCC-MAIN-2017-34,text/x-chdr,6396,6393,0.0002\nCC-MAIN-2017-34,text/x-coldfusion,111497,111215,0.0034\nCC-MAIN-2017-34,text/x-csrc,11591,11591,0.0004\nCC-MAIN-2017-34,text/x-diff,6221,6214,0.0002\nCC-MAIN-2017-34,text/x-jsp,41096,40940,0.0013\nCC-MAIN-2017-34,text/x-log,11735,11734,0.0004\nCC-MAIN-2017-34,text/x-matlab,8504,8504,0.0003\nCC-MAIN-2017-34,text/x-perl,31357,31332,0.0010\nCC-MAIN-2017-34,text/x-php,1662708,1658755,0.0507\nCC-MAIN-2017-34,text/x-python,3633,3632,0.0001\nCC-MAIN-2017-34,text/x-vcalendar,7766,7766,0.0002\nCC-MAIN-2017-34,text/x-vcard,32982,32943,0.0010\nCC-MAIN-2017-34,text/x-web-markdown,1786,1785,0.0001\nCC-MAIN-2017-34,text/x-yaml,180,180,0.0000\nCC-MAIN-2017-34,video/mp4,22521,22494,0.0007\nCC-MAIN-2017-34,video/quicktime,6303,6301,0.0002\nCC-MAIN-2017-34,video/webm,11397,11392,0.0003\nCC-MAIN-2017-34,video/x-m4v,15233,15223,0.0005\nCC-MAIN-2017-39,<other>,373171,371822,0.0124\nCC-MAIN-2017-39,application/atom+xml,7191769,7189643,0.2384\nCC-MAIN-2017-39,application/epub+zip,29673,29015,0.0010\nCC-MAIN-2017-39,application/gpx+xml,2411,2411,0.0001\nCC-MAIN-2017-39,application/gzip,99987,99580,0.0033\nCC-MAIN-2017-39,application/javascript,27061,27036,0.0009\nCC-MAIN-2017-39,application/json,184065,183783,0.0061\nCC-MAIN-2017-39,application/marc,12103,12099,0.0004\nCC-MAIN-2017-39,application/mbox,15172,15074,0.0005\nCC-MAIN-2017-39,application/msword,136252,135619,0.0045\nCC-MAIN-2017-39,application/octet-stream,340751,338885,0.0113\nCC-MAIN-2017-39,application/pdf,25566236,25499895,0.8474\nCC-MAIN-2017-39,application/pgp-signature,51846,51841,0.0017\nCC-MAIN-2017-39,application/pkcs7-signature,3634,3633,0.0001\nCC-MAIN-2017-39,application/postscript,46224,46117,0.0015\nCC-MAIN-2017-39,application/rdf+xml,407537,407213,0.0135\nCC-MAIN-2017-39,application/rss+xml,5722964,5703256,0.1897\nCC-MAIN-2017-39,application/rtf,22496,22449,0.0007\nCC-MAIN-2017-39,application/text,17022,17009,0.0006\nCC-MAIN-2017-39,application/vnd.android.package-archive,27941,27756,0.0009\nCC-MAIN-2017-39,application/vnd.google-earth.kml+xml,103123,102963,0.0034\nCC-MAIN-2017-39,application/vnd.google-earth.kmz,14166,14155,0.0005\nCC-MAIN-2017-39,application/vnd.ms-excel,30737,30450,0.0010\nCC-MAIN-2017-39,application/vnd.ms-powerpoint,21284,21228,0.0007\nCC-MAIN-2017-39,application/vnd.oasis.opendocument.spreadsheet,3245,3243,0.0001\nCC-MAIN-2017-39,application/vnd.oasis.opendocument.text,17295,17281,0.0006\nCC-MAIN-2017-39,application/vnd.openxmlformats-officedocument.presentationml.presentation,8287,8253,0.0003\nCC-MAIN-2017-39,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,12951,12765,0.0004\nCC-MAIN-2017-39,application/vnd.openxmlformats-officedocument.wordprocessingml.document,46204,45859,0.0015\nCC-MAIN-2017-39,application/x-bibtex-text-file,59811,59705,0.0020\nCC-MAIN-2017-39,application/x-bittorrent,8532,8528,0.0003\nCC-MAIN-2017-39,application/x-bzip2,7503,7481,0.0002\nCC-MAIN-2017-39,application/x-dosexec,10717,10469,0.0004\nCC-MAIN-2017-39,application/x-endnote-refer,18907,18906,0.0006\nCC-MAIN-2017-39,application/x-hdf,10405,10405,0.0003\nCC-MAIN-2017-39,application/x-mobipocket-ebook,11251,11231,0.0004\nCC-MAIN-2017-39,application/x-ms-asx,17490,17392,0.0006\nCC-MAIN-2017-39,application/x-msdownload,79365,79309,0.0026\nCC-MAIN-2017-39,application/x-rar-compressed,18371,18168,0.0006\nCC-MAIN-2017-39,application/x-research-info-systems,54587,54577,0.0018\nCC-MAIN-2017-39,application/x-sh,22269,22207,0.0007\nCC-MAIN-2017-39,application/x-shockwave-flash,48921,48868,0.0016\nCC-MAIN-2017-39,application/x-stata-do,3542,3534,0.0001\nCC-MAIN-2017-39,application/x-tex,11850,11804,0.0004\nCC-MAIN-2017-39,application/x-tex-tfm,262,262,0.0000\nCC-MAIN-2017-39,application/x-tika-msoffice,56883,56797,0.0019\nCC-MAIN-2017-39,application/x-tika-ooxml,35456,35422,0.0012\nCC-MAIN-2017-39,application/x-wais-source,26782,26782,0.0009\nCC-MAIN-2017-39,application/x-xz,63391,63296,0.0021\nCC-MAIN-2017-39,application/xhtml+xml,929279332,921717354,30.7996\nCC-MAIN-2017-39,application/xml,1120886,1115555,0.0372\nCC-MAIN-2017-39,application/zip,197577,195134,0.0065\nCC-MAIN-2017-39,application/zlib,13654,13630,0.0005\nCC-MAIN-2017-39,audio/mp4,19553,19499,0.0006\nCC-MAIN-2017-39,audio/mpeg,151153,150571,0.0050\nCC-MAIN-2017-39,audio/vnd.wave,50619,50612,0.0017\nCC-MAIN-2017-39,audio/x-mpegurl,47309,47246,0.0016\nCC-MAIN-2017-39,image/gif,170179,169543,0.0056\nCC-MAIN-2017-39,image/jpeg,5486713,5483500,0.1818\nCC-MAIN-2017-39,image/png,963810,962412,0.0319\nCC-MAIN-2017-39,image/svg+xml,4963,4903,0.0002\nCC-MAIN-2017-39,image/tiff,21711,21610,0.0007\nCC-MAIN-2017-39,image/vnd.djvu,36116,36020,0.0012\nCC-MAIN-2017-39,image/vnd.dxf; format=ascii,4259,4259,0.0001\nCC-MAIN-2017-39,image/webp,8015,7875,0.0003\nCC-MAIN-2017-39,message/rfc822,38355,38226,0.0013\nCC-MAIN-2017-39,text/asp,375627,374739,0.0124\nCC-MAIN-2017-39,text/aspdotnet,135206,134695,0.0045\nCC-MAIN-2017-39,text/calendar,384542,384163,0.0127\nCC-MAIN-2017-39,text/css,6858,6856,0.0002\nCC-MAIN-2017-39,text/csv,15085,15040,0.0005\nCC-MAIN-2017-39,text/html,2033632054,2005885431,67.4017\nCC-MAIN-2017-39,text/plain,1088158,1085970,0.0361\nCC-MAIN-2017-39,text/prs.lines.tag,2668,2667,0.0001\nCC-MAIN-2017-39,text/tab-separated-values,8366,8366,0.0003\nCC-MAIN-2017-39,text/troff,7711,7711,0.0003\nCC-MAIN-2017-39,text/turtle,12948,12937,0.0004\nCC-MAIN-2017-39,text/vtt,876,875,0.0000\nCC-MAIN-2017-39,text/x-c++src,3914,3862,0.0001\nCC-MAIN-2017-39,text/x-cgi,70032,64417,0.0023\nCC-MAIN-2017-39,text/x-chdr,4367,4322,0.0001\nCC-MAIN-2017-39,text/x-coldfusion,123256,122593,0.0041\nCC-MAIN-2017-39,text/x-csrc,15520,15501,0.0005\nCC-MAIN-2017-39,text/x-diff,15916,15886,0.0005\nCC-MAIN-2017-39,text/x-jsp,164861,164220,0.0055\nCC-MAIN-2017-39,text/x-log,22833,22833,0.0008\nCC-MAIN-2017-39,text/x-matlab,41562,41527,0.0014\nCC-MAIN-2017-39,text/x-perl,43319,43258,0.0014\nCC-MAIN-2017-39,text/x-php,2166330,2157815,0.0718\nCC-MAIN-2017-39,text/x-python,6930,6918,0.0002\nCC-MAIN-2017-39,text/x-vcalendar,10232,10168,0.0003\nCC-MAIN-2017-39,text/x-vcard,46486,46326,0.0015\nCC-MAIN-2017-39,text/x-web-markdown,2471,2467,0.0001\nCC-MAIN-2017-39,text/x-yaml,228,228,0.0000\nCC-MAIN-2017-39,video/mp4,22205,22090,0.0007\nCC-MAIN-2017-39,video/quicktime,5226,5191,0.0002\nCC-MAIN-2017-39,video/webm,18516,18497,0.0006\nCC-MAIN-2017-39,video/x-m4v,10154,10140,0.0003\nCC-MAIN-2017-43,<other>,320891,320133,0.0088\nCC-MAIN-2017-43,application/atom+xml,7636438,7634889,0.2092\nCC-MAIN-2017-43,application/epub+zip,33992,33727,0.0009\nCC-MAIN-2017-43,application/gpx+xml,2089,2089,0.0001\nCC-MAIN-2017-43,application/gzip,67397,66663,0.0018\nCC-MAIN-2017-43,application/javascript,23176,23159,0.0006\nCC-MAIN-2017-43,application/json,194262,194027,0.0053\nCC-MAIN-2017-43,application/marc,16441,16441,0.0005\nCC-MAIN-2017-43,application/mbox,5240,5227,0.0001\nCC-MAIN-2017-43,application/msword,85655,85187,0.0023\nCC-MAIN-2017-43,application/octet-stream,251510,249896,0.0069\nCC-MAIN-2017-43,application/pdf,16958825,16916708,0.4646\nCC-MAIN-2017-43,application/pgp-signature,19979,19964,0.0005\nCC-MAIN-2017-43,application/pkcs7-signature,3460,3458,0.0001\nCC-MAIN-2017-43,application/postscript,16137,16130,0.0004\nCC-MAIN-2017-43,application/rdf+xml,394288,394068,0.0108\nCC-MAIN-2017-43,application/rss+xml,6274031,6256200,0.1719\nCC-MAIN-2017-43,application/rtf,19128,19119,0.0005\nCC-MAIN-2017-43,application/text,7882,7881,0.0002\nCC-MAIN-2017-43,application/vnd.android.package-archive,35267,35134,0.0010\nCC-MAIN-2017-43,application/vnd.google-earth.kml+xml,81647,81170,0.0022\nCC-MAIN-2017-43,application/vnd.google-earth.kmz,9699,9694,0.0003\nCC-MAIN-2017-43,application/vnd.ms-excel,28650,28566,0.0008\nCC-MAIN-2017-43,application/vnd.ms-powerpoint,18494,18441,0.0005\nCC-MAIN-2017-43,application/vnd.oasis.opendocument.spreadsheet,1468,1467,0.0000\nCC-MAIN-2017-43,application/vnd.oasis.opendocument.text,7906,7899,0.0002\nCC-MAIN-2017-43,application/vnd.openxmlformats-officedocument.presentationml.presentation,4926,4903,0.0001\nCC-MAIN-2017-43,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,14973,14891,0.0004\nCC-MAIN-2017-43,application/vnd.openxmlformats-officedocument.wordprocessingml.document,28807,28552,0.0008\nCC-MAIN-2017-43,application/x-bibtex-text-file,36354,36288,0.0010\nCC-MAIN-2017-43,application/x-bittorrent,6500,6345,0.0002\nCC-MAIN-2017-43,application/x-bzip2,3772,3759,0.0001\nCC-MAIN-2017-43,application/x-dosexec,15020,14834,0.0004\nCC-MAIN-2017-43,application/x-endnote-refer,11874,11851,0.0003\nCC-MAIN-2017-43,application/x-hdf,97,97,0.0000\nCC-MAIN-2017-43,application/x-mobipocket-ebook,8463,8454,0.0002\nCC-MAIN-2017-43,application/x-ms-asx,36326,36310,0.0010\nCC-MAIN-2017-43,application/x-msdownload,85732,85705,0.0023\nCC-MAIN-2017-43,application/x-rar-compressed,17102,17090,0.0005\nCC-MAIN-2017-43,application/x-research-info-systems,53166,53144,0.0015\nCC-MAIN-2017-43,application/x-sh,21181,21106,0.0006\nCC-MAIN-2017-43,application/x-shockwave-flash,34331,34271,0.0009\nCC-MAIN-2017-43,application/x-stata-do,3218,3217,0.0001\nCC-MAIN-2017-43,application/x-tex,3841,3823,0.0001\nCC-MAIN-2017-43,application/x-tex-tfm,369,369,0.0000\nCC-MAIN-2017-43,application/x-tika-msoffice,33793,33770,0.0009\nCC-MAIN-2017-43,application/x-tika-ooxml,19694,19681,0.0005\nCC-MAIN-2017-43,application/x-wais-source,6361,6361,0.0002\nCC-MAIN-2017-43,application/x-xz,43538,43468,0.0012\nCC-MAIN-2017-43,application/xhtml+xml,1100032953,1092802841,30.1343\nCC-MAIN-2017-43,application/xml,1151496,1146684,0.0315\nCC-MAIN-2017-43,application/zip,169900,169447,0.0047\nCC-MAIN-2017-43,application/zlib,1527,1511,0.0000\nCC-MAIN-2017-43,audio/mp4,17369,17322,0.0005\nCC-MAIN-2017-43,audio/mpeg,149000,148464,0.0041\nCC-MAIN-2017-43,audio/vnd.wave,65622,65620,0.0018\nCC-MAIN-2017-43,audio/x-mpegurl,38627,38607,0.0011\nCC-MAIN-2017-43,image/gif,1347205,1345101,0.0369\nCC-MAIN-2017-43,image/jpeg,93808666,92110751,2.5698\nCC-MAIN-2017-43,image/png,11391966,11374902,0.3121\nCC-MAIN-2017-43,image/svg+xml,84143,83924,0.0023\nCC-MAIN-2017-43,image/tiff,32528,32518,0.0009\nCC-MAIN-2017-43,image/vnd.djvu,17732,17693,0.0005\nCC-MAIN-2017-43,image/vnd.dxf; format=ascii,2035,2035,0.0001\nCC-MAIN-2017-43,image/webp,12325,12196,0.0003\nCC-MAIN-2017-43,message/rfc822,70771,70494,0.0019\nCC-MAIN-2017-43,text/asp,587876,586872,0.0161\nCC-MAIN-2017-43,text/aspdotnet,202800,202485,0.0056\nCC-MAIN-2017-43,text/calendar,430449,430145,0.0118\nCC-MAIN-2017-43,text/css,6412,6343,0.0002\nCC-MAIN-2017-43,text/csv,15551,15543,0.0004\nCC-MAIN-2017-43,text/html,2403241071,2374565793,65.8345\nCC-MAIN-2017-43,text/plain,838980,835927,0.0230\nCC-MAIN-2017-43,text/prs.lines.tag,901,901,0.0000\nCC-MAIN-2017-43,text/tab-separated-values,9301,9301,0.0003\nCC-MAIN-2017-43,text/troff,17604,17599,0.0005\nCC-MAIN-2017-43,text/turtle,15115,15096,0.0004\nCC-MAIN-2017-43,text/vtt,742,742,0.0000\nCC-MAIN-2017-43,text/x-c++src,27847,27783,0.0008\nCC-MAIN-2017-43,text/x-cgi,102057,99625,0.0028\nCC-MAIN-2017-43,text/x-chdr,68321,68278,0.0019\nCC-MAIN-2017-43,text/x-coldfusion,249765,248995,0.0068\nCC-MAIN-2017-43,text/x-csrc,69889,69851,0.0019\nCC-MAIN-2017-43,text/x-diff,16757,16736,0.0005\nCC-MAIN-2017-43,text/x-jsp,214333,206105,0.0059\nCC-MAIN-2017-43,text/x-log,13333,13333,0.0004\nCC-MAIN-2017-43,text/x-matlab,19293,19277,0.0005\nCC-MAIN-2017-43,text/x-perl,61922,61816,0.0017\nCC-MAIN-2017-43,text/x-php,2736112,2730174,0.0750\nCC-MAIN-2017-43,text/x-python,3941,3923,0.0001\nCC-MAIN-2017-43,text/x-vcalendar,9247,9101,0.0003\nCC-MAIN-2017-43,text/x-vcard,33316,33182,0.0009\nCC-MAIN-2017-43,text/x-web-markdown,1832,1831,0.0001\nCC-MAIN-2017-43,text/x-yaml,154,154,0.0000\nCC-MAIN-2017-43,video/mp4,18147,18076,0.0005\nCC-MAIN-2017-43,video/quicktime,4987,4985,0.0001\nCC-MAIN-2017-43,video/webm,8365,8363,0.0002\nCC-MAIN-2017-43,video/x-m4v,6543,6524,0.0002\nCC-MAIN-2017-47,<other>,293716,293087,0.0092\nCC-MAIN-2017-47,application/atom+xml,6551009,6549640,0.2044\nCC-MAIN-2017-47,application/epub+zip,28198,27942,0.0009\nCC-MAIN-2017-47,application/gpx+xml,1688,1688,0.0001\nCC-MAIN-2017-47,application/gzip,49845,49744,0.0016\nCC-MAIN-2017-47,application/javascript,16562,16552,0.0005\nCC-MAIN-2017-47,application/json,191212,191080,0.0060\nCC-MAIN-2017-47,application/marc,12172,12172,0.0004\nCC-MAIN-2017-47,application/mbox,9301,9300,0.0003\nCC-MAIN-2017-47,application/msword,111390,110980,0.0035\nCC-MAIN-2017-47,application/octet-stream,239915,239301,0.0075\nCC-MAIN-2017-47,application/pdf,16415812,16385588,0.5122\nCC-MAIN-2017-47,application/pgp-signature,16080,16077,0.0005\nCC-MAIN-2017-47,application/pkcs7-signature,1712,1711,0.0001\nCC-MAIN-2017-47,application/postscript,16209,16199,0.0005\nCC-MAIN-2017-47,application/rdf+xml,405169,405021,0.0126\nCC-MAIN-2017-47,application/rss+xml,5695027,5683359,0.1777\nCC-MAIN-2017-47,application/rtf,26162,26157,0.0008\nCC-MAIN-2017-47,application/text,17450,17449,0.0005\nCC-MAIN-2017-47,application/vnd.android.package-archive,25945,25725,0.0008\nCC-MAIN-2017-47,application/vnd.google-earth.kml+xml,72940,72864,0.0023\nCC-MAIN-2017-47,application/vnd.google-earth.kmz,9783,9779,0.0003\nCC-MAIN-2017-47,application/vnd.ms-excel,27815,27741,0.0009\nCC-MAIN-2017-47,application/vnd.ms-powerpoint,23029,23003,0.0007\nCC-MAIN-2017-47,application/vnd.oasis.opendocument.spreadsheet,1882,1862,0.0001\nCC-MAIN-2017-47,application/vnd.oasis.opendocument.text,9398,9394,0.0003\nCC-MAIN-2017-47,application/vnd.openxmlformats-officedocument.presentationml.presentation,6341,6334,0.0002\nCC-MAIN-2017-47,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,11018,10961,0.0003\nCC-MAIN-2017-47,application/vnd.openxmlformats-officedocument.wordprocessingml.document,32890,32750,0.0010\nCC-MAIN-2017-47,application/x-bibtex-text-file,37932,37923,0.0012\nCC-MAIN-2017-47,application/x-bittorrent,9367,9131,0.0003\nCC-MAIN-2017-47,application/x-bzip2,4097,4082,0.0001\nCC-MAIN-2017-47,application/x-dosexec,9641,9394,0.0003\nCC-MAIN-2017-47,application/x-endnote-refer,24372,24366,0.0008\nCC-MAIN-2017-47,application/x-hdf,1085,1085,0.0000\nCC-MAIN-2017-47,application/x-mobipocket-ebook,8054,8041,0.0003\nCC-MAIN-2017-47,application/x-ms-asx,13254,13240,0.0004\nCC-MAIN-2017-47,application/x-msdownload,15433,15409,0.0005\nCC-MAIN-2017-47,application/x-rar-compressed,19410,19378,0.0006\nCC-MAIN-2017-47,application/x-research-info-systems,46344,46326,0.0014\nCC-MAIN-2017-47,application/x-sh,27198,27149,0.0008\nCC-MAIN-2017-47,application/x-shockwave-flash,30649,30618,0.0010\nCC-MAIN-2017-47,application/x-stata-do,2439,2432,0.0001\nCC-MAIN-2017-47,application/x-tex,2029,2027,0.0001\nCC-MAIN-2017-47,application/x-tex-tfm,176,176,0.0000\nCC-MAIN-2017-47,application/x-tika-msoffice,55722,55698,0.0017\nCC-MAIN-2017-47,application/x-tika-ooxml,32580,32572,0.0010\nCC-MAIN-2017-47,application/x-wais-source,1858,1858,0.0001\nCC-MAIN-2017-47,application/x-xz,24233,24204,0.0008\nCC-MAIN-2017-47,application/xhtml+xml,967898281,962277749,30.2002\nCC-MAIN-2017-47,application/xml,1177954,1174183,0.0368\nCC-MAIN-2017-47,application/zip,165054,163983,0.0051\nCC-MAIN-2017-47,application/zlib,1512,1491,0.0000\nCC-MAIN-2017-47,audio/mp4,21559,21518,0.0007\nCC-MAIN-2017-47,audio/mpeg,171719,170938,0.0054\nCC-MAIN-2017-47,audio/vnd.wave,38572,38569,0.0012\nCC-MAIN-2017-47,audio/x-mpegurl,26509,26502,0.0008\nCC-MAIN-2017-47,image/gif,640257,638326,0.0200\nCC-MAIN-2017-47,image/jpeg,53384700,52366899,1.6657\nCC-MAIN-2017-47,image/png,5590547,5575017,0.1744\nCC-MAIN-2017-47,image/svg+xml,74535,74504,0.0023\nCC-MAIN-2017-47,image/tiff,28907,28899,0.0009\nCC-MAIN-2017-47,image/vnd.djvu,19455,19452,0.0006\nCC-MAIN-2017-47,image/vnd.dxf; format=ascii,2121,2121,0.0001\nCC-MAIN-2017-47,image/webp,14589,14535,0.0005\nCC-MAIN-2017-47,message/rfc822,41260,41164,0.0013\nCC-MAIN-2017-47,text/asp,537225,536296,0.0168\nCC-MAIN-2017-47,text/aspdotnet,135003,134709,0.0042\nCC-MAIN-2017-47,text/calendar,423002,422707,0.0132\nCC-MAIN-2017-47,text/css,5430,5423,0.0002\nCC-MAIN-2017-47,text/csv,14899,14899,0.0005\nCC-MAIN-2017-47,text/html,2139627126,2117784581,66.7602\nCC-MAIN-2017-47,text/plain,467693,466603,0.0146\nCC-MAIN-2017-47,text/prs.lines.tag,1360,1360,0.0000\nCC-MAIN-2017-47,text/tab-separated-values,5009,5009,0.0002\nCC-MAIN-2017-47,text/troff,5182,5182,0.0002\nCC-MAIN-2017-47,text/turtle,25247,25245,0.0008\nCC-MAIN-2017-47,text/vtt,2555,2555,0.0001\nCC-MAIN-2017-47,text/x-c++src,8956,8940,0.0003\nCC-MAIN-2017-47,text/x-cgi,95159,91219,0.0030\nCC-MAIN-2017-47,text/x-chdr,19102,19086,0.0006\nCC-MAIN-2017-47,text/x-coldfusion,243319,242558,0.0076\nCC-MAIN-2017-47,text/x-csrc,21982,21975,0.0007\nCC-MAIN-2017-47,text/x-diff,8057,8053,0.0003\nCC-MAIN-2017-47,text/x-jsp,197751,195680,0.0062\nCC-MAIN-2017-47,text/x-log,13667,13665,0.0004\nCC-MAIN-2017-47,text/x-matlab,25340,25059,0.0008\nCC-MAIN-2017-47,text/x-perl,36292,36266,0.0011\nCC-MAIN-2017-47,text/x-php,2863713,2858283,0.0894\nCC-MAIN-2017-47,text/x-python,22945,22939,0.0007\nCC-MAIN-2017-47,text/x-vcalendar,8197,8191,0.0003\nCC-MAIN-2017-47,text/x-vcard,37762,37728,0.0012\nCC-MAIN-2017-47,text/x-web-markdown,2702,2699,0.0001\nCC-MAIN-2017-47,text/x-yaml,238,238,0.0000\nCC-MAIN-2017-47,video/mp4,19195,19129,0.0006\nCC-MAIN-2017-47,video/quicktime,5148,5145,0.0002\nCC-MAIN-2017-47,video/webm,66390,66335,0.0021\nCC-MAIN-2017-47,video/x-m4v,14853,14804,0.0005\nCC-MAIN-2017-51,<other>,167008,166384,0.0057\nCC-MAIN-2017-51,application/atom+xml,3255787,3255061,0.1117\nCC-MAIN-2017-51,application/epub+zip,23036,22977,0.0008\nCC-MAIN-2017-51,application/gpx+xml,2048,2048,0.0001\nCC-MAIN-2017-51,application/gzip,42166,42102,0.0014\nCC-MAIN-2017-51,application/javascript,11072,11064,0.0004\nCC-MAIN-2017-51,application/json,159062,158830,0.0055\nCC-MAIN-2017-51,application/marc,11909,11909,0.0004\nCC-MAIN-2017-51,application/mbox,6892,6891,0.0002\nCC-MAIN-2017-51,application/msword,37398,37341,0.0013\nCC-MAIN-2017-51,application/octet-stream,118245,117603,0.0041\nCC-MAIN-2017-51,application/pdf,8614399,8603324,0.2956\nCC-MAIN-2017-51,application/pgp-signature,8640,8639,0.0003\nCC-MAIN-2017-51,application/pkcs7-signature,1153,1152,0.0000\nCC-MAIN-2017-51,application/postscript,2736,2736,0.0001\nCC-MAIN-2017-51,application/rdf+xml,140044,139941,0.0048\nCC-MAIN-2017-51,application/rss+xml,4272975,4266535,0.1466\nCC-MAIN-2017-51,application/rtf,9243,9237,0.0003\nCC-MAIN-2017-51,application/text,4648,4648,0.0002\nCC-MAIN-2017-51,application/vnd.android.package-archive,27856,27771,0.0010\nCC-MAIN-2017-51,application/vnd.google-earth.kml+xml,88197,88173,0.0030\nCC-MAIN-2017-51,application/vnd.google-earth.kmz,5576,5572,0.0002\nCC-MAIN-2017-51,application/vnd.ms-excel,14468,14434,0.0005\nCC-MAIN-2017-51,application/vnd.ms-powerpoint,10968,10963,0.0004\nCC-MAIN-2017-51,application/vnd.oasis.opendocument.spreadsheet,919,919,0.0000\nCC-MAIN-2017-51,application/vnd.oasis.opendocument.text,3751,3750,0.0001\nCC-MAIN-2017-51,application/vnd.openxmlformats-officedocument.presentationml.presentation,2501,2494,0.0001\nCC-MAIN-2017-51,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,7405,7376,0.0003\nCC-MAIN-2017-51,application/vnd.openxmlformats-officedocument.wordprocessingml.document,12486,12463,0.0004\nCC-MAIN-2017-51,application/x-bibtex-text-file,11950,11950,0.0004\nCC-MAIN-2017-51,application/x-bittorrent,4394,3963,0.0002\nCC-MAIN-2017-51,application/x-bzip2,1113,1113,0.0000\nCC-MAIN-2017-51,application/x-dosexec,4089,4021,0.0001\nCC-MAIN-2017-51,application/x-endnote-refer,8645,8641,0.0003\nCC-MAIN-2017-51,application/x-hdf,117,117,0.0000\nCC-MAIN-2017-51,application/x-mobipocket-ebook,4558,4558,0.0002\nCC-MAIN-2017-51,application/x-ms-asx,6665,6662,0.0002\nCC-MAIN-2017-51,application/x-msdownload,3826,3816,0.0001\nCC-MAIN-2017-51,application/x-rar-compressed,10474,10452,0.0004\nCC-MAIN-2017-51,application/x-research-info-systems,33472,33472,0.0011\nCC-MAIN-2017-51,application/x-sh,7350,7341,0.0003\nCC-MAIN-2017-51,application/x-shockwave-flash,20613,20598,0.0007\nCC-MAIN-2017-51,application/x-stata-do,2714,2559,0.0001\nCC-MAIN-2017-51,application/x-tex,617,617,0.0000\nCC-MAIN-2017-51,application/x-tex-tfm,1,1,0.0000\nCC-MAIN-2017-51,application/x-tika-msoffice,20656,20640,0.0007\nCC-MAIN-2017-51,application/x-tika-ooxml,13948,13939,0.0005\nCC-MAIN-2017-51,application/x-wais-source,2423,2423,0.0001\nCC-MAIN-2017-51,application/x-xz,15361,15339,0.0005\nCC-MAIN-2017-51,application/xhtml+xml,887109811,883320780,30.4430\nCC-MAIN-2017-51,application/xml,1010251,1004911,0.0347\nCC-MAIN-2017-51,application/zip,87445,87239,0.0030\nCC-MAIN-2017-51,application/zlib,417,409,0.0000\nCC-MAIN-2017-51,audio/mp4,15725,15683,0.0005\nCC-MAIN-2017-51,audio/mpeg,106097,105399,0.0036\nCC-MAIN-2017-51,audio/vnd.wave,26886,26885,0.0009\nCC-MAIN-2017-51,audio/x-mpegurl,14350,14331,0.0005\nCC-MAIN-2017-51,image/gif,625838,621590,0.0215\nCC-MAIN-2017-51,image/jpeg,54231426,53156202,1.8611\nCC-MAIN-2017-51,image/png,5821625,5802004,0.1998\nCC-MAIN-2017-51,image/svg+xml,88001,87971,0.0030\nCC-MAIN-2017-51,image/tiff,14999,14992,0.0005\nCC-MAIN-2017-51,image/vnd.djvu,10414,10414,0.0004\nCC-MAIN-2017-51,image/vnd.dxf; format=ascii,1104,1104,0.0000\nCC-MAIN-2017-51,image/webp,10342,10338,0.0004\nCC-MAIN-2017-51,message/rfc822,16681,16601,0.0006\nCC-MAIN-2017-51,text/asp,386858,386175,0.0133\nCC-MAIN-2017-51,text/aspdotnet,106238,106150,0.0036\nCC-MAIN-2017-51,text/calendar,350987,350891,0.0120\nCC-MAIN-2017-51,text/css,4733,4730,0.0002\nCC-MAIN-2017-51,text/csv,4641,4640,0.0002\nCC-MAIN-2017-51,text/html,1944009699,1929453456,66.7127\nCC-MAIN-2017-51,text/plain,220481,219850,0.0076\nCC-MAIN-2017-51,text/prs.lines.tag,509,509,0.0000\nCC-MAIN-2017-51,text/tab-separated-values,1436,1436,0.0000\nCC-MAIN-2017-51,text/troff,1288,1288,0.0000\nCC-MAIN-2017-51,text/turtle,8227,8227,0.0003\nCC-MAIN-2017-51,text/vtt,1362,1362,0.0000\nCC-MAIN-2017-51,text/x-c++src,1120,1120,0.0000\nCC-MAIN-2017-51,text/x-cgi,55364,54828,0.0019\nCC-MAIN-2017-51,text/x-chdr,2627,2624,0.0001\nCC-MAIN-2017-51,text/x-coldfusion,159762,159401,0.0055\nCC-MAIN-2017-51,text/x-csrc,5421,5419,0.0002\nCC-MAIN-2017-51,text/x-diff,5155,5150,0.0002\nCC-MAIN-2017-51,text/x-jsp,125511,122044,0.0043\nCC-MAIN-2017-51,text/x-log,5498,5498,0.0002\nCC-MAIN-2017-51,text/x-matlab,11593,11590,0.0004\nCC-MAIN-2017-51,text/x-perl,23533,23529,0.0008\nCC-MAIN-2017-51,text/x-php,1988386,1985606,0.0682\nCC-MAIN-2017-51,text/x-python,1346,1346,0.0000\nCC-MAIN-2017-51,text/x-vcalendar,4990,4988,0.0002\nCC-MAIN-2017-51,text/x-vcard,20946,20942,0.0007\nCC-MAIN-2017-51,text/x-web-markdown,1315,1315,0.0000\nCC-MAIN-2017-51,text/x-yaml,87,87,0.0000\nCC-MAIN-2017-51,video/mp4,11875,11737,0.0004\nCC-MAIN-2017-51,video/quicktime,3460,3459,0.0001\nCC-MAIN-2017-51,video/webm,41573,41544,0.0014\nCC-MAIN-2017-51,video/x-m4v,11416,11403,0.0004\nCC-MAIN-2018-05,<other>,746976,745927,0.0216\nCC-MAIN-2018-05,application/atom+xml,5942275,5940972,0.1715\nCC-MAIN-2018-05,application/epub+zip,59982,58611,0.0017\nCC-MAIN-2018-05,application/gpx+xml,5436,5436,0.0002\nCC-MAIN-2018-05,application/gzip,112865,112633,0.0033\nCC-MAIN-2018-05,application/javascript,20600,20585,0.0006\nCC-MAIN-2018-05,application/json,322168,322025,0.0093\nCC-MAIN-2018-05,application/marc,9775,9775,0.0003\nCC-MAIN-2018-05,application/mbox,125513,125508,0.0036\nCC-MAIN-2018-05,application/msword,187708,185973,0.0054\nCC-MAIN-2018-05,application/octet-stream,604350,602847,0.0174\nCC-MAIN-2018-05,application/pdf,29870025,29801719,0.8622\nCC-MAIN-2018-05,application/pgp-signature,61867,61771,0.0018\nCC-MAIN-2018-05,application/pkcs7-signature,8594,8593,0.0002\nCC-MAIN-2018-05,application/postscript,31982,31877,0.0009\nCC-MAIN-2018-05,application/rdf+xml,347623,347418,0.0100\nCC-MAIN-2018-05,application/rss+xml,6698078,6684349,0.1933\nCC-MAIN-2018-05,application/rtf,28076,27870,0.0008\nCC-MAIN-2018-05,application/text,12592,12592,0.0004\nCC-MAIN-2018-05,application/vnd.android.package-archive,78486,77927,0.0023\nCC-MAIN-2018-05,application/vnd.google-earth.kml+xml,216788,216751,0.0063\nCC-MAIN-2018-05,application/vnd.google-earth.kmz,40817,40812,0.0012\nCC-MAIN-2018-05,application/vnd.ms-excel,43349,43221,0.0013\nCC-MAIN-2018-05,application/vnd.ms-powerpoint,27896,27819,0.0008\nCC-MAIN-2018-05,application/vnd.oasis.opendocument.spreadsheet,5681,5679,0.0002\nCC-MAIN-2018-05,application/vnd.oasis.opendocument.text,18815,18752,0.0005\nCC-MAIN-2018-05,application/vnd.openxmlformats-officedocument.presentationml.presentation,16804,16765,0.0005\nCC-MAIN-2018-05,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,26838,26723,0.0008\nCC-MAIN-2018-05,application/vnd.openxmlformats-officedocument.wordprocessingml.document,58559,58101,0.0017\nCC-MAIN-2018-05,application/x-bibtex-text-file,74394,74375,0.0021\nCC-MAIN-2018-05,application/x-bittorrent,20183,18934,0.0006\nCC-MAIN-2018-05,application/x-bzip2,9109,9104,0.0003\nCC-MAIN-2018-05,application/x-dosexec,18008,17377,0.0005\nCC-MAIN-2018-05,application/x-endnote-refer,18733,18718,0.0005\nCC-MAIN-2018-05,application/x-hdf,826,826,0.0000\nCC-MAIN-2018-05,application/x-mobipocket-ebook,19822,19812,0.0006\nCC-MAIN-2018-05,application/x-ms-asx,46935,46924,0.0014\nCC-MAIN-2018-05,application/x-msdownload,7361,7331,0.0002\nCC-MAIN-2018-05,application/x-rar-compressed,30915,30651,0.0009\nCC-MAIN-2018-05,application/x-research-info-systems,48206,48202,0.0014\nCC-MAIN-2018-05,application/x-sh,28699,28639,0.0008\nCC-MAIN-2018-05,application/x-shockwave-flash,35782,35711,0.0010\nCC-MAIN-2018-05,application/x-stata-do,4673,4617,0.0001\nCC-MAIN-2018-05,application/x-tex,13753,13743,0.0004\nCC-MAIN-2018-05,application/x-tex-tfm,2013,2013,0.0001\nCC-MAIN-2018-05,application/x-tika-msoffice,83895,83846,0.0024\nCC-MAIN-2018-05,application/x-tika-ooxml,51402,51379,0.0015\nCC-MAIN-2018-05,application/x-wais-source,34087,34087,0.0010\nCC-MAIN-2018-05,application/x-xz,66987,66871,0.0019\nCC-MAIN-2018-05,application/xhtml+xml,1012360463,1005619090,29.2207\nCC-MAIN-2018-05,application/xml,1768242,1757268,0.0510\nCC-MAIN-2018-05,application/zip,358139,343257,0.0103\nCC-MAIN-2018-05,application/zlib,2762,2733,0.0001\nCC-MAIN-2018-05,audio/mp4,35827,35648,0.0010\nCC-MAIN-2018-05,audio/mpeg,241557,238956,0.0070\nCC-MAIN-2018-05,audio/vnd.wave,30813,30808,0.0009\nCC-MAIN-2018-05,audio/x-mpegurl,62944,62913,0.0018\nCC-MAIN-2018-05,image/gif,758280,756710,0.0219\nCC-MAIN-2018-05,image/jpeg,61639883,60839652,1.7792\nCC-MAIN-2018-05,image/png,7363930,7354917,0.2126\nCC-MAIN-2018-05,image/svg+xml,89814,89729,0.0026\nCC-MAIN-2018-05,image/tiff,20402,20393,0.0006\nCC-MAIN-2018-05,image/vnd.djvu,34330,34324,0.0010\nCC-MAIN-2018-05,image/vnd.dxf; format=ascii,7473,7462,0.0002\nCC-MAIN-2018-05,image/webp,30050,30048,0.0009\nCC-MAIN-2018-05,message/rfc822,189258,189173,0.0055\nCC-MAIN-2018-05,text/asp,552400,551247,0.0159\nCC-MAIN-2018-05,text/aspdotnet,261553,260715,0.0075\nCC-MAIN-2018-05,text/calendar,521806,521498,0.0151\nCC-MAIN-2018-05,text/css,5908,5899,0.0002\nCC-MAIN-2018-05,text/csv,43551,43531,0.0013\nCC-MAIN-2018-05,text/html,2324524466,2300705171,67.0948\nCC-MAIN-2018-05,text/markdown,1,1,0.0000\nCC-MAIN-2018-05,text/plain,1687693,1685705,0.0487\nCC-MAIN-2018-05,text/prs.lines.tag,10946,10927,0.0003\nCC-MAIN-2018-05,text/tab-separated-values,36593,36593,0.0011\nCC-MAIN-2018-05,text/troff,44986,44945,0.0013\nCC-MAIN-2018-05,text/turtle,15523,15508,0.0004\nCC-MAIN-2018-05,text/vtt,1593,1593,0.0000\nCC-MAIN-2018-05,text/x-c++src,5197,5196,0.0002\nCC-MAIN-2018-05,text/x-cgi,134585,133467,0.0039\nCC-MAIN-2018-05,text/x-chdr,11762,11759,0.0003\nCC-MAIN-2018-05,text/x-coldfusion,232943,232296,0.0067\nCC-MAIN-2018-05,text/x-csrc,32966,32949,0.0010\nCC-MAIN-2018-05,text/x-diff,60560,60521,0.0017\nCC-MAIN-2018-05,text/x-jsp,214816,210907,0.0062\nCC-MAIN-2018-05,text/x-log,40301,40262,0.0012\nCC-MAIN-2018-05,text/x-matlab,46624,46113,0.0013\nCC-MAIN-2018-05,text/x-perl,126876,126555,0.0037\nCC-MAIN-2018-05,text/x-php,4351521,4342090,0.1256\nCC-MAIN-2018-05,text/x-python,10819,10808,0.0003\nCC-MAIN-2018-05,text/x-vcalendar,20353,20341,0.0006\nCC-MAIN-2018-05,text/x-vcard,55929,55881,0.0016\nCC-MAIN-2018-05,text/x-web-markdown,4903,4897,0.0001\nCC-MAIN-2018-05,text/x-yaml,540,540,0.0000\nCC-MAIN-2018-05,video/mp4,36071,35773,0.0010\nCC-MAIN-2018-05,video/quicktime,8739,8735,0.0003\nCC-MAIN-2018-05,video/webm,72417,72226,0.0021\nCC-MAIN-2018-05,video/x-m4v,21796,21658,0.0006\nCC-MAIN-2018-09,<other>,350604,349924,0.0101\nCC-MAIN-2018-09,application/atom+xml,6601676,6598507,0.1892\nCC-MAIN-2018-09,application/epub+zip,30626,30186,0.0009\nCC-MAIN-2018-09,application/gpx+xml,2733,2733,0.0001\nCC-MAIN-2018-09,application/gzip,87651,87463,0.0025\nCC-MAIN-2018-09,application/javascript,21479,21452,0.0006\nCC-MAIN-2018-09,application/json,218958,218737,0.0063\nCC-MAIN-2018-09,application/marc,13192,13192,0.0004\nCC-MAIN-2018-09,application/mbox,22897,22897,0.0007\nCC-MAIN-2018-09,application/msword,118288,117905,0.0034\nCC-MAIN-2018-09,application/octet-stream,292603,290386,0.0084\nCC-MAIN-2018-09,application/pdf,21725339,21650480,0.6228\nCC-MAIN-2018-09,application/pgp-signature,60640,60632,0.0017\nCC-MAIN-2018-09,application/pkcs7-signature,2547,2547,0.0001\nCC-MAIN-2018-09,application/postscript,12492,12477,0.0004\nCC-MAIN-2018-09,application/rdf+xml,581328,580803,0.0167\nCC-MAIN-2018-09,application/rss+xml,6440947,6421277,0.1846\nCC-MAIN-2018-09,application/rtf,20879,20836,0.0006\nCC-MAIN-2018-09,application/text,7383,7383,0.0002\nCC-MAIN-2018-09,application/vnd.android.package-archive,55784,55398,0.0016\nCC-MAIN-2018-09,application/vnd.google-earth.kml+xml,84592,84538,0.0024\nCC-MAIN-2018-09,application/vnd.google-earth.kmz,12296,12290,0.0004\nCC-MAIN-2018-09,application/vnd.ms-excel,30776,30578,0.0009\nCC-MAIN-2018-09,application/vnd.ms-powerpoint,18237,18200,0.0005\nCC-MAIN-2018-09,application/vnd.oasis.opendocument.spreadsheet,2631,2630,0.0001\nCC-MAIN-2018-09,application/vnd.oasis.opendocument.text,13404,13391,0.0004\nCC-MAIN-2018-09,application/vnd.openxmlformats-officedocument.presentationml.presentation,10195,10160,0.0003\nCC-MAIN-2018-09,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,19341,19085,0.0006\nCC-MAIN-2018-09,application/vnd.openxmlformats-officedocument.wordprocessingml.document,48333,47909,0.0014\nCC-MAIN-2018-09,application/x-bibtex-text-file,23719,23671,0.0007\nCC-MAIN-2018-09,application/x-bittorrent,10012,9722,0.0003\nCC-MAIN-2018-09,application/x-bzip2,5147,5131,0.0001\nCC-MAIN-2018-09,application/x-dosexec,9306,8935,0.0003\nCC-MAIN-2018-09,application/x-endnote-refer,12936,12934,0.0004\nCC-MAIN-2018-09,application/x-hdf,932,932,0.0000\nCC-MAIN-2018-09,application/x-mobipocket-ebook,7185,7146,0.0002\nCC-MAIN-2018-09,application/x-ms-asx,11750,11733,0.0003\nCC-MAIN-2018-09,application/x-msdownload,9324,9262,0.0003\nCC-MAIN-2018-09,application/x-rar-compressed,23853,23728,0.0007\nCC-MAIN-2018-09,application/x-research-info-systems,34860,34859,0.0010\nCC-MAIN-2018-09,application/x-sh,10925,10902,0.0003\nCC-MAIN-2018-09,application/x-shockwave-flash,16177,16083,0.0005\nCC-MAIN-2018-09,application/x-stata-do,14166,14122,0.0004\nCC-MAIN-2018-09,application/x-tex,4341,4339,0.0001\nCC-MAIN-2018-09,application/x-tex-tfm,29,29,0.0000\nCC-MAIN-2018-09,application/x-tika-msoffice,54359,54318,0.0016\nCC-MAIN-2018-09,application/x-tika-ooxml,36492,36460,0.0010\nCC-MAIN-2018-09,application/x-wais-source,10746,10746,0.0003\nCC-MAIN-2018-09,application/x-xz,69343,69303,0.0020\nCC-MAIN-2018-09,application/xhtml+xml,1039648402,1033462173,29.8025\nCC-MAIN-2018-09,application/xml,1463277,1453526,0.0419\nCC-MAIN-2018-09,application/zip,178984,177311,0.0051\nCC-MAIN-2018-09,application/zlib,1565,1545,0.0000\nCC-MAIN-2018-09,audio/mp4,28258,28135,0.0008\nCC-MAIN-2018-09,audio/mpeg,185001,183668,0.0053\nCC-MAIN-2018-09,audio/vnd.wave,18432,18429,0.0005\nCC-MAIN-2018-09,audio/x-mpegurl,39607,39577,0.0011\nCC-MAIN-2018-09,image/gif,773959,770305,0.0222\nCC-MAIN-2018-09,image/jpeg,64728989,63693236,1.8555\nCC-MAIN-2018-09,image/png,7739504,7711071,0.2219\nCC-MAIN-2018-09,image/svg+xml,91431,91312,0.0026\nCC-MAIN-2018-09,image/tiff,10290,10284,0.0003\nCC-MAIN-2018-09,image/vnd.djvu,18688,18682,0.0005\nCC-MAIN-2018-09,image/vnd.dxf; format=ascii,5009,5008,0.0001\nCC-MAIN-2018-09,image/webp,14924,14918,0.0004\nCC-MAIN-2018-09,message/rfc822,22718,22632,0.0007\nCC-MAIN-2018-09,text/asp,452744,451452,0.0130\nCC-MAIN-2018-09,text/aspdotnet,170984,170168,0.0049\nCC-MAIN-2018-09,text/calendar,517893,517270,0.0148\nCC-MAIN-2018-09,text/css,6774,6769,0.0002\nCC-MAIN-2018-09,text/csv,10814,10801,0.0003\nCC-MAIN-2018-09,text/html,2330008752,2306706785,66.7918\nCC-MAIN-2018-09,text/markdown,17,17,0.0000\nCC-MAIN-2018-09,text/plain,826674,825213,0.0237\nCC-MAIN-2018-09,text/prs.lines.tag,2104,2088,0.0001\nCC-MAIN-2018-09,text/tab-separated-values,4093,4092,0.0001\nCC-MAIN-2018-09,text/troff,8783,8769,0.0003\nCC-MAIN-2018-09,text/turtle,20101,20074,0.0006\nCC-MAIN-2018-09,text/vtt,2076,2076,0.0001\nCC-MAIN-2018-09,text/x-c++src,2008,2008,0.0001\nCC-MAIN-2018-09,text/x-cgi,71928,71596,0.0021\nCC-MAIN-2018-09,text/x-chdr,3376,3374,0.0001\nCC-MAIN-2018-09,text/x-coldfusion,231656,230931,0.0066\nCC-MAIN-2018-09,text/x-csrc,9781,9779,0.0003\nCC-MAIN-2018-09,text/x-diff,15711,15706,0.0005\nCC-MAIN-2018-09,text/x-jsp,134487,134193,0.0039\nCC-MAIN-2018-09,text/x-log,16500,16499,0.0005\nCC-MAIN-2018-09,text/x-matlab,15628,15609,0.0004\nCC-MAIN-2018-09,text/x-perl,48910,48830,0.0014\nCC-MAIN-2018-09,text/x-php,3464866,3455752,0.0993\nCC-MAIN-2018-09,text/x-python,4257,4256,0.0001\nCC-MAIN-2018-09,text/x-vcalendar,9573,9572,0.0003\nCC-MAIN-2018-09,text/x-vcard,50748,50634,0.0015\nCC-MAIN-2018-09,text/x-web-markdown,3032,3032,0.0001\nCC-MAIN-2018-09,text/x-yaml,445,445,0.0000\nCC-MAIN-2018-09,video/mp4,31189,31001,0.0009\nCC-MAIN-2018-09,video/quicktime,8478,8440,0.0002\nCC-MAIN-2018-09,video/webm,50975,50864,0.0015\nCC-MAIN-2018-09,video/x-m4v,15471,15394,0.0004\nCC-MAIN-2018-13,<other>,350548,349468,0.0108\nCC-MAIN-2018-13,application/atom+xml,11984069,11978463,0.3707\nCC-MAIN-2018-13,application/epub+zip,33237,33067,0.0010\nCC-MAIN-2018-13,application/gpx+xml,2600,2599,0.0001\nCC-MAIN-2018-13,application/gzip,60098,59942,0.0019\nCC-MAIN-2018-13,application/javascript,26201,25986,0.0008\nCC-MAIN-2018-13,application/json,231381,230389,0.0072\nCC-MAIN-2018-13,application/marc,9112,9112,0.0003\nCC-MAIN-2018-13,application/mbox,30498,30494,0.0009\nCC-MAIN-2018-13,application/msword,91849,91400,0.0028\nCC-MAIN-2018-13,application/octet-stream,360889,359227,0.0112\nCC-MAIN-2018-13,application/pdf,17184636,17123257,0.5316\nCC-MAIN-2018-13,application/pgp-signature,28810,28800,0.0009\nCC-MAIN-2018-13,application/pkcs7-signature,2571,2571,0.0001\nCC-MAIN-2018-13,application/postscript,20851,20804,0.0006\nCC-MAIN-2018-13,application/rdf+xml,489471,488930,0.0151\nCC-MAIN-2018-13,application/rss+xml,5237387,5213228,0.1620\nCC-MAIN-2018-13,application/rtf,20769,20734,0.0006\nCC-MAIN-2018-13,application/text,8060,8060,0.0002\nCC-MAIN-2018-13,application/vnd.android.package-archive,47250,47093,0.0015\nCC-MAIN-2018-13,application/vnd.google-earth.kml+xml,67901,67828,0.0021\nCC-MAIN-2018-13,application/vnd.google-earth.kmz,9105,9089,0.0003\nCC-MAIN-2018-13,application/vnd.ms-excel,28069,27854,0.0009\nCC-MAIN-2018-13,application/vnd.ms-powerpoint,14550,14519,0.0005\nCC-MAIN-2018-13,application/vnd.oasis.opendocument.spreadsheet,1989,1983,0.0001\nCC-MAIN-2018-13,application/vnd.oasis.opendocument.text,9098,9047,0.0003\nCC-MAIN-2018-13,application/vnd.openxmlformats-officedocument.presentationml.presentation,6159,6149,0.0002\nCC-MAIN-2018-13,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,13047,12938,0.0004\nCC-MAIN-2018-13,application/vnd.openxmlformats-officedocument.wordprocessingml.document,41431,41033,0.0013\nCC-MAIN-2018-13,application/x-bibtex-text-file,34278,34175,0.0011\nCC-MAIN-2018-13,application/x-bittorrent,10781,10489,0.0003\nCC-MAIN-2018-13,application/x-bzip2,2700,2682,0.0001\nCC-MAIN-2018-13,application/x-dosexec,10265,9788,0.0003\nCC-MAIN-2018-13,application/x-endnote-refer,14412,14408,0.0004\nCC-MAIN-2018-13,application/x-hdf,209,209,0.0000\nCC-MAIN-2018-13,application/x-mobipocket-ebook,10954,10826,0.0003\nCC-MAIN-2018-13,application/x-ms-asx,19553,19527,0.0006\nCC-MAIN-2018-13,application/x-msdownload,8783,8722,0.0003\nCC-MAIN-2018-13,application/x-rar-compressed,19451,19335,0.0006\nCC-MAIN-2018-13,application/x-research-info-systems,29718,29709,0.0009\nCC-MAIN-2018-13,application/x-sh,13788,13767,0.0004\nCC-MAIN-2018-13,application/x-shockwave-flash,26661,26351,0.0008\nCC-MAIN-2018-13,application/x-stata-do,8150,8135,0.0003\nCC-MAIN-2018-13,application/x-tex,8525,8511,0.0003\nCC-MAIN-2018-13,application/x-tex-tfm,195,195,0.0000\nCC-MAIN-2018-13,application/x-tika-msoffice,49404,49345,0.0015\nCC-MAIN-2018-13,application/x-tika-ooxml,28918,28894,0.0009\nCC-MAIN-2018-13,application/x-wais-source,14844,14844,0.0005\nCC-MAIN-2018-13,application/x-xz,31762,31705,0.0010\nCC-MAIN-2018-13,application/xhtml+xml,916093244,909557676,28.3380\nCC-MAIN-2018-13,application/xml,1415872,1405169,0.0438\nCC-MAIN-2018-13,application/zip,186205,182451,0.0058\nCC-MAIN-2018-13,application/zlib,1691,1654,0.0001\nCC-MAIN-2018-13,audio/mp4,22502,22362,0.0007\nCC-MAIN-2018-13,audio/mpeg,159688,158361,0.0049\nCC-MAIN-2018-13,audio/vnd.wave,16634,16631,0.0005\nCC-MAIN-2018-13,audio/x-mpegurl,48494,48444,0.0015\nCC-MAIN-2018-13,image/gif,711214,703879,0.0220\nCC-MAIN-2018-13,image/jpeg,66271699,63577153,2.0500\nCC-MAIN-2018-13,image/png,7013508,6969339,0.2170\nCC-MAIN-2018-13,image/svg+xml,66071,65909,0.0020\nCC-MAIN-2018-13,image/tiff,9814,9801,0.0003\nCC-MAIN-2018-13,image/vnd.djvu,18891,18890,0.0006\nCC-MAIN-2018-13,image/vnd.dxf; format=ascii,3650,3649,0.0001\nCC-MAIN-2018-13,image/webp,10191,10187,0.0003\nCC-MAIN-2018-13,message/rfc822,30231,30195,0.0009\nCC-MAIN-2018-13,text/asp,424108,422186,0.0131\nCC-MAIN-2018-13,text/aspdotnet,160416,160005,0.0050\nCC-MAIN-2018-13,text/calendar,429354,429054,0.0133\nCC-MAIN-2018-13,text/css,8028,8019,0.0002\nCC-MAIN-2018-13,text/csv,18722,18615,0.0006\nCC-MAIN-2018-13,text/html,2198457800,2173776914,68.0061\nCC-MAIN-2018-13,text/markdown,1,1,0.0000\nCC-MAIN-2018-13,text/plain,726451,725058,0.0225\nCC-MAIN-2018-13,text/prs.lines.tag,1756,1755,0.0001\nCC-MAIN-2018-13,text/tab-separated-values,8672,8672,0.0003\nCC-MAIN-2018-13,text/troff,6279,6276,0.0002\nCC-MAIN-2018-13,text/turtle,9045,9037,0.0003\nCC-MAIN-2018-13,text/vtt,1638,1634,0.0001\nCC-MAIN-2018-13,text/x-c++src,1895,1893,0.0001\nCC-MAIN-2018-13,text/x-cgi,76608,76253,0.0024\nCC-MAIN-2018-13,text/x-chdr,5892,5886,0.0002\nCC-MAIN-2018-13,text/x-coldfusion,182863,181927,0.0057\nCC-MAIN-2018-13,text/x-csrc,12668,12659,0.0004\nCC-MAIN-2018-13,text/x-diff,20111,20069,0.0006\nCC-MAIN-2018-13,text/x-jsp,108138,107757,0.0033\nCC-MAIN-2018-13,text/x-log,14221,14154,0.0004\nCC-MAIN-2018-13,text/x-matlab,27409,27398,0.0008\nCC-MAIN-2018-13,text/x-perl,62862,62794,0.0019\nCC-MAIN-2018-13,text/x-php,3003084,2993631,0.0929\nCC-MAIN-2018-13,text/x-python,4561,4552,0.0001\nCC-MAIN-2018-13,text/x-vcalendar,9934,9934,0.0003\nCC-MAIN-2018-13,text/x-vcard,37067,36993,0.0011\nCC-MAIN-2018-13,text/x-web-markdown,2849,2848,0.0001\nCC-MAIN-2018-13,text/x-yaml,341,341,0.0000\nCC-MAIN-2018-13,video/mp4,28515,28390,0.0009\nCC-MAIN-2018-13,video/quicktime,6887,6885,0.0002\nCC-MAIN-2018-13,video/webm,34081,34038,0.0011\nCC-MAIN-2018-13,video/x-m4v,11176,11121,0.0003\nCC-MAIN-2018-17,<other>,279500,279065,0.0090\nCC-MAIN-2018-17,application/atom+xml,5496197,5494403,0.1772\nCC-MAIN-2018-17,application/epub+zip,19641,19498,0.0006\nCC-MAIN-2018-17,application/gpx+xml,2070,2070,0.0001\nCC-MAIN-2018-17,application/gzip,77959,76938,0.0025\nCC-MAIN-2018-17,application/javascript,18009,17986,0.0006\nCC-MAIN-2018-17,application/json,176678,176572,0.0057\nCC-MAIN-2018-17,application/marc,18040,18040,0.0006\nCC-MAIN-2018-17,application/mbox,55258,55256,0.0018\nCC-MAIN-2018-17,application/msword,95814,95453,0.0031\nCC-MAIN-2018-17,application/octet-stream,307808,307030,0.0099\nCC-MAIN-2018-17,application/pdf,14383572,14350371,0.4638\nCC-MAIN-2018-17,application/pgp-signature,24609,24566,0.0008\nCC-MAIN-2018-17,application/pkcs7-signature,2013,2013,0.0001\nCC-MAIN-2018-17,application/postscript,13504,13498,0.0004\nCC-MAIN-2018-17,application/rdf+xml,297524,297310,0.0096\nCC-MAIN-2018-17,application/rss+xml,5818908,5808461,0.1876\nCC-MAIN-2018-17,application/rtf,20909,20646,0.0007\nCC-MAIN-2018-17,application/text,6702,6702,0.0002\nCC-MAIN-2018-17,application/vnd.android.package-archive,52574,52407,0.0017\nCC-MAIN-2018-17,application/vnd.google-earth.kml+xml,48801,48770,0.0016\nCC-MAIN-2018-17,application/vnd.google-earth.kmz,6770,6770,0.0002\nCC-MAIN-2018-17,application/vnd.ms-excel,30215,29553,0.0010\nCC-MAIN-2018-17,application/vnd.ms-powerpoint,17044,17018,0.0005\nCC-MAIN-2018-17,application/vnd.oasis.opendocument.spreadsheet,1740,1739,0.0001\nCC-MAIN-2018-17,application/vnd.oasis.opendocument.text,8540,8538,0.0003\nCC-MAIN-2018-17,application/vnd.openxmlformats-officedocument.presentationml.presentation,6851,6842,0.0002\nCC-MAIN-2018-17,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,11673,11607,0.0004\nCC-MAIN-2018-17,application/vnd.openxmlformats-officedocument.wordprocessingml.document,41195,41017,0.0013\nCC-MAIN-2018-17,application/x-bibtex-text-file,24846,24832,0.0008\nCC-MAIN-2018-17,application/x-bittorrent,10280,10133,0.0003\nCC-MAIN-2018-17,application/x-bzip2,2554,2540,0.0001\nCC-MAIN-2018-17,application/x-dosexec,7536,7217,0.0002\nCC-MAIN-2018-17,application/x-endnote-refer,11172,11172,0.0004\nCC-MAIN-2018-17,application/x-hdf,141,141,0.0000\nCC-MAIN-2018-17,application/x-mobipocket-ebook,7316,7316,0.0002\nCC-MAIN-2018-17,application/x-ms-asx,13210,13157,0.0004\nCC-MAIN-2018-17,application/x-msdownload,6082,6050,0.0002\nCC-MAIN-2018-17,application/x-rar-compressed,19559,19411,0.0006\nCC-MAIN-2018-17,application/x-research-info-systems,18141,18140,0.0006\nCC-MAIN-2018-17,application/x-sh,15530,15523,0.0005\nCC-MAIN-2018-17,application/x-shockwave-flash,23977,23835,0.0008\nCC-MAIN-2018-17,application/x-stata-do,4391,4389,0.0001\nCC-MAIN-2018-17,application/x-tex,3272,3272,0.0001\nCC-MAIN-2018-17,application/x-tex-tfm,176,176,0.0000\nCC-MAIN-2018-17,application/x-tika-msoffice,56476,56444,0.0018\nCC-MAIN-2018-17,application/x-tika-ooxml,33713,33684,0.0011\nCC-MAIN-2018-17,application/x-wais-source,2654,2654,0.0001\nCC-MAIN-2018-17,application/x-xz,37649,37643,0.0012\nCC-MAIN-2018-17,application/xhtml+xml,925495160,920260861,29.8416\nCC-MAIN-2018-17,application/xml,1358892,1351715,0.0438\nCC-MAIN-2018-17,application/zip,154501,153892,0.0050\nCC-MAIN-2018-17,application/zlib,1357,1339,0.0000\nCC-MAIN-2018-17,audio/mp4,17337,17220,0.0006\nCC-MAIN-2018-17,audio/mpeg,162872,162065,0.0053\nCC-MAIN-2018-17,audio/vnd.wave,21611,21611,0.0007\nCC-MAIN-2018-17,audio/x-mpegurl,23135,23109,0.0007\nCC-MAIN-2018-17,image/gif,220198,218975,0.0071\nCC-MAIN-2018-17,image/jpeg,15914923,15519573,0.5132\nCC-MAIN-2018-17,image/png,1827926,1822135,0.0589\nCC-MAIN-2018-17,image/svg+xml,14116,14046,0.0005\nCC-MAIN-2018-17,image/tiff,9708,9706,0.0003\nCC-MAIN-2018-17,image/vnd.djvu,15901,15901,0.0005\nCC-MAIN-2018-17,image/vnd.dxf; format=ascii,2811,2810,0.0001\nCC-MAIN-2018-17,image/webp,3627,3626,0.0001\nCC-MAIN-2018-17,message/rfc822,66349,66338,0.0021\nCC-MAIN-2018-17,text/asp,410213,409241,0.0132\nCC-MAIN-2018-17,text/aspdotnet,140229,139886,0.0045\nCC-MAIN-2018-17,text/calendar,469836,469435,0.0151\nCC-MAIN-2018-17,text/css,6291,6259,0.0002\nCC-MAIN-2018-17,text/csv,13317,12977,0.0004\nCC-MAIN-2018-17,text/html,2123419429,2103571073,68.4675\nCC-MAIN-2018-17,text/markdown,8,8,0.0000\nCC-MAIN-2018-17,text/plain,574831,573984,0.0185\nCC-MAIN-2018-17,text/prs.lines.tag,1631,1631,0.0001\nCC-MAIN-2018-17,text/tab-separated-values,4805,4805,0.0002\nCC-MAIN-2018-17,text/troff,1125,1125,0.0000\nCC-MAIN-2018-17,text/turtle,20883,20876,0.0007\nCC-MAIN-2018-17,text/vtt,2436,2436,0.0001\nCC-MAIN-2018-17,text/x-c++src,1023,1023,0.0000\nCC-MAIN-2018-17,text/x-cgi,58692,58430,0.0019\nCC-MAIN-2018-17,text/x-chdr,1740,1740,0.0001\nCC-MAIN-2018-17,text/x-coldfusion,211284,210606,0.0068\nCC-MAIN-2018-17,text/x-csrc,4646,4645,0.0001\nCC-MAIN-2018-17,text/x-diff,6932,6930,0.0002\nCC-MAIN-2018-17,text/x-jsp,122277,122079,0.0039\nCC-MAIN-2018-17,text/x-log,9679,9679,0.0003\nCC-MAIN-2018-17,text/x-matlab,15060,15056,0.0005\nCC-MAIN-2018-17,text/x-perl,28227,28186,0.0009\nCC-MAIN-2018-17,text/x-php,2753341,2745434,0.0888\nCC-MAIN-2018-17,text/x-python,3204,3204,0.0001\nCC-MAIN-2018-17,text/x-vcalendar,8587,8587,0.0003\nCC-MAIN-2018-17,text/x-vcard,42631,42616,0.0014\nCC-MAIN-2018-17,text/x-web-markdown,2737,2737,0.0001\nCC-MAIN-2018-17,text/x-yaml,475,475,0.0000\nCC-MAIN-2018-17,video/mp4,19438,19318,0.0006\nCC-MAIN-2018-17,video/quicktime,6001,6001,0.0002\nCC-MAIN-2018-17,video/webm,33712,33660,0.0011\nCC-MAIN-2018-17,video/x-m4v,10052,10006,0.0003\nCC-MAIN-2018-22,<other>,245564,245147,0.0088\nCC-MAIN-2018-22,application/atom+xml,4892432,4890575,0.1755\nCC-MAIN-2018-22,application/epub+zip,19224,19136,0.0007\nCC-MAIN-2018-22,application/gpx+xml,1213,1213,0.0000\nCC-MAIN-2018-22,application/gzip,57865,55344,0.0021\nCC-MAIN-2018-22,application/javascript,23695,23673,0.0008\nCC-MAIN-2018-22,application/json,198010,197881,0.0071\nCC-MAIN-2018-22,application/marc,10261,10261,0.0004\nCC-MAIN-2018-22,application/mbox,33865,33864,0.0012\nCC-MAIN-2018-22,application/msword,91252,91033,0.0033\nCC-MAIN-2018-22,application/octet-stream,317895,316124,0.0114\nCC-MAIN-2018-22,application/pdf,11885965,11849949,0.4263\nCC-MAIN-2018-22,application/pgp-signature,56351,56349,0.0020\nCC-MAIN-2018-22,application/pkcs7-signature,2493,2493,0.0001\nCC-MAIN-2018-22,application/postscript,8606,8593,0.0003\nCC-MAIN-2018-22,application/rdf+xml,264643,264450,0.0095\nCC-MAIN-2018-22,application/rss+xml,4222106,4212573,0.1514\nCC-MAIN-2018-22,application/rtf,21835,21810,0.0008\nCC-MAIN-2018-22,application/text,10012,10012,0.0004\nCC-MAIN-2018-22,application/vnd.android.package-archive,26956,26632,0.0010\nCC-MAIN-2018-22,application/vnd.google-earth.kml+xml,52549,52511,0.0019\nCC-MAIN-2018-22,application/vnd.google-earth.kmz,7638,7636,0.0003\nCC-MAIN-2018-22,application/vnd.ms-excel,27589,27454,0.0010\nCC-MAIN-2018-22,application/vnd.ms-powerpoint,13242,13228,0.0005\nCC-MAIN-2018-22,application/vnd.oasis.opendocument.spreadsheet,2006,2006,0.0001\nCC-MAIN-2018-22,application/vnd.oasis.opendocument.text,8929,8924,0.0003\nCC-MAIN-2018-22,application/vnd.openxmlformats-officedocument.presentationml.presentation,6467,6430,0.0002\nCC-MAIN-2018-22,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,13862,13769,0.0005\nCC-MAIN-2018-22,application/vnd.openxmlformats-officedocument.wordprocessingml.document,42363,42151,0.0015\nCC-MAIN-2018-22,application/x-bibtex-text-file,23901,23899,0.0009\nCC-MAIN-2018-22,application/x-bittorrent,12102,11901,0.0004\nCC-MAIN-2018-22,application/x-bzip2,2839,2829,0.0001\nCC-MAIN-2018-22,application/x-dosexec,8696,8354,0.0003\nCC-MAIN-2018-22,application/x-endnote-refer,17805,17805,0.0006\nCC-MAIN-2018-22,application/x-hdf,872,872,0.0000\nCC-MAIN-2018-22,application/x-mobipocket-ebook,4045,4023,0.0001\nCC-MAIN-2018-22,application/x-ms-asx,6986,6979,0.0003\nCC-MAIN-2018-22,application/x-msdownload,4752,4676,0.0002\nCC-MAIN-2018-22,application/x-rar-compressed,16721,16640,0.0006\nCC-MAIN-2018-22,application/x-research-info-systems,25884,25883,0.0009\nCC-MAIN-2018-22,application/x-sh,11742,11719,0.0004\nCC-MAIN-2018-22,application/x-shockwave-flash,20901,20868,0.0007\nCC-MAIN-2018-22,application/x-stata-do,3934,3932,0.0001\nCC-MAIN-2018-22,application/x-tex,1546,1543,0.0001\nCC-MAIN-2018-22,application/x-tex-tfm,2,2,0.0000\nCC-MAIN-2018-22,application/x-tika-msoffice,44625,44592,0.0016\nCC-MAIN-2018-22,application/x-tika-ooxml,33622,33595,0.0012\nCC-MAIN-2018-22,application/x-wais-source,5441,5441,0.0002\nCC-MAIN-2018-22,application/x-xz,64098,64092,0.0023\nCC-MAIN-2018-22,application/xhtml+xml,792930117,787575940,28.4369\nCC-MAIN-2018-22,application/xml,1271044,1264937,0.0456\nCC-MAIN-2018-22,application/zip,127753,127061,0.0046\nCC-MAIN-2018-22,application/zlib,960,936,0.0000\nCC-MAIN-2018-22,audio/mp4,21643,21460,0.0008\nCC-MAIN-2018-22,audio/mpeg,193509,192338,0.0069\nCC-MAIN-2018-22,audio/vnd.wave,15661,15659,0.0006\nCC-MAIN-2018-22,audio/x-mpegurl,17657,17619,0.0006\nCC-MAIN-2018-22,image/gif,252858,251272,0.0091\nCC-MAIN-2018-22,image/jpeg,24493811,24264663,0.8784\nCC-MAIN-2018-22,image/png,2994372,2984908,0.1074\nCC-MAIN-2018-22,image/svg+xml,35306,35283,0.0013\nCC-MAIN-2018-22,image/tiff,7572,7565,0.0003\nCC-MAIN-2018-22,image/vnd.djvu,10166,10165,0.0004\nCC-MAIN-2018-22,image/vnd.dxf; format=ascii,1595,1595,0.0001\nCC-MAIN-2018-22,image/webp,6698,6694,0.0002\nCC-MAIN-2018-22,message/rfc822,30414,30397,0.0011\nCC-MAIN-2018-22,text/asp,344448,342578,0.0124\nCC-MAIN-2018-22,text/aspdotnet,134770,134287,0.0048\nCC-MAIN-2018-22,text/calendar,421984,421630,0.0151\nCC-MAIN-2018-22,text/css,7552,7550,0.0003\nCC-MAIN-2018-22,text/csv,8739,8714,0.0003\nCC-MAIN-2018-22,text/html,1938438066,1916235134,69.5182\nCC-MAIN-2018-22,text/markdown,16,16,0.0000\nCC-MAIN-2018-22,text/plain,386411,385459,0.0139\nCC-MAIN-2018-22,text/prs.lines.tag,1367,1364,0.0000\nCC-MAIN-2018-22,text/tab-separated-values,3144,3144,0.0001\nCC-MAIN-2018-22,text/troff,1612,1591,0.0001\nCC-MAIN-2018-22,text/turtle,13710,13696,0.0005\nCC-MAIN-2018-22,text/vtt,2046,2045,0.0001\nCC-MAIN-2018-22,text/x-c++src,2363,2363,0.0001\nCC-MAIN-2018-22,text/x-cgi,62326,61391,0.0022\nCC-MAIN-2018-22,text/x-chdr,1271,1270,0.0000\nCC-MAIN-2018-22,text/x-coldfusion,181994,181096,0.0065\nCC-MAIN-2018-22,text/x-csrc,3583,3566,0.0001\nCC-MAIN-2018-22,text/x-diff,4955,4954,0.0002\nCC-MAIN-2018-22,text/x-jsp,99072,98825,0.0036\nCC-MAIN-2018-22,text/x-log,5348,5348,0.0002\nCC-MAIN-2018-22,text/x-matlab,12784,12769,0.0005\nCC-MAIN-2018-22,text/x-perl,25458,25393,0.0009\nCC-MAIN-2018-22,text/x-php,2810721,2798973,0.1008\nCC-MAIN-2018-22,text/x-python,2062,2055,0.0001\nCC-MAIN-2018-22,text/x-vcalendar,8654,8652,0.0003\nCC-MAIN-2018-22,text/x-vcard,33364,33319,0.0012\nCC-MAIN-2018-22,text/x-web-markdown,2395,2392,0.0001\nCC-MAIN-2018-22,text/x-yaml,126,126,0.0000\nCC-MAIN-2018-22,video/mp4,26579,26468,0.0010\nCC-MAIN-2018-22,video/quicktime,7167,7163,0.0003\nCC-MAIN-2018-22,video/webm,34252,34203,0.0012\nCC-MAIN-2018-22,video/x-m4v,13130,13111,0.0005\nCC-MAIN-2018-26,<other>,425550,424450,0.0139\nCC-MAIN-2018-26,application/atom+xml,5623155,5621236,0.1832\nCC-MAIN-2018-26,application/epub+zip,32260,31966,0.0011\nCC-MAIN-2018-26,application/gpx+xml,3110,3110,0.0001\nCC-MAIN-2018-26,application/gzip,91815,89276,0.0030\nCC-MAIN-2018-26,application/javascript,17059,17038,0.0006\nCC-MAIN-2018-26,application/json,259845,259517,0.0085\nCC-MAIN-2018-26,application/marc,10598,10598,0.0003\nCC-MAIN-2018-26,application/mbox,53755,53755,0.0018\nCC-MAIN-2018-26,application/msword,98412,98113,0.0032\nCC-MAIN-2018-26,application/octet-stream,392685,390458,0.0128\nCC-MAIN-2018-26,application/pdf,17213107,17177496,0.5608\nCC-MAIN-2018-26,application/pgp-signature,62066,62060,0.0020\nCC-MAIN-2018-26,application/pkcs7-signature,3698,3698,0.0001\nCC-MAIN-2018-26,application/postscript,18778,18764,0.0006\nCC-MAIN-2018-26,application/rdf+xml,354007,353773,0.0115\nCC-MAIN-2018-26,application/rss+xml,5001589,4990204,0.1629\nCC-MAIN-2018-26,application/rtf,22413,22393,0.0007\nCC-MAIN-2018-26,application/text,10611,10611,0.0003\nCC-MAIN-2018-26,application/vnd.android.package-archive,23777,23530,0.0008\nCC-MAIN-2018-26,application/vnd.google-earth.kml+xml,79794,79740,0.0026\nCC-MAIN-2018-26,application/vnd.google-earth.kmz,20350,20339,0.0007\nCC-MAIN-2018-26,application/vnd.ms-excel,29641,29527,0.0010\nCC-MAIN-2018-26,application/vnd.ms-powerpoint,17721,17617,0.0006\nCC-MAIN-2018-26,application/vnd.oasis.opendocument.spreadsheet,2045,2044,0.0001\nCC-MAIN-2018-26,application/vnd.oasis.opendocument.text,10715,10709,0.0003\nCC-MAIN-2018-26,application/vnd.openxmlformats-officedocument.presentationml.presentation,8864,8848,0.0003\nCC-MAIN-2018-26,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,21242,21072,0.0007\nCC-MAIN-2018-26,application/vnd.openxmlformats-officedocument.wordprocessingml.document,40214,40054,0.0013\nCC-MAIN-2018-26,application/x-bibtex-text-file,41817,41796,0.0014\nCC-MAIN-2018-26,application/x-bittorrent,14519,14245,0.0005\nCC-MAIN-2018-26,application/x-bzip2,4470,4455,0.0001\nCC-MAIN-2018-26,application/x-dosexec,9418,8954,0.0003\nCC-MAIN-2018-26,application/x-endnote-refer,20327,20326,0.0007\nCC-MAIN-2018-26,application/x-hdf,515,515,0.0000\nCC-MAIN-2018-26,application/x-mobipocket-ebook,10161,10147,0.0003\nCC-MAIN-2018-26,application/x-ms-asx,25337,25332,0.0008\nCC-MAIN-2018-26,application/x-msdownload,6348,6305,0.0002\nCC-MAIN-2018-26,application/x-rar-compressed,20476,20279,0.0007\nCC-MAIN-2018-26,application/x-research-info-systems,31082,31082,0.0010\nCC-MAIN-2018-26,application/x-sh,20575,20551,0.0007\nCC-MAIN-2018-26,application/x-shockwave-flash,26208,26161,0.0009\nCC-MAIN-2018-26,application/x-stata-do,4076,4058,0.0001\nCC-MAIN-2018-26,application/x-tex,6786,6785,0.0002\nCC-MAIN-2018-26,application/x-tex-tfm,873,873,0.0000\nCC-MAIN-2018-26,application/x-tika-msoffice,51935,51912,0.0017\nCC-MAIN-2018-26,application/x-tika-ooxml,34389,34374,0.0011\nCC-MAIN-2018-26,application/x-wais-source,7786,7786,0.0003\nCC-MAIN-2018-26,application/x-xz,66941,66923,0.0022\nCC-MAIN-2018-26,application/xhtml+xml,870780523,862262319,28.3696\nCC-MAIN-2018-26,application/xml,2328094,2321622,0.0758\nCC-MAIN-2018-26,application/zip,181652,180770,0.0059\nCC-MAIN-2018-26,application/zlib,1715,1671,0.0001\nCC-MAIN-2018-26,audio/mp4,20716,20485,0.0007\nCC-MAIN-2018-26,audio/mpeg,160269,159081,0.0052\nCC-MAIN-2018-26,audio/vnd.wave,19220,19182,0.0006\nCC-MAIN-2018-26,audio/x-mpegurl,32084,32070,0.0010\nCC-MAIN-2018-26,image/gif,332190,330349,0.0108\nCC-MAIN-2018-26,image/jpeg,29371045,29181665,0.9569\nCC-MAIN-2018-26,image/png,4075555,4061273,0.1328\nCC-MAIN-2018-26,image/svg+xml,47931,47895,0.0016\nCC-MAIN-2018-26,image/tiff,8360,8354,0.0003\nCC-MAIN-2018-26,image/vnd.djvu,20603,20600,0.0007\nCC-MAIN-2018-26,image/vnd.dxf; format=ascii,2726,2724,0.0001\nCC-MAIN-2018-26,image/webp,11107,11104,0.0004\nCC-MAIN-2018-26,message/rfc822,105608,105534,0.0034\nCC-MAIN-2018-26,text/asp,371789,369942,0.0121\nCC-MAIN-2018-26,text/aspdotnet,234664,234143,0.0076\nCC-MAIN-2018-26,text/calendar,529988,529404,0.0173\nCC-MAIN-2018-26,text/css,7030,7020,0.0002\nCC-MAIN-2018-26,text/csv,31507,31500,0.0010\nCC-MAIN-2018-26,text/html,2125724328,2100370754,69.2550\nCC-MAIN-2018-26,text/markdown,1,1,0.0000\nCC-MAIN-2018-26,text/plain,884887,883737,0.0288\nCC-MAIN-2018-26,text/prs.lines.tag,5905,5904,0.0002\nCC-MAIN-2018-26,text/tab-separated-values,22060,22060,0.0007\nCC-MAIN-2018-26,text/troff,22484,22459,0.0007\nCC-MAIN-2018-26,text/turtle,10412,10393,0.0003\nCC-MAIN-2018-26,text/vtt,2207,2207,0.0001\nCC-MAIN-2018-26,text/x-c++src,1913,1913,0.0001\nCC-MAIN-2018-26,text/x-cgi,66411,66143,0.0022\nCC-MAIN-2018-26,text/x-chdr,7949,7943,0.0003\nCC-MAIN-2018-26,text/x-coldfusion,159762,158987,0.0052\nCC-MAIN-2018-26,text/x-csrc,15156,15145,0.0005\nCC-MAIN-2018-26,text/x-diff,35617,35606,0.0012\nCC-MAIN-2018-26,text/x-jsp,123103,122850,0.0040\nCC-MAIN-2018-26,text/x-log,17642,17642,0.0006\nCC-MAIN-2018-26,text/x-matlab,28425,28422,0.0009\nCC-MAIN-2018-26,text/x-perl,79532,79392,0.0026\nCC-MAIN-2018-26,text/x-php,3040706,3033632,0.0991\nCC-MAIN-2018-26,text/x-python,5561,5560,0.0002\nCC-MAIN-2018-26,text/x-vcalendar,15089,15087,0.0005\nCC-MAIN-2018-26,text/x-vcard,38864,38815,0.0013\nCC-MAIN-2018-26,text/x-web-markdown,3602,3591,0.0001\nCC-MAIN-2018-26,text/x-yaml,673,673,0.0000\nCC-MAIN-2018-26,video/mp4,27129,27037,0.0009\nCC-MAIN-2018-26,video/quicktime,5943,5937,0.0002\nCC-MAIN-2018-26,video/webm,32689,32627,0.0011\nCC-MAIN-2018-26,video/x-m4v,8906,8884,0.0003\nCC-MAIN-2018-30,<other>,348164,346156,0.0107\nCC-MAIN-2018-30,application/atom+xml,6517097,6513533,0.1997\nCC-MAIN-2018-30,application/epub+zip,30048,29727,0.0009\nCC-MAIN-2018-30,application/gpx+xml,2595,2592,0.0001\nCC-MAIN-2018-30,application/gzip,96061,95557,0.0029\nCC-MAIN-2018-30,application/javascript,17908,17879,0.0005\nCC-MAIN-2018-30,application/json,171547,171361,0.0053\nCC-MAIN-2018-30,application/marc,514,514,0.0000\nCC-MAIN-2018-30,application/mbox,8378,8365,0.0003\nCC-MAIN-2018-30,application/msword,118185,117778,0.0036\nCC-MAIN-2018-30,application/octet-stream,358866,357608,0.0110\nCC-MAIN-2018-30,application/pdf,17699076,17641285,0.5423\nCC-MAIN-2018-30,application/pgp-signature,80489,80480,0.0025\nCC-MAIN-2018-30,application/pkcs7-signature,2881,2880,0.0001\nCC-MAIN-2018-30,application/postscript,16497,16460,0.0005\nCC-MAIN-2018-30,application/rdf+xml,329267,328805,0.0101\nCC-MAIN-2018-30,application/rss+xml,4038331,4023923,0.1237\nCC-MAIN-2018-30,application/rtf,22169,22126,0.0007\nCC-MAIN-2018-30,application/text,7782,7780,0.0002\nCC-MAIN-2018-30,application/vnd.android.package-archive,26578,26119,0.0008\nCC-MAIN-2018-30,application/vnd.google-earth.kml+xml,66484,66463,0.0020\nCC-MAIN-2018-30,application/vnd.google-earth.kmz,11098,11077,0.0003\nCC-MAIN-2018-30,application/vnd.ms-excel,44612,44448,0.0014\nCC-MAIN-2018-30,application/vnd.ms-powerpoint,15350,15236,0.0005\nCC-MAIN-2018-30,application/vnd.oasis.opendocument.spreadsheet,2262,2236,0.0001\nCC-MAIN-2018-30,application/vnd.oasis.opendocument.text,10018,10014,0.0003\nCC-MAIN-2018-30,application/vnd.openxmlformats-officedocument.presentationml.presentation,7557,7539,0.0002\nCC-MAIN-2018-30,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,20464,20289,0.0006\nCC-MAIN-2018-30,application/vnd.openxmlformats-officedocument.wordprocessingml.document,55095,54796,0.0017\nCC-MAIN-2018-30,application/x-bibtex-text-file,28747,28666,0.0009\nCC-MAIN-2018-30,application/x-bittorrent,17903,17560,0.0005\nCC-MAIN-2018-30,application/x-bzip2,5299,5283,0.0002\nCC-MAIN-2018-30,application/x-dosexec,16372,14161,0.0005\nCC-MAIN-2018-30,application/x-endnote-refer,13197,13195,0.0004\nCC-MAIN-2018-30,application/x-hdf,768,768,0.0000\nCC-MAIN-2018-30,application/x-mobipocket-ebook,9339,9307,0.0003\nCC-MAIN-2018-30,application/x-ms-asx,15121,15038,0.0005\nCC-MAIN-2018-30,application/x-msdownload,5121,5053,0.0002\nCC-MAIN-2018-30,application/x-rar-compressed,24885,24791,0.0008\nCC-MAIN-2018-30,application/x-research-info-systems,20343,20336,0.0006\nCC-MAIN-2018-30,application/x-sh,10511,10491,0.0003\nCC-MAIN-2018-30,application/x-shockwave-flash,88652,88154,0.0027\nCC-MAIN-2018-30,application/x-stata-do,3946,3923,0.0001\nCC-MAIN-2018-30,application/x-tex,2510,2502,0.0001\nCC-MAIN-2018-30,application/x-tex-tfm,10,10,0.0000\nCC-MAIN-2018-30,application/x-tika-msoffice,49376,49347,0.0015\nCC-MAIN-2018-30,application/x-tika-ooxml,30949,30916,0.0009\nCC-MAIN-2018-30,application/x-wais-source,29799,29799,0.0009\nCC-MAIN-2018-30,application/x-xz,89103,89087,0.0027\nCC-MAIN-2018-30,application/xhtml+xml,912662972,901617777,27.9618\nCC-MAIN-2018-30,application/xml,1552076,1542277,0.0476\nCC-MAIN-2018-30,application/zip,177241,173740,0.0054\nCC-MAIN-2018-30,application/zlib,3995,3966,0.0001\nCC-MAIN-2018-30,audio/mp4,24183,23863,0.0007\nCC-MAIN-2018-30,audio/mpeg,268266,266249,0.0082\nCC-MAIN-2018-30,audio/vnd.wave,14136,14129,0.0004\nCC-MAIN-2018-30,audio/x-mpegurl,39838,39789,0.0012\nCC-MAIN-2018-30,image/gif,402760,400649,0.0123\nCC-MAIN-2018-30,image/jpeg,26995236,25536677,0.8271\nCC-MAIN-2018-30,image/png,2648171,2637294,0.0811\nCC-MAIN-2018-30,image/svg+xml,58978,58945,0.0018\nCC-MAIN-2018-30,image/tiff,8501,8491,0.0003\nCC-MAIN-2018-30,image/vnd.djvu,12253,12252,0.0004\nCC-MAIN-2018-30,image/vnd.dxf; format=ascii,5065,5064,0.0002\nCC-MAIN-2018-30,image/webp,5166,5165,0.0002\nCC-MAIN-2018-30,message/rfc822,48722,48701,0.0015\nCC-MAIN-2018-30,text/asp,390463,388373,0.0120\nCC-MAIN-2018-30,text/aspdotnet,148236,147558,0.0045\nCC-MAIN-2018-30,text/calendar,470557,469885,0.0144\nCC-MAIN-2018-30,text/css,8868,8863,0.0003\nCC-MAIN-2018-30,text/csv,13316,13312,0.0004\nCC-MAIN-2018-30,text/html,2282746079,2247854485,69.9380\nCC-MAIN-2018-30,text/markdown,4,4,0.0000\nCC-MAIN-2018-30,text/plain,555762,553918,0.0170\nCC-MAIN-2018-30,text/prs.lines.tag,2059,2058,0.0001\nCC-MAIN-2018-30,text/tab-separated-values,2151,2151,0.0001\nCC-MAIN-2018-30,text/troff,1529,1529,0.0000\nCC-MAIN-2018-30,text/turtle,1504,1492,0.0000\nCC-MAIN-2018-30,text/vtt,2286,2284,0.0001\nCC-MAIN-2018-30,text/x-c++src,1466,1466,0.0000\nCC-MAIN-2018-30,text/x-cgi,115887,115342,0.0036\nCC-MAIN-2018-30,text/x-chdr,5352,5352,0.0002\nCC-MAIN-2018-30,text/x-coldfusion,113827,112936,0.0035\nCC-MAIN-2018-30,text/x-csrc,8610,8603,0.0003\nCC-MAIN-2018-30,text/x-diff,12160,12149,0.0004\nCC-MAIN-2018-30,text/x-jsp,126514,126254,0.0039\nCC-MAIN-2018-30,text/x-log,17061,17060,0.0005\nCC-MAIN-2018-30,text/x-matlab,13368,13364,0.0004\nCC-MAIN-2018-30,text/x-perl,35431,35302,0.0011\nCC-MAIN-2018-30,text/x-php,3473784,3461456,0.1064\nCC-MAIN-2018-30,text/x-python,4290,4288,0.0001\nCC-MAIN-2018-30,text/x-vcalendar,9823,9823,0.0003\nCC-MAIN-2018-30,text/x-vcard,41622,41479,0.0013\nCC-MAIN-2018-30,text/x-web-markdown,3370,3321,0.0001\nCC-MAIN-2018-30,text/x-yaml,395,395,0.0000\nCC-MAIN-2018-30,video/mp4,61134,60929,0.0019\nCC-MAIN-2018-30,video/quicktime,7298,7272,0.0002\nCC-MAIN-2018-30,video/webm,36109,36016,0.0011\nCC-MAIN-2018-30,video/x-m4v,13002,12934,0.0004\nCC-MAIN-2018-34,<other>,1060971,1055524,0.0395\nCC-MAIN-2018-34,application/atom+xml,2968509,2961679,0.1105\nCC-MAIN-2018-34,application/epub+zip,17659,17516,0.0007\nCC-MAIN-2018-34,application/gpx+xml,1529,1528,0.0001\nCC-MAIN-2018-34,application/gzip,308924,308253,0.0115\nCC-MAIN-2018-34,application/javascript,41557,41421,0.0015\nCC-MAIN-2018-34,application/json,169974,169478,0.0063\nCC-MAIN-2018-34,application/marc,814,814,0.0000\nCC-MAIN-2018-34,application/mbox,9371,9327,0.0003\nCC-MAIN-2018-34,application/msword,913594,913047,0.0340\nCC-MAIN-2018-34,application/octet-stream,306719,305499,0.0114\nCC-MAIN-2018-34,application/pdf,12558985,12525324,0.4675\nCC-MAIN-2018-34,application/pgp-signature,13476,13457,0.0005\nCC-MAIN-2018-34,application/pkcs7-signature,1545,1544,0.0001\nCC-MAIN-2018-34,application/postscript,20667,20649,0.0008\nCC-MAIN-2018-34,application/rdf+xml,252515,251903,0.0094\nCC-MAIN-2018-34,application/rss+xml,3490681,3473439,0.1299\nCC-MAIN-2018-34,application/rtf,75391,75346,0.0028\nCC-MAIN-2018-34,application/text,8382,8382,0.0003\nCC-MAIN-2018-34,application/vnd.android.package-archive,15258,15108,0.0006\nCC-MAIN-2018-34,application/vnd.google-earth.kml+xml,53207,53112,0.0020\nCC-MAIN-2018-34,application/vnd.google-earth.kmz,8006,7995,0.0003\nCC-MAIN-2018-34,application/vnd.ms-excel,221255,220921,0.0082\nCC-MAIN-2018-34,application/vnd.ms-powerpoint,132911,132846,0.0049\nCC-MAIN-2018-34,application/vnd.oasis.opendocument.spreadsheet,1280,1280,0.0000\nCC-MAIN-2018-34,application/vnd.oasis.opendocument.text,7363,7360,0.0003\nCC-MAIN-2018-34,application/vnd.openxmlformats-officedocument.presentationml.presentation,68655,68613,0.0026\nCC-MAIN-2018-34,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,117665,117491,0.0044\nCC-MAIN-2018-34,application/vnd.openxmlformats-officedocument.wordprocessingml.document,432344,432054,0.0161\nCC-MAIN-2018-34,application/x-bibtex-text-file,25326,25308,0.0009\nCC-MAIN-2018-34,application/x-bittorrent,32411,32165,0.0012\nCC-MAIN-2018-34,application/x-bzip2,36232,36110,0.0013\nCC-MAIN-2018-34,application/x-dosexec,112733,111299,0.0042\nCC-MAIN-2018-34,application/x-endnote-refer,15957,15953,0.0006\nCC-MAIN-2018-34,application/x-hdf,236,236,0.0000\nCC-MAIN-2018-34,application/x-mobipocket-ebook,7428,7422,0.0003\nCC-MAIN-2018-34,application/x-ms-asx,9138,9047,0.0003\nCC-MAIN-2018-34,application/x-msdownload,7304,7262,0.0003\nCC-MAIN-2018-34,application/x-rar-compressed,149006,148897,0.0055\nCC-MAIN-2018-34,application/x-research-info-systems,27954,27942,0.0010\nCC-MAIN-2018-34,application/x-sh,6351,6337,0.0002\nCC-MAIN-2018-34,application/x-shockwave-flash,146629,146166,0.0055\nCC-MAIN-2018-34,application/x-stata-do,3292,3274,0.0001\nCC-MAIN-2018-34,application/x-tex,1870,1869,0.0001\nCC-MAIN-2018-34,application/x-tex-tfm,6,6,0.0000\nCC-MAIN-2018-34,application/x-tika-msoffice,41537,41519,0.0015\nCC-MAIN-2018-34,application/x-tika-ooxml,34210,34194,0.0013\nCC-MAIN-2018-34,application/x-wais-source,3144,3142,0.0001\nCC-MAIN-2018-34,application/x-xz,14294,14277,0.0005\nCC-MAIN-2018-34,application/xhtml+xml,668576811,662681869,24.8882\nCC-MAIN-2018-34,application/xml,1680786,1672422,0.0626\nCC-MAIN-2018-34,application/zip,959410,957544,0.0357\nCC-MAIN-2018-34,application/zlib,16529,16258,0.0006\nCC-MAIN-2018-34,audio/mp4,17889,17786,0.0007\nCC-MAIN-2018-34,audio/mpeg,2394822,2386291,0.0891\nCC-MAIN-2018-34,audio/vnd.wave,84919,84855,0.0032\nCC-MAIN-2018-34,audio/x-mpegurl,26122,26086,0.0010\nCC-MAIN-2018-34,image/gif,1109362,1106892,0.0413\nCC-MAIN-2018-34,image/jpeg,86705179,84914592,3.2277\nCC-MAIN-2018-34,image/png,6074452,6057995,0.2261\nCC-MAIN-2018-34,image/svg+xml,79043,78772,0.0029\nCC-MAIN-2018-34,image/tiff,39432,39388,0.0015\nCC-MAIN-2018-34,image/vnd.djvu,8832,8829,0.0003\nCC-MAIN-2018-34,image/vnd.dxf; format=ascii,2432,2432,0.0001\nCC-MAIN-2018-34,image/webp,12794,12793,0.0005\nCC-MAIN-2018-34,message/rfc822,27163,27140,0.0010\nCC-MAIN-2018-34,text/calendar,430270,429664,0.0160\nCC-MAIN-2018-34,text/css,20938,20925,0.0008\nCC-MAIN-2018-34,text/csv,35003,34938,0.0013\nCC-MAIN-2018-34,text/html,1892697389,1866045997,70.4568\nCC-MAIN-2018-34,text/markdown,1,1,0.0000\nCC-MAIN-2018-34,text/plain,409782,409043,0.0153\nCC-MAIN-2018-34,text/prs.lines.tag,1096,1095,0.0000\nCC-MAIN-2018-34,text/tab-separated-values,1806,1806,0.0001\nCC-MAIN-2018-34,text/troff,787,787,0.0000\nCC-MAIN-2018-34,text/turtle,2350,2340,0.0001\nCC-MAIN-2018-34,text/vtt,2847,2847,0.0001\nCC-MAIN-2018-34,text/x-c++src,985,982,0.0000\nCC-MAIN-2018-34,text/x-chdr,2948,2948,0.0001\nCC-MAIN-2018-34,text/x-csrc,5952,5947,0.0002\nCC-MAIN-2018-34,text/x-diff,6044,6041,0.0002\nCC-MAIN-2018-34,text/x-jsp,5666,5634,0.0002\nCC-MAIN-2018-34,text/x-log,7143,7142,0.0003\nCC-MAIN-2018-34,text/x-matlab,11440,11435,0.0004\nCC-MAIN-2018-34,text/x-perl,21686,21633,0.0008\nCC-MAIN-2018-34,text/x-php,114058,112811,0.0042\nCC-MAIN-2018-34,text/x-python,1976,1976,0.0001\nCC-MAIN-2018-34,text/x-vcalendar,14415,14413,0.0005\nCC-MAIN-2018-34,text/x-vcard,33330,33178,0.0012\nCC-MAIN-2018-34,text/x-web-markdown,2687,2630,0.0001\nCC-MAIN-2018-34,text/x-yaml,138,138,0.0000\nCC-MAIN-2018-34,video/mp4,592456,591924,0.0221\nCC-MAIN-2018-34,video/quicktime,65031,64968,0.0024\nCC-MAIN-2018-34,video/webm,26487,26432,0.0010\nCC-MAIN-2018-34,video/x-m4v,38405,38338,0.0014\nCC-MAIN-2018-39,<other>,315992,315454,0.0111\nCC-MAIN-2018-39,application/atom+xml,2868631,2866761,0.1010\nCC-MAIN-2018-39,application/epub+zip,21343,21193,0.0008\nCC-MAIN-2018-39,application/gpx+xml,1560,1560,0.0001\nCC-MAIN-2018-39,application/gzip,151927,151429,0.0053\nCC-MAIN-2018-39,application/javascript,25529,25416,0.0009\nCC-MAIN-2018-39,application/json,237185,236941,0.0083\nCC-MAIN-2018-39,application/marc,699,699,0.0000\nCC-MAIN-2018-39,application/mbox,5060,5039,0.0002\nCC-MAIN-2018-39,application/msword,52085,51977,0.0018\nCC-MAIN-2018-39,application/octet-stream,326959,325619,0.0115\nCC-MAIN-2018-39,application/pdf,4127568,4111170,0.1453\nCC-MAIN-2018-39,application/pgp-signature,13283,13281,0.0005\nCC-MAIN-2018-39,application/pkcs7-signature,1918,1918,0.0001\nCC-MAIN-2018-39,application/postscript,8540,8523,0.0003\nCC-MAIN-2018-39,application/rdf+xml,229771,229375,0.0081\nCC-MAIN-2018-39,application/rss+xml,3495103,3484236,0.1230\nCC-MAIN-2018-39,application/rtf,22492,22480,0.0008\nCC-MAIN-2018-39,application/text,8570,8567,0.0003\nCC-MAIN-2018-39,application/vnd.android.package-archive,16298,16120,0.0006\nCC-MAIN-2018-39,application/vnd.google-earth.kml+xml,49216,49192,0.0017\nCC-MAIN-2018-39,application/vnd.google-earth.kmz,6185,6183,0.0002\nCC-MAIN-2018-39,application/vnd.ms-excel,22067,21994,0.0008\nCC-MAIN-2018-39,application/vnd.ms-powerpoint,5799,5778,0.0002\nCC-MAIN-2018-39,application/vnd.oasis.opendocument.spreadsheet,1486,1484,0.0001\nCC-MAIN-2018-39,application/vnd.oasis.opendocument.text,8314,8307,0.0003\nCC-MAIN-2018-39,application/vnd.openxmlformats-officedocument.presentationml.presentation,6835,6823,0.0002\nCC-MAIN-2018-39,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,16289,16220,0.0006\nCC-MAIN-2018-39,application/vnd.openxmlformats-officedocument.wordprocessingml.document,53579,53478,0.0019\nCC-MAIN-2018-39,application/x-bibtex-text-file,26738,26717,0.0009\nCC-MAIN-2018-39,application/x-bittorrent,16946,16754,0.0006\nCC-MAIN-2018-39,application/x-bzip2,4788,4781,0.0002\nCC-MAIN-2018-39,application/x-dosexec,13038,12530,0.0005\nCC-MAIN-2018-39,application/x-endnote-refer,15777,15764,0.0006\nCC-MAIN-2018-39,application/x-hdf,106,106,0.0000\nCC-MAIN-2018-39,application/x-mobipocket-ebook,5545,5541,0.0002\nCC-MAIN-2018-39,application/x-ms-asx,7958,7941,0.0003\nCC-MAIN-2018-39,application/x-msdownload,4416,4377,0.0002\nCC-MAIN-2018-39,application/x-rar-compressed,24371,24328,0.0009\nCC-MAIN-2018-39,application/x-research-info-systems,21927,21925,0.0008\nCC-MAIN-2018-39,application/x-sh,5816,5792,0.0002\nCC-MAIN-2018-39,application/x-shockwave-flash,42775,42584,0.0015\nCC-MAIN-2018-39,application/x-stata-do,2388,2370,0.0001\nCC-MAIN-2018-39,application/x-tex,1366,1363,0.0000\nCC-MAIN-2018-39,application/x-tex-tfm,3,3,0.0000\nCC-MAIN-2018-39,application/x-tika-msoffice,50420,50409,0.0018\nCC-MAIN-2018-39,application/x-tika-ooxml,34963,34941,0.0012\nCC-MAIN-2018-39,application/x-wais-source,4133,4131,0.0001\nCC-MAIN-2018-39,application/x-xz,12591,12589,0.0004\nCC-MAIN-2018-39,application/xhtml+xml,749386478,743688980,26.3758\nCC-MAIN-2018-39,application/xml,1352418,1344490,0.0476\nCC-MAIN-2018-39,application/zip,80880,80503,0.0028\nCC-MAIN-2018-39,application/zlib,10353,10145,0.0004\nCC-MAIN-2018-39,audio/mp4,18432,18322,0.0006\nCC-MAIN-2018-39,audio/mpeg,128207,127318,0.0045\nCC-MAIN-2018-39,audio/vnd.wave,13272,13270,0.0005\nCC-MAIN-2018-39,audio/x-mpegurl,28230,28201,0.0010\nCC-MAIN-2018-39,image/gif,166113,160109,0.0058\nCC-MAIN-2018-39,image/jpeg,6206786,6187410,0.2185\nCC-MAIN-2018-39,image/png,584761,573865,0.0206\nCC-MAIN-2018-39,image/svg+xml,49625,49590,0.0017\nCC-MAIN-2018-39,image/tiff,5684,5677,0.0002\nCC-MAIN-2018-39,image/vnd.djvu,12096,11641,0.0004\nCC-MAIN-2018-39,image/vnd.dxf; format=ascii,3271,3271,0.0001\nCC-MAIN-2018-39,image/webp,8663,8660,0.0003\nCC-MAIN-2018-39,message/rfc822,23306,23270,0.0008\nCC-MAIN-2018-39,text/asp,1,1,0.0000\nCC-MAIN-2018-39,text/calendar,470624,470204,0.0166\nCC-MAIN-2018-39,text/css,7822,7813,0.0003\nCC-MAIN-2018-39,text/csv,12320,12300,0.0004\nCC-MAIN-2018-39,text/html,2069467396,2043284749,72.8379\nCC-MAIN-2018-39,text/markdown,9,9,0.0000\nCC-MAIN-2018-39,text/plain,436110,434865,0.0153\nCC-MAIN-2018-39,text/prs.lines.tag,2020,2020,0.0001\nCC-MAIN-2018-39,text/tab-separated-values,4016,4016,0.0001\nCC-MAIN-2018-39,text/troff,643,643,0.0000\nCC-MAIN-2018-39,text/turtle,2105,2075,0.0001\nCC-MAIN-2018-39,text/vtt,2507,2507,0.0001\nCC-MAIN-2018-39,text/x-c++src,1247,1247,0.0000\nCC-MAIN-2018-39,text/x-chdr,2055,2053,0.0001\nCC-MAIN-2018-39,text/x-csrc,5403,5403,0.0002\nCC-MAIN-2018-39,text/x-diff,5672,5671,0.0002\nCC-MAIN-2018-39,text/x-jsp,8088,8049,0.0003\nCC-MAIN-2018-39,text/x-log,9358,9357,0.0003\nCC-MAIN-2018-39,text/x-matlab,12221,12200,0.0004\nCC-MAIN-2018-39,text/x-perl,23078,23047,0.0008\nCC-MAIN-2018-39,text/x-php,98902,97945,0.0035\nCC-MAIN-2018-39,text/x-python,2715,2715,0.0001\nCC-MAIN-2018-39,text/x-vcalendar,12851,12844,0.0005\nCC-MAIN-2018-39,text/x-vcard,37270,37201,0.0013\nCC-MAIN-2018-39,text/x-web-markdown,2650,2623,0.0001\nCC-MAIN-2018-39,text/x-yaml,309,309,0.0000\nCC-MAIN-2018-39,video/mp4,44408,43866,0.0016\nCC-MAIN-2018-39,video/quicktime,6317,6314,0.0002\nCC-MAIN-2018-39,video/webm,31140,31050,0.0011\nCC-MAIN-2018-39,video/x-m4v,10649,10628,0.0004\nCC-MAIN-2018-43,<other>,507213,506121,0.0167\nCC-MAIN-2018-43,application/atom+xml,2781632,2778433,0.0914\nCC-MAIN-2018-43,application/epub+zip,26039,25746,0.0009\nCC-MAIN-2018-43,application/gpx+xml,3657,3656,0.0001\nCC-MAIN-2018-43,application/gzip,184827,184309,0.0061\nCC-MAIN-2018-43,application/javascript,23558,23477,0.0008\nCC-MAIN-2018-43,application/json,301555,287487,0.0099\nCC-MAIN-2018-43,application/marc,907,907,0.0000\nCC-MAIN-2018-43,application/mbox,7476,7430,0.0002\nCC-MAIN-2018-43,application/msword,130228,129821,0.0043\nCC-MAIN-2018-43,application/octet-stream,511617,509949,0.0168\nCC-MAIN-2018-43,application/pdf,24962489,24903677,0.8207\nCC-MAIN-2018-43,application/pgp-signature,47204,47188,0.0016\nCC-MAIN-2018-43,application/pkcs7-signature,2468,2467,0.0001\nCC-MAIN-2018-43,application/postscript,18391,18364,0.0006\nCC-MAIN-2018-43,application/rdf+xml,322379,321502,0.0106\nCC-MAIN-2018-43,application/rss+xml,3928131,3912468,0.1291\nCC-MAIN-2018-43,application/rtf,34012,33970,0.0011\nCC-MAIN-2018-43,application/text,7183,7182,0.0002\nCC-MAIN-2018-43,application/vnd.android.package-archive,33588,33113,0.0011\nCC-MAIN-2018-43,application/vnd.google-earth.kml+xml,38270,38211,0.0013\nCC-MAIN-2018-43,application/vnd.google-earth.kmz,10222,10210,0.0003\nCC-MAIN-2018-43,application/vnd.ms-excel,47683,47519,0.0016\nCC-MAIN-2018-43,application/vnd.ms-powerpoint,13357,13334,0.0004\nCC-MAIN-2018-43,application/vnd.oasis.opendocument.spreadsheet,3432,3430,0.0001\nCC-MAIN-2018-43,application/vnd.oasis.opendocument.text,14796,14768,0.0005\nCC-MAIN-2018-43,application/vnd.openxmlformats-officedocument.presentationml.presentation,17051,17028,0.0006\nCC-MAIN-2018-43,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,41442,41256,0.0014\nCC-MAIN-2018-43,application/vnd.openxmlformats-officedocument.wordprocessingml.document,130217,130052,0.0043\nCC-MAIN-2018-43,application/x-bibtex-text-file,29076,29009,0.0010\nCC-MAIN-2018-43,application/x-bittorrent,19705,19354,0.0006\nCC-MAIN-2018-43,application/x-bzip2,15547,15533,0.0005\nCC-MAIN-2018-43,application/x-dosexec,29091,27368,0.0010\nCC-MAIN-2018-43,application/x-endnote-refer,15524,15510,0.0005\nCC-MAIN-2018-43,application/x-hdf,2105,2105,0.0001\nCC-MAIN-2018-43,application/x-mobipocket-ebook,8729,8691,0.0003\nCC-MAIN-2018-43,application/x-ms-asx,12414,12406,0.0004\nCC-MAIN-2018-43,application/x-msdownload,8475,8420,0.0003\nCC-MAIN-2018-43,application/x-rar-compressed,60263,60159,0.0020\nCC-MAIN-2018-43,application/x-research-info-systems,25714,25707,0.0008\nCC-MAIN-2018-43,application/x-sh,10177,10146,0.0003\nCC-MAIN-2018-43,application/x-shockwave-flash,48816,48563,0.0016\nCC-MAIN-2018-43,application/x-stata-do,4577,4557,0.0002\nCC-MAIN-2018-43,application/x-tex,2836,2835,0.0001\nCC-MAIN-2018-43,application/x-tex-tfm,123,123,0.0000\nCC-MAIN-2018-43,application/x-tika-msoffice,53698,53642,0.0018\nCC-MAIN-2018-43,application/x-tika-ooxml,38080,38020,0.0013\nCC-MAIN-2018-43,application/x-wais-source,10700,10700,0.0004\nCC-MAIN-2018-43,application/x-xz,50398,50358,0.0017\nCC-MAIN-2018-43,application/xhtml+xml,792340037,786350691,26.0485\nCC-MAIN-2018-43,application/xml,1890058,1883662,0.0621\nCC-MAIN-2018-43,application/zip,175659,174910,0.0058\nCC-MAIN-2018-43,application/zlib,11594,11344,0.0004\nCC-MAIN-2018-43,application/zstd,49,49,0.0000\nCC-MAIN-2018-43,audio/mp4,31985,31785,0.0011\nCC-MAIN-2018-43,audio/mpeg,175502,174019,0.0058\nCC-MAIN-2018-43,audio/vnd.wave,22684,22679,0.0007\nCC-MAIN-2018-43,audio/x-mpegurl,37189,37134,0.0012\nCC-MAIN-2018-43,image/gif,156112,154354,0.0051\nCC-MAIN-2018-43,image/jpeg,7388078,7375771,0.2429\nCC-MAIN-2018-43,image/png,638656,635357,0.0210\nCC-MAIN-2018-43,image/svg+xml,89021,88951,0.0029\nCC-MAIN-2018-43,image/tiff,14644,14638,0.0005\nCC-MAIN-2018-43,image/vnd.djvu,19972,19956,0.0007\nCC-MAIN-2018-43,image/vnd.dxf; format=ascii,5408,5408,0.0002\nCC-MAIN-2018-43,image/webp,25019,25018,0.0008\nCC-MAIN-2018-43,message/rfc822,33477,33423,0.0011\nCC-MAIN-2018-43,text/asp,1,1,0.0000\nCC-MAIN-2018-43,text/calendar,550773,550427,0.0181\nCC-MAIN-2018-43,text/css,8704,8693,0.0003\nCC-MAIN-2018-43,text/csv,18874,18863,0.0006\nCC-MAIN-2018-43,text/html,2202471755,2176057779,72.4072\nCC-MAIN-2018-43,text/markdown,16,16,0.0000\nCC-MAIN-2018-43,text/plain,619174,618087,0.0204\nCC-MAIN-2018-43,text/prs.lines.tag,2390,2388,0.0001\nCC-MAIN-2018-43,text/tab-separated-values,2732,2732,0.0001\nCC-MAIN-2018-43,text/troff,2341,2340,0.0001\nCC-MAIN-2018-43,text/turtle,2250,2233,0.0001\nCC-MAIN-2018-43,text/vtt,2514,2514,0.0001\nCC-MAIN-2018-43,text/x-c++src,1724,1724,0.0001\nCC-MAIN-2018-43,text/x-chdr,3633,3626,0.0001\nCC-MAIN-2018-43,text/x-csrc,8655,8651,0.0003\nCC-MAIN-2018-43,text/x-diff,10072,10064,0.0003\nCC-MAIN-2018-43,text/x-jsp,9329,9286,0.0003\nCC-MAIN-2018-43,text/x-log,19112,19109,0.0006\nCC-MAIN-2018-43,text/x-matlab,14075,14057,0.0005\nCC-MAIN-2018-43,text/x-perl,30781,30569,0.0010\nCC-MAIN-2018-43,text/x-php,135440,133988,0.0045\nCC-MAIN-2018-43,text/x-python,3709,3709,0.0001\nCC-MAIN-2018-43,text/x-vcalendar,13442,13439,0.0004\nCC-MAIN-2018-43,text/x-vcard,38195,38010,0.0013\nCC-MAIN-2018-43,text/x-web-markdown,2590,2580,0.0001\nCC-MAIN-2018-43,text/x-yaml,1121,1121,0.0000\nCC-MAIN-2018-43,video/mp4,57551,57399,0.0019\nCC-MAIN-2018-43,video/quicktime,12907,12904,0.0004\nCC-MAIN-2018-43,video/webm,64231,64133,0.0021\nCC-MAIN-2018-43,video/x-m4v,24216,24186,0.0008\nCC-MAIN-2018-47,<other>,531289,528170,0.0201\nCC-MAIN-2018-47,application/atom+xml,2776464,2771696,0.1049\nCC-MAIN-2018-47,application/epub+zip,27782,27646,0.0010\nCC-MAIN-2018-47,application/gpx+xml,4827,4825,0.0002\nCC-MAIN-2018-47,application/gzip,139496,138218,0.0053\nCC-MAIN-2018-47,application/javascript,24353,24245,0.0009\nCC-MAIN-2018-47,application/json,246433,246234,0.0093\nCC-MAIN-2018-47,application/marc,726,720,0.0000\nCC-MAIN-2018-47,application/mbox,17969,17955,0.0007\nCC-MAIN-2018-47,application/msword,283097,282711,0.0107\nCC-MAIN-2018-47,application/octet-stream,787906,785464,0.0298\nCC-MAIN-2018-47,application/pdf,25703997,25634027,0.9712\nCC-MAIN-2018-47,application/pgp-signature,188164,188143,0.0071\nCC-MAIN-2018-47,application/pkcs7-signature,17712,17710,0.0007\nCC-MAIN-2018-47,application/postscript,26531,26495,0.0010\nCC-MAIN-2018-47,application/rdf+xml,310224,309475,0.0117\nCC-MAIN-2018-47,application/rss+xml,3381933,3367131,0.1278\nCC-MAIN-2018-47,application/rtf,22597,22461,0.0009\nCC-MAIN-2018-47,application/text,7704,7703,0.0003\nCC-MAIN-2018-47,application/vnd.android.package-archive,42588,42254,0.0016\nCC-MAIN-2018-47,application/vnd.google-earth.kml+xml,56674,56646,0.0021\nCC-MAIN-2018-47,application/vnd.google-earth.kmz,13357,13224,0.0005\nCC-MAIN-2018-47,application/vnd.ms-excel,88012,87785,0.0033\nCC-MAIN-2018-47,application/vnd.ms-powerpoint,29412,29399,0.0011\nCC-MAIN-2018-47,application/vnd.oasis.opendocument.spreadsheet,3040,3033,0.0001\nCC-MAIN-2018-47,application/vnd.oasis.opendocument.text,13447,13430,0.0005\nCC-MAIN-2018-47,application/vnd.openxmlformats-officedocument.presentationml.presentation,8546,8504,0.0003\nCC-MAIN-2018-47,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,26887,26598,0.0010\nCC-MAIN-2018-47,application/vnd.openxmlformats-officedocument.wordprocessingml.document,62340,62123,0.0024\nCC-MAIN-2018-47,application/x-bibtex-text-file,36328,36185,0.0014\nCC-MAIN-2018-47,application/x-bittorrent,15998,15667,0.0006\nCC-MAIN-2018-47,application/x-bzip2,7160,7047,0.0003\nCC-MAIN-2018-47,application/x-dosexec,15609,14992,0.0006\nCC-MAIN-2018-47,application/x-endnote-refer,15783,15778,0.0006\nCC-MAIN-2018-47,application/x-hdf,956,956,0.0000\nCC-MAIN-2018-47,application/x-mobipocket-ebook,10108,10096,0.0004\nCC-MAIN-2018-47,application/x-ms-asx,25216,25047,0.0010\nCC-MAIN-2018-47,application/x-msdownload,8005,7901,0.0003\nCC-MAIN-2018-47,application/x-rar-compressed,27828,27772,0.0011\nCC-MAIN-2018-47,application/x-research-info-systems,27117,27113,0.0010\nCC-MAIN-2018-47,application/x-sh,13812,13774,0.0005\nCC-MAIN-2018-47,application/x-shockwave-flash,56536,56260,0.0021\nCC-MAIN-2018-47,application/x-stata-do,4298,4273,0.0002\nCC-MAIN-2018-47,application/x-tex,3271,3270,0.0001\nCC-MAIN-2018-47,application/x-tex-tfm,13,13,0.0000\nCC-MAIN-2018-47,application/x-tika-msoffice,52708,52676,0.0020\nCC-MAIN-2018-47,application/x-tika-ooxml,37260,37196,0.0014\nCC-MAIN-2018-47,application/x-wais-source,66203,66203,0.0025\nCC-MAIN-2018-47,application/x-xz,192773,192753,0.0073\nCC-MAIN-2018-47,application/xhtml+xml,648394353,642698444,24.4994\nCC-MAIN-2018-47,application/xml,1404796,1394738,0.0531\nCC-MAIN-2018-47,application/zip,335028,333968,0.0127\nCC-MAIN-2018-47,application/zlib,15069,14709,0.0006\nCC-MAIN-2018-47,application/zstd,2,2,0.0000\nCC-MAIN-2018-47,audio/mp4,37340,37203,0.0014\nCC-MAIN-2018-47,audio/mpeg,197814,195616,0.0075\nCC-MAIN-2018-47,audio/vnd.wave,12775,12773,0.0005\nCC-MAIN-2018-47,audio/x-mpegurl,51127,51066,0.0019\nCC-MAIN-2018-47,image/gif,172549,170948,0.0065\nCC-MAIN-2018-47,image/jpeg,8235925,8222865,0.3112\nCC-MAIN-2018-47,image/png,852586,848922,0.0322\nCC-MAIN-2018-47,image/svg+xml,64495,63875,0.0024\nCC-MAIN-2018-47,image/tiff,15827,15815,0.0006\nCC-MAIN-2018-47,image/vnd.djvu,23297,23287,0.0009\nCC-MAIN-2018-47,image/vnd.dxf; format=ascii,8253,8253,0.0003\nCC-MAIN-2018-47,image/webp,12480,12479,0.0005\nCC-MAIN-2018-47,message/rfc822,38126,38071,0.0014\nCC-MAIN-2018-47,text/asp,8,8,0.0000\nCC-MAIN-2018-47,text/calendar,372544,372343,0.0141\nCC-MAIN-2018-47,text/css,10350,10344,0.0004\nCC-MAIN-2018-47,text/csv,14079,13876,0.0005\nCC-MAIN-2018-47,text/html,1949326389,1922368668,73.6549\nCC-MAIN-2018-47,text/markdown,5,5,0.0000\nCC-MAIN-2018-47,text/plain,949615,947413,0.0359\nCC-MAIN-2018-47,text/prs.lines.tag,3823,3819,0.0001\nCC-MAIN-2018-47,text/tab-separated-values,2587,2586,0.0001\nCC-MAIN-2018-47,text/troff,2120,2120,0.0001\nCC-MAIN-2018-47,text/turtle,3510,3496,0.0001\nCC-MAIN-2018-47,text/vtt,2267,2267,0.0001\nCC-MAIN-2018-47,text/x-c++src,3464,3464,0.0001\nCC-MAIN-2018-47,text/x-chdr,3976,3975,0.0002\nCC-MAIN-2018-47,text/x-csrc,9747,9738,0.0004\nCC-MAIN-2018-47,text/x-diff,9813,9801,0.0004\nCC-MAIN-2018-47,text/x-jsp,13353,13267,0.0005\nCC-MAIN-2018-47,text/x-log,38815,38815,0.0015\nCC-MAIN-2018-47,text/x-matlab,19223,19213,0.0007\nCC-MAIN-2018-47,text/x-perl,48941,48856,0.0018\nCC-MAIN-2018-47,text/x-php,149642,148143,0.0057\nCC-MAIN-2018-47,text/x-python,4094,4092,0.0002\nCC-MAIN-2018-47,text/x-vcalendar,11089,11089,0.0004\nCC-MAIN-2018-47,text/x-vcard,41293,41151,0.0016\nCC-MAIN-2018-47,text/x-web-markdown,3922,3901,0.0001\nCC-MAIN-2018-47,text/x-yaml,1317,1317,0.0000\nCC-MAIN-2018-47,video/mp4,75805,75646,0.0029\nCC-MAIN-2018-47,video/quicktime,7915,7907,0.0003\nCC-MAIN-2018-47,video/webm,79104,79013,0.0030\nCC-MAIN-2018-47,video/x-m4v,27403,27366,0.0010\nCC-MAIN-2018-51,<other>,515138,513207,0.0163\nCC-MAIN-2018-51,application/atom+xml,2860889,2857546,0.0904\nCC-MAIN-2018-51,application/epub+zip,37486,37329,0.0012\nCC-MAIN-2018-51,application/gpx+xml,6528,6524,0.0002\nCC-MAIN-2018-51,application/gzip,160165,159128,0.0051\nCC-MAIN-2018-51,application/javascript,22267,22144,0.0007\nCC-MAIN-2018-51,application/json,301295,300972,0.0095\nCC-MAIN-2018-51,application/marc,685,684,0.0000\nCC-MAIN-2018-51,application/mbox,16086,16072,0.0005\nCC-MAIN-2018-51,application/msword,121216,120842,0.0038\nCC-MAIN-2018-51,application/octet-stream,660152,657525,0.0209\nCC-MAIN-2018-51,application/pdf,36718832,36534433,1.1604\nCC-MAIN-2018-51,application/pgp-signature,44443,44365,0.0014\nCC-MAIN-2018-51,application/pkcs7-signature,9248,9246,0.0003\nCC-MAIN-2018-51,application/postscript,23601,23579,0.0007\nCC-MAIN-2018-51,application/rdf+xml,313126,312656,0.0099\nCC-MAIN-2018-51,application/rss+xml,4506576,4486116,0.1424\nCC-MAIN-2018-51,application/rtf,29616,29295,0.0009\nCC-MAIN-2018-51,application/text,8212,8194,0.0003\nCC-MAIN-2018-51,application/vnd.android.package-archive,38530,37483,0.0012\nCC-MAIN-2018-51,application/vnd.google-earth.kml+xml,57637,57331,0.0018\nCC-MAIN-2018-51,application/vnd.google-earth.kmz,12409,12317,0.0004\nCC-MAIN-2018-51,application/vnd.ms-excel,43623,43383,0.0014\nCC-MAIN-2018-51,application/vnd.ms-powerpoint,14160,14125,0.0004\nCC-MAIN-2018-51,application/vnd.oasis.opendocument.spreadsheet,4126,4121,0.0001\nCC-MAIN-2018-51,application/vnd.oasis.opendocument.text,20007,19975,0.0006\nCC-MAIN-2018-51,application/vnd.openxmlformats-officedocument.presentationml.presentation,9380,9355,0.0003\nCC-MAIN-2018-51,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,27057,26963,0.0009\nCC-MAIN-2018-51,application/vnd.openxmlformats-officedocument.wordprocessingml.document,75867,75553,0.0024\nCC-MAIN-2018-51,application/x-bibtex-text-file,44073,43744,0.0014\nCC-MAIN-2018-51,application/x-bittorrent,14174,13668,0.0004\nCC-MAIN-2018-51,application/x-bzip2,10478,10303,0.0003\nCC-MAIN-2018-51,application/x-dosexec,15989,15537,0.0005\nCC-MAIN-2018-51,application/x-endnote-refer,12924,12916,0.0004\nCC-MAIN-2018-51,application/x-hdf,583,583,0.0000\nCC-MAIN-2018-51,application/x-mobipocket-ebook,13319,13303,0.0004\nCC-MAIN-2018-51,application/x-ms-asx,17183,17086,0.0005\nCC-MAIN-2018-51,application/x-msdownload,8829,8750,0.0003\nCC-MAIN-2018-51,application/x-rar-compressed,25076,24964,0.0008\nCC-MAIN-2018-51,application/x-research-info-systems,26003,25996,0.0008\nCC-MAIN-2018-51,application/x-sh,17261,17202,0.0005\nCC-MAIN-2018-51,application/x-shockwave-flash,48589,48384,0.0015\nCC-MAIN-2018-51,application/x-stata-do,6542,6537,0.0002\nCC-MAIN-2018-51,application/x-tex,3813,3802,0.0001\nCC-MAIN-2018-51,application/x-tex-tfm,15,15,0.0000\nCC-MAIN-2018-51,application/x-tika-msoffice,63837,63736,0.0020\nCC-MAIN-2018-51,application/x-tika-ooxml,45780,45725,0.0014\nCC-MAIN-2018-51,application/x-wais-source,22375,22375,0.0007\nCC-MAIN-2018-51,application/x-xz,64606,64467,0.0020\nCC-MAIN-2018-51,application/xhtml+xml,772291130,765993479,24.4068\nCC-MAIN-2018-51,application/xml,1665995,1653652,0.0527\nCC-MAIN-2018-51,application/zip,214240,212553,0.0068\nCC-MAIN-2018-51,application/zlib,14460,14118,0.0005\nCC-MAIN-2018-51,application/zstd,70,70,0.0000\nCC-MAIN-2018-51,audio/mp4,63904,63740,0.0020\nCC-MAIN-2018-51,audio/mpeg,206440,203397,0.0065\nCC-MAIN-2018-51,audio/vnd.wave,18027,17991,0.0006\nCC-MAIN-2018-51,audio/x-mpegurl,45954,45888,0.0015\nCC-MAIN-2018-51,image/gif,139267,137908,0.0044\nCC-MAIN-2018-51,image/jpeg,8854459,8838096,0.2798\nCC-MAIN-2018-51,image/png,744626,741610,0.0235\nCC-MAIN-2018-51,image/svg+xml,45123,45052,0.0014\nCC-MAIN-2018-51,image/tiff,12339,12322,0.0004\nCC-MAIN-2018-51,image/vnd.djvu,20240,20160,0.0006\nCC-MAIN-2018-51,image/vnd.dxf; format=ascii,6823,6806,0.0002\nCC-MAIN-2018-51,image/webp,15969,15967,0.0005\nCC-MAIN-2018-51,message/rfc822,26562,26507,0.0008\nCC-MAIN-2018-51,text/asp,1,1,0.0000\nCC-MAIN-2018-51,text/calendar,678110,677304,0.0214\nCC-MAIN-2018-51,text/css,7837,7830,0.0002\nCC-MAIN-2018-51,text/csv,16867,16777,0.0005\nCC-MAIN-2018-51,text/html,2330627822,2299878881,73.6550\nCC-MAIN-2018-51,text/markdown,59,59,0.0000\nCC-MAIN-2018-51,text/plain,794234,791893,0.0251\nCC-MAIN-2018-51,text/prs.lines.tag,2271,2269,0.0001\nCC-MAIN-2018-51,text/tab-separated-values,3586,3586,0.0001\nCC-MAIN-2018-51,text/troff,2173,2172,0.0001\nCC-MAIN-2018-51,text/turtle,3034,3009,0.0001\nCC-MAIN-2018-51,text/vtt,2457,2457,0.0001\nCC-MAIN-2018-51,text/x-c++src,1970,1957,0.0001\nCC-MAIN-2018-51,text/x-chdr,3395,3392,0.0001\nCC-MAIN-2018-51,text/x-csrc,10622,10574,0.0003\nCC-MAIN-2018-51,text/x-diff,11174,11161,0.0004\nCC-MAIN-2018-51,text/x-jsp,9957,9888,0.0003\nCC-MAIN-2018-51,text/x-log,41764,41764,0.0013\nCC-MAIN-2018-51,text/x-matlab,16023,16004,0.0005\nCC-MAIN-2018-51,text/x-perl,30458,30397,0.0010\nCC-MAIN-2018-51,text/x-php,134902,133462,0.0043\nCC-MAIN-2018-51,text/x-python,5948,5936,0.0002\nCC-MAIN-2018-51,text/x-vcalendar,17622,17613,0.0006\nCC-MAIN-2018-51,text/x-vcard,100579,100205,0.0032\nCC-MAIN-2018-51,text/x-web-markdown,4032,4020,0.0001\nCC-MAIN-2018-51,text/x-yaml,1471,1470,0.0000\nCC-MAIN-2018-51,video/mp4,57651,57532,0.0018\nCC-MAIN-2018-51,video/quicktime,11018,11007,0.0003\nCC-MAIN-2018-51,video/webm,109622,109300,0.0035\nCC-MAIN-2018-51,video/x-m4v,35542,35439,0.0011\nCC-MAIN-2019-04,<other>,345975,345135,0.0120\nCC-MAIN-2019-04,application/atom+xml,2996123,2993393,0.1037\nCC-MAIN-2019-04,application/epub+zip,35067,34913,0.0012\nCC-MAIN-2019-04,application/gpx+xml,5663,5645,0.0002\nCC-MAIN-2019-04,application/gzip,208974,208652,0.0072\nCC-MAIN-2019-04,application/javascript,22030,21962,0.0008\nCC-MAIN-2019-04,application/json,225008,224579,0.0078\nCC-MAIN-2019-04,application/marc,627,627,0.0000\nCC-MAIN-2019-04,application/mbox,11079,11074,0.0004\nCC-MAIN-2019-04,application/msword,143040,142595,0.0049\nCC-MAIN-2019-04,application/octet-stream,286960,286238,0.0099\nCC-MAIN-2019-04,application/pdf,27082692,26994427,0.9372\nCC-MAIN-2019-04,application/pgp-signature,124710,124710,0.0043\nCC-MAIN-2019-04,application/pkcs7-signature,9034,9033,0.0003\nCC-MAIN-2019-04,application/postscript,12945,12869,0.0004\nCC-MAIN-2019-04,application/rdf+xml,204113,203863,0.0071\nCC-MAIN-2019-04,application/rss+xml,3781070,3766057,0.1308\nCC-MAIN-2019-04,application/rtf,35643,35605,0.0012\nCC-MAIN-2019-04,application/text,1257,1257,0.0000\nCC-MAIN-2019-04,application/vnd.android.package-archive,34723,34479,0.0012\nCC-MAIN-2019-04,application/vnd.google-earth.kml+xml,38407,38341,0.0013\nCC-MAIN-2019-04,application/vnd.google-earth.kmz,10660,10625,0.0004\nCC-MAIN-2019-04,application/vnd.ms-excel,45636,45446,0.0016\nCC-MAIN-2019-04,application/vnd.ms-powerpoint,20449,20289,0.0007\nCC-MAIN-2019-04,application/vnd.oasis.opendocument.spreadsheet,3566,3555,0.0001\nCC-MAIN-2019-04,application/vnd.oasis.opendocument.text,16700,16683,0.0006\nCC-MAIN-2019-04,application/vnd.openxmlformats-officedocument.presentationml.presentation,15441,15409,0.0005\nCC-MAIN-2019-04,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,38366,38234,0.0013\nCC-MAIN-2019-04,application/vnd.openxmlformats-officedocument.wordprocessingml.document,98976,98553,0.0034\nCC-MAIN-2019-04,application/x-bibtex-text-file,44442,44409,0.0015\nCC-MAIN-2019-04,application/x-bittorrent,13654,13151,0.0005\nCC-MAIN-2019-04,application/x-bzip2,9696,9664,0.0003\nCC-MAIN-2019-04,application/x-dosexec,25136,24760,0.0009\nCC-MAIN-2019-04,application/x-endnote-refer,12160,12120,0.0004\nCC-MAIN-2019-04,application/x-hdf,1055,1055,0.0000\nCC-MAIN-2019-04,application/x-mobipocket-ebook,14358,14323,0.0005\nCC-MAIN-2019-04,application/x-ms-asx,6959,6943,0.0002\nCC-MAIN-2019-04,application/x-msdownload,6456,6401,0.0002\nCC-MAIN-2019-04,application/x-rar-compressed,29863,29803,0.0010\nCC-MAIN-2019-04,application/x-research-info-systems,58,58,0.0000\nCC-MAIN-2019-04,application/x-sh,9224,9086,0.0003\nCC-MAIN-2019-04,application/x-shockwave-flash,106041,105898,0.0037\nCC-MAIN-2019-04,application/x-stata-do,4157,4154,0.0001\nCC-MAIN-2019-04,application/x-tex,4415,4388,0.0002\nCC-MAIN-2019-04,application/x-tex-tfm,61,61,0.0000\nCC-MAIN-2019-04,application/x-tika-msoffice,57793,57708,0.0020\nCC-MAIN-2019-04,application/x-tika-ooxml,46376,46296,0.0016\nCC-MAIN-2019-04,application/x-wais-source,20874,20874,0.0007\nCC-MAIN-2019-04,application/x-xz,139686,139450,0.0048\nCC-MAIN-2019-04,application/xhtml+xml,699580010,694786650,24.2092\nCC-MAIN-2019-04,application/xml,1462988,1457382,0.0506\nCC-MAIN-2019-04,application/zip,244772,242784,0.0085\nCC-MAIN-2019-04,application/zlib,21672,21268,0.0007\nCC-MAIN-2019-04,application/zstd,512,512,0.0000\nCC-MAIN-2019-04,audio/mp4,50031,49824,0.0017\nCC-MAIN-2019-04,audio/mpeg,374686,369216,0.0130\nCC-MAIN-2019-04,audio/vnd.wave,22971,22968,0.0008\nCC-MAIN-2019-04,audio/x-mpegurl,5476,5469,0.0002\nCC-MAIN-2019-04,image/gif,192630,191675,0.0067\nCC-MAIN-2019-04,image/jpeg,7662110,7646750,0.2651\nCC-MAIN-2019-04,image/png,897811,894885,0.0311\nCC-MAIN-2019-04,image/svg+xml,25381,25322,0.0009\nCC-MAIN-2019-04,image/tiff,19212,19188,0.0007\nCC-MAIN-2019-04,image/vnd.djvu,14303,14268,0.0005\nCC-MAIN-2019-04,image/vnd.dxf; format=ascii,12746,12730,0.0004\nCC-MAIN-2019-04,image/webp,11850,11850,0.0004\nCC-MAIN-2019-04,message/rfc822,29801,29792,0.0010\nCC-MAIN-2019-04,text/asp,2,2,0.0000\nCC-MAIN-2019-04,text/calendar,771054,770423,0.0267\nCC-MAIN-2019-04,text/css,9408,9402,0.0003\nCC-MAIN-2019-04,text/csv,24146,24121,0.0008\nCC-MAIN-2019-04,text/html,2140034056,2117647674,74.0566\nCC-MAIN-2019-04,text/markdown,38,38,0.0000\nCC-MAIN-2019-04,text/plain,1232830,1229860,0.0427\nCC-MAIN-2019-04,text/prs.lines.tag,2683,2682,0.0001\nCC-MAIN-2019-04,text/tab-separated-values,3078,3078,0.0001\nCC-MAIN-2019-04,text/troff,3703,3703,0.0001\nCC-MAIN-2019-04,text/turtle,3609,3597,0.0001\nCC-MAIN-2019-04,text/vtt,5087,5087,0.0002\nCC-MAIN-2019-04,text/x-c++src,2655,2655,0.0001\nCC-MAIN-2019-04,text/x-chdr,3807,3807,0.0001\nCC-MAIN-2019-04,text/x-csrc,8655,8652,0.0003\nCC-MAIN-2019-04,text/x-diff,12467,12464,0.0004\nCC-MAIN-2019-04,text/x-jsp,4141,4062,0.0001\nCC-MAIN-2019-04,text/x-log,30372,30340,0.0011\nCC-MAIN-2019-04,text/x-matlab,15332,15327,0.0005\nCC-MAIN-2019-04,text/x-perl,29650,29593,0.0010\nCC-MAIN-2019-04,text/x-php,119431,118449,0.0041\nCC-MAIN-2019-04,text/x-python,4015,4012,0.0001\nCC-MAIN-2019-04,text/x-vcalendar,21356,21356,0.0007\nCC-MAIN-2019-04,text/x-vcard,77708,77517,0.0027\nCC-MAIN-2019-04,text/x-web-markdown,3139,3139,0.0001\nCC-MAIN-2019-04,text/x-yaml,797,797,0.0000\nCC-MAIN-2019-04,video/mp4,165702,165337,0.0057\nCC-MAIN-2019-04,video/quicktime,12894,12886,0.0004\nCC-MAIN-2019-04,video/webm,64064,63965,0.0022\nCC-MAIN-2019-04,video/x-m4v,24403,24304,0.0008\nCC-MAIN-2019-09,<other>,605445,604209,0.0208\nCC-MAIN-2019-09,application/atom+xml,3028709,3026302,0.1039\nCC-MAIN-2019-09,application/epub+zip,50257,50058,0.0017\nCC-MAIN-2019-09,application/gpx+xml,6071,6071,0.0002\nCC-MAIN-2019-09,application/gzip,267591,267138,0.0092\nCC-MAIN-2019-09,application/javascript,30791,30769,0.0011\nCC-MAIN-2019-09,application/json,379395,378919,0.0130\nCC-MAIN-2019-09,application/marc,1945,1945,0.0001\nCC-MAIN-2019-09,application/mbox,16784,16780,0.0006\nCC-MAIN-2019-09,application/msword,223925,223399,0.0077\nCC-MAIN-2019-09,application/octet-stream,343733,342839,0.0118\nCC-MAIN-2019-09,application/pdf,31586278,31465381,1.0840\nCC-MAIN-2019-09,application/pgp-signature,58156,58133,0.0020\nCC-MAIN-2019-09,application/pkcs7-signature,9895,9893,0.0003\nCC-MAIN-2019-09,application/postscript,22493,22447,0.0008\nCC-MAIN-2019-09,application/rdf+xml,240670,240259,0.0083\nCC-MAIN-2019-09,application/rss+xml,4429955,4412929,0.1520\nCC-MAIN-2019-09,application/rtf,54134,54080,0.0019\nCC-MAIN-2019-09,application/text,3100,3100,0.0001\nCC-MAIN-2019-09,application/vnd.android.package-archive,36515,36206,0.0013\nCC-MAIN-2019-09,application/vnd.google-earth.kml+xml,67982,67935,0.0023\nCC-MAIN-2019-09,application/vnd.google-earth.kmz,14870,14860,0.0005\nCC-MAIN-2019-09,application/vnd.ms-excel,80671,80506,0.0028\nCC-MAIN-2019-09,application/vnd.ms-powerpoint,29256,29100,0.0010\nCC-MAIN-2019-09,application/vnd.oasis.opendocument.spreadsheet,5287,5278,0.0002\nCC-MAIN-2019-09,application/vnd.oasis.opendocument.text,18853,18812,0.0006\nCC-MAIN-2019-09,application/vnd.openxmlformats-officedocument.presentationml.presentation,20729,20504,0.0007\nCC-MAIN-2019-09,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,54547,54415,0.0019\nCC-MAIN-2019-09,application/vnd.openxmlformats-officedocument.wordprocessingml.document,146364,145963,0.0050\nCC-MAIN-2019-09,application/x-bibtex-text-file,64980,64963,0.0022\nCC-MAIN-2019-09,application/x-bittorrent,12541,12209,0.0004\nCC-MAIN-2019-09,application/x-bzip2,16299,16229,0.0006\nCC-MAIN-2019-09,application/x-dosexec,30921,30375,0.0011\nCC-MAIN-2019-09,application/x-endnote-refer,19913,19904,0.0007\nCC-MAIN-2019-09,application/x-hdf,5010,5000,0.0002\nCC-MAIN-2019-09,application/x-mobipocket-ebook,15117,15081,0.0005\nCC-MAIN-2019-09,application/x-ms-asx,16742,16711,0.0006\nCC-MAIN-2019-09,application/x-msdownload,10443,10385,0.0004\nCC-MAIN-2019-09,application/x-rar-compressed,40769,40719,0.0014\nCC-MAIN-2019-09,application/x-research-info-systems,479,477,0.0000\nCC-MAIN-2019-09,application/x-sh,27751,27709,0.0010\nCC-MAIN-2019-09,application/x-shockwave-flash,123209,123086,0.0042\nCC-MAIN-2019-09,application/x-stata-do,5391,5389,0.0002\nCC-MAIN-2019-09,application/x-tex,5792,5789,0.0002\nCC-MAIN-2019-09,application/x-tex-tfm,52,52,0.0000\nCC-MAIN-2019-09,application/x-tika-msoffice,79237,79030,0.0027\nCC-MAIN-2019-09,application/x-tika-ooxml,57475,57412,0.0020\nCC-MAIN-2019-09,application/x-wais-source,7573,7573,0.0003\nCC-MAIN-2019-09,application/x-xz,98791,98620,0.0034\nCC-MAIN-2019-09,application/xhtml+xml,686860975,681868620,23.5732\nCC-MAIN-2019-09,application/xml,2010153,2002656,0.0690\nCC-MAIN-2019-09,application/zip,376774,375514,0.0129\nCC-MAIN-2019-09,application/zlib,24126,23861,0.0008\nCC-MAIN-2019-09,application/zstd,1200,1200,0.0000\nCC-MAIN-2019-09,audio/mp4,62501,62111,0.0021\nCC-MAIN-2019-09,audio/mpeg,546670,535916,0.0188\nCC-MAIN-2019-09,audio/vnd.wave,28368,28295,0.0010\nCC-MAIN-2019-09,audio/x-mpegurl,5685,5677,0.0002\nCC-MAIN-2019-09,image/gif,253898,252974,0.0087\nCC-MAIN-2019-09,image/jpeg,14448790,14427003,0.4959\nCC-MAIN-2019-09,image/png,1546005,1541996,0.0531\nCC-MAIN-2019-09,image/svg+xml,40518,40395,0.0014\nCC-MAIN-2019-09,image/tiff,23331,23288,0.0008\nCC-MAIN-2019-09,image/vnd.djvu,24517,24515,0.0008\nCC-MAIN-2019-09,image/vnd.dxf; format=ascii,13366,13157,0.0005\nCC-MAIN-2019-09,image/webp,11973,11973,0.0004\nCC-MAIN-2019-09,message/rfc822,30370,30329,0.0010\nCC-MAIN-2019-09,text/calendar,871762,870936,0.0299\nCC-MAIN-2019-09,text/css,12651,12649,0.0004\nCC-MAIN-2019-09,text/csv,50812,50742,0.0017\nCC-MAIN-2019-09,text/html,2161428643,2137712866,74.1807\nCC-MAIN-2019-09,text/markdown,50,50,0.0000\nCC-MAIN-2019-09,text/plain,1733993,1731122,0.0595\nCC-MAIN-2019-09,text/prs.lines.tag,7193,7191,0.0002\nCC-MAIN-2019-09,text/tab-separated-values,6666,6662,0.0002\nCC-MAIN-2019-09,text/troff,3786,3786,0.0001\nCC-MAIN-2019-09,text/turtle,8060,8036,0.0003\nCC-MAIN-2019-09,text/vtt,7237,7237,0.0002\nCC-MAIN-2019-09,text/x-c++src,3377,3377,0.0001\nCC-MAIN-2019-09,text/x-chdr,5070,5069,0.0002\nCC-MAIN-2019-09,text/x-csrc,11207,11200,0.0004\nCC-MAIN-2019-09,text/x-diff,19434,19403,0.0007\nCC-MAIN-2019-09,text/x-jsp,8990,8898,0.0003\nCC-MAIN-2019-09,text/x-log,43688,43681,0.0015\nCC-MAIN-2019-09,text/x-matlab,26078,26043,0.0009\nCC-MAIN-2019-09,text/x-perl,40886,40840,0.0014\nCC-MAIN-2019-09,text/x-php,135441,134075,0.0046\nCC-MAIN-2019-09,text/x-python,8181,8159,0.0003\nCC-MAIN-2019-09,text/x-vcalendar,24007,24002,0.0008\nCC-MAIN-2019-09,text/x-vcard,96455,96035,0.0033\nCC-MAIN-2019-09,text/x-web-markdown,5838,5818,0.0002\nCC-MAIN-2019-09,text/x-yaml,3790,3790,0.0001\nCC-MAIN-2019-09,video/mp4,220077,219738,0.0076\nCC-MAIN-2019-09,video/quicktime,19653,19634,0.0007\nCC-MAIN-2019-09,video/webm,111415,111132,0.0038\nCC-MAIN-2019-09,video/x-m4v,36876,36701,0.0013\nCC-MAIN-2019-13,<other>,657345,655922,0.0256\nCC-MAIN-2019-13,application/atom+xml,2830579,2828212,0.1102\nCC-MAIN-2019-13,application/epub+zip,45375,45218,0.0018\nCC-MAIN-2019-13,application/gpx+xml,5082,5081,0.0002\nCC-MAIN-2019-13,application/gzip,278587,278125,0.0108\nCC-MAIN-2019-13,application/javascript,30228,30187,0.0012\nCC-MAIN-2019-13,application/json,297548,297163,0.0116\nCC-MAIN-2019-13,application/marc,1102,1102,0.0000\nCC-MAIN-2019-13,application/mbox,18567,18467,0.0007\nCC-MAIN-2019-13,application/msword,182996,182697,0.0071\nCC-MAIN-2019-13,application/octet-stream,171690,171084,0.0067\nCC-MAIN-2019-13,application/pdf,12288145,12247581,0.4782\nCC-MAIN-2019-13,application/pgp-signature,35829,35826,0.0014\nCC-MAIN-2019-13,application/pkcs7-signature,4793,4743,0.0002\nCC-MAIN-2019-13,application/postscript,30144,29969,0.0012\nCC-MAIN-2019-13,application/rdf+xml,194711,194381,0.0076\nCC-MAIN-2019-13,application/rss+xml,3561805,3548201,0.1386\nCC-MAIN-2019-13,application/rtf,74185,74115,0.0029\nCC-MAIN-2019-13,application/text,3915,3915,0.0002\nCC-MAIN-2019-13,application/vnd.android.package-archive,31267,31051,0.0012\nCC-MAIN-2019-13,application/vnd.google-earth.kml+xml,68044,67813,0.0026\nCC-MAIN-2019-13,application/vnd.google-earth.kmz,15722,15702,0.0006\nCC-MAIN-2019-13,application/vnd.ms-excel,56023,55916,0.0022\nCC-MAIN-2019-13,application/vnd.ms-powerpoint,25435,25407,0.0010\nCC-MAIN-2019-13,application/vnd.oasis.opendocument.spreadsheet,5215,5212,0.0002\nCC-MAIN-2019-13,application/vnd.oasis.opendocument.text,20355,20322,0.0008\nCC-MAIN-2019-13,application/vnd.openxmlformats-officedocument.presentationml.presentation,38850,38725,0.0015\nCC-MAIN-2019-13,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,83116,82873,0.0032\nCC-MAIN-2019-13,application/vnd.openxmlformats-officedocument.wordprocessingml.document,249900,249539,0.0097\nCC-MAIN-2019-13,application/x-bibtex-text-file,71086,71050,0.0028\nCC-MAIN-2019-13,application/x-bittorrent,21069,20015,0.0008\nCC-MAIN-2019-13,application/x-bzip2,51594,51531,0.0020\nCC-MAIN-2019-13,application/x-dosexec,28842,28352,0.0011\nCC-MAIN-2019-13,application/x-endnote-refer,22827,22809,0.0009\nCC-MAIN-2019-13,application/x-hdf,6139,6139,0.0002\nCC-MAIN-2019-13,application/x-mobipocket-ebook,14753,14682,0.0006\nCC-MAIN-2019-13,application/x-ms-asx,15966,15943,0.0006\nCC-MAIN-2019-13,application/x-msdownload,8036,7950,0.0003\nCC-MAIN-2019-13,application/x-rar-compressed,74781,74681,0.0029\nCC-MAIN-2019-13,application/x-research-info-systems,661,661,0.0000\nCC-MAIN-2019-13,application/x-sh,16584,16558,0.0006\nCC-MAIN-2019-13,application/x-shockwave-flash,158735,158593,0.0062\nCC-MAIN-2019-13,application/x-stata-do,7741,7739,0.0003\nCC-MAIN-2019-13,application/x-tex,5477,5476,0.0002\nCC-MAIN-2019-13,application/x-tex-tfm,229,229,0.0000\nCC-MAIN-2019-13,application/x-tika-msoffice,76050,75941,0.0030\nCC-MAIN-2019-13,application/x-tika-ooxml,56201,56131,0.0022\nCC-MAIN-2019-13,application/x-wais-source,9106,9106,0.0004\nCC-MAIN-2019-13,application/x-xz,61982,61856,0.0024\nCC-MAIN-2019-13,application/xhtml+xml,600007581,595412984,23.3495\nCC-MAIN-2019-13,application/xml,1457477,1451255,0.0567\nCC-MAIN-2019-13,application/zip,310731,309642,0.0121\nCC-MAIN-2019-13,application/zlib,22700,22430,0.0009\nCC-MAIN-2019-13,application/zstd,854,854,0.0000\nCC-MAIN-2019-13,audio/mp4,27682,27456,0.0011\nCC-MAIN-2019-13,audio/mpeg,576055,565503,0.0224\nCC-MAIN-2019-13,audio/vnd.wave,46950,46931,0.0018\nCC-MAIN-2019-13,audio/x-mpegurl,7092,7083,0.0003\nCC-MAIN-2019-13,image/gif,334008,333140,0.0130\nCC-MAIN-2019-13,image/jpeg,14299708,14281195,0.5565\nCC-MAIN-2019-13,image/png,1623561,1620052,0.0632\nCC-MAIN-2019-13,image/svg+xml,53241,53096,0.0021\nCC-MAIN-2019-13,image/tiff,28658,28624,0.0011\nCC-MAIN-2019-13,image/vnd.djvu,31506,31486,0.0012\nCC-MAIN-2019-13,image/vnd.dxf; format=ascii,9342,9341,0.0004\nCC-MAIN-2019-13,image/webp,16954,16953,0.0007\nCC-MAIN-2019-13,message/rfc822,41860,41791,0.0016\nCC-MAIN-2019-13,text/asp,2,2,0.0000\nCC-MAIN-2019-13,text/calendar,852582,851889,0.0332\nCC-MAIN-2019-13,text/css,15637,15622,0.0006\nCC-MAIN-2019-13,text/csv,58135,58109,0.0023\nCC-MAIN-2019-13,text/html,1925557585,1903670751,74.9337\nCC-MAIN-2019-13,text/markdown,40,40,0.0000\nCC-MAIN-2019-13,text/plain,1564052,1560982,0.0609\nCC-MAIN-2019-13,text/prs.lines.tag,5631,5631,0.0002\nCC-MAIN-2019-13,text/tab-separated-values,9469,9469,0.0004\nCC-MAIN-2019-13,text/troff,4663,4660,0.0002\nCC-MAIN-2019-13,text/turtle,10238,10232,0.0004\nCC-MAIN-2019-13,text/vtt,10165,10165,0.0004\nCC-MAIN-2019-13,text/x-c++src,3898,3896,0.0002\nCC-MAIN-2019-13,text/x-chdr,5674,5674,0.0002\nCC-MAIN-2019-13,text/x-csrc,15367,15364,0.0006\nCC-MAIN-2019-13,text/x-diff,28945,28923,0.0011\nCC-MAIN-2019-13,text/x-jsp,8431,8395,0.0003\nCC-MAIN-2019-13,text/x-log,37930,37910,0.0015\nCC-MAIN-2019-13,text/x-matlab,33334,33316,0.0013\nCC-MAIN-2019-13,text/x-perl,40395,40295,0.0016\nCC-MAIN-2019-13,text/x-php,140107,138918,0.0055\nCC-MAIN-2019-13,text/x-python,7797,7793,0.0003\nCC-MAIN-2019-13,text/x-vcalendar,23586,23573,0.0009\nCC-MAIN-2019-13,text/x-vcard,78037,77831,0.0030\nCC-MAIN-2019-13,text/x-web-markdown,4679,4679,0.0002\nCC-MAIN-2019-13,text/x-yaml,1859,1859,0.0001\nCC-MAIN-2019-13,video/mp4,173542,173257,0.0068\nCC-MAIN-2019-13,video/quicktime,14348,14301,0.0006\nCC-MAIN-2019-13,video/webm,47831,47804,0.0019\nCC-MAIN-2019-13,video/x-m4v,17514,17459,0.0007\nCC-MAIN-2019-18,<other>,586784,585862,0.0235\nCC-MAIN-2019-18,application/atom+xml,2757710,2755922,0.1104\nCC-MAIN-2019-18,application/epub+zip,39655,39534,0.0016\nCC-MAIN-2019-18,application/gpx+xml,4989,4985,0.0002\nCC-MAIN-2019-18,application/gzip,62123,61924,0.0025\nCC-MAIN-2019-18,application/javascript,26876,26795,0.0011\nCC-MAIN-2019-18,application/json,370749,370252,0.0148\nCC-MAIN-2019-18,application/marc,1237,1237,0.0000\nCC-MAIN-2019-18,application/mbox,21501,21491,0.0009\nCC-MAIN-2019-18,application/msword,58647,58431,0.0023\nCC-MAIN-2019-18,application/octet-stream,254628,253940,0.0102\nCC-MAIN-2019-18,application/pdf,12960647,12925617,0.5189\nCC-MAIN-2019-18,application/pgp-signature,43772,43760,0.0018\nCC-MAIN-2019-18,application/pkcs7-signature,3656,3655,0.0001\nCC-MAIN-2019-18,application/postscript,26426,26411,0.0011\nCC-MAIN-2019-18,application/rdf+xml,269726,269327,0.0108\nCC-MAIN-2019-18,application/rss+xml,3814506,3802299,0.1527\nCC-MAIN-2019-18,application/rtf,78052,78012,0.0031\nCC-MAIN-2019-18,application/text,6198,6198,0.0002\nCC-MAIN-2019-18,application/vnd.android.package-archive,30452,30327,0.0012\nCC-MAIN-2019-18,application/vnd.google-earth.kml+xml,57093,57068,0.0023\nCC-MAIN-2019-18,application/vnd.google-earth.kmz,10553,10531,0.0004\nCC-MAIN-2019-18,application/vnd.ms-excel,24835,24773,0.0010\nCC-MAIN-2019-18,application/vnd.ms-powerpoint,15541,15524,0.0006\nCC-MAIN-2019-18,application/vnd.oasis.opendocument.spreadsheet,4321,4316,0.0002\nCC-MAIN-2019-18,application/vnd.oasis.opendocument.text,15831,15799,0.0006\nCC-MAIN-2019-18,application/vnd.openxmlformats-officedocument.presentationml.presentation,41966,41919,0.0017\nCC-MAIN-2019-18,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,79911,79838,0.0032\nCC-MAIN-2019-18,application/vnd.openxmlformats-officedocument.wordprocessingml.document,262208,262025,0.0105\nCC-MAIN-2019-18,application/x-bibtex-text-file,76229,76208,0.0031\nCC-MAIN-2019-18,application/x-bittorrent,16936,16106,0.0007\nCC-MAIN-2019-18,application/x-bzip2,23970,23839,0.0010\nCC-MAIN-2019-18,application/x-dosexec,9957,9639,0.0004\nCC-MAIN-2019-18,application/x-endnote-refer,29846,29817,0.0012\nCC-MAIN-2019-18,application/x-hdf,2027,2027,0.0001\nCC-MAIN-2019-18,application/x-mobipocket-ebook,11384,11359,0.0005\nCC-MAIN-2019-18,application/x-ms-asx,11420,11401,0.0005\nCC-MAIN-2019-18,application/x-msdownload,6926,6878,0.0003\nCC-MAIN-2019-18,application/x-rar-compressed,90924,90813,0.0036\nCC-MAIN-2019-18,application/x-research-info-systems,1994,1994,0.0001\nCC-MAIN-2019-18,application/x-sh,14091,14056,0.0006\nCC-MAIN-2019-18,application/x-shockwave-flash,31374,31235,0.0013\nCC-MAIN-2019-18,application/x-stata-do,8558,8554,0.0003\nCC-MAIN-2019-18,application/x-tex,7415,7415,0.0003\nCC-MAIN-2019-18,application/x-tex-tfm,1674,1674,0.0001\nCC-MAIN-2019-18,application/x-tika-msoffice,69555,69528,0.0028\nCC-MAIN-2019-18,application/x-tika-ooxml,47588,47568,0.0019\nCC-MAIN-2019-18,application/x-wais-source,6375,6375,0.0003\nCC-MAIN-2019-18,application/x-xz,73486,73421,0.0029\nCC-MAIN-2019-18,application/xhtml+xml,564033765,559648885,22.5811\nCC-MAIN-2019-18,application/xml,1667653,1660679,0.0668\nCC-MAIN-2019-18,application/zip,129192,128168,0.0052\nCC-MAIN-2019-18,application/zlib,18519,18319,0.0007\nCC-MAIN-2019-18,application/zstd,196,196,0.0000\nCC-MAIN-2019-18,audio/mp4,48292,47765,0.0019\nCC-MAIN-2019-18,audio/mpeg,101293,100775,0.0041\nCC-MAIN-2019-18,audio/vnd.wave,51947,51941,0.0021\nCC-MAIN-2019-18,audio/x-mpegurl,5284,5282,0.0002\nCC-MAIN-2019-18,image/gif,68102,67590,0.0027\nCC-MAIN-2019-18,image/jpeg,3471932,3456216,0.1390\nCC-MAIN-2019-18,image/png,586866,584110,0.0235\nCC-MAIN-2019-18,image/svg+xml,13214,13141,0.0005\nCC-MAIN-2019-18,image/tiff,8682,8671,0.0003\nCC-MAIN-2019-18,image/vnd.djvu,18012,18002,0.0007\nCC-MAIN-2019-18,image/vnd.dxf; format=ascii,8002,8001,0.0003\nCC-MAIN-2019-18,image/webp,17019,17005,0.0007\nCC-MAIN-2019-18,message/rfc822,34845,34814,0.0014\nCC-MAIN-2019-18,text/calendar,837643,836968,0.0335\nCC-MAIN-2019-18,text/css,10872,10871,0.0004\nCC-MAIN-2019-18,text/csv,58604,58571,0.0023\nCC-MAIN-2019-18,text/html,1901926946,1880669925,76.1435\nCC-MAIN-2019-18,text/markdown,60,60,0.0000\nCC-MAIN-2019-18,text/plain,1708917,1707012,0.0684\nCC-MAIN-2019-18,text/prs.lines.tag,27220,27219,0.0011\nCC-MAIN-2019-18,text/tab-separated-values,10421,10415,0.0004\nCC-MAIN-2019-18,text/troff,7774,7774,0.0003\nCC-MAIN-2019-18,text/turtle,8976,8976,0.0004\nCC-MAIN-2019-18,text/vtt,11598,11597,0.0005\nCC-MAIN-2019-18,text/x-c++src,4228,4224,0.0002\nCC-MAIN-2019-18,text/x-chdr,11774,11773,0.0005\nCC-MAIN-2019-18,text/x-csrc,22543,22538,0.0009\nCC-MAIN-2019-18,text/x-diff,27216,27178,0.0011\nCC-MAIN-2019-18,text/x-jsp,8016,7979,0.0003\nCC-MAIN-2019-18,text/x-log,28471,28463,0.0011\nCC-MAIN-2019-18,text/x-matlab,49097,49080,0.0020\nCC-MAIN-2019-18,text/x-perl,52695,52658,0.0021\nCC-MAIN-2019-18,text/x-php,98495,97521,0.0039\nCC-MAIN-2019-18,text/x-python,7016,7005,0.0003\nCC-MAIN-2019-18,text/x-vcalendar,19894,19884,0.0008\nCC-MAIN-2019-18,text/x-vcard,63176,63111,0.0025\nCC-MAIN-2019-18,text/x-web-markdown,4999,4994,0.0002\nCC-MAIN-2019-18,text/x-yaml,4015,4006,0.0002\nCC-MAIN-2019-18,video/mp4,27692,27518,0.0011\nCC-MAIN-2019-18,video/quicktime,9977,9971,0.0004\nCC-MAIN-2019-18,video/webm,2048,2043,0.0001\nCC-MAIN-2019-18,video/x-m4v,13087,13045,0.0005\nCC-MAIN-2019-22,<other>,391339,389802,0.0146\nCC-MAIN-2019-22,application/atom+xml,4324102,4322098,0.1614\nCC-MAIN-2019-22,application/epub+zip,54795,54503,0.0020\nCC-MAIN-2019-22,application/gpx+xml,7215,7210,0.0003\nCC-MAIN-2019-22,application/gzip,61240,61032,0.0023\nCC-MAIN-2019-22,application/javascript,29630,29576,0.0011\nCC-MAIN-2019-22,application/json,448618,447922,0.0167\nCC-MAIN-2019-22,application/marc,1585,1585,0.0001\nCC-MAIN-2019-22,application/mbox,35401,35386,0.0013\nCC-MAIN-2019-22,application/msword,91918,91517,0.0034\nCC-MAIN-2019-22,application/octet-stream,356409,355440,0.0133\nCC-MAIN-2019-22,application/pdf,19423997,19368467,0.7248\nCC-MAIN-2019-22,application/pgp-signature,24830,24830,0.0009\nCC-MAIN-2019-22,application/pkcs7-signature,7560,7560,0.0003\nCC-MAIN-2019-22,application/postscript,17314,17299,0.0006\nCC-MAIN-2019-22,application/rdf+xml,260221,259804,0.0097\nCC-MAIN-2019-22,application/rss+xml,3944276,3932475,0.1472\nCC-MAIN-2019-22,application/rtf,53978,53855,0.0020\nCC-MAIN-2019-22,application/text,4940,4940,0.0002\nCC-MAIN-2019-22,application/vnd.android.package-archive,38406,38029,0.0014\nCC-MAIN-2019-22,application/vnd.google-earth.kml+xml,59275,59212,0.0022\nCC-MAIN-2019-22,application/vnd.google-earth.kmz,11994,11992,0.0004\nCC-MAIN-2019-22,application/vnd.ms-excel,36958,36913,0.0014\nCC-MAIN-2019-22,application/vnd.ms-powerpoint,22177,22083,0.0008\nCC-MAIN-2019-22,application/vnd.oasis.opendocument.spreadsheet,4583,4582,0.0002\nCC-MAIN-2019-22,application/vnd.oasis.opendocument.text,18629,18615,0.0007\nCC-MAIN-2019-22,application/vnd.openxmlformats-officedocument.presentationml.presentation,12061,12046,0.0005\nCC-MAIN-2019-22,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,35468,35387,0.0013\nCC-MAIN-2019-22,application/vnd.openxmlformats-officedocument.wordprocessingml.document,83151,82864,0.0031\nCC-MAIN-2019-22,application/x-bibtex-text-file,81859,81775,0.0031\nCC-MAIN-2019-22,application/x-bittorrent,14565,13714,0.0005\nCC-MAIN-2019-22,application/x-bzip2,11721,11679,0.0004\nCC-MAIN-2019-22,application/x-dosexec,10728,10361,0.0004\nCC-MAIN-2019-22,application/x-endnote-refer,31042,30960,0.0012\nCC-MAIN-2019-22,application/x-hdf,2023,2023,0.0001\nCC-MAIN-2019-22,application/x-mobipocket-ebook,12672,12617,0.0005\nCC-MAIN-2019-22,application/x-ms-asx,9985,9968,0.0004\nCC-MAIN-2019-22,application/x-msdownload,6490,6454,0.0002\nCC-MAIN-2019-22,application/x-rar-compressed,27336,27090,0.0010\nCC-MAIN-2019-22,application/x-research-info-systems,1762,1759,0.0001\nCC-MAIN-2019-22,application/x-sh,20777,20736,0.0008\nCC-MAIN-2019-22,application/x-shockwave-flash,25157,25013,0.0009\nCC-MAIN-2019-22,application/x-stata-do,8800,8793,0.0003\nCC-MAIN-2019-22,application/x-tex,6093,6082,0.0002\nCC-MAIN-2019-22,application/x-tex-tfm,2792,2792,0.0001\nCC-MAIN-2019-22,application/x-tika-msoffice,63604,63577,0.0024\nCC-MAIN-2019-22,application/x-tika-ooxml,47457,47394,0.0018\nCC-MAIN-2019-22,application/x-wais-source,9942,9942,0.0004\nCC-MAIN-2019-22,application/x-xz,56504,56426,0.0021\nCC-MAIN-2019-22,application/xhtml+xml,605403020,600637148,22.5918\nCC-MAIN-2019-22,application/xml,1625678,1618435,0.0607\nCC-MAIN-2019-22,application/zip,181213,180155,0.0068\nCC-MAIN-2019-22,application/zlib,31569,31344,0.0012\nCC-MAIN-2019-22,application/zstd,42,42,0.0000\nCC-MAIN-2019-22,audio/mp4,42868,42200,0.0016\nCC-MAIN-2019-22,audio/mpeg,166558,164442,0.0062\nCC-MAIN-2019-22,audio/vnd.wave,23245,23236,0.0009\nCC-MAIN-2019-22,audio/x-mpegurl,5576,5571,0.0002\nCC-MAIN-2019-22,image/gif,89904,88539,0.0034\nCC-MAIN-2019-22,image/jpeg,4158147,4143282,0.1552\nCC-MAIN-2019-22,image/png,633587,628398,0.0236\nCC-MAIN-2019-22,image/svg+xml,12252,12234,0.0005\nCC-MAIN-2019-22,image/tiff,12046,12042,0.0004\nCC-MAIN-2019-22,image/vnd.djvu,20063,20062,0.0007\nCC-MAIN-2019-22,image/vnd.dxf; format=ascii,12774,12772,0.0005\nCC-MAIN-2019-22,image/webp,21407,21405,0.0008\nCC-MAIN-2019-22,message/rfc822,31206,31172,0.0012\nCC-MAIN-2019-22,text/asp,2,2,0.0000\nCC-MAIN-2019-22,text/calendar,991193,990426,0.0370\nCC-MAIN-2019-22,text/css,7121,7119,0.0003\nCC-MAIN-2019-22,text/csv,45029,45015,0.0017\nCC-MAIN-2019-22,text/html,2033659795,2011426830,75.8900\nCC-MAIN-2019-22,text/markdown,212,212,0.0000\nCC-MAIN-2019-22,text/plain,1656795,1654247,0.0618\nCC-MAIN-2019-22,text/prs.lines.tag,29740,29735,0.0011\nCC-MAIN-2019-22,text/tab-separated-values,15689,15687,0.0006\nCC-MAIN-2019-22,text/troff,5695,5694,0.0002\nCC-MAIN-2019-22,text/turtle,9969,9968,0.0004\nCC-MAIN-2019-22,text/vtt,13455,13455,0.0005\nCC-MAIN-2019-22,text/x-c++src,5790,5790,0.0002\nCC-MAIN-2019-22,text/x-chdr,12199,12199,0.0005\nCC-MAIN-2019-22,text/x-csrc,19816,19808,0.0007\nCC-MAIN-2019-22,text/x-diff,31391,31297,0.0012\nCC-MAIN-2019-22,text/x-jsp,5766,5733,0.0002\nCC-MAIN-2019-22,text/x-log,50929,50916,0.0019\nCC-MAIN-2019-22,text/x-matlab,42532,42383,0.0016\nCC-MAIN-2019-22,text/x-perl,54284,54248,0.0020\nCC-MAIN-2019-22,text/x-php,104979,104180,0.0039\nCC-MAIN-2019-22,text/x-python,9690,9654,0.0004\nCC-MAIN-2019-22,text/x-vcalendar,26082,25949,0.0010\nCC-MAIN-2019-22,text/x-vcard,77097,77038,0.0029\nCC-MAIN-2019-22,text/x-web-markdown,5194,5189,0.0002\nCC-MAIN-2019-22,text/x-yaml,6479,6479,0.0002\nCC-MAIN-2019-22,video/mp4,43070,42718,0.0016\nCC-MAIN-2019-22,video/quicktime,13084,13073,0.0005\nCC-MAIN-2019-22,video/webm,2540,2524,0.0001\nCC-MAIN-2019-22,video/x-m4v,16099,15948,0.0006\nCC-MAIN-2019-26,<other>,284938,284259,0.0110\nCC-MAIN-2019-26,application/atom+xml,3668074,3667161,0.1414\nCC-MAIN-2019-26,application/epub+zip,36114,36025,0.0014\nCC-MAIN-2019-26,application/gpx+xml,5644,5626,0.0002\nCC-MAIN-2019-26,application/gzip,49346,49240,0.0019\nCC-MAIN-2019-26,application/javascript,24050,23995,0.0009\nCC-MAIN-2019-26,application/json,518263,517657,0.0200\nCC-MAIN-2019-26,application/marc,2944,2944,0.0001\nCC-MAIN-2019-26,application/mbox,31449,31448,0.0012\nCC-MAIN-2019-26,application/msword,63342,63015,0.0024\nCC-MAIN-2019-26,application/octet-stream,289690,289250,0.0112\nCC-MAIN-2019-26,application/pdf,16109119,16067642,0.6210\nCC-MAIN-2019-26,application/pgp-signature,27999,27999,0.0011\nCC-MAIN-2019-26,application/pkcs7-signature,8782,8781,0.0003\nCC-MAIN-2019-26,application/postscript,14834,14830,0.0006\nCC-MAIN-2019-26,application/rdf+xml,292928,292732,0.0113\nCC-MAIN-2019-26,application/rss+xml,3955218,3946552,0.1525\nCC-MAIN-2019-26,application/rtf,48888,48819,0.0019\nCC-MAIN-2019-26,application/text,3871,3871,0.0001\nCC-MAIN-2019-26,application/vnd.android.package-archive,23148,23017,0.0009\nCC-MAIN-2019-26,application/vnd.google-earth.kml+xml,52124,52093,0.0020\nCC-MAIN-2019-26,application/vnd.google-earth.kmz,10701,10694,0.0004\nCC-MAIN-2019-26,application/vnd.ms-excel,26716,26657,0.0010\nCC-MAIN-2019-26,application/vnd.ms-powerpoint,19746,19740,0.0008\nCC-MAIN-2019-26,application/vnd.oasis.opendocument.spreadsheet,4352,4351,0.0002\nCC-MAIN-2019-26,application/vnd.oasis.opendocument.text,15235,15223,0.0006\nCC-MAIN-2019-26,application/vnd.openxmlformats-officedocument.presentationml.presentation,5735,5726,0.0002\nCC-MAIN-2019-26,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,23247,23191,0.0009\nCC-MAIN-2019-26,application/vnd.openxmlformats-officedocument.wordprocessingml.document,49501,49384,0.0019\nCC-MAIN-2019-26,application/x-bibtex-text-file,74931,74920,0.0029\nCC-MAIN-2019-26,application/x-bittorrent,10538,9986,0.0004\nCC-MAIN-2019-26,application/x-bzip2,11532,11502,0.0004\nCC-MAIN-2019-26,application/x-dosexec,8493,8207,0.0003\nCC-MAIN-2019-26,application/x-endnote-refer,31923,31891,0.0012\nCC-MAIN-2019-26,application/x-hdf,1984,1984,0.0001\nCC-MAIN-2019-26,application/x-mobipocket-ebook,8795,8790,0.0003\nCC-MAIN-2019-26,application/x-ms-asx,6172,6168,0.0002\nCC-MAIN-2019-26,application/x-msdownload,3684,3653,0.0001\nCC-MAIN-2019-26,application/x-rar-compressed,13559,13473,0.0005\nCC-MAIN-2019-26,application/x-research-info-systems,1810,1810,0.0001\nCC-MAIN-2019-26,application/x-sh,58096,58069,0.0022\nCC-MAIN-2019-26,application/x-shockwave-flash,23421,23302,0.0009\nCC-MAIN-2019-26,application/x-stata-do,6746,6725,0.0003\nCC-MAIN-2019-26,application/x-tex,5582,5573,0.0002\nCC-MAIN-2019-26,application/x-tex-tfm,2255,2255,0.0001\nCC-MAIN-2019-26,application/x-tika-msoffice,60947,60931,0.0023\nCC-MAIN-2019-26,application/x-tika-ooxml,49386,49356,0.0019\nCC-MAIN-2019-26,application/x-wais-source,5094,5094,0.0002\nCC-MAIN-2019-26,application/x-xz,75681,75460,0.0029\nCC-MAIN-2019-26,application/xhtml+xml,587097886,582888684,22.6306\nCC-MAIN-2019-26,application/xml,1561741,1553877,0.0602\nCC-MAIN-2019-26,application/zip,168977,166295,0.0065\nCC-MAIN-2019-26,application/zlib,32852,32658,0.0013\nCC-MAIN-2019-26,application/zstd,26,26,0.0000\nCC-MAIN-2019-26,audio/mp4,38678,37368,0.0015\nCC-MAIN-2019-26,audio/mpeg,130636,129850,0.0050\nCC-MAIN-2019-26,audio/vnd.wave,13583,13583,0.0005\nCC-MAIN-2019-26,audio/x-mpegurl,3604,3602,0.0001\nCC-MAIN-2019-26,image/gif,80176,79758,0.0031\nCC-MAIN-2019-26,image/jpeg,3781318,3770003,0.1458\nCC-MAIN-2019-26,image/png,528095,524194,0.0204\nCC-MAIN-2019-26,image/svg+xml,13943,13906,0.0005\nCC-MAIN-2019-26,image/tiff,13188,13183,0.0005\nCC-MAIN-2019-26,image/vnd.djvu,21707,21600,0.0008\nCC-MAIN-2019-26,image/vnd.dxf; format=ascii,8561,8560,0.0003\nCC-MAIN-2019-26,image/webp,10310,10304,0.0004\nCC-MAIN-2019-26,message/rfc822,34320,34206,0.0013\nCC-MAIN-2019-26,text/asp,1,1,0.0000\nCC-MAIN-2019-26,text/calendar,1046773,1046049,0.0403\nCC-MAIN-2019-26,text/css,4931,4929,0.0002\nCC-MAIN-2019-26,text/csv,42424,42420,0.0016\nCC-MAIN-2019-26,text/html,1971308583,1952626740,75.9873\nCC-MAIN-2019-26,text/markdown,337,337,0.0000\nCC-MAIN-2019-26,text/plain,1582281,1580657,0.0610\nCC-MAIN-2019-26,text/prs.lines.tag,31623,31622,0.0012\nCC-MAIN-2019-26,text/tab-separated-values,13193,13193,0.0005\nCC-MAIN-2019-26,text/troff,10381,10378,0.0004\nCC-MAIN-2019-26,text/turtle,11400,11400,0.0004\nCC-MAIN-2019-26,text/vtt,12124,12123,0.0005\nCC-MAIN-2019-26,text/x-c++src,7553,7552,0.0003\nCC-MAIN-2019-26,text/x-chdr,17680,17680,0.0007\nCC-MAIN-2019-26,text/x-csrc,28895,28894,0.0011\nCC-MAIN-2019-26,text/x-diff,36934,36892,0.0014\nCC-MAIN-2019-26,text/x-jsp,3476,3454,0.0001\nCC-MAIN-2019-26,text/x-log,61797,61783,0.0024\nCC-MAIN-2019-26,text/x-matlab,50775,50751,0.0020\nCC-MAIN-2019-26,text/x-perl,63054,63042,0.0024\nCC-MAIN-2019-26,text/x-php,85896,85323,0.0033\nCC-MAIN-2019-26,text/x-python,7154,7154,0.0003\nCC-MAIN-2019-26,text/x-vcalendar,22469,22454,0.0009\nCC-MAIN-2019-26,text/x-vcard,77395,77324,0.0030\nCC-MAIN-2019-26,text/x-web-markdown,4442,4442,0.0002\nCC-MAIN-2019-26,text/x-yaml,4349,4349,0.0002\nCC-MAIN-2019-26,video/mp4,31100,30912,0.0012\nCC-MAIN-2019-26,video/quicktime,13213,13183,0.0005\nCC-MAIN-2019-26,video/webm,1467,1464,0.0001\nCC-MAIN-2019-26,video/x-m4v,13189,13029,0.0005\nCC-MAIN-2019-30,<other>,319698,318873,0.0123\nCC-MAIN-2019-30,application/atom+xml,4230920,4229991,0.1631\nCC-MAIN-2019-30,application/epub+zip,40443,40354,0.0016\nCC-MAIN-2019-30,application/gpx+xml,4999,4993,0.0002\nCC-MAIN-2019-30,application/gzip,48783,48641,0.0019\nCC-MAIN-2019-30,application/javascript,29370,29355,0.0011\nCC-MAIN-2019-30,application/json,557932,557346,0.0215\nCC-MAIN-2019-30,application/marc,3619,3619,0.0001\nCC-MAIN-2019-30,application/mbox,46283,46276,0.0018\nCC-MAIN-2019-30,application/msword,60331,60055,0.0023\nCC-MAIN-2019-30,application/octet-stream,243557,242825,0.0094\nCC-MAIN-2019-30,application/pdf,3453816,3432810,0.1331\nCC-MAIN-2019-30,application/pgp-signature,24281,24281,0.0009\nCC-MAIN-2019-30,application/pkcs7-signature,5650,5649,0.0002\nCC-MAIN-2019-30,application/postscript,3837,3828,0.0001\nCC-MAIN-2019-30,application/rdf+xml,270686,270498,0.0104\nCC-MAIN-2019-30,application/rss+xml,3886045,3876787,0.1498\nCC-MAIN-2019-30,application/rtf,60657,60406,0.0023\nCC-MAIN-2019-30,application/text,8350,8332,0.0003\nCC-MAIN-2019-30,application/vnd.android.package-archive,25729,25509,0.0010\nCC-MAIN-2019-30,application/vnd.google-earth.kml+xml,43879,43855,0.0017\nCC-MAIN-2019-30,application/vnd.google-earth.kmz,6371,6312,0.0002\nCC-MAIN-2019-30,application/vnd.ms-excel,24369,24339,0.0009\nCC-MAIN-2019-30,application/vnd.ms-powerpoint,23301,23277,0.0009\nCC-MAIN-2019-30,application/vnd.oasis.opendocument.spreadsheet,4191,4165,0.0002\nCC-MAIN-2019-30,application/vnd.oasis.opendocument.text,15489,15476,0.0006\nCC-MAIN-2019-30,application/vnd.openxmlformats-officedocument.presentationml.presentation,6299,6284,0.0002\nCC-MAIN-2019-30,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,28109,28021,0.0011\nCC-MAIN-2019-30,application/vnd.openxmlformats-officedocument.wordprocessingml.document,53398,53186,0.0021\nCC-MAIN-2019-30,application/x-bibtex-text-file,90835,90806,0.0035\nCC-MAIN-2019-30,application/x-bittorrent,9080,8683,0.0003\nCC-MAIN-2019-30,application/x-bzip2,5484,5456,0.0002\nCC-MAIN-2019-30,application/x-dosexec,9942,9585,0.0004\nCC-MAIN-2019-30,application/x-endnote-refer,35542,35502,0.0014\nCC-MAIN-2019-30,application/x-hdf,4051,4051,0.0002\nCC-MAIN-2019-30,application/x-mobipocket-ebook,8393,8388,0.0003\nCC-MAIN-2019-30,application/x-ms-asx,6570,6568,0.0003\nCC-MAIN-2019-30,application/x-msdownload,3420,3399,0.0001\nCC-MAIN-2019-30,application/x-rar-compressed,13697,13654,0.0005\nCC-MAIN-2019-30,application/x-research-info-systems,2324,2324,0.0001\nCC-MAIN-2019-30,application/x-sh,14986,14957,0.0006\nCC-MAIN-2019-30,application/x-shockwave-flash,24419,24257,0.0009\nCC-MAIN-2019-30,application/x-stata-do,28904,28880,0.0011\nCC-MAIN-2019-30,application/x-tex,5348,5348,0.0002\nCC-MAIN-2019-30,application/x-tex-tfm,1383,1383,0.0001\nCC-MAIN-2019-30,application/x-tika-msoffice,63801,63750,0.0025\nCC-MAIN-2019-30,application/x-tika-ooxml,50792,50751,0.0020\nCC-MAIN-2019-30,application/x-wais-source,4348,4348,0.0002\nCC-MAIN-2019-30,application/x-xz,17037,17032,0.0007\nCC-MAIN-2019-30,application/xhtml+xml,580035774,575837671,22.3538\nCC-MAIN-2019-30,application/xml,1759185,1753638,0.0678\nCC-MAIN-2019-30,application/zip,187679,186206,0.0072\nCC-MAIN-2019-30,application/zlib,34807,34593,0.0013\nCC-MAIN-2019-30,application/zstd,107,107,0.0000\nCC-MAIN-2019-30,audio/mp4,34758,34329,0.0013\nCC-MAIN-2019-30,audio/mpeg,158346,155713,0.0061\nCC-MAIN-2019-30,audio/vnd.wave,16307,16298,0.0006\nCC-MAIN-2019-30,audio/x-mpegurl,3422,3415,0.0001\nCC-MAIN-2019-30,image/gif,71343,70831,0.0027\nCC-MAIN-2019-30,image/jpeg,3556578,3547982,0.1371\nCC-MAIN-2019-30,image/png,495871,492378,0.0191\nCC-MAIN-2019-30,image/svg+xml,9758,9723,0.0004\nCC-MAIN-2019-30,image/tiff,19397,19395,0.0007\nCC-MAIN-2019-30,image/vnd.djvu,16215,16140,0.0006\nCC-MAIN-2019-30,image/vnd.dxf; format=ascii,8630,8630,0.0003\nCC-MAIN-2019-30,image/webp,20856,20855,0.0008\nCC-MAIN-2019-30,message/rfc822,33524,33456,0.0013\nCC-MAIN-2019-30,text/asp,26,26,0.0000\nCC-MAIN-2019-30,text/calendar,1079586,1078624,0.0416\nCC-MAIN-2019-30,text/css,5542,5539,0.0002\nCC-MAIN-2019-30,text/csv,53432,53395,0.0021\nCC-MAIN-2019-30,text/html,1990575970,1970948081,76.7141\nCC-MAIN-2019-30,text/markdown,110,110,0.0000\nCC-MAIN-2019-30,text/plain,1977206,1975217,0.0762\nCC-MAIN-2019-30,text/prs.lines.tag,35267,35256,0.0014\nCC-MAIN-2019-30,text/tab-separated-values,14558,14558,0.0006\nCC-MAIN-2019-30,text/troff,8204,8204,0.0003\nCC-MAIN-2019-30,text/turtle,12424,12424,0.0005\nCC-MAIN-2019-30,text/vtt,11911,11908,0.0005\nCC-MAIN-2019-30,text/x-c++src,10006,10005,0.0004\nCC-MAIN-2019-30,text/x-chdr,24480,24480,0.0009\nCC-MAIN-2019-30,text/x-csrc,35985,35984,0.0014\nCC-MAIN-2019-30,text/x-diff,37482,37405,0.0014\nCC-MAIN-2019-30,text/x-jsp,2903,2880,0.0001\nCC-MAIN-2019-30,text/x-log,91692,91690,0.0035\nCC-MAIN-2019-30,text/x-matlab,50922,50675,0.0020\nCC-MAIN-2019-30,text/x-perl,106991,106965,0.0041\nCC-MAIN-2019-30,text/x-php,85866,85074,0.0033\nCC-MAIN-2019-30,text/x-python,6489,6489,0.0003\nCC-MAIN-2019-30,text/x-vcalendar,23313,23311,0.0009\nCC-MAIN-2019-30,text/x-vcard,83625,83499,0.0032\nCC-MAIN-2019-30,text/x-web-markdown,5046,5046,0.0002\nCC-MAIN-2019-30,text/x-yaml,4252,4252,0.0002\nCC-MAIN-2019-30,video/mp4,37730,37467,0.0015\nCC-MAIN-2019-30,video/quicktime,9658,9642,0.0004\nCC-MAIN-2019-30,video/webm,2191,2189,0.0001\nCC-MAIN-2019-30,video/x-m4v,12203,12133,0.0005\nCC-MAIN-2019-35,<other>,339280,338422,0.0115\nCC-MAIN-2019-35,application/atom+xml,4147093,4145898,0.1403\nCC-MAIN-2019-35,application/epub+zip,44428,44315,0.0015\nCC-MAIN-2019-35,application/gpx+xml,6800,6798,0.0002\nCC-MAIN-2019-35,application/gzip,74753,74576,0.0025\nCC-MAIN-2019-35,application/javascript,31912,31901,0.0011\nCC-MAIN-2019-35,application/json,587974,587496,0.0199\nCC-MAIN-2019-35,application/marc,4846,4846,0.0002\nCC-MAIN-2019-35,application/mbox,47144,47139,0.0016\nCC-MAIN-2019-35,application/msword,83556,83183,0.0028\nCC-MAIN-2019-35,application/octet-stream,454385,453334,0.0154\nCC-MAIN-2019-35,application/pdf,4236832,4206464,0.1434\nCC-MAIN-2019-35,application/pgp-signature,51979,51979,0.0018\nCC-MAIN-2019-35,application/pkcs7-signature,11864,11859,0.0004\nCC-MAIN-2019-35,application/postscript,4124,4111,0.0001\nCC-MAIN-2019-35,application/rdf+xml,331005,330796,0.0112\nCC-MAIN-2019-35,application/rss+xml,4551061,4537828,0.1540\nCC-MAIN-2019-35,application/rtf,66286,66164,0.0022\nCC-MAIN-2019-35,application/text,10972,10955,0.0004\nCC-MAIN-2019-35,application/vnd.android.package-archive,35198,34910,0.0012\nCC-MAIN-2019-35,application/vnd.google-earth.kml+xml,65451,65427,0.0022\nCC-MAIN-2019-35,application/vnd.google-earth.kmz,12846,12841,0.0004\nCC-MAIN-2019-35,application/vnd.ms-excel,31032,30937,0.0011\nCC-MAIN-2019-35,application/vnd.ms-powerpoint,23613,23593,0.0008\nCC-MAIN-2019-35,application/vnd.oasis.opendocument.spreadsheet,5251,5233,0.0002\nCC-MAIN-2019-35,application/vnd.oasis.opendocument.text,20923,20898,0.0007\nCC-MAIN-2019-35,application/vnd.openxmlformats-officedocument.presentationml.presentation,6672,6652,0.0002\nCC-MAIN-2019-35,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,33178,33083,0.0011\nCC-MAIN-2019-35,application/vnd.openxmlformats-officedocument.wordprocessingml.document,61735,61441,0.0021\nCC-MAIN-2019-35,application/x-bibtex-text-file,102170,102085,0.0035\nCC-MAIN-2019-35,application/x-bittorrent,13371,12843,0.0005\nCC-MAIN-2019-35,application/x-bzip2,6350,6284,0.0002\nCC-MAIN-2019-35,application/x-dosexec,11420,11055,0.0004\nCC-MAIN-2019-35,application/x-endnote-refer,44472,44449,0.0015\nCC-MAIN-2019-35,application/x-hdf,2668,2668,0.0001\nCC-MAIN-2019-35,application/x-mobipocket-ebook,6841,6840,0.0002\nCC-MAIN-2019-35,application/x-ms-asx,7814,7807,0.0003\nCC-MAIN-2019-35,application/x-msdownload,4934,4914,0.0002\nCC-MAIN-2019-35,application/x-rar-compressed,15522,15288,0.0005\nCC-MAIN-2019-35,application/x-research-info-systems,2248,2247,0.0001\nCC-MAIN-2019-35,application/x-sh,19565,19548,0.0007\nCC-MAIN-2019-35,application/x-shockwave-flash,18001,17915,0.0006\nCC-MAIN-2019-35,application/x-stata-do,15390,15336,0.0005\nCC-MAIN-2019-35,application/x-tex,5777,5770,0.0002\nCC-MAIN-2019-35,application/x-tex-tfm,2772,2772,0.0001\nCC-MAIN-2019-35,application/x-tika-msoffice,78818,78772,0.0027\nCC-MAIN-2019-35,application/x-tika-ooxml,67765,67690,0.0023\nCC-MAIN-2019-35,application/x-wais-source,6663,6663,0.0002\nCC-MAIN-2019-35,application/x-xz,21828,21827,0.0007\nCC-MAIN-2019-35,application/xhtml+xml,654698175,649959981,22.1568\nCC-MAIN-2019-35,application/xml,1723927,1716347,0.0583\nCC-MAIN-2019-35,application/zip,190434,188907,0.0064\nCC-MAIN-2019-35,application/zlib,40885,40685,0.0014\nCC-MAIN-2019-35,application/zstd,11,11,0.0000\nCC-MAIN-2019-35,audio/mp4,37441,36889,0.0013\nCC-MAIN-2019-35,audio/mpeg,146174,144124,0.0049\nCC-MAIN-2019-35,audio/vnd.wave,16325,16323,0.0006\nCC-MAIN-2019-35,audio/x-mpegurl,5350,5344,0.0002\nCC-MAIN-2019-35,image/gif,78054,77382,0.0026\nCC-MAIN-2019-35,image/jpeg,4018956,4009444,0.1360\nCC-MAIN-2019-35,image/png,594846,591895,0.0201\nCC-MAIN-2019-35,image/svg+xml,17311,17292,0.0006\nCC-MAIN-2019-35,image/tiff,29441,29409,0.0010\nCC-MAIN-2019-35,image/vnd.djvu,17536,17532,0.0006\nCC-MAIN-2019-35,image/vnd.dxf; format=ascii,10879,10879,0.0004\nCC-MAIN-2019-35,image/webp,18209,18209,0.0006\nCC-MAIN-2019-35,message/rfc822,41279,40995,0.0014\nCC-MAIN-2019-35,text/asp,8,8,0.0000\nCC-MAIN-2019-35,text/calendar,1296710,1295820,0.0439\nCC-MAIN-2019-35,text/css,5976,5975,0.0002\nCC-MAIN-2019-35,text/csv,57482,57443,0.0019\nCC-MAIN-2019-35,text/html,2272837587,2250657304,76.9192\nCC-MAIN-2019-35,text/markdown,222,222,0.0000\nCC-MAIN-2019-35,text/plain,2323895,2322145,0.0786\nCC-MAIN-2019-35,text/prs.lines.tag,39330,39302,0.0013\nCC-MAIN-2019-35,text/tab-separated-values,16603,16603,0.0006\nCC-MAIN-2019-35,text/troff,6675,6675,0.0002\nCC-MAIN-2019-35,text/turtle,12333,12332,0.0004\nCC-MAIN-2019-35,text/vtt,16595,16595,0.0006\nCC-MAIN-2019-35,text/x-c++src,10050,10049,0.0003\nCC-MAIN-2019-35,text/x-chdr,23561,23559,0.0008\nCC-MAIN-2019-35,text/x-csrc,41669,41660,0.0014\nCC-MAIN-2019-35,text/x-diff,49330,49198,0.0017\nCC-MAIN-2019-35,text/x-jsp,4723,4704,0.0002\nCC-MAIN-2019-35,text/x-log,119883,119881,0.0041\nCC-MAIN-2019-35,text/x-matlab,50271,50157,0.0017\nCC-MAIN-2019-35,text/x-perl,88610,88582,0.0030\nCC-MAIN-2019-35,text/x-php,93537,92736,0.0032\nCC-MAIN-2019-35,text/x-python,7001,7000,0.0002\nCC-MAIN-2019-35,text/x-vcalendar,28303,28298,0.0010\nCC-MAIN-2019-35,text/x-vcard,105340,105247,0.0036\nCC-MAIN-2019-35,text/x-web-markdown,6378,6374,0.0002\nCC-MAIN-2019-35,text/x-yaml,3498,3498,0.0001\nCC-MAIN-2019-35,video/mp4,40385,40182,0.0014\nCC-MAIN-2019-35,video/quicktime,11250,11231,0.0004\nCC-MAIN-2019-35,video/webm,1692,1689,0.0001\nCC-MAIN-2019-35,video/x-m4v,15353,15260,0.0005\nCC-MAIN-2019-39,<other>,350212,348767,0.0137\nCC-MAIN-2019-39,application/atom+xml,3910004,3908886,0.1527\nCC-MAIN-2019-39,application/epub+zip,46919,46652,0.0018\nCC-MAIN-2019-39,application/gpx+xml,6036,6030,0.0002\nCC-MAIN-2019-39,application/gzip,59777,59635,0.0023\nCC-MAIN-2019-39,application/javascript,24285,24278,0.0009\nCC-MAIN-2019-39,application/json,629150,628317,0.0246\nCC-MAIN-2019-39,application/marc,6960,6946,0.0003\nCC-MAIN-2019-39,application/mbox,56209,56202,0.0022\nCC-MAIN-2019-39,application/msword,82479,81910,0.0032\nCC-MAIN-2019-39,application/octet-stream,445264,444805,0.0174\nCC-MAIN-2019-39,application/pdf,25529661,25450652,0.9968\nCC-MAIN-2019-39,application/pgp-signature,46766,46765,0.0018\nCC-MAIN-2019-39,application/pkcs7-signature,10326,10320,0.0004\nCC-MAIN-2019-39,application/postscript,19728,19711,0.0008\nCC-MAIN-2019-39,application/rdf+xml,325828,325471,0.0127\nCC-MAIN-2019-39,application/rss+xml,3860736,3852612,0.1507\nCC-MAIN-2019-39,application/rtf,69905,69847,0.0027\nCC-MAIN-2019-39,application/text,14048,14033,0.0005\nCC-MAIN-2019-39,application/vnd.android.package-archive,35162,34698,0.0014\nCC-MAIN-2019-39,application/vnd.google-earth.kml+xml,58061,57978,0.0023\nCC-MAIN-2019-39,application/vnd.google-earth.kmz,7480,7469,0.0003\nCC-MAIN-2019-39,application/vnd.ms-excel,35646,35569,0.0014\nCC-MAIN-2019-39,application/vnd.ms-powerpoint,19807,19777,0.0008\nCC-MAIN-2019-39,application/vnd.oasis.opendocument.spreadsheet,6071,6067,0.0002\nCC-MAIN-2019-39,application/vnd.oasis.opendocument.text,22369,22342,0.0009\nCC-MAIN-2019-39,application/vnd.openxmlformats-officedocument.presentationml.presentation,8060,8038,0.0003\nCC-MAIN-2019-39,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,32140,32016,0.0013\nCC-MAIN-2019-39,application/vnd.openxmlformats-officedocument.wordprocessingml.document,65027,64689,0.0025\nCC-MAIN-2019-39,application/x-bibtex-text-file,113379,113309,0.0044\nCC-MAIN-2019-39,application/x-bittorrent,13221,12714,0.0005\nCC-MAIN-2019-39,application/x-bzip2,18145,18072,0.0007\nCC-MAIN-2019-39,application/x-dosexec,16108,15678,0.0006\nCC-MAIN-2019-39,application/x-endnote-refer,48954,48922,0.0019\nCC-MAIN-2019-39,application/x-hdf,3910,3910,0.0002\nCC-MAIN-2019-39,application/x-mobipocket-ebook,7818,7813,0.0003\nCC-MAIN-2019-39,application/x-ms-asx,7593,7585,0.0003\nCC-MAIN-2019-39,application/x-msdownload,4149,4122,0.0002\nCC-MAIN-2019-39,application/x-rar-compressed,18785,18688,0.0007\nCC-MAIN-2019-39,application/x-research-info-systems,2297,2297,0.0001\nCC-MAIN-2019-39,application/x-sh,27939,27912,0.0011\nCC-MAIN-2019-39,application/x-shockwave-flash,19933,19830,0.0008\nCC-MAIN-2019-39,application/x-stata-do,6449,6426,0.0003\nCC-MAIN-2019-39,application/x-tex,7356,7354,0.0003\nCC-MAIN-2019-39,application/x-tex-tfm,8595,8595,0.0003\nCC-MAIN-2019-39,application/x-tika-msoffice,87754,87722,0.0034\nCC-MAIN-2019-39,application/x-tika-ooxml,69857,69707,0.0027\nCC-MAIN-2019-39,application/x-wais-source,4981,4981,0.0002\nCC-MAIN-2019-39,application/x-xz,11911,11910,0.0005\nCC-MAIN-2019-39,application/xhtml+xml,561870001,557695815,21.9389\nCC-MAIN-2019-39,application/xml,1521248,1515369,0.0594\nCC-MAIN-2019-39,application/zip,226024,224804,0.0088\nCC-MAIN-2019-39,application/zlib,29720,29527,0.0012\nCC-MAIN-2019-39,application/zstd,19,19,0.0000\nCC-MAIN-2019-39,audio/mp4,36751,35789,0.0014\nCC-MAIN-2019-39,audio/mpeg,169971,166576,0.0066\nCC-MAIN-2019-39,audio/vnd.wave,20184,20149,0.0008\nCC-MAIN-2019-39,audio/x-mpegurl,3466,3461,0.0001\nCC-MAIN-2019-39,image/gif,79675,79035,0.0031\nCC-MAIN-2019-39,image/jpeg,4285454,4275456,0.1673\nCC-MAIN-2019-39,image/png,628364,625482,0.0245\nCC-MAIN-2019-39,image/svg+xml,15627,15616,0.0006\nCC-MAIN-2019-39,image/tiff,32804,32791,0.0013\nCC-MAIN-2019-39,image/vnd.djvu,12737,12734,0.0005\nCC-MAIN-2019-39,image/vnd.dxf; format=ascii,10938,10937,0.0004\nCC-MAIN-2019-39,image/webp,16223,16223,0.0006\nCC-MAIN-2019-39,message/rfc822,37116,36966,0.0014\nCC-MAIN-2019-39,text/asp,1,1,0.0000\nCC-MAIN-2019-39,text/calendar,1130831,1130146,0.0442\nCC-MAIN-2019-39,text/css,5902,5901,0.0002\nCC-MAIN-2019-39,text/csv,58183,58150,0.0023\nCC-MAIN-2019-39,text/html,1951634806,1933597026,76.2041\nCC-MAIN-2019-39,text/markdown,139,139,0.0000\nCC-MAIN-2019-39,text/plain,2181723,2179837,0.0852\nCC-MAIN-2019-39,text/prs.lines.tag,35576,35404,0.0014\nCC-MAIN-2019-39,text/tab-separated-values,14498,14498,0.0006\nCC-MAIN-2019-39,text/troff,10459,10459,0.0004\nCC-MAIN-2019-39,text/turtle,14703,14703,0.0006\nCC-MAIN-2019-39,text/vtt,15578,15565,0.0006\nCC-MAIN-2019-39,text/x-c++src,9475,9474,0.0004\nCC-MAIN-2019-39,text/x-chdr,28011,28010,0.0011\nCC-MAIN-2019-39,text/x-csrc,47137,47132,0.0018\nCC-MAIN-2019-39,text/x-diff,50862,50770,0.0020\nCC-MAIN-2019-39,text/x-jsp,2836,2834,0.0001\nCC-MAIN-2019-39,text/x-log,98169,98165,0.0038\nCC-MAIN-2019-39,text/x-matlab,55744,55724,0.0022\nCC-MAIN-2019-39,text/x-perl,82999,82983,0.0032\nCC-MAIN-2019-39,text/x-php,86469,85752,0.0034\nCC-MAIN-2019-39,text/x-python,8804,8803,0.0003\nCC-MAIN-2019-39,text/x-vcalendar,25683,25683,0.0010\nCC-MAIN-2019-39,text/x-vcard,103245,103164,0.0040\nCC-MAIN-2019-39,text/x-web-markdown,5400,5396,0.0002\nCC-MAIN-2019-39,text/x-yaml,5887,5887,0.0002\nCC-MAIN-2019-39,video/mp4,43618,43385,0.0017\nCC-MAIN-2019-39,video/quicktime,11119,11105,0.0004\nCC-MAIN-2019-39,video/webm,1956,1947,0.0001\nCC-MAIN-2019-39,video/x-m4v,13527,13382,0.0005\nCC-MAIN-2019-43,<other>,382065,381239,0.0127\nCC-MAIN-2019-43,application/atom+xml,3367971,3366938,0.1116\nCC-MAIN-2019-43,application/epub+zip,38510,38387,0.0013\nCC-MAIN-2019-43,application/gpx+xml,5568,5568,0.0002\nCC-MAIN-2019-43,application/gzip,67086,66923,0.0022\nCC-MAIN-2019-43,application/javascript,34392,34384,0.0011\nCC-MAIN-2019-43,application/json,718691,717731,0.0238\nCC-MAIN-2019-43,application/marc,8372,8372,0.0003\nCC-MAIN-2019-43,application/mbox,63750,63747,0.0021\nCC-MAIN-2019-43,application/msword,61936,61579,0.0021\nCC-MAIN-2019-43,application/octet-stream,479514,479221,0.0159\nCC-MAIN-2019-43,application/pdf,11780097,11733082,0.3902\nCC-MAIN-2019-43,application/pgp-signature,32233,32233,0.0011\nCC-MAIN-2019-43,application/pkcs7-signature,4516,4516,0.0001\nCC-MAIN-2019-43,application/postscript,16515,16507,0.0005\nCC-MAIN-2019-43,application/rdf+xml,324608,324358,0.0108\nCC-MAIN-2019-43,application/rss+xml,4138660,4129740,0.1371\nCC-MAIN-2019-43,application/rtf,88184,88135,0.0029\nCC-MAIN-2019-43,application/text,20054,20041,0.0007\nCC-MAIN-2019-43,application/vnd.android.package-archive,37524,36963,0.0012\nCC-MAIN-2019-43,application/vnd.google-earth.kml+xml,57628,57604,0.0019\nCC-MAIN-2019-43,application/vnd.google-earth.kmz,9124,9118,0.0003\nCC-MAIN-2019-43,application/vnd.ms-excel,30200,30113,0.0010\nCC-MAIN-2019-43,application/vnd.ms-powerpoint,33718,33597,0.0011\nCC-MAIN-2019-43,application/vnd.oasis.opendocument.spreadsheet,6305,6304,0.0002\nCC-MAIN-2019-43,application/vnd.oasis.opendocument.text,18171,18161,0.0006\nCC-MAIN-2019-43,application/vnd.openxmlformats-officedocument.presentationml.presentation,7009,6984,0.0002\nCC-MAIN-2019-43,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,30862,30758,0.0010\nCC-MAIN-2019-43,application/vnd.openxmlformats-officedocument.wordprocessingml.document,68569,68283,0.0023\nCC-MAIN-2019-43,application/x-bibtex-text-file,152363,152281,0.0050\nCC-MAIN-2019-43,application/x-bittorrent,16401,15701,0.0005\nCC-MAIN-2019-43,application/x-bzip2,11827,11790,0.0004\nCC-MAIN-2019-43,application/x-dosexec,12121,11593,0.0004\nCC-MAIN-2019-43,application/x-endnote-refer,63929,63811,0.0021\nCC-MAIN-2019-43,application/x-hdf,3162,3162,0.0001\nCC-MAIN-2019-43,application/x-mobipocket-ebook,6939,6937,0.0002\nCC-MAIN-2019-43,application/x-ms-asx,7598,7592,0.0003\nCC-MAIN-2019-43,application/x-msdownload,3601,3572,0.0001\nCC-MAIN-2019-43,application/x-rar-compressed,13304,13207,0.0004\nCC-MAIN-2019-43,application/x-research-info-systems,4634,4632,0.0002\nCC-MAIN-2019-43,application/x-sh,24088,24081,0.0008\nCC-MAIN-2019-43,application/x-shockwave-flash,19538,19469,0.0006\nCC-MAIN-2019-43,application/x-stata-do,8153,8130,0.0003\nCC-MAIN-2019-43,application/x-tex,6484,6482,0.0002\nCC-MAIN-2019-43,application/x-tex-tfm,5369,5369,0.0002\nCC-MAIN-2019-43,application/x-tika-msoffice,80245,80184,0.0027\nCC-MAIN-2019-43,application/x-tika-ooxml,58026,57962,0.0019\nCC-MAIN-2019-43,application/x-wais-source,4062,4062,0.0001\nCC-MAIN-2019-43,application/x-xz,13749,13747,0.0005\nCC-MAIN-2019-43,application/xhtml+xml,676241086,671478623,22.3992\nCC-MAIN-2019-43,application/xml,1857670,1851428,0.0615\nCC-MAIN-2019-43,application/zip,193880,192539,0.0064\nCC-MAIN-2019-43,application/zlib,25505,25436,0.0008\nCC-MAIN-2019-43,application/zstd,159,159,0.0000\nCC-MAIN-2019-43,audio/mp4,34393,33805,0.0011\nCC-MAIN-2019-43,audio/mpeg,137446,133795,0.0046\nCC-MAIN-2019-43,audio/vnd.wave,26005,26003,0.0009\nCC-MAIN-2019-43,audio/x-mpegurl,6309,6304,0.0002\nCC-MAIN-2019-43,image/gif,81173,80489,0.0027\nCC-MAIN-2019-43,image/jpeg,3758762,3751193,0.1245\nCC-MAIN-2019-43,image/png,560060,557713,0.0186\nCC-MAIN-2019-43,image/svg+xml,13042,13010,0.0004\nCC-MAIN-2019-43,image/tiff,30978,30977,0.0010\nCC-MAIN-2019-43,image/vnd.djvu,12879,12877,0.0004\nCC-MAIN-2019-43,image/vnd.dxf; format=ascii,9128,9122,0.0003\nCC-MAIN-2019-43,image/webp,28436,28418,0.0009\nCC-MAIN-2019-43,message/rfc822,35931,35780,0.0012\nCC-MAIN-2019-43,text/calendar,1066195,1065592,0.0353\nCC-MAIN-2019-43,text/css,7569,7564,0.0003\nCC-MAIN-2019-43,text/csv,84712,84699,0.0028\nCC-MAIN-2019-43,text/html,2308918649,2288335354,76.4787\nCC-MAIN-2019-43,text/markdown,178,178,0.0000\nCC-MAIN-2019-43,text/plain,2529349,2526894,0.0838\nCC-MAIN-2019-43,text/prs.lines.tag,44699,44654,0.0015\nCC-MAIN-2019-43,text/tab-separated-values,17356,17355,0.0006\nCC-MAIN-2019-43,text/troff,15403,15402,0.0005\nCC-MAIN-2019-43,text/turtle,24512,24512,0.0008\nCC-MAIN-2019-43,text/vtt,14213,14213,0.0005\nCC-MAIN-2019-43,text/x-c++src,12639,12638,0.0004\nCC-MAIN-2019-43,text/x-chdr,44445,44445,0.0015\nCC-MAIN-2019-43,text/x-csrc,75126,75124,0.0025\nCC-MAIN-2019-43,text/x-diff,80759,80682,0.0027\nCC-MAIN-2019-43,text/x-jsp,3870,3863,0.0001\nCC-MAIN-2019-43,text/x-log,102289,102278,0.0034\nCC-MAIN-2019-43,text/x-matlab,77426,77388,0.0026\nCC-MAIN-2019-43,text/x-perl,115826,115802,0.0038\nCC-MAIN-2019-43,text/x-php,95351,94454,0.0032\nCC-MAIN-2019-43,text/x-python,8100,8100,0.0003\nCC-MAIN-2019-43,text/x-vcalendar,23523,23520,0.0008\nCC-MAIN-2019-43,text/x-vcard,101214,101101,0.0034\nCC-MAIN-2019-43,text/x-web-markdown,7585,7585,0.0003\nCC-MAIN-2019-43,text/x-yaml,7788,7788,0.0003\nCC-MAIN-2019-43,video/mp4,35183,34982,0.0012\nCC-MAIN-2019-43,video/quicktime,8334,8315,0.0003\nCC-MAIN-2019-43,video/webm,1833,1824,0.0001\nCC-MAIN-2019-43,video/x-m4v,12136,12071,0.0004\nCC-MAIN-2019-47,<other>,334421,333430,0.0129\nCC-MAIN-2019-47,application/atom+xml,3261205,3260129,0.1259\nCC-MAIN-2019-47,application/epub+zip,57861,57785,0.0022\nCC-MAIN-2019-47,application/gpx+xml,6047,6047,0.0002\nCC-MAIN-2019-47,application/gzip,70255,70108,0.0027\nCC-MAIN-2019-47,application/javascript,27596,27579,0.0011\nCC-MAIN-2019-47,application/json,633507,633021,0.0245\nCC-MAIN-2019-47,application/marc,5539,5538,0.0002\nCC-MAIN-2019-47,application/mbox,63038,63032,0.0024\nCC-MAIN-2019-47,application/msword,69081,68702,0.0027\nCC-MAIN-2019-47,application/octet-stream,329265,328777,0.0127\nCC-MAIN-2019-47,application/pdf,12206558,12163646,0.4712\nCC-MAIN-2019-47,application/pgp-signature,39357,39354,0.0015\nCC-MAIN-2019-47,application/pkcs7-signature,6026,6025,0.0002\nCC-MAIN-2019-47,application/postscript,12369,12366,0.0005\nCC-MAIN-2019-47,application/rdf+xml,239943,239797,0.0093\nCC-MAIN-2019-47,application/rss+xml,3424865,3416398,0.1322\nCC-MAIN-2019-47,application/rtf,69344,69307,0.0027\nCC-MAIN-2019-47,application/text,13365,13362,0.0005\nCC-MAIN-2019-47,application/vnd.android.package-archive,39023,38523,0.0015\nCC-MAIN-2019-47,application/vnd.google-earth.kml+xml,55546,55474,0.0021\nCC-MAIN-2019-47,application/vnd.google-earth.kmz,9421,9417,0.0004\nCC-MAIN-2019-47,application/vnd.ms-excel,30147,30096,0.0012\nCC-MAIN-2019-47,application/vnd.ms-powerpoint,40684,40674,0.0016\nCC-MAIN-2019-47,application/vnd.oasis.opendocument.spreadsheet,4716,4706,0.0002\nCC-MAIN-2019-47,application/vnd.oasis.opendocument.text,18911,18885,0.0007\nCC-MAIN-2019-47,application/vnd.openxmlformats-officedocument.presentationml.presentation,6438,6426,0.0002\nCC-MAIN-2019-47,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,30487,30416,0.0012\nCC-MAIN-2019-47,application/vnd.openxmlformats-officedocument.wordprocessingml.document,61154,60886,0.0024\nCC-MAIN-2019-47,application/x-bibtex-text-file,128140,127982,0.0049\nCC-MAIN-2019-47,application/x-bittorrent,7955,7513,0.0003\nCC-MAIN-2019-47,application/x-bzip2,19119,19049,0.0007\nCC-MAIN-2019-47,application/x-dosexec,12853,12489,0.0005\nCC-MAIN-2019-47,application/x-endnote-refer,49684,49668,0.0019\nCC-MAIN-2019-47,application/x-hdf,5990,5990,0.0002\nCC-MAIN-2019-47,application/x-mobipocket-ebook,11359,11346,0.0004\nCC-MAIN-2019-47,application/x-ms-asx,3199,3197,0.0001\nCC-MAIN-2019-47,application/x-msdownload,2955,2920,0.0001\nCC-MAIN-2019-47,application/x-rar-compressed,13932,13814,0.0005\nCC-MAIN-2019-47,application/x-research-info-systems,5528,5495,0.0002\nCC-MAIN-2019-47,application/x-sh,34207,34196,0.0013\nCC-MAIN-2019-47,application/x-shockwave-flash,14016,13949,0.0005\nCC-MAIN-2019-47,application/x-stata-do,6006,5959,0.0002\nCC-MAIN-2019-47,application/x-tex,6157,6156,0.0002\nCC-MAIN-2019-47,application/x-tex-tfm,7143,7143,0.0003\nCC-MAIN-2019-47,application/x-tika-msoffice,74780,74760,0.0029\nCC-MAIN-2019-47,application/x-tika-ooxml,49611,49562,0.0019\nCC-MAIN-2019-47,application/x-wais-source,5305,5305,0.0002\nCC-MAIN-2019-47,application/x-xz,4698,4695,0.0002\nCC-MAIN-2019-47,application/xhtml+xml,555659037,551688296,21.4491\nCC-MAIN-2019-47,application/xml,1713357,1707959,0.0661\nCC-MAIN-2019-47,application/zip,222256,220459,0.0086\nCC-MAIN-2019-47,application/zlib,11303,11211,0.0004\nCC-MAIN-2019-47,application/zstd,329,329,0.0000\nCC-MAIN-2019-47,audio/mp4,37268,36647,0.0014\nCC-MAIN-2019-47,audio/mpeg,147410,142984,0.0057\nCC-MAIN-2019-47,audio/vnd.wave,24501,24345,0.0009\nCC-MAIN-2019-47,audio/x-mpegurl,2654,2649,0.0001\nCC-MAIN-2019-47,image/gif,72788,72143,0.0028\nCC-MAIN-2019-47,image/jpeg,3932068,3923053,0.1518\nCC-MAIN-2019-47,image/png,584080,581194,0.0225\nCC-MAIN-2019-47,image/svg+xml,17713,17696,0.0007\nCC-MAIN-2019-47,image/tiff,54456,54452,0.0021\nCC-MAIN-2019-47,image/vnd.djvu,12508,12504,0.0005\nCC-MAIN-2019-47,image/vnd.dxf; format=ascii,8087,8085,0.0003\nCC-MAIN-2019-47,image/webp,23843,23834,0.0009\nCC-MAIN-2019-47,message/rfc822,32313,32168,0.0012\nCC-MAIN-2019-47,text/calendar,959303,958771,0.0370\nCC-MAIN-2019-47,text/css,10935,10933,0.0004\nCC-MAIN-2019-47,text/csv,68436,68422,0.0026\nCC-MAIN-2019-47,text/html,2002557402,1983625070,77.3011\nCC-MAIN-2019-47,text/markdown,180,180,0.0000\nCC-MAIN-2019-47,text/plain,2068745,2067326,0.0799\nCC-MAIN-2019-47,text/prs.lines.tag,41295,41263,0.0016\nCC-MAIN-2019-47,text/tab-separated-values,15719,15715,0.0006\nCC-MAIN-2019-47,text/troff,9453,9452,0.0004\nCC-MAIN-2019-47,text/turtle,17557,17556,0.0007\nCC-MAIN-2019-47,text/vtt,14145,14145,0.0005\nCC-MAIN-2019-47,text/x-c++src,10176,10175,0.0004\nCC-MAIN-2019-47,text/x-chdr,29672,29672,0.0011\nCC-MAIN-2019-47,text/x-csrc,46003,45999,0.0018\nCC-MAIN-2019-47,text/x-diff,55258,55222,0.0021\nCC-MAIN-2019-47,text/x-jsp,3927,3908,0.0002\nCC-MAIN-2019-47,text/x-log,74299,74295,0.0029\nCC-MAIN-2019-47,text/x-matlab,53244,53204,0.0021\nCC-MAIN-2019-47,text/x-perl,80012,80005,0.0031\nCC-MAIN-2019-47,text/x-php,89228,87113,0.0034\nCC-MAIN-2019-47,text/x-python,6753,6751,0.0003\nCC-MAIN-2019-47,text/x-vcalendar,19384,19377,0.0007\nCC-MAIN-2019-47,text/x-vcard,95335,95196,0.0037\nCC-MAIN-2019-47,text/x-web-markdown,7563,7563,0.0003\nCC-MAIN-2019-47,text/x-yaml,5307,5305,0.0002\nCC-MAIN-2019-47,video/mp4,42645,42464,0.0016\nCC-MAIN-2019-47,video/quicktime,11641,11621,0.0004\nCC-MAIN-2019-47,video/webm,1830,1824,0.0001\nCC-MAIN-2019-47,video/x-m4v,14949,14841,0.0006\nCC-MAIN-2019-51,<other>,326872,326110,0.0132\nCC-MAIN-2019-51,application/atom+xml,3292421,3291780,0.1332\nCC-MAIN-2019-51,application/epub+zip,43111,43000,0.0017\nCC-MAIN-2019-51,application/gpx+xml,6394,6392,0.0003\nCC-MAIN-2019-51,application/gzip,61940,61707,0.0025\nCC-MAIN-2019-51,application/javascript,34270,34256,0.0014\nCC-MAIN-2019-51,application/json,602595,602405,0.0244\nCC-MAIN-2019-51,application/marc,7539,7539,0.0003\nCC-MAIN-2019-51,application/mbox,58293,58277,0.0024\nCC-MAIN-2019-51,application/msword,58085,57824,0.0023\nCC-MAIN-2019-51,application/octet-stream,330491,330189,0.0134\nCC-MAIN-2019-51,application/pdf,3275012,3253269,0.1325\nCC-MAIN-2019-51,application/pgp-signature,22254,22254,0.0009\nCC-MAIN-2019-51,application/pkcs7-signature,9234,9231,0.0004\nCC-MAIN-2019-51,application/postscript,4401,4401,0.0002\nCC-MAIN-2019-51,application/rdf+xml,245634,245428,0.0099\nCC-MAIN-2019-51,application/rss+xml,3502802,3494780,0.1417\nCC-MAIN-2019-51,application/rtf,64460,64419,0.0026\nCC-MAIN-2019-51,application/text,12391,12384,0.0005\nCC-MAIN-2019-51,application/vnd.android.package-archive,36089,35657,0.0015\nCC-MAIN-2019-51,application/vnd.google-earth.kml+xml,54745,54631,0.0022\nCC-MAIN-2019-51,application/vnd.google-earth.kmz,7451,7446,0.0003\nCC-MAIN-2019-51,application/vnd.ms-excel,28764,28701,0.0012\nCC-MAIN-2019-51,application/vnd.ms-powerpoint,21654,21644,0.0009\nCC-MAIN-2019-51,application/vnd.oasis.opendocument.spreadsheet,4952,4948,0.0002\nCC-MAIN-2019-51,application/vnd.oasis.opendocument.text,18617,18605,0.0008\nCC-MAIN-2019-51,application/vnd.openxmlformats-officedocument.presentationml.presentation,6540,6512,0.0003\nCC-MAIN-2019-51,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,30797,30702,0.0012\nCC-MAIN-2019-51,application/vnd.openxmlformats-officedocument.wordprocessingml.document,57486,57254,0.0023\nCC-MAIN-2019-51,application/x-bibtex-text-file,127477,127350,0.0052\nCC-MAIN-2019-51,application/x-bittorrent,9220,8853,0.0004\nCC-MAIN-2019-51,application/x-bzip2,21470,21413,0.0009\nCC-MAIN-2019-51,application/x-dosexec,11836,11522,0.0005\nCC-MAIN-2019-51,application/x-endnote-refer,48132,48127,0.0019\nCC-MAIN-2019-51,application/x-hdf,10639,10639,0.0004\nCC-MAIN-2019-51,application/x-mobipocket-ebook,7861,7802,0.0003\nCC-MAIN-2019-51,application/x-ms-asx,4380,4376,0.0002\nCC-MAIN-2019-51,application/x-msdownload,3118,3065,0.0001\nCC-MAIN-2019-51,application/x-rar-compressed,14870,14685,0.0006\nCC-MAIN-2019-51,application/x-research-info-systems,6194,6163,0.0003\nCC-MAIN-2019-51,application/x-sh,20451,20438,0.0008\nCC-MAIN-2019-51,application/x-shockwave-flash,15495,15431,0.0006\nCC-MAIN-2019-51,application/x-stata-do,7019,6980,0.0003\nCC-MAIN-2019-51,application/x-tex,5417,5417,0.0002\nCC-MAIN-2019-51,application/x-tex-tfm,4235,4235,0.0002\nCC-MAIN-2019-51,application/x-tika-msoffice,76350,76319,0.0031\nCC-MAIN-2019-51,application/x-tika-ooxml,48830,48765,0.0020\nCC-MAIN-2019-51,application/x-wais-source,5608,5608,0.0002\nCC-MAIN-2019-51,application/x-xz,6858,6858,0.0003\nCC-MAIN-2019-51,application/xhtml+xml,535820053,532157219,21.6764\nCC-MAIN-2019-51,application/xml,1895334,1889813,0.0767\nCC-MAIN-2019-51,application/zip,200675,199152,0.0081\nCC-MAIN-2019-51,application/zlib,11799,11745,0.0005\nCC-MAIN-2019-51,application/zstd,61,61,0.0000\nCC-MAIN-2019-51,audio/mp4,33152,32718,0.0013\nCC-MAIN-2019-51,audio/mpeg,150458,146015,0.0061\nCC-MAIN-2019-51,audio/vnd.wave,22607,22125,0.0009\nCC-MAIN-2019-51,audio/x-mpegurl,2997,2991,0.0001\nCC-MAIN-2019-51,image/gif,68298,67677,0.0028\nCC-MAIN-2019-51,image/jpeg,3405050,3396222,0.1378\nCC-MAIN-2019-51,image/png,495169,492477,0.0200\nCC-MAIN-2019-51,image/svg+xml,13275,13264,0.0005\nCC-MAIN-2019-51,image/tiff,26676,26670,0.0011\nCC-MAIN-2019-51,image/vnd.djvu,11636,11628,0.0005\nCC-MAIN-2019-51,image/vnd.dxf; format=ascii,12007,12007,0.0005\nCC-MAIN-2019-51,image/webp,21989,21988,0.0009\nCC-MAIN-2019-51,message/rfc822,34911,34754,0.0014\nCC-MAIN-2019-51,text/calendar,1083785,1083102,0.0438\nCC-MAIN-2019-51,text/css,8303,8300,0.0003\nCC-MAIN-2019-51,text/csv,66297,66288,0.0027\nCC-MAIN-2019-51,text/html,1913115275,1896342937,77.3944\nCC-MAIN-2019-51,text/markdown,230,230,0.0000\nCC-MAIN-2019-51,text/plain,1988645,1987364,0.0804\nCC-MAIN-2019-51,text/prs.lines.tag,30904,30898,0.0013\nCC-MAIN-2019-51,text/tab-separated-values,16762,16759,0.0007\nCC-MAIN-2019-51,text/troff,14963,14962,0.0006\nCC-MAIN-2019-51,text/turtle,21382,21380,0.0009\nCC-MAIN-2019-51,text/vtt,10981,10981,0.0004\nCC-MAIN-2019-51,text/x-c++src,8517,8517,0.0003\nCC-MAIN-2019-51,text/x-chdr,31531,31531,0.0013\nCC-MAIN-2019-51,text/x-csrc,47633,47631,0.0019\nCC-MAIN-2019-51,text/x-diff,54426,54391,0.0022\nCC-MAIN-2019-51,text/x-jsp,3907,3903,0.0002\nCC-MAIN-2019-51,text/x-log,65773,65773,0.0027\nCC-MAIN-2019-51,text/x-matlab,53200,53173,0.0022\nCC-MAIN-2019-51,text/x-perl,86489,86471,0.0035\nCC-MAIN-2019-51,text/x-php,80378,80006,0.0033\nCC-MAIN-2019-51,text/x-python,7423,7422,0.0003\nCC-MAIN-2019-51,text/x-vcalendar,21762,21760,0.0009\nCC-MAIN-2019-51,text/x-vcard,102502,102385,0.0041\nCC-MAIN-2019-51,text/x-web-markdown,7583,7579,0.0003\nCC-MAIN-2019-51,text/x-yaml,7306,7306,0.0003\nCC-MAIN-2019-51,video/mp4,38976,38662,0.0016\nCC-MAIN-2019-51,video/quicktime,9680,9673,0.0004\nCC-MAIN-2019-51,video/webm,1332,1328,0.0001\nCC-MAIN-2019-51,video/x-m4v,12119,12040,0.0005\nCC-MAIN-2020-05,<other>,351562,350967,0.0113\nCC-MAIN-2020-05,application/atom+xml,3970607,3969580,0.1280\nCC-MAIN-2020-05,application/epub+zip,40617,40586,0.0013\nCC-MAIN-2020-05,application/gpx+xml,6418,6414,0.0002\nCC-MAIN-2020-05,application/gzip,45949,45733,0.0015\nCC-MAIN-2020-05,application/javascript,37375,37269,0.0012\nCC-MAIN-2020-05,application/json,610185,609831,0.0197\nCC-MAIN-2020-05,application/marc,7629,7627,0.0002\nCC-MAIN-2020-05,application/mbox,69167,69156,0.0022\nCC-MAIN-2020-05,application/msword,47130,46892,0.0015\nCC-MAIN-2020-05,application/octet-stream,326861,326377,0.0105\nCC-MAIN-2020-05,application/pdf,2716184,2697447,0.0876\nCC-MAIN-2020-05,application/pgp-signature,30666,30666,0.0010\nCC-MAIN-2020-05,application/pkcs7-signature,8025,8023,0.0003\nCC-MAIN-2020-05,application/postscript,3063,3060,0.0001\nCC-MAIN-2020-05,application/rdf+xml,299008,298781,0.0096\nCC-MAIN-2020-05,application/rss+xml,4053670,4043848,0.1307\nCC-MAIN-2020-05,application/rtf,67652,67613,0.0022\nCC-MAIN-2020-05,application/text,15165,15161,0.0005\nCC-MAIN-2020-05,application/vnd.android.package-archive,31861,31429,0.0010\nCC-MAIN-2020-05,application/vnd.google-earth.kml+xml,63483,63444,0.0020\nCC-MAIN-2020-05,application/vnd.google-earth.kmz,11525,11523,0.0004\nCC-MAIN-2020-05,application/vnd.ms-excel,25646,25578,0.0008\nCC-MAIN-2020-05,application/vnd.ms-powerpoint,21910,21907,0.0007\nCC-MAIN-2020-05,application/vnd.oasis.opendocument.spreadsheet,4929,4919,0.0002\nCC-MAIN-2020-05,application/vnd.oasis.opendocument.text,19910,19891,0.0006\nCC-MAIN-2020-05,application/vnd.openxmlformats-officedocument.presentationml.presentation,6817,6808,0.0002\nCC-MAIN-2020-05,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,30615,30541,0.0010\nCC-MAIN-2020-05,application/vnd.openxmlformats-officedocument.wordprocessingml.document,56769,56509,0.0018\nCC-MAIN-2020-05,application/x-bibtex-text-file,157356,157272,0.0051\nCC-MAIN-2020-05,application/x-bittorrent,9664,9458,0.0003\nCC-MAIN-2020-05,application/x-bzip2,8449,8421,0.0003\nCC-MAIN-2020-05,application/x-dosexec,11136,10850,0.0004\nCC-MAIN-2020-05,application/x-endnote-refer,52832,52822,0.0017\nCC-MAIN-2020-05,application/x-hdf,12675,12675,0.0004\nCC-MAIN-2020-05,application/x-mobipocket-ebook,8413,8409,0.0003\nCC-MAIN-2020-05,application/x-ms-asx,10210,10199,0.0003\nCC-MAIN-2020-05,application/x-msdownload,4543,4506,0.0001\nCC-MAIN-2020-05,application/x-rar-compressed,13175,12839,0.0004\nCC-MAIN-2020-05,application/x-research-info-systems,6562,6501,0.0002\nCC-MAIN-2020-05,application/x-sh,27644,27631,0.0009\nCC-MAIN-2020-05,application/x-shockwave-flash,15300,15244,0.0005\nCC-MAIN-2020-05,application/x-stata-do,11038,11007,0.0004\nCC-MAIN-2020-05,application/x-tex,4593,4593,0.0001\nCC-MAIN-2020-05,application/x-tex-tfm,6061,6061,0.0002\nCC-MAIN-2020-05,application/x-tika-msoffice,78579,78504,0.0025\nCC-MAIN-2020-05,application/x-tika-ooxml,52856,52828,0.0017\nCC-MAIN-2020-05,application/x-wais-source,4790,4790,0.0002\nCC-MAIN-2020-05,application/x-xz,6236,6232,0.0002\nCC-MAIN-2020-05,application/xhtml+xml,652804795,648152178,21.0508\nCC-MAIN-2020-05,application/xml,2461600,2454536,0.0794\nCC-MAIN-2020-05,application/zip,200387,198872,0.0065\nCC-MAIN-2020-05,application/zlib,10762,10708,0.0003\nCC-MAIN-2020-05,application/zstd,1178,1178,0.0000\nCC-MAIN-2020-05,audio/mp4,28265,27345,0.0009\nCC-MAIN-2020-05,audio/mpeg,134375,131402,0.0043\nCC-MAIN-2020-05,audio/vnd.wave,23300,23270,0.0008\nCC-MAIN-2020-05,audio/x-mpegurl,3939,3939,0.0001\nCC-MAIN-2020-05,image/gif,74390,73766,0.0024\nCC-MAIN-2020-05,image/jpeg,3221238,3213979,0.1039\nCC-MAIN-2020-05,image/png,472382,469752,0.0152\nCC-MAIN-2020-05,image/svg+xml,11735,11728,0.0004\nCC-MAIN-2020-05,image/tiff,16313,16307,0.0005\nCC-MAIN-2020-05,image/vnd.djvu,14901,14900,0.0005\nCC-MAIN-2020-05,image/vnd.dxf; format=ascii,8867,8867,0.0003\nCC-MAIN-2020-05,image/webp,19578,19567,0.0006\nCC-MAIN-2020-05,message/rfc822,40017,39866,0.0013\nCC-MAIN-2020-05,text/calendar,1106624,1105904,0.0357\nCC-MAIN-2020-05,text/css,8034,8033,0.0003\nCC-MAIN-2020-05,text/csv,74894,74869,0.0024\nCC-MAIN-2020-05,text/html,2423156742,2400118131,78.1387\nCC-MAIN-2020-05,text/markdown,365,365,0.0000\nCC-MAIN-2020-05,text/plain,2885243,2884079,0.0930\nCC-MAIN-2020-05,text/prs.lines.tag,47658,47653,0.0015\nCC-MAIN-2020-05,text/tab-separated-values,15183,15183,0.0005\nCC-MAIN-2020-05,text/troff,7868,7867,0.0003\nCC-MAIN-2020-05,text/turtle,24559,24558,0.0008\nCC-MAIN-2020-05,text/vtt,12112,12112,0.0004\nCC-MAIN-2020-05,text/x-c++src,8108,8107,0.0003\nCC-MAIN-2020-05,text/x-chdr,30962,30960,0.0010\nCC-MAIN-2020-05,text/x-csrc,53179,53177,0.0017\nCC-MAIN-2020-05,text/x-diff,60026,59974,0.0019\nCC-MAIN-2020-05,text/x-jsp,4896,4894,0.0002\nCC-MAIN-2020-05,text/x-log,73564,73564,0.0024\nCC-MAIN-2020-05,text/x-matlab,54906,54893,0.0018\nCC-MAIN-2020-05,text/x-perl,120764,120745,0.0039\nCC-MAIN-2020-05,text/x-php,107529,106898,0.0035\nCC-MAIN-2020-05,text/x-python,9574,9571,0.0003\nCC-MAIN-2020-05,text/x-vcalendar,19715,19714,0.0006\nCC-MAIN-2020-05,text/x-vcard,118799,118516,0.0038\nCC-MAIN-2020-05,text/x-web-markdown,8963,8963,0.0003\nCC-MAIN-2020-05,text/x-yaml,7251,7251,0.0002\nCC-MAIN-2020-05,video/mp4,37703,37520,0.0012\nCC-MAIN-2020-05,video/quicktime,7437,7408,0.0002\nCC-MAIN-2020-05,video/webm,1981,1975,0.0001\nCC-MAIN-2020-05,video/x-m4v,2002,1995,0.0001\nCC-MAIN-2020-10,<other>,401696,401091,0.0153\nCC-MAIN-2020-10,application/atom+xml,3736945,3736112,0.1421\nCC-MAIN-2020-10,application/epub+zip,57015,56797,0.0022\nCC-MAIN-2020-10,application/gpx+xml,9610,9606,0.0004\nCC-MAIN-2020-10,application/gzip,51903,51745,0.0020\nCC-MAIN-2020-10,application/javascript,38111,38020,0.0014\nCC-MAIN-2020-10,application/json,615896,615551,0.0234\nCC-MAIN-2020-10,application/marc,8579,8579,0.0003\nCC-MAIN-2020-10,application/mbox,76255,76249,0.0029\nCC-MAIN-2020-10,application/msword,70510,70109,0.0027\nCC-MAIN-2020-10,application/octet-stream,446877,446512,0.0170\nCC-MAIN-2020-10,application/pdf,3790477,3758916,0.1441\nCC-MAIN-2020-10,application/pgp-signature,45319,45318,0.0017\nCC-MAIN-2020-10,application/pkcs7-signature,6635,6631,0.0003\nCC-MAIN-2020-10,application/postscript,4311,4299,0.0002\nCC-MAIN-2020-10,application/rdf+xml,305037,304874,0.0116\nCC-MAIN-2020-10,application/rss+xml,4065161,4056226,0.1546\nCC-MAIN-2020-10,application/rtf,74665,74556,0.0028\nCC-MAIN-2020-10,application/text,15944,15925,0.0006\nCC-MAIN-2020-10,application/vnd.android.package-archive,50329,49866,0.0019\nCC-MAIN-2020-10,application/vnd.google-earth.kml+xml,66758,66736,0.0025\nCC-MAIN-2020-10,application/vnd.google-earth.kmz,13772,13771,0.0005\nCC-MAIN-2020-10,application/vnd.ms-excel,37849,37767,0.0014\nCC-MAIN-2020-10,application/vnd.ms-powerpoint,23090,23064,0.0009\nCC-MAIN-2020-10,application/vnd.oasis.opendocument.spreadsheet,8508,8495,0.0003\nCC-MAIN-2020-10,application/vnd.oasis.opendocument.text,28008,27987,0.0011\nCC-MAIN-2020-10,application/vnd.openxmlformats-officedocument.presentationml.presentation,9635,9598,0.0004\nCC-MAIN-2020-10,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,36496,36315,0.0014\nCC-MAIN-2020-10,application/vnd.openxmlformats-officedocument.wordprocessingml.document,80239,79971,0.0031\nCC-MAIN-2020-10,application/x-bibtex-text-file,178011,177850,0.0068\nCC-MAIN-2020-10,application/x-bittorrent,14976,14723,0.0006\nCC-MAIN-2020-10,application/x-bzip2,17436,17407,0.0007\nCC-MAIN-2020-10,application/x-dosexec,12847,12474,0.0005\nCC-MAIN-2020-10,application/x-endnote-refer,61394,61385,0.0023\nCC-MAIN-2020-10,application/x-hdf,22545,22545,0.0009\nCC-MAIN-2020-10,application/x-mobipocket-ebook,9885,9853,0.0004\nCC-MAIN-2020-10,application/x-ms-asx,10774,10763,0.0004\nCC-MAIN-2020-10,application/x-msdownload,5274,5237,0.0002\nCC-MAIN-2020-10,application/x-rar-compressed,17585,17287,0.0007\nCC-MAIN-2020-10,application/x-research-info-systems,5509,5490,0.0002\nCC-MAIN-2020-10,application/x-sh,30822,30804,0.0012\nCC-MAIN-2020-10,application/x-shockwave-flash,16329,16267,0.0006\nCC-MAIN-2020-10,application/x-stata-do,7558,7538,0.0003\nCC-MAIN-2020-10,application/x-tex,5657,5657,0.0002\nCC-MAIN-2020-10,application/x-tex-tfm,7097,7097,0.0003\nCC-MAIN-2020-10,application/x-tika-msoffice,110663,110598,0.0042\nCC-MAIN-2020-10,application/x-tika-ooxml,71929,71874,0.0027\nCC-MAIN-2020-10,application/x-wais-source,7714,7714,0.0003\nCC-MAIN-2020-10,application/x-xz,8407,8405,0.0003\nCC-MAIN-2020-10,application/xhtml+xml,565348157,561714262,21.4964\nCC-MAIN-2020-10,application/xml,2659243,2653628,0.1011\nCC-MAIN-2020-10,application/zip,241310,239181,0.0092\nCC-MAIN-2020-10,application/zlib,5330,5257,0.0002\nCC-MAIN-2020-10,application/zstd,7903,7903,0.0003\nCC-MAIN-2020-10,audio/mp4,45548,44833,0.0017\nCC-MAIN-2020-10,audio/mpeg,183666,179659,0.0070\nCC-MAIN-2020-10,audio/vnd.wave,30576,30253,0.0012\nCC-MAIN-2020-10,audio/x-mpegurl,6315,6313,0.0002\nCC-MAIN-2020-10,image/gif,83648,83132,0.0032\nCC-MAIN-2020-10,image/jpeg,4144514,4134785,0.1576\nCC-MAIN-2020-10,image/png,573387,570654,0.0218\nCC-MAIN-2020-10,image/svg+xml,14559,14541,0.0006\nCC-MAIN-2020-10,image/tiff,12885,12836,0.0005\nCC-MAIN-2020-10,image/vnd.djvu,24847,24838,0.0009\nCC-MAIN-2020-10,image/vnd.dxf; format=ascii,15932,15845,0.0006\nCC-MAIN-2020-10,image/webp,25527,25514,0.0010\nCC-MAIN-2020-10,message/rfc822,55034,54842,0.0021\nCC-MAIN-2020-10,text/calendar,1336854,1335882,0.0508\nCC-MAIN-2020-10,text/css,7454,7451,0.0003\nCC-MAIN-2020-10,text/csv,89607,89569,0.0034\nCC-MAIN-2020-10,text/html,2036627827,2018575282,77.4394\nCC-MAIN-2020-10,text/markdown,254,254,0.0000\nCC-MAIN-2020-10,text/plain,2727676,2725732,0.1037\nCC-MAIN-2020-10,text/prs.lines.tag,23833,23830,0.0009\nCC-MAIN-2020-10,text/tab-separated-values,20589,20584,0.0008\nCC-MAIN-2020-10,text/troff,6889,6888,0.0003\nCC-MAIN-2020-10,text/turtle,26344,26331,0.0010\nCC-MAIN-2020-10,text/vtt,14952,14951,0.0006\nCC-MAIN-2020-10,text/x-c++src,10752,10745,0.0004\nCC-MAIN-2020-10,text/x-chdr,31099,31093,0.0012\nCC-MAIN-2020-10,text/x-csrc,53105,53099,0.0020\nCC-MAIN-2020-10,text/x-diff,66374,66181,0.0025\nCC-MAIN-2020-10,text/x-jsp,9766,9763,0.0004\nCC-MAIN-2020-10,text/x-log,103976,103972,0.0040\nCC-MAIN-2020-10,text/x-matlab,62847,62825,0.0024\nCC-MAIN-2020-10,text/x-perl,113108,113012,0.0043\nCC-MAIN-2020-10,text/x-php,98665,98336,0.0038\nCC-MAIN-2020-10,text/x-python,10562,10558,0.0004\nCC-MAIN-2020-10,text/x-vcalendar,29338,29334,0.0011\nCC-MAIN-2020-10,text/x-vcard,140816,140690,0.0054\nCC-MAIN-2020-10,text/x-web-markdown,8679,8678,0.0003\nCC-MAIN-2020-10,text/x-yaml,3607,3607,0.0001\nCC-MAIN-2020-10,video/mp4,45469,45257,0.0017\nCC-MAIN-2020-10,video/quicktime,11846,11808,0.0005\nCC-MAIN-2020-10,video/webm,1708,1704,0.0001\nCC-MAIN-2020-10,video/x-m4v,3043,3034,0.0001\nCC-MAIN-2020-16,<other>,343711,343079,0.0119\nCC-MAIN-2020-16,application/atom+xml,2789340,2788465,0.0966\nCC-MAIN-2020-16,application/epub+zip,46746,46642,0.0016\nCC-MAIN-2020-16,application/gpx+xml,5935,5932,0.0002\nCC-MAIN-2020-16,application/gzip,71690,71397,0.0025\nCC-MAIN-2020-16,application/javascript,30848,30748,0.0011\nCC-MAIN-2020-16,application/json,473252,473036,0.0164\nCC-MAIN-2020-16,application/marc,6043,6043,0.0002\nCC-MAIN-2020-16,application/mbox,55469,55464,0.0019\nCC-MAIN-2020-16,application/msword,62331,62165,0.0022\nCC-MAIN-2020-16,application/octet-stream,266744,266225,0.0092\nCC-MAIN-2020-16,application/pdf,21430937,21391455,0.7425\nCC-MAIN-2020-16,application/pgp-signature,47600,47600,0.0016\nCC-MAIN-2020-16,application/pkcs7-signature,7906,7906,0.0003\nCC-MAIN-2020-16,application/postscript,3161,3157,0.0001\nCC-MAIN-2020-16,application/rdf+xml,288252,288029,0.0100\nCC-MAIN-2020-16,application/rss+xml,3751025,3742797,0.1300\nCC-MAIN-2020-16,application/rtf,59860,59802,0.0021\nCC-MAIN-2020-16,application/text,14484,14484,0.0005\nCC-MAIN-2020-16,application/vnd.android.package-archive,40598,40234,0.0014\nCC-MAIN-2020-16,application/vnd.google-earth.kml+xml,49353,49268,0.0017\nCC-MAIN-2020-16,application/vnd.google-earth.kmz,8751,8750,0.0003\nCC-MAIN-2020-16,application/vnd.ms-excel,31340,31287,0.0011\nCC-MAIN-2020-16,application/vnd.ms-powerpoint,21938,21925,0.0008\nCC-MAIN-2020-16,application/vnd.oasis.opendocument.spreadsheet,6382,6376,0.0002\nCC-MAIN-2020-16,application/vnd.oasis.opendocument.text,17616,17607,0.0006\nCC-MAIN-2020-16,application/vnd.openxmlformats-officedocument.presentationml.presentation,6805,6790,0.0002\nCC-MAIN-2020-16,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,27717,27588,0.0010\nCC-MAIN-2020-16,application/vnd.openxmlformats-officedocument.wordprocessingml.document,59408,59195,0.0021\nCC-MAIN-2020-16,application/x-bibtex-text-file,143725,143709,0.0050\nCC-MAIN-2020-16,application/x-bittorrent,9206,8928,0.0003\nCC-MAIN-2020-16,application/x-bzip2,5532,5515,0.0002\nCC-MAIN-2020-16,application/x-dosexec,11294,11074,0.0004\nCC-MAIN-2020-16,application/x-endnote-refer,44433,44415,0.0015\nCC-MAIN-2020-16,application/x-hdf,15680,15633,0.0005\nCC-MAIN-2020-16,application/x-mobipocket-ebook,8204,8204,0.0003\nCC-MAIN-2020-16,application/x-ms-asx,4418,4416,0.0002\nCC-MAIN-2020-16,application/x-msdownload,3557,3540,0.0001\nCC-MAIN-2020-16,application/x-rar-compressed,15105,14852,0.0005\nCC-MAIN-2020-16,application/x-research-info-systems,5191,5191,0.0002\nCC-MAIN-2020-16,application/x-sh,24763,24735,0.0009\nCC-MAIN-2020-16,application/x-shockwave-flash,9997,9954,0.0003\nCC-MAIN-2020-16,application/x-stata-do,5193,5157,0.0002\nCC-MAIN-2020-16,application/x-tex,4965,4965,0.0002\nCC-MAIN-2020-16,application/x-tex-tfm,2904,2904,0.0001\nCC-MAIN-2020-16,application/x-tika-msoffice,72560,72490,0.0025\nCC-MAIN-2020-16,application/x-tika-ooxml,53994,53911,0.0019\nCC-MAIN-2020-16,application/x-wais-source,4493,4493,0.0002\nCC-MAIN-2020-16,application/x-xz,4433,4431,0.0002\nCC-MAIN-2020-16,application/xhtml+xml,582049557,578093001,20.1664\nCC-MAIN-2020-16,application/xml,2430609,2424854,0.0842\nCC-MAIN-2020-16,application/zip,218967,217528,0.0076\nCC-MAIN-2020-16,application/zlib,5433,5366,0.0002\nCC-MAIN-2020-16,application/zstd,8089,8089,0.0003\nCC-MAIN-2020-16,audio/mp4,43300,42904,0.0015\nCC-MAIN-2020-16,audio/mpeg,162396,158419,0.0056\nCC-MAIN-2020-16,audio/vnd.wave,21918,21858,0.0008\nCC-MAIN-2020-16,audio/x-mpegurl,4084,4084,0.0001\nCC-MAIN-2020-16,image/gif,73021,72586,0.0025\nCC-MAIN-2020-16,image/jpeg,3782159,3774949,0.1310\nCC-MAIN-2020-16,image/png,602941,600567,0.0209\nCC-MAIN-2020-16,image/svg+xml,14877,14834,0.0005\nCC-MAIN-2020-16,image/tiff,8364,8359,0.0003\nCC-MAIN-2020-16,image/vnd.djvu,18526,18524,0.0006\nCC-MAIN-2020-16,image/vnd.dxf; format=ascii,8087,8087,0.0003\nCC-MAIN-2020-16,image/webp,25592,25589,0.0009\nCC-MAIN-2020-16,message/rfc822,37135,36933,0.0013\nCC-MAIN-2020-16,text/calendar,945320,944873,0.0328\nCC-MAIN-2020-16,text/css,7769,7729,0.0003\nCC-MAIN-2020-16,text/csv,74006,73992,0.0026\nCC-MAIN-2020-16,text/html,2262409384,2242316677,78.3861\nCC-MAIN-2020-16,text/markdown,312,312,0.0000\nCC-MAIN-2020-16,text/plain,2104520,2103158,0.0729\nCC-MAIN-2020-16,text/prs.lines.tag,30432,30429,0.0011\nCC-MAIN-2020-16,text/tab-separated-values,12385,12385,0.0004\nCC-MAIN-2020-16,text/troff,8151,8151,0.0003\nCC-MAIN-2020-16,text/turtle,25413,25411,0.0009\nCC-MAIN-2020-16,text/vtt,13907,13906,0.0005\nCC-MAIN-2020-16,text/x-c++src,9328,9328,0.0003\nCC-MAIN-2020-16,text/x-chdr,27514,27514,0.0010\nCC-MAIN-2020-16,text/x-csrc,42250,42246,0.0015\nCC-MAIN-2020-16,text/x-diff,53437,53379,0.0019\nCC-MAIN-2020-16,text/x-jsp,4006,4002,0.0001\nCC-MAIN-2020-16,text/x-log,43935,43933,0.0015\nCC-MAIN-2020-16,text/x-matlab,44662,44541,0.0015\nCC-MAIN-2020-16,text/x-perl,88632,88612,0.0031\nCC-MAIN-2020-16,text/x-php,110910,110551,0.0038\nCC-MAIN-2020-16,text/x-python,7376,7374,0.0003\nCC-MAIN-2020-16,text/x-vcalendar,19210,19209,0.0007\nCC-MAIN-2020-16,text/x-vcard,94225,94160,0.0033\nCC-MAIN-2020-16,text/x-web-markdown,7970,7926,0.0003\nCC-MAIN-2020-16,text/x-yaml,5502,5502,0.0002\nCC-MAIN-2020-16,video/mp4,41214,41089,0.0014\nCC-MAIN-2020-16,video/quicktime,10614,10581,0.0004\nCC-MAIN-2020-16,video/webm,1792,1791,0.0001\nCC-MAIN-2020-16,video/x-m4v,2117,2108,0.0001\nCC-MAIN-2020-24,<other>,362187,361746,0.0131\nCC-MAIN-2020-24,application/atom+xml,4482316,4481146,0.1622\nCC-MAIN-2020-24,application/epub+zip,43311,43009,0.0016\nCC-MAIN-2020-24,application/gpx+xml,6693,6689,0.0002\nCC-MAIN-2020-24,application/gzip,82028,81774,0.0030\nCC-MAIN-2020-24,application/javascript,56050,56007,0.0020\nCC-MAIN-2020-24,application/json,568510,568003,0.0206\nCC-MAIN-2020-24,application/marc,7295,7295,0.0003\nCC-MAIN-2020-24,application/mbox,62266,62254,0.0023\nCC-MAIN-2020-24,application/msword,59213,58972,0.0021\nCC-MAIN-2020-24,application/octet-stream,284826,284308,0.0103\nCC-MAIN-2020-24,application/pdf,3506961,3483840,0.1269\nCC-MAIN-2020-24,application/pgp-signature,32138,32134,0.0012\nCC-MAIN-2020-24,application/pkcs7-signature,10298,10296,0.0004\nCC-MAIN-2020-24,application/postscript,4969,4968,0.0002\nCC-MAIN-2020-24,application/rdf+xml,274524,274309,0.0099\nCC-MAIN-2020-24,application/rss+xml,4258344,4246869,0.1541\nCC-MAIN-2020-24,application/rtf,66487,66435,0.0024\nCC-MAIN-2020-24,application/text,17714,17712,0.0006\nCC-MAIN-2020-24,application/vnd.android.package-archive,35766,32742,0.0013\nCC-MAIN-2020-24,application/vnd.google-earth.kml+xml,63012,62967,0.0023\nCC-MAIN-2020-24,application/vnd.google-earth.kmz,10409,10398,0.0004\nCC-MAIN-2020-24,application/vnd.ms-excel,32985,32908,0.0012\nCC-MAIN-2020-24,application/vnd.ms-powerpoint,25099,25086,0.0009\nCC-MAIN-2020-24,application/vnd.oasis.opendocument.spreadsheet,7693,7667,0.0003\nCC-MAIN-2020-24,application/vnd.oasis.opendocument.text,23172,23162,0.0008\nCC-MAIN-2020-24,application/vnd.openxmlformats-officedocument.presentationml.presentation,6785,6770,0.0002\nCC-MAIN-2020-24,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,38553,38450,0.0014\nCC-MAIN-2020-24,application/vnd.openxmlformats-officedocument.wordprocessingml.document,72692,72405,0.0026\nCC-MAIN-2020-24,application/x-bibtex-text-file,158356,158280,0.0057\nCC-MAIN-2020-24,application/x-bittorrent,12563,12353,0.0005\nCC-MAIN-2020-24,application/x-bzip2,4148,4109,0.0002\nCC-MAIN-2020-24,application/x-dosexec,9456,9254,0.0003\nCC-MAIN-2020-24,application/x-endnote-refer,56677,56646,0.0021\nCC-MAIN-2020-24,application/x-hdf,3655,3655,0.0001\nCC-MAIN-2020-24,application/x-mobipocket-ebook,7868,7865,0.0003\nCC-MAIN-2020-24,application/x-ms-asx,4244,4241,0.0002\nCC-MAIN-2020-24,application/x-msdownload,3302,3285,0.0001\nCC-MAIN-2020-24,application/x-rar-compressed,117,117,0.0000\nCC-MAIN-2020-24,application/x-research-info-systems,5944,5936,0.0002\nCC-MAIN-2020-24,application/x-sh,23250,23238,0.0008\nCC-MAIN-2020-24,application/x-shockwave-flash,9572,9521,0.0003\nCC-MAIN-2020-24,application/x-stata-do,13917,13898,0.0005\nCC-MAIN-2020-24,application/x-tex,5008,5008,0.0002\nCC-MAIN-2020-24,application/x-tex-tfm,906,906,0.0000\nCC-MAIN-2020-24,application/x-tika-msoffice,99934,99807,0.0036\nCC-MAIN-2020-24,application/x-tika-ooxml,78089,77971,0.0028\nCC-MAIN-2020-24,application/x-wais-source,3558,3558,0.0001\nCC-MAIN-2020-24,application/x-xz,2164,2163,0.0001\nCC-MAIN-2020-24,application/xhtml+xml,575658420,571953791,20.8330\nCC-MAIN-2020-24,application/xml,2062259,2055230,0.0746\nCC-MAIN-2020-24,application/zip,195765,195161,0.0071\nCC-MAIN-2020-24,application/zlib,6433,6373,0.0002\nCC-MAIN-2020-24,application/zstd,9825,9825,0.0004\nCC-MAIN-2020-24,audio/mp4,41361,40993,0.0015\nCC-MAIN-2020-24,audio/mpeg,142161,138607,0.0051\nCC-MAIN-2020-24,audio/vnd.wave,15272,15064,0.0006\nCC-MAIN-2020-24,audio/x-mpegurl,4657,4656,0.0002\nCC-MAIN-2020-24,image/gif,65615,65028,0.0024\nCC-MAIN-2020-24,image/jpeg,3421666,3411441,0.1238\nCC-MAIN-2020-24,image/png,505537,502801,0.0183\nCC-MAIN-2020-24,image/svg+xml,15140,15127,0.0005\nCC-MAIN-2020-24,image/tiff,14069,14064,0.0005\nCC-MAIN-2020-24,image/vnd.djvu,9183,9178,0.0003\nCC-MAIN-2020-24,image/vnd.dxf; format=ascii,9074,9052,0.0003\nCC-MAIN-2020-24,image/webp,36246,36239,0.0013\nCC-MAIN-2020-24,message/rfc822,46356,46333,0.0017\nCC-MAIN-2020-24,text/calendar,1370771,1369496,0.0496\nCC-MAIN-2020-24,text/css,5634,5632,0.0002\nCC-MAIN-2020-24,text/csv,88544,88527,0.0032\nCC-MAIN-2020-24,text/html,2161629720,2141416984,78.2290\nCC-MAIN-2020-24,text/markdown,239,239,0.0000\nCC-MAIN-2020-24,text/plain,2051059,2049601,0.0742\nCC-MAIN-2020-24,text/prs.lines.tag,28151,28083,0.0010\nCC-MAIN-2020-24,text/tab-separated-values,19391,19384,0.0007\nCC-MAIN-2020-24,text/troff,4630,4629,0.0002\nCC-MAIN-2020-24,text/turtle,27839,27827,0.0010\nCC-MAIN-2020-24,text/vtt,14994,14992,0.0005\nCC-MAIN-2020-24,text/x-c++src,10768,10768,0.0004\nCC-MAIN-2020-24,text/x-chdr,26262,26262,0.0010\nCC-MAIN-2020-24,text/x-csrc,42117,42117,0.0015\nCC-MAIN-2020-24,text/x-diff,53393,53378,0.0019\nCC-MAIN-2020-24,text/x-jsp,3523,3520,0.0001\nCC-MAIN-2020-24,text/x-log,35109,35109,0.0013\nCC-MAIN-2020-24,text/x-matlab,61766,61662,0.0022\nCC-MAIN-2020-24,text/x-perl,100838,100806,0.0036\nCC-MAIN-2020-24,text/x-php,137020,136654,0.0050\nCC-MAIN-2020-24,text/x-python,10296,10294,0.0004\nCC-MAIN-2020-24,text/x-vcalendar,28208,28202,0.0010\nCC-MAIN-2020-24,text/x-vcard,120536,120439,0.0044\nCC-MAIN-2020-24,text/x-web-markdown,8795,8794,0.0003\nCC-MAIN-2020-24,text/x-yaml,4307,4307,0.0002\nCC-MAIN-2020-24,video/mp4,40843,40704,0.0015\nCC-MAIN-2020-24,video/quicktime,13059,12971,0.0005\nCC-MAIN-2020-24,video/webm,2104,2101,0.0001\nCC-MAIN-2020-24,video/x-m4v,2783,2778,0.0001\nCC-MAIN-2020-29,<other>,378931,378177,0.0120\nCC-MAIN-2020-29,application/atom+xml,4059098,4057000,0.1291\nCC-MAIN-2020-29,application/epub+zip,42963,42813,0.0014\nCC-MAIN-2020-29,application/gpx+xml,7316,7313,0.0002\nCC-MAIN-2020-29,application/gzip,100207,99304,0.0032\nCC-MAIN-2020-29,application/javascript,43882,43870,0.0014\nCC-MAIN-2020-29,application/json,573511,572990,0.0182\nCC-MAIN-2020-29,application/marc,8303,8303,0.0003\nCC-MAIN-2020-29,application/mbox,68599,68592,0.0022\nCC-MAIN-2020-29,application/msword,75768,75607,0.0024\nCC-MAIN-2020-29,application/octet-stream,340907,340315,0.0108\nCC-MAIN-2020-29,application/pdf,3122176,3099382,0.0993\nCC-MAIN-2020-29,application/pgp-signature,41356,41356,0.0013\nCC-MAIN-2020-29,application/pkcs7-signature,10264,10253,0.0003\nCC-MAIN-2020-29,application/postscript,5655,5655,0.0002\nCC-MAIN-2020-29,application/rdf+xml,294907,294408,0.0094\nCC-MAIN-2020-29,application/rss+xml,4483902,4468712,0.1426\nCC-MAIN-2020-29,application/rtf,69669,69600,0.0022\nCC-MAIN-2020-29,application/text,19962,19960,0.0006\nCC-MAIN-2020-29,application/vnd.android.package-archive,43633,40292,0.0014\nCC-MAIN-2020-29,application/vnd.google-earth.kml+xml,71063,71014,0.0023\nCC-MAIN-2020-29,application/vnd.google-earth.kmz,8224,8223,0.0003\nCC-MAIN-2020-29,application/vnd.ms-excel,31296,31183,0.0010\nCC-MAIN-2020-29,application/vnd.ms-powerpoint,21254,21244,0.0007\nCC-MAIN-2020-29,application/vnd.oasis.opendocument.spreadsheet,6277,6272,0.0002\nCC-MAIN-2020-29,application/vnd.oasis.opendocument.text,23128,23109,0.0007\nCC-MAIN-2020-29,application/vnd.openxmlformats-officedocument.presentationml.presentation,7529,7456,0.0002\nCC-MAIN-2020-29,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,35029,34946,0.0011\nCC-MAIN-2020-29,application/vnd.openxmlformats-officedocument.wordprocessingml.document,77249,77033,0.0025\nCC-MAIN-2020-29,application/x-bibtex-text-file,168453,168410,0.0054\nCC-MAIN-2020-29,application/x-bittorrent,13205,13046,0.0004\nCC-MAIN-2020-29,application/x-bzip2,12550,12526,0.0004\nCC-MAIN-2020-29,application/x-dosexec,10728,10440,0.0003\nCC-MAIN-2020-29,application/x-endnote-refer,55332,55319,0.0018\nCC-MAIN-2020-29,application/x-hdf,19506,19506,0.0006\nCC-MAIN-2020-29,application/x-mobipocket-ebook,8289,8252,0.0003\nCC-MAIN-2020-29,application/x-ms-asx,3616,3611,0.0001\nCC-MAIN-2020-29,application/x-msdownload,6767,6731,0.0002\nCC-MAIN-2020-29,application/x-rar-compressed,487,487,0.0000\nCC-MAIN-2020-29,application/x-research-info-systems,5578,5574,0.0002\nCC-MAIN-2020-29,application/x-sh,20337,20321,0.0006\nCC-MAIN-2020-29,application/x-shockwave-flash,7699,7679,0.0002\nCC-MAIN-2020-29,application/x-stata-do,10639,10575,0.0003\nCC-MAIN-2020-29,application/x-tex,7269,7268,0.0002\nCC-MAIN-2020-29,application/x-tex-tfm,1878,1878,0.0001\nCC-MAIN-2020-29,application/x-tika-msoffice,104269,104208,0.0033\nCC-MAIN-2020-29,application/x-tika-ooxml,86884,86759,0.0028\nCC-MAIN-2020-29,application/x-wais-source,13612,13612,0.0004\nCC-MAIN-2020-29,application/x-xz,3511,3502,0.0001\nCC-MAIN-2020-29,application/xhtml+xml,626446270,622166715,19.9205\nCC-MAIN-2020-29,application/xml,2202379,2194692,0.0700\nCC-MAIN-2020-29,application/zip,195748,194733,0.0062\nCC-MAIN-2020-29,application/zlib,6157,6090,0.0002\nCC-MAIN-2020-29,application/zstd,13462,13460,0.0004\nCC-MAIN-2020-29,audio/mp4,42696,42259,0.0014\nCC-MAIN-2020-29,audio/mpeg,137348,134965,0.0044\nCC-MAIN-2020-29,audio/vnd.wave,14101,13921,0.0004\nCC-MAIN-2020-29,audio/x-mpegurl,5793,5736,0.0002\nCC-MAIN-2020-29,image/gif,67168,66657,0.0021\nCC-MAIN-2020-29,image/jpeg,4029618,4018193,0.1281\nCC-MAIN-2020-29,image/png,621080,617912,0.0197\nCC-MAIN-2020-29,image/svg+xml,14033,13998,0.0004\nCC-MAIN-2020-29,image/tiff,11691,11684,0.0004\nCC-MAIN-2020-29,image/vnd.djvu,7302,7300,0.0002\nCC-MAIN-2020-29,image/vnd.dxf; format=ascii,11657,11656,0.0004\nCC-MAIN-2020-29,image/webp,36718,36712,0.0012\nCC-MAIN-2020-29,message/rfc822,50227,50192,0.0016\nCC-MAIN-2020-29,text/calendar,1415486,1413777,0.0450\nCC-MAIN-2020-29,text/css,7922,7920,0.0003\nCC-MAIN-2020-29,text/csv,88650,88509,0.0028\nCC-MAIN-2020-29,text/html,2491605619,2466367067,79.2311\nCC-MAIN-2020-29,text/markdown,253,253,0.0000\nCC-MAIN-2020-29,text/plain,2233469,2231706,0.0710\nCC-MAIN-2020-29,text/prs.lines.tag,34888,34888,0.0011\nCC-MAIN-2020-29,text/tab-separated-values,16960,16959,0.0005\nCC-MAIN-2020-29,text/troff,13650,13649,0.0004\nCC-MAIN-2020-29,text/turtle,26827,26821,0.0009\nCC-MAIN-2020-29,text/vtt,13123,13123,0.0004\nCC-MAIN-2020-29,text/x-c++src,9051,9051,0.0003\nCC-MAIN-2020-29,text/x-chdr,22009,22009,0.0007\nCC-MAIN-2020-29,text/x-csrc,40523,40522,0.0013\nCC-MAIN-2020-29,text/x-diff,61978,61960,0.0020\nCC-MAIN-2020-29,text/x-jsp,4555,4546,0.0001\nCC-MAIN-2020-29,text/x-log,74431,74430,0.0024\nCC-MAIN-2020-29,text/x-matlab,60149,60039,0.0019\nCC-MAIN-2020-29,text/x-perl,107897,107865,0.0034\nCC-MAIN-2020-29,text/x-php,110164,109713,0.0035\nCC-MAIN-2020-29,text/x-python,9915,9915,0.0003\nCC-MAIN-2020-29,text/x-vcalendar,26199,26185,0.0008\nCC-MAIN-2020-29,text/x-vcard,124001,123799,0.0039\nCC-MAIN-2020-29,text/x-web-markdown,8940,8937,0.0003\nCC-MAIN-2020-29,text/x-yaml,6361,6361,0.0002\nCC-MAIN-2020-29,video/mp4,44432,44266,0.0014\nCC-MAIN-2020-29,video/quicktime,15811,15771,0.0005\nCC-MAIN-2020-29,video/webm,2032,2030,0.0001\nCC-MAIN-2020-29,video/x-m4v,2010,2006,0.0001\nCC-MAIN-2020-34,<other>,408982,408430,0.0167\nCC-MAIN-2020-34,application/atom+xml,3716114,3715132,0.1517\nCC-MAIN-2020-34,application/epub+zip,51287,51220,0.0021\nCC-MAIN-2020-34,application/gpx+xml,9273,9270,0.0004\nCC-MAIN-2020-34,application/gzip,81447,81360,0.0033\nCC-MAIN-2020-34,application/javascript,45924,45909,0.0019\nCC-MAIN-2020-34,application/json,604565,604230,0.0247\nCC-MAIN-2020-34,application/marc,8234,8233,0.0003\nCC-MAIN-2020-34,application/mbox,89868,89842,0.0037\nCC-MAIN-2020-34,application/msword,71678,71377,0.0029\nCC-MAIN-2020-34,application/octet-stream,350210,349796,0.0143\nCC-MAIN-2020-34,application/pdf,3809774,3784722,0.1555\nCC-MAIN-2020-34,application/pgp-signature,59403,59400,0.0024\nCC-MAIN-2020-34,application/pkcs7-signature,12464,12464,0.0005\nCC-MAIN-2020-34,application/postscript,4445,4444,0.0002\nCC-MAIN-2020-34,application/rdf+xml,316962,316797,0.0129\nCC-MAIN-2020-34,application/rss+xml,3863102,3854325,0.1577\nCC-MAIN-2020-34,application/rtf,62241,62185,0.0025\nCC-MAIN-2020-34,application/text,21659,21648,0.0009\nCC-MAIN-2020-34,application/vnd.android.package-archive,50003,48684,0.0020\nCC-MAIN-2020-34,application/vnd.google-earth.kml+xml,56896,56770,0.0023\nCC-MAIN-2020-34,application/vnd.google-earth.kmz,9180,9178,0.0004\nCC-MAIN-2020-34,application/vnd.ms-excel,55697,55602,0.0023\nCC-MAIN-2020-34,application/vnd.ms-powerpoint,21903,21892,0.0009\nCC-MAIN-2020-34,application/vnd.oasis.opendocument.spreadsheet,8333,8324,0.0003\nCC-MAIN-2020-34,application/vnd.oasis.opendocument.text,26417,26384,0.0011\nCC-MAIN-2020-34,application/vnd.openxmlformats-officedocument.presentationml.presentation,8571,8544,0.0003\nCC-MAIN-2020-34,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,39842,39765,0.0016\nCC-MAIN-2020-34,application/vnd.openxmlformats-officedocument.wordprocessingml.document,126035,125851,0.0051\nCC-MAIN-2020-34,application/x-bibtex-text-file,194281,194080,0.0079\nCC-MAIN-2020-34,application/x-bittorrent,11227,11035,0.0005\nCC-MAIN-2020-34,application/x-bzip2,21456,21415,0.0009\nCC-MAIN-2020-34,application/x-dosexec,12175,11958,0.0005\nCC-MAIN-2020-34,application/x-endnote-refer,67887,67842,0.0028\nCC-MAIN-2020-34,application/x-hdf,5845,5845,0.0002\nCC-MAIN-2020-34,application/x-mobipocket-ebook,9995,9992,0.0004\nCC-MAIN-2020-34,application/x-ms-asx,6334,6302,0.0003\nCC-MAIN-2020-34,application/x-msdownload,3672,3647,0.0001\nCC-MAIN-2020-34,application/x-rar-compressed,219,219,0.0000\nCC-MAIN-2020-34,application/x-research-info-systems,6731,6727,0.0003\nCC-MAIN-2020-34,application/x-sh,22688,22604,0.0009\nCC-MAIN-2020-34,application/x-shockwave-flash,12687,12634,0.0005\nCC-MAIN-2020-34,application/x-stata-do,9110,9070,0.0004\nCC-MAIN-2020-34,application/x-tex,6539,6538,0.0003\nCC-MAIN-2020-34,application/x-tex-tfm,3648,3648,0.0001\nCC-MAIN-2020-34,application/x-tika-msoffice,96466,96420,0.0039\nCC-MAIN-2020-34,application/x-tika-ooxml,80621,80472,0.0033\nCC-MAIN-2020-34,application/x-wais-source,7730,7730,0.0003\nCC-MAIN-2020-34,application/x-xz,15977,15977,0.0007\nCC-MAIN-2020-34,application/xhtml+xml,484035358,481070482,19.7579\nCC-MAIN-2020-34,application/xml,2026423,2021584,0.0827\nCC-MAIN-2020-34,application/zip,288855,286739,0.0118\nCC-MAIN-2020-34,application/zlib,4294,4235,0.0002\nCC-MAIN-2020-34,application/zstd,19578,19577,0.0008\nCC-MAIN-2020-34,audio/mp4,43128,42941,0.0018\nCC-MAIN-2020-34,audio/mpeg,153243,150993,0.0063\nCC-MAIN-2020-34,audio/vnd.wave,50413,50318,0.0021\nCC-MAIN-2020-34,audio/x-mpegurl,4414,4413,0.0002\nCC-MAIN-2020-34,image/gif,80870,80379,0.0033\nCC-MAIN-2020-34,image/jpeg,3815135,3806571,0.1557\nCC-MAIN-2020-34,image/png,533131,530131,0.0218\nCC-MAIN-2020-34,image/svg+xml,16092,16080,0.0007\nCC-MAIN-2020-34,image/tiff,12462,12449,0.0005\nCC-MAIN-2020-34,image/vnd.djvu,14464,14460,0.0006\nCC-MAIN-2020-34,image/vnd.dxf; format=ascii,10405,10405,0.0004\nCC-MAIN-2020-34,image/webp,41509,41484,0.0017\nCC-MAIN-2020-34,message/rfc822,46516,46381,0.0019\nCC-MAIN-2020-34,text/calendar,1216042,1214842,0.0496\nCC-MAIN-2020-34,text/css,8996,8979,0.0004\nCC-MAIN-2020-34,text/csv,114380,114359,0.0047\nCC-MAIN-2020-34,text/html,1939448052,1922047816,79.1665\nCC-MAIN-2020-34,text/markdown,143,143,0.0000\nCC-MAIN-2020-34,text/plain,2427289,2424759,0.0991\nCC-MAIN-2020-34,text/prs.lines.tag,46714,46698,0.0019\nCC-MAIN-2020-34,text/tab-separated-values,22788,22788,0.0009\nCC-MAIN-2020-34,text/troff,10633,10633,0.0004\nCC-MAIN-2020-34,text/turtle,31572,31570,0.0013\nCC-MAIN-2020-34,text/vtt,16048,16047,0.0007\nCC-MAIN-2020-34,text/x-c++src,9007,9007,0.0004\nCC-MAIN-2020-34,text/x-chdr,22877,22877,0.0009\nCC-MAIN-2020-34,text/x-csrc,44296,44294,0.0018\nCC-MAIN-2020-34,text/x-diff,66492,66483,0.0027\nCC-MAIN-2020-34,text/x-jsp,2878,2877,0.0001\nCC-MAIN-2020-34,text/x-log,75237,75233,0.0031\nCC-MAIN-2020-34,text/x-matlab,71527,71414,0.0029\nCC-MAIN-2020-34,text/x-perl,91846,91779,0.0037\nCC-MAIN-2020-34,text/x-php,77718,77283,0.0032\nCC-MAIN-2020-34,text/x-python,18431,18417,0.0008\nCC-MAIN-2020-34,text/x-vcalendar,22862,22862,0.0009\nCC-MAIN-2020-34,text/x-vcard,120499,120356,0.0049\nCC-MAIN-2020-34,text/x-web-markdown,10170,10168,0.0004\nCC-MAIN-2020-34,text/x-yaml,8475,8475,0.0003\nCC-MAIN-2020-34,video/mp4,47836,47608,0.0020\nCC-MAIN-2020-34,video/quicktime,14497,14455,0.0006\nCC-MAIN-2020-34,video/webm,2522,2467,0.0001\nCC-MAIN-2020-34,video/x-m4v,2325,2318,0.0001\nCC-MAIN-2020-40,<other>,379304,378731,0.0109\nCC-MAIN-2020-40,application/atom+xml,2487258,2485944,0.0716\nCC-MAIN-2020-40,application/epub+zip,44392,44351,0.0013\nCC-MAIN-2020-40,application/gpx+xml,7495,7495,0.0002\nCC-MAIN-2020-40,application/gzip,60636,60255,0.0017\nCC-MAIN-2020-40,application/javascript,38605,38596,0.0011\nCC-MAIN-2020-40,application/json,549490,548604,0.0158\nCC-MAIN-2020-40,application/marc,6936,6936,0.0002\nCC-MAIN-2020-40,application/mbox,91379,91284,0.0026\nCC-MAIN-2020-40,application/msword,78739,78563,0.0023\nCC-MAIN-2020-40,application/octet-stream,369218,368599,0.0106\nCC-MAIN-2020-40,application/pdf,35100891,35012972,1.0105\nCC-MAIN-2020-40,application/pgp-signature,38753,38751,0.0011\nCC-MAIN-2020-40,application/pkcs7-signature,12862,12856,0.0004\nCC-MAIN-2020-40,application/postscript,3693,3691,0.0001\nCC-MAIN-2020-40,application/rdf+xml,291835,291631,0.0084\nCC-MAIN-2020-40,application/rss+xml,3831141,3821926,0.1103\nCC-MAIN-2020-40,application/rtf,60798,60717,0.0018\nCC-MAIN-2020-40,application/text,20311,20306,0.0006\nCC-MAIN-2020-40,application/vnd.android.package-archive,36545,36239,0.0011\nCC-MAIN-2020-40,application/vnd.google-earth.kml+xml,58662,58656,0.0017\nCC-MAIN-2020-40,application/vnd.google-earth.kmz,23818,23815,0.0007\nCC-MAIN-2020-40,application/vnd.ms-excel,51005,50935,0.0015\nCC-MAIN-2020-40,application/vnd.ms-powerpoint,26088,26075,0.0008\nCC-MAIN-2020-40,application/vnd.oasis.opendocument.spreadsheet,8104,8098,0.0002\nCC-MAIN-2020-40,application/vnd.oasis.opendocument.text,22921,22885,0.0007\nCC-MAIN-2020-40,application/vnd.openxmlformats-officedocument.presentationml.presentation,7188,7178,0.0002\nCC-MAIN-2020-40,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,34742,34656,0.0010\nCC-MAIN-2020-40,application/vnd.openxmlformats-officedocument.wordprocessingml.document,105701,105479,0.0030\nCC-MAIN-2020-40,application/x-bibtex-text-file,172753,172634,0.0050\nCC-MAIN-2020-40,application/x-bittorrent,9561,9335,0.0003\nCC-MAIN-2020-40,application/x-bzip2,30198,30003,0.0009\nCC-MAIN-2020-40,application/x-dosexec,9753,9476,0.0003\nCC-MAIN-2020-40,application/x-endnote-refer,60076,60040,0.0017\nCC-MAIN-2020-40,application/x-hdf,7032,7032,0.0002\nCC-MAIN-2020-40,application/x-mobipocket-ebook,9271,9269,0.0003\nCC-MAIN-2020-40,application/x-ms-asx,4281,4266,0.0001\nCC-MAIN-2020-40,application/x-msdownload,3948,3920,0.0001\nCC-MAIN-2020-40,application/x-rar-compressed,351,351,0.0000\nCC-MAIN-2020-40,application/x-research-info-systems,4350,4346,0.0001\nCC-MAIN-2020-40,application/x-sh,24219,24201,0.0007\nCC-MAIN-2020-40,application/x-shockwave-flash,10394,10359,0.0003\nCC-MAIN-2020-40,application/x-stata-do,10919,10830,0.0003\nCC-MAIN-2020-40,application/x-tex,6040,6039,0.0002\nCC-MAIN-2020-40,application/x-tex-tfm,8062,8062,0.0002\nCC-MAIN-2020-40,application/x-tika-msoffice,91899,91846,0.0026\nCC-MAIN-2020-40,application/x-tika-ooxml,78631,78540,0.0023\nCC-MAIN-2020-40,application/x-wais-source,8466,8378,0.0002\nCC-MAIN-2020-40,application/x-xz,7969,7966,0.0002\nCC-MAIN-2020-40,application/xhtml+xml,596904489,593259435,17.1842\nCC-MAIN-2020-40,application/xml,2293596,2288433,0.0660\nCC-MAIN-2020-40,application/zip,260859,259779,0.0075\nCC-MAIN-2020-40,application/zlib,5649,5601,0.0002\nCC-MAIN-2020-40,application/zstd,12379,12379,0.0004\nCC-MAIN-2020-40,audio/mp4,38282,38009,0.0011\nCC-MAIN-2020-40,audio/mpeg,145806,144138,0.0042\nCC-MAIN-2020-40,audio/vnd.wave,46559,46533,0.0013\nCC-MAIN-2020-40,audio/x-mpegurl,4927,4927,0.0001\nCC-MAIN-2020-40,image/gif,107328,106547,0.0031\nCC-MAIN-2020-40,image/jpeg,7111274,7083336,0.2047\nCC-MAIN-2020-40,image/png,1491900,1486222,0.0430\nCC-MAIN-2020-40,image/svg+xml,32258,32212,0.0009\nCC-MAIN-2020-40,image/tiff,16041,16032,0.0005\nCC-MAIN-2020-40,image/vnd.djvu,10502,10485,0.0003\nCC-MAIN-2020-40,image/vnd.dxf; format=ascii,6176,6172,0.0002\nCC-MAIN-2020-40,image/webp,39054,39047,0.0011\nCC-MAIN-2020-40,message/rfc822,44639,44568,0.0013\nCC-MAIN-2020-40,text/calendar,1121737,1120767,0.0323\nCC-MAIN-2020-40,text/css,8999,8995,0.0003\nCC-MAIN-2020-40,text/csv,100421,100407,0.0029\nCC-MAIN-2020-40,text/html,2816189978,2792964353,81.0748\nCC-MAIN-2020-40,text/markdown,308,308,0.0000\nCC-MAIN-2020-40,text/plain,2319811,2316827,0.0668\nCC-MAIN-2020-40,text/prs.lines.tag,42913,42887,0.0012\nCC-MAIN-2020-40,text/tab-separated-values,19238,19238,0.0006\nCC-MAIN-2020-40,text/troff,16242,16241,0.0005\nCC-MAIN-2020-40,text/turtle,28769,28766,0.0008\nCC-MAIN-2020-40,text/vtt,15007,15006,0.0004\nCC-MAIN-2020-40,text/x-c++src,10187,10186,0.0003\nCC-MAIN-2020-40,text/x-chdr,21204,21200,0.0006\nCC-MAIN-2020-40,text/x-csrc,38411,38410,0.0011\nCC-MAIN-2020-40,text/x-diff,71675,71630,0.0021\nCC-MAIN-2020-40,text/x-jsp,2574,2571,0.0001\nCC-MAIN-2020-40,text/x-log,59516,59511,0.0017\nCC-MAIN-2020-40,text/x-matlab,59575,59467,0.0017\nCC-MAIN-2020-40,text/x-perl,92221,92178,0.0027\nCC-MAIN-2020-40,text/x-php,106336,106077,0.0031\nCC-MAIN-2020-40,text/x-python,10445,10444,0.0003\nCC-MAIN-2020-40,text/x-vcalendar,21527,21526,0.0006\nCC-MAIN-2020-40,text/x-vcard,109709,109521,0.0032\nCC-MAIN-2020-40,text/x-web-markdown,10292,10290,0.0003\nCC-MAIN-2020-40,text/x-yaml,8403,8402,0.0002\nCC-MAIN-2020-40,video/mp4,85560,85367,0.0025\nCC-MAIN-2020-40,video/quicktime,15554,15483,0.0004\nCC-MAIN-2020-40,video/webm,2676,2668,0.0001\nCC-MAIN-2020-40,video/x-m4v,3517,3514,0.0001\nCC-MAIN-2020-45,<other>,404686,402943,0.0148\nCC-MAIN-2020-45,application/atom+xml,2390993,2390322,0.0875\nCC-MAIN-2020-45,application/epub+zip,52854,52828,0.0019\nCC-MAIN-2020-45,application/gpx+xml,7396,7394,0.0003\nCC-MAIN-2020-45,application/gzip,58031,57825,0.0021\nCC-MAIN-2020-45,application/javascript,27373,27363,0.0010\nCC-MAIN-2020-45,application/json,551949,551337,0.0202\nCC-MAIN-2020-45,application/marc,5267,5267,0.0002\nCC-MAIN-2020-45,application/mbox,76267,76266,0.0028\nCC-MAIN-2020-45,application/msword,59727,59611,0.0022\nCC-MAIN-2020-45,application/octet-stream,405592,405201,0.0149\nCC-MAIN-2020-45,application/pdf,23346577,23279470,0.8549\nCC-MAIN-2020-45,application/pgp-signature,36241,36240,0.0013\nCC-MAIN-2020-45,application/pkcs7-signature,10833,10833,0.0004\nCC-MAIN-2020-45,application/postscript,2629,2616,0.0001\nCC-MAIN-2020-45,application/rdf+xml,207905,207812,0.0076\nCC-MAIN-2020-45,application/rss+xml,3510527,3505043,0.1285\nCC-MAIN-2020-45,application/rtf,65798,65787,0.0024\nCC-MAIN-2020-45,application/text,19510,19509,0.0007\nCC-MAIN-2020-45,application/vnd.android.package-archive,11844,11699,0.0004\nCC-MAIN-2020-45,application/vnd.google-earth.kml+xml,49378,49378,0.0018\nCC-MAIN-2020-45,application/vnd.google-earth.kmz,8068,8068,0.0003\nCC-MAIN-2020-45,application/vnd.ms-excel,49071,49001,0.0018\nCC-MAIN-2020-45,application/vnd.ms-powerpoint,27801,27783,0.0010\nCC-MAIN-2020-45,application/vnd.oasis.opendocument.spreadsheet,6616,6505,0.0002\nCC-MAIN-2020-45,application/vnd.oasis.opendocument.text,20111,20032,0.0007\nCC-MAIN-2020-45,application/vnd.openxmlformats-officedocument.presentationml.presentation,7892,7877,0.0003\nCC-MAIN-2020-45,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,33691,33623,0.0012\nCC-MAIN-2020-45,application/vnd.openxmlformats-officedocument.wordprocessingml.document,72196,72032,0.0026\nCC-MAIN-2020-45,application/x-bibtex-text-file,167270,167055,0.0061\nCC-MAIN-2020-45,application/x-bittorrent,8111,7860,0.0003\nCC-MAIN-2020-45,application/x-bzip2,28610,28557,0.0010\nCC-MAIN-2020-45,application/x-dosexec,9545,9304,0.0003\nCC-MAIN-2020-45,application/x-endnote-refer,55793,55786,0.0020\nCC-MAIN-2020-45,application/x-hdf,3771,3771,0.0001\nCC-MAIN-2020-45,application/x-mobipocket-ebook,13957,13955,0.0005\nCC-MAIN-2020-45,application/x-ms-asx,2649,2610,0.0001\nCC-MAIN-2020-45,application/x-msdownload,7651,7068,0.0003\nCC-MAIN-2020-45,application/x-rar-compressed,148,148,0.0000\nCC-MAIN-2020-45,application/x-research-info-systems,4428,4428,0.0002\nCC-MAIN-2020-45,application/x-sh,26462,26445,0.0010\nCC-MAIN-2020-45,application/x-shockwave-flash,12021,11971,0.0004\nCC-MAIN-2020-45,application/x-stata-do,11739,11721,0.0004\nCC-MAIN-2020-45,application/x-tex,4846,4846,0.0002\nCC-MAIN-2020-45,application/x-tex-tfm,5059,5059,0.0002\nCC-MAIN-2020-45,application/x-tika-msoffice,80558,80446,0.0029\nCC-MAIN-2020-45,application/x-tika-ooxml,62214,62152,0.0023\nCC-MAIN-2020-45,application/x-wais-source,5287,5286,0.0002\nCC-MAIN-2020-45,application/x-xz,3353,3353,0.0001\nCC-MAIN-2020-45,application/xhtml+xml,460652267,457613028,16.8671\nCC-MAIN-2020-45,application/xml,2109240,2105036,0.0772\nCC-MAIN-2020-45,application/zip,242178,240264,0.0089\nCC-MAIN-2020-45,application/zlib,6067,5895,0.0002\nCC-MAIN-2020-45,application/zstd,9805,9804,0.0004\nCC-MAIN-2020-45,audio/mp4,48538,48127,0.0018\nCC-MAIN-2020-45,audio/mpeg,179884,176909,0.0066\nCC-MAIN-2020-45,audio/vnd.wave,24012,23924,0.0009\nCC-MAIN-2020-45,audio/x-mpegurl,3857,3857,0.0001\nCC-MAIN-2020-45,image/gif,95398,94765,0.0035\nCC-MAIN-2020-45,image/jpeg,5716304,5694598,0.2093\nCC-MAIN-2020-45,image/png,971104,966600,0.0356\nCC-MAIN-2020-45,image/svg+xml,22105,22021,0.0008\nCC-MAIN-2020-45,image/tiff,20325,20313,0.0007\nCC-MAIN-2020-45,image/vnd.djvu,10136,10136,0.0004\nCC-MAIN-2020-45,image/vnd.dxf; format=ascii,11042,11039,0.0004\nCC-MAIN-2020-45,image/webp,4009,4006,0.0001\nCC-MAIN-2020-45,message/rfc822,39347,39176,0.0014\nCC-MAIN-2020-45,text/calendar,926369,926067,0.0339\nCC-MAIN-2020-45,text/css,9126,9064,0.0003\nCC-MAIN-2020-45,text/csv,94611,94608,0.0035\nCC-MAIN-2020-45,text/html,2224739419,2206664160,81.4606\nCC-MAIN-2020-45,text/markdown,340,340,0.0000\nCC-MAIN-2020-45,text/plain,2252325,2251004,0.0825\nCC-MAIN-2020-45,text/prs.lines.tag,37223,37222,0.0014\nCC-MAIN-2020-45,text/tab-separated-values,16331,16331,0.0006\nCC-MAIN-2020-45,text/troff,11582,11568,0.0004\nCC-MAIN-2020-45,text/turtle,29530,29530,0.0011\nCC-MAIN-2020-45,text/vtt,15795,15795,0.0006\nCC-MAIN-2020-45,text/x-c++src,10777,10777,0.0004\nCC-MAIN-2020-45,text/x-chdr,26308,26308,0.0010\nCC-MAIN-2020-45,text/x-csrc,46846,46846,0.0017\nCC-MAIN-2020-45,text/x-diff,52549,52544,0.0019\nCC-MAIN-2020-45,text/x-jsp,2232,2230,0.0001\nCC-MAIN-2020-45,text/x-log,68690,68690,0.0025\nCC-MAIN-2020-45,text/x-matlab,66321,66206,0.0024\nCC-MAIN-2020-45,text/x-perl,89731,89705,0.0033\nCC-MAIN-2020-45,text/x-php,93015,92718,0.0034\nCC-MAIN-2020-45,text/x-python,14707,14703,0.0005\nCC-MAIN-2020-45,text/x-vcalendar,20283,20282,0.0007\nCC-MAIN-2020-45,text/x-vcard,102405,102364,0.0037\nCC-MAIN-2020-45,text/x-web-markdown,10650,10649,0.0004\nCC-MAIN-2020-45,text/x-yaml,5314,5314,0.0002\nCC-MAIN-2020-45,video/mp4,64400,64263,0.0024\nCC-MAIN-2020-45,video/quicktime,44333,44223,0.0016\nCC-MAIN-2020-45,video/webm,2747,2741,0.0001\nCC-MAIN-2020-45,video/x-m4v,3371,3363,0.0001\nCC-MAIN-2020-50,<other>,366020,365614,0.0139\nCC-MAIN-2020-50,application/atom+xml,1634541,1633886,0.0619\nCC-MAIN-2020-50,application/epub+zip,53166,53132,0.0020\nCC-MAIN-2020-50,application/gpx+xml,6755,6751,0.0003\nCC-MAIN-2020-50,application/gzip,50097,50024,0.0019\nCC-MAIN-2020-50,application/javascript,24086,24068,0.0009\nCC-MAIN-2020-50,application/json,546911,546487,0.0207\nCC-MAIN-2020-50,application/marc,8131,8131,0.0003\nCC-MAIN-2020-50,application/mbox,91776,91775,0.0035\nCC-MAIN-2020-50,application/msword,53069,52967,0.0020\nCC-MAIN-2020-50,application/octet-stream,334857,334414,0.0127\nCC-MAIN-2020-50,application/pdf,18345598,18294015,0.6943\nCC-MAIN-2020-50,application/pgp-signature,32439,32439,0.0012\nCC-MAIN-2020-50,application/pkcs7-signature,8323,8323,0.0003\nCC-MAIN-2020-50,application/postscript,2887,2887,0.0001\nCC-MAIN-2020-50,application/rdf+xml,211523,211431,0.0080\nCC-MAIN-2020-50,application/rss+xml,3035806,3030593,0.1149\nCC-MAIN-2020-50,application/rtf,56300,56289,0.0021\nCC-MAIN-2020-50,application/text,22579,22578,0.0009\nCC-MAIN-2020-50,application/vnd.android.package-archive,13777,13606,0.0005\nCC-MAIN-2020-50,application/vnd.google-earth.kml+xml,66017,66013,0.0025\nCC-MAIN-2020-50,application/vnd.google-earth.kmz,8420,8418,0.0003\nCC-MAIN-2020-50,application/vnd.ms-excel,46224,46126,0.0017\nCC-MAIN-2020-50,application/vnd.ms-powerpoint,26462,26457,0.0010\nCC-MAIN-2020-50,application/vnd.oasis.opendocument.spreadsheet,5104,5103,0.0002\nCC-MAIN-2020-50,application/vnd.oasis.opendocument.text,16209,16206,0.0006\nCC-MAIN-2020-50,application/vnd.openxmlformats-officedocument.presentationml.presentation,5755,5575,0.0002\nCC-MAIN-2020-50,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,32062,32038,0.0012\nCC-MAIN-2020-50,application/vnd.openxmlformats-officedocument.wordprocessingml.document,60012,59725,0.0023\nCC-MAIN-2020-50,application/x-bibtex-text-file,161279,161266,0.0061\nCC-MAIN-2020-50,application/x-bittorrent,8797,8608,0.0003\nCC-MAIN-2020-50,application/x-bzip2,13657,13604,0.0005\nCC-MAIN-2020-50,application/x-dosexec,7808,7552,0.0003\nCC-MAIN-2020-50,application/x-endnote-refer,55397,55386,0.0021\nCC-MAIN-2020-50,application/x-hdf,4195,4195,0.0002\nCC-MAIN-2020-50,application/x-mobipocket-ebook,8910,8909,0.0003\nCC-MAIN-2020-50,application/x-ms-asx,2416,2398,0.0001\nCC-MAIN-2020-50,application/x-msdownload,3467,3436,0.0001\nCC-MAIN-2020-50,application/x-rar-compressed,72,72,0.0000\nCC-MAIN-2020-50,application/x-research-info-systems,6047,6047,0.0002\nCC-MAIN-2020-50,application/x-sh,24106,24097,0.0009\nCC-MAIN-2020-50,application/x-shockwave-flash,9160,9137,0.0003\nCC-MAIN-2020-50,application/x-stata-do,10971,10859,0.0004\nCC-MAIN-2020-50,application/x-tex,5547,5547,0.0002\nCC-MAIN-2020-50,application/x-tex-tfm,6504,6504,0.0002\nCC-MAIN-2020-50,application/x-tika-msoffice,72685,72629,0.0028\nCC-MAIN-2020-50,application/x-tika-ooxml,56200,56106,0.0021\nCC-MAIN-2020-50,application/x-wais-source,4095,4095,0.0002\nCC-MAIN-2020-50,application/x-xz,4600,4600,0.0002\nCC-MAIN-2020-50,application/xhtml+xml,441772587,438961526,16.7182\nCC-MAIN-2020-50,application/xml,1851326,1848058,0.0701\nCC-MAIN-2020-50,application/zip,212567,211499,0.0080\nCC-MAIN-2020-50,application/zlib,5150,5120,0.0002\nCC-MAIN-2020-50,application/zstd,11971,11971,0.0005\nCC-MAIN-2020-50,audio/mp4,43868,43459,0.0017\nCC-MAIN-2020-50,audio/mpeg,158080,155062,0.0060\nCC-MAIN-2020-50,audio/vnd.wave,17886,17871,0.0007\nCC-MAIN-2020-50,audio/x-mpegurl,3592,3591,0.0001\nCC-MAIN-2020-50,image/gif,81031,80459,0.0031\nCC-MAIN-2020-50,image/jpeg,4473735,4452548,0.1693\nCC-MAIN-2020-50,image/png,748243,743003,0.0283\nCC-MAIN-2020-50,image/svg+xml,21076,21007,0.0008\nCC-MAIN-2020-50,image/tiff,17477,17466,0.0007\nCC-MAIN-2020-50,image/vnd.djvu,12850,12840,0.0005\nCC-MAIN-2020-50,image/vnd.dxf; format=ascii,8074,8074,0.0003\nCC-MAIN-2020-50,image/webp,3157,3154,0.0001\nCC-MAIN-2020-50,message/rfc822,44633,44534,0.0017\nCC-MAIN-2020-50,text/calendar,746262,746060,0.0282\nCC-MAIN-2020-50,text/css,9611,9484,0.0004\nCC-MAIN-2020-50,text/csv,108105,108092,0.0041\nCC-MAIN-2020-50,text/html,2163700603,2147168131,81.8817\nCC-MAIN-2020-50,text/markdown,232,232,0.0000\nCC-MAIN-2020-50,text/plain,2010787,2009799,0.0761\nCC-MAIN-2020-50,text/prs.lines.tag,35408,35397,0.0013\nCC-MAIN-2020-50,text/tab-separated-values,16379,16379,0.0006\nCC-MAIN-2020-50,text/troff,13170,13169,0.0005\nCC-MAIN-2020-50,text/turtle,31670,31669,0.0012\nCC-MAIN-2020-50,text/vtt,17610,17609,0.0007\nCC-MAIN-2020-50,text/x-c++src,13931,13931,0.0005\nCC-MAIN-2020-50,text/x-chdr,30073,30073,0.0011\nCC-MAIN-2020-50,text/x-csrc,52275,52273,0.0020\nCC-MAIN-2020-50,text/x-diff,63682,63676,0.0024\nCC-MAIN-2020-50,text/x-jsp,1698,1694,0.0001\nCC-MAIN-2020-50,text/x-log,61445,61445,0.0023\nCC-MAIN-2020-50,text/x-matlab,55950,55817,0.0021\nCC-MAIN-2020-50,text/x-perl,91562,91547,0.0035\nCC-MAIN-2020-50,text/x-php,73148,72887,0.0028\nCC-MAIN-2020-50,text/x-python,14233,14233,0.0005\nCC-MAIN-2020-50,text/x-vcalendar,18271,18271,0.0007\nCC-MAIN-2020-50,text/x-vcard,88270,88141,0.0033\nCC-MAIN-2020-50,text/x-web-markdown,10505,10505,0.0004\nCC-MAIN-2020-50,text/x-yaml,7973,7972,0.0003\nCC-MAIN-2020-50,video/mp4,52580,52387,0.0020\nCC-MAIN-2020-50,video/quicktime,23016,22943,0.0009\nCC-MAIN-2020-50,video/webm,2605,2593,0.0001\nCC-MAIN-2020-50,video/x-m4v,2325,2312,0.0001\nCC-MAIN-2021-04,<other>,422782,422363,0.0124\nCC-MAIN-2021-04,application/atom+xml,2265128,2264186,0.0666\nCC-MAIN-2021-04,application/epub+zip,50647,50589,0.0015\nCC-MAIN-2021-04,application/gpx+xml,7961,7961,0.0002\nCC-MAIN-2021-04,application/gzip,50803,50719,0.0015\nCC-MAIN-2021-04,application/javascript,34540,34520,0.0010\nCC-MAIN-2021-04,application/json,590721,590434,0.0174\nCC-MAIN-2021-04,application/marc,6780,6780,0.0002\nCC-MAIN-2021-04,application/mbox,90972,90970,0.0027\nCC-MAIN-2021-04,application/msword,51814,51663,0.0015\nCC-MAIN-2021-04,application/octet-stream,411592,411040,0.0121\nCC-MAIN-2021-04,application/pdf,26963788,26899892,0.7928\nCC-MAIN-2021-04,application/pgp-signature,38764,38764,0.0011\nCC-MAIN-2021-04,application/pkcs7-signature,10410,10410,0.0003\nCC-MAIN-2021-04,application/postscript,3216,3216,0.0001\nCC-MAIN-2021-04,application/rdf+xml,226171,226010,0.0066\nCC-MAIN-2021-04,application/rss+xml,3607237,3598620,0.1061\nCC-MAIN-2021-04,application/rtf,56866,56843,0.0017\nCC-MAIN-2021-04,application/text,22434,22434,0.0007\nCC-MAIN-2021-04,application/vnd.android.package-archive,12251,11998,0.0004\nCC-MAIN-2021-04,application/vnd.google-earth.kml+xml,49833,49814,0.0015\nCC-MAIN-2021-04,application/vnd.google-earth.kmz,7353,7353,0.0002\nCC-MAIN-2021-04,application/vnd.ms-excel,51694,51587,0.0015\nCC-MAIN-2021-04,application/vnd.ms-powerpoint,24320,24292,0.0007\nCC-MAIN-2021-04,application/vnd.oasis.opendocument.spreadsheet,6006,5997,0.0002\nCC-MAIN-2021-04,application/vnd.oasis.opendocument.text,18348,18325,0.0005\nCC-MAIN-2021-04,application/vnd.openxmlformats-officedocument.presentationml.presentation,6369,6361,0.0002\nCC-MAIN-2021-04,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,35862,35811,0.0011\nCC-MAIN-2021-04,application/vnd.openxmlformats-officedocument.wordprocessingml.document,63620,63286,0.0019\nCC-MAIN-2021-04,application/x-bibtex-text-file,164066,164047,0.0048\nCC-MAIN-2021-04,application/x-bittorrent,8488,8269,0.0002\nCC-MAIN-2021-04,application/x-bzip2,29596,29566,0.0009\nCC-MAIN-2021-04,application/x-dosexec,8410,8190,0.0002\nCC-MAIN-2021-04,application/x-endnote-refer,55664,55657,0.0016\nCC-MAIN-2021-04,application/x-hdf,2308,2308,0.0001\nCC-MAIN-2021-04,application/x-mobipocket-ebook,10554,10550,0.0003\nCC-MAIN-2021-04,application/x-ms-asx,3248,3239,0.0001\nCC-MAIN-2021-04,application/x-msdownload,4921,4867,0.0001\nCC-MAIN-2021-04,application/x-rar-compressed,115,115,0.0000\nCC-MAIN-2021-04,application/x-research-info-systems,4974,4974,0.0001\nCC-MAIN-2021-04,application/x-sh,25657,25652,0.0008\nCC-MAIN-2021-04,application/x-shockwave-flash,7891,7852,0.0002\nCC-MAIN-2021-04,application/x-stata-do,22463,22334,0.0007\nCC-MAIN-2021-04,application/x-tex,4209,4209,0.0001\nCC-MAIN-2021-04,application/x-tex-tfm,7182,7182,0.0002\nCC-MAIN-2021-04,application/x-tika-msoffice,74852,74834,0.0022\nCC-MAIN-2021-04,application/x-tika-ooxml,66999,66906,0.0020\nCC-MAIN-2021-04,application/x-wais-source,4329,4329,0.0001\nCC-MAIN-2021-04,application/x-xz,4942,4942,0.0001\nCC-MAIN-2021-04,application/xhtml+xml,549847476,546287972,16.1659\nCC-MAIN-2021-04,application/xml,2244053,2238732,0.0660\nCC-MAIN-2021-04,application/zip,212487,211493,0.0062\nCC-MAIN-2021-04,application/zlib,11519,11183,0.0003\nCC-MAIN-2021-04,application/zstd,16150,16145,0.0005\nCC-MAIN-2021-04,audio/mp4,44442,44148,0.0013\nCC-MAIN-2021-04,audio/mpeg,172651,168238,0.0051\nCC-MAIN-2021-04,audio/vnd.wave,19911,19866,0.0006\nCC-MAIN-2021-04,audio/x-mpegurl,1899,1897,0.0001\nCC-MAIN-2021-04,image/gif,182579,182167,0.0054\nCC-MAIN-2021-04,image/jpeg,4822311,4805190,0.1418\nCC-MAIN-2021-04,image/png,850310,845773,0.0250\nCC-MAIN-2021-04,image/svg+xml,20260,20058,0.0006\nCC-MAIN-2021-04,image/tiff,14899,14893,0.0004\nCC-MAIN-2021-04,image/vnd.djvu,9967,9940,0.0003\nCC-MAIN-2021-04,image/vnd.dxf; format=ascii,9070,9070,0.0003\nCC-MAIN-2021-04,image/webp,6814,6806,0.0002\nCC-MAIN-2021-04,message/rfc822,53471,53403,0.0016\nCC-MAIN-2021-04,text/asp,1,1,0.0000\nCC-MAIN-2021-04,text/calendar,850401,849858,0.0250\nCC-MAIN-2021-04,text/css,8957,8917,0.0003\nCC-MAIN-2021-04,text/csv,111021,111010,0.0033\nCC-MAIN-2021-04,text/html,2803269385,2779924949,82.4179\nCC-MAIN-2021-04,text/markdown,705,703,0.0000\nCC-MAIN-2021-04,text/plain,1993011,1991767,0.0586\nCC-MAIN-2021-04,text/prs.lines.tag,37036,37036,0.0011\nCC-MAIN-2021-04,text/tab-separated-values,13797,13797,0.0004\nCC-MAIN-2021-04,text/troff,12254,12254,0.0004\nCC-MAIN-2021-04,text/turtle,31193,31193,0.0009\nCC-MAIN-2021-04,text/vtt,17501,17501,0.0005\nCC-MAIN-2021-04,text/x-c++src,12493,12493,0.0004\nCC-MAIN-2021-04,text/x-chdr,29410,29409,0.0009\nCC-MAIN-2021-04,text/x-csrc,50641,50638,0.0015\nCC-MAIN-2021-04,text/x-diff,59202,59192,0.0017\nCC-MAIN-2021-04,text/x-jsp,2712,2706,0.0001\nCC-MAIN-2021-04,text/x-log,56193,56193,0.0017\nCC-MAIN-2021-04,text/x-matlab,60188,60099,0.0018\nCC-MAIN-2021-04,text/x-perl,95356,95351,0.0028\nCC-MAIN-2021-04,text/x-php,102587,102170,0.0030\nCC-MAIN-2021-04,text/x-python,13360,13360,0.0004\nCC-MAIN-2021-04,text/x-vcalendar,17858,17854,0.0005\nCC-MAIN-2021-04,text/x-vcard,103868,103746,0.0031\nCC-MAIN-2021-04,text/x-web-markdown,10278,10277,0.0003\nCC-MAIN-2021-04,text/x-yaml,6122,6122,0.0002\nCC-MAIN-2021-04,video/mp4,63637,63361,0.0019\nCC-MAIN-2021-04,video/quicktime,12659,12480,0.0004\nCC-MAIN-2021-04,video/webm,2524,2517,0.0001\nCC-MAIN-2021-04,video/x-m4v,2638,2614,0.0001\nCC-MAIN-2021-10,<other>,309719,309319,0.0113\nCC-MAIN-2021-10,application/atom+xml,2214067,2213143,0.0809\nCC-MAIN-2021-10,application/epub+zip,47614,47589,0.0017\nCC-MAIN-2021-10,application/gpx+xml,8768,8768,0.0003\nCC-MAIN-2021-10,application/gzip,48940,48849,0.0018\nCC-MAIN-2021-10,application/javascript,26947,26937,0.0010\nCC-MAIN-2021-10,application/json,499127,498951,0.0182\nCC-MAIN-2021-10,application/marc,5105,5105,0.0002\nCC-MAIN-2021-10,application/mbox,86680,86675,0.0032\nCC-MAIN-2021-10,application/msword,58544,58202,0.0021\nCC-MAIN-2021-10,application/octet-stream,315472,315086,0.0115\nCC-MAIN-2021-10,application/pdf,16358436,16312468,0.5977\nCC-MAIN-2021-10,application/pgp-signature,34334,34334,0.0013\nCC-MAIN-2021-10,application/pkcs7-signature,9484,9483,0.0003\nCC-MAIN-2021-10,application/postscript,2204,2203,0.0001\nCC-MAIN-2021-10,application/rdf+xml,203926,203827,0.0075\nCC-MAIN-2021-10,application/rss+xml,3189087,3184642,0.1165\nCC-MAIN-2021-10,application/rtf,59495,59483,0.0022\nCC-MAIN-2021-10,application/text,16789,16789,0.0006\nCC-MAIN-2021-10,application/vnd.android.package-archive,10592,10435,0.0004\nCC-MAIN-2021-10,application/vnd.google-earth.kml+xml,44022,44008,0.0016\nCC-MAIN-2021-10,application/vnd.google-earth.kmz,5280,5276,0.0002\nCC-MAIN-2021-10,application/vnd.ms-excel,54202,54131,0.0020\nCC-MAIN-2021-10,application/vnd.ms-powerpoint,24037,24018,0.0009\nCC-MAIN-2021-10,application/vnd.oasis.opendocument.spreadsheet,4740,4724,0.0002\nCC-MAIN-2021-10,application/vnd.oasis.opendocument.text,19065,19035,0.0007\nCC-MAIN-2021-10,application/vnd.openxmlformats-officedocument.presentationml.presentation,10421,10403,0.0004\nCC-MAIN-2021-10,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,31212,31166,0.0011\nCC-MAIN-2021-10,application/vnd.openxmlformats-officedocument.wordprocessingml.document,70175,69058,0.0026\nCC-MAIN-2021-10,application/x-bibtex-text-file,143844,143805,0.0053\nCC-MAIN-2021-10,application/x-bittorrent,7358,7146,0.0003\nCC-MAIN-2021-10,application/x-bzip2,20410,20399,0.0007\nCC-MAIN-2021-10,application/x-dosexec,8614,8358,0.0003\nCC-MAIN-2021-10,application/x-endnote-refer,49887,49883,0.0018\nCC-MAIN-2021-10,application/x-hdf,3272,3272,0.0001\nCC-MAIN-2021-10,application/x-mobipocket-ebook,11583,11578,0.0004\nCC-MAIN-2021-10,application/x-ms-asx,2797,2792,0.0001\nCC-MAIN-2021-10,application/x-msdownload,3770,3734,0.0001\nCC-MAIN-2021-10,application/x-rar-compressed,148,148,0.0000\nCC-MAIN-2021-10,application/x-research-info-systems,5092,5092,0.0002\nCC-MAIN-2021-10,application/x-sh,24077,24048,0.0009\nCC-MAIN-2021-10,application/x-shockwave-flash,9472,9444,0.0003\nCC-MAIN-2021-10,application/x-stata-do,20825,20662,0.0008\nCC-MAIN-2021-10,application/x-tex,6716,6716,0.0002\nCC-MAIN-2021-10,application/x-tex-tfm,267,267,0.0000\nCC-MAIN-2021-10,application/x-tika-msoffice,68725,68702,0.0025\nCC-MAIN-2021-10,application/x-tika-ooxml,63946,63826,0.0023\nCC-MAIN-2021-10,application/x-wais-source,5015,5015,0.0002\nCC-MAIN-2021-10,application/x-xz,2669,2668,0.0001\nCC-MAIN-2021-10,application/xhtml+xml,419171194,416585750,15.3164\nCC-MAIN-2021-10,application/xml,1850897,1847812,0.0676\nCC-MAIN-2021-10,application/zip,225280,223830,0.0082\nCC-MAIN-2021-10,application/zlib,11031,11008,0.0004\nCC-MAIN-2021-10,application/zstd,21532,21532,0.0008\nCC-MAIN-2021-10,audio/mp4,1293,1293,0.0000\nCC-MAIN-2021-10,audio/mpeg,154901,151808,0.0057\nCC-MAIN-2021-10,audio/vnd.wave,20210,20205,0.0007\nCC-MAIN-2021-10,audio/x-mpegurl,2257,2249,0.0001\nCC-MAIN-2021-10,image/gif,127286,126909,0.0047\nCC-MAIN-2021-10,image/jpeg,3768537,3757335,0.1377\nCC-MAIN-2021-10,image/png,561335,558887,0.0205\nCC-MAIN-2021-10,image/svg+xml,16012,15993,0.0006\nCC-MAIN-2021-10,image/tiff,11557,11552,0.0004\nCC-MAIN-2021-10,image/vnd.djvu,18607,18606,0.0007\nCC-MAIN-2021-10,image/vnd.dxf; format=ascii,8243,8240,0.0003\nCC-MAIN-2021-10,image/webp,4868,4863,0.0002\nCC-MAIN-2021-10,message/rfc822,49328,49188,0.0018\nCC-MAIN-2021-10,text/calendar,804243,804086,0.0294\nCC-MAIN-2021-10,text/css,6750,6749,0.0002\nCC-MAIN-2021-10,text/csv,103071,103064,0.0038\nCC-MAIN-2021-10,text/html,2283030149,2266517870,83.4212\nCC-MAIN-2021-10,text/markdown,511,511,0.0000\nCC-MAIN-2021-10,text/plain,1831224,1829640,0.0669\nCC-MAIN-2021-10,text/prs.lines.tag,32505,32504,0.0012\nCC-MAIN-2021-10,text/tab-separated-values,14790,14790,0.0005\nCC-MAIN-2021-10,text/troff,9905,9905,0.0004\nCC-MAIN-2021-10,text/turtle,28542,28542,0.0010\nCC-MAIN-2021-10,text/vtt,18760,18760,0.0007\nCC-MAIN-2021-10,text/x-c++src,9589,9589,0.0004\nCC-MAIN-2021-10,text/x-chdr,27067,27067,0.0010\nCC-MAIN-2021-10,text/x-csrc,51324,51324,0.0019\nCC-MAIN-2021-10,text/x-diff,58915,58915,0.0022\nCC-MAIN-2021-10,text/x-jsp,1914,1910,0.0001\nCC-MAIN-2021-10,text/x-log,48510,48509,0.0018\nCC-MAIN-2021-10,text/x-matlab,59846,59757,0.0022\nCC-MAIN-2021-10,text/x-perl,70586,70580,0.0026\nCC-MAIN-2021-10,text/x-php,83612,83350,0.0031\nCC-MAIN-2021-10,text/x-python,11845,11845,0.0004\nCC-MAIN-2021-10,text/x-vcalendar,19142,19142,0.0007\nCC-MAIN-2021-10,text/x-vcard,97145,97039,0.0035\nCC-MAIN-2021-10,text/x-web-markdown,8631,8629,0.0003\nCC-MAIN-2021-10,text/x-yaml,7499,7499,0.0003\nCC-MAIN-2021-10,video/mp4,50306,50166,0.0018\nCC-MAIN-2021-10,video/quicktime,7964,7916,0.0003\nCC-MAIN-2021-10,video/webm,2921,2915,0.0001\nCC-MAIN-2021-10,video/x-m4v,1278,1278,0.0000\nCC-MAIN-2021-17,<other>,348813,348244,0.0111\nCC-MAIN-2021-17,application/atom+xml,2329818,2329076,0.0743\nCC-MAIN-2021-17,application/epub+zip,49045,48974,0.0016\nCC-MAIN-2021-17,application/gpx+xml,13026,13024,0.0004\nCC-MAIN-2021-17,application/gzip,53029,52921,0.0017\nCC-MAIN-2021-17,application/javascript,25486,25449,0.0008\nCC-MAIN-2021-17,application/json,531571,531427,0.0170\nCC-MAIN-2021-17,application/marc,7485,7485,0.0002\nCC-MAIN-2021-17,application/mbox,102869,102839,0.0033\nCC-MAIN-2021-17,application/msword,66297,66187,0.0021\nCC-MAIN-2021-17,application/octet-stream,357159,356780,0.0114\nCC-MAIN-2021-17,application/pdf,14802128,14762903,0.4722\nCC-MAIN-2021-17,application/pgp-signature,63977,63976,0.0020\nCC-MAIN-2021-17,application/pkcs7-signature,10771,10770,0.0003\nCC-MAIN-2021-17,application/postscript,2489,2487,0.0001\nCC-MAIN-2021-17,application/rdf+xml,225621,225537,0.0072\nCC-MAIN-2021-17,application/rss+xml,3533371,3527340,0.1127\nCC-MAIN-2021-17,application/rtf,52507,52497,0.0017\nCC-MAIN-2021-17,application/text,17842,17842,0.0006\nCC-MAIN-2021-17,application/vnd.android.package-archive,11866,11720,0.0004\nCC-MAIN-2021-17,application/vnd.google-earth.kml+xml,51932,51925,0.0017\nCC-MAIN-2021-17,application/vnd.google-earth.kmz,11466,11464,0.0004\nCC-MAIN-2021-17,application/vnd.ms-excel,54177,54120,0.0017\nCC-MAIN-2021-17,application/vnd.ms-powerpoint,23937,23926,0.0008\nCC-MAIN-2021-17,application/vnd.oasis.opendocument.spreadsheet,5594,5586,0.0002\nCC-MAIN-2021-17,application/vnd.oasis.opendocument.text,22959,22950,0.0007\nCC-MAIN-2021-17,application/vnd.openxmlformats-officedocument.presentationml.presentation,10309,10292,0.0003\nCC-MAIN-2021-17,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,33234,33188,0.0011\nCC-MAIN-2021-17,application/vnd.openxmlformats-officedocument.wordprocessingml.document,72444,72112,0.0023\nCC-MAIN-2021-17,application/x-bibtex-text-file,156021,155990,0.0050\nCC-MAIN-2021-17,application/x-bittorrent,7805,7582,0.0002\nCC-MAIN-2021-17,application/x-bzip2,24393,24381,0.0008\nCC-MAIN-2021-17,application/x-dosexec,11134,10879,0.0004\nCC-MAIN-2021-17,application/x-endnote-refer,53349,53349,0.0017\nCC-MAIN-2021-17,application/x-hdf,18372,18372,0.0006\nCC-MAIN-2021-17,application/x-mobipocket-ebook,14342,14331,0.0005\nCC-MAIN-2021-17,application/x-ms-asx,3529,3523,0.0001\nCC-MAIN-2021-17,application/x-msdownload,4733,4705,0.0002\nCC-MAIN-2021-17,application/x-rar-compressed,145,145,0.0000\nCC-MAIN-2021-17,application/x-research-info-systems,3850,3850,0.0001\nCC-MAIN-2021-17,application/x-sh,27321,27281,0.0009\nCC-MAIN-2021-17,application/x-shockwave-flash,10255,10220,0.0003\nCC-MAIN-2021-17,application/x-stata-do,23858,23839,0.0008\nCC-MAIN-2021-17,application/x-tex,5825,5825,0.0002\nCC-MAIN-2021-17,application/x-tex-tfm,148,148,0.0000\nCC-MAIN-2021-17,application/x-tika-msoffice,82178,82118,0.0026\nCC-MAIN-2021-17,application/x-tika-ooxml,71904,71779,0.0023\nCC-MAIN-2021-17,application/x-wais-source,5783,5783,0.0002\nCC-MAIN-2021-17,application/x-xz,1833,1833,0.0001\nCC-MAIN-2021-17,application/xhtml+xml,477793901,475176954,15.2434\nCC-MAIN-2021-17,application/xml,2233055,2229677,0.0712\nCC-MAIN-2021-17,application/zip,233809,232270,0.0075\nCC-MAIN-2021-17,application/zlib,21687,21648,0.0007\nCC-MAIN-2021-17,application/zstd,26734,26734,0.0009\nCC-MAIN-2021-17,audio/mp4,2550,2460,0.0001\nCC-MAIN-2021-17,audio/mpeg,161378,158832,0.0051\nCC-MAIN-2021-17,audio/vnd.wave,11890,11850,0.0004\nCC-MAIN-2021-17,audio/x-mpegurl,2620,2618,0.0001\nCC-MAIN-2021-17,image/gif,143476,143121,0.0046\nCC-MAIN-2021-17,image/jpeg,5412932,5402665,0.1727\nCC-MAIN-2021-17,image/png,1034634,1031484,0.0330\nCC-MAIN-2021-17,image/svg+xml,27105,27063,0.0009\nCC-MAIN-2021-17,image/tiff,13495,13491,0.0004\nCC-MAIN-2021-17,image/vnd.djvu,12848,12847,0.0004\nCC-MAIN-2021-17,image/vnd.dxf; format=ascii,10020,10020,0.0003\nCC-MAIN-2021-17,image/webp,4223,4219,0.0001\nCC-MAIN-2021-17,message/rfc822,55638,55579,0.0018\nCC-MAIN-2021-17,text/calendar,831587,831246,0.0265\nCC-MAIN-2021-17,text/css,7090,7088,0.0002\nCC-MAIN-2021-17,text/csv,115957,115949,0.0037\nCC-MAIN-2021-17,text/html,2620015323,2604595127,83.5884\nCC-MAIN-2021-17,text/markdown,652,652,0.0000\nCC-MAIN-2021-17,text/plain,2043955,2042717,0.0652\nCC-MAIN-2021-17,text/prs.lines.tag,22283,22283,0.0007\nCC-MAIN-2021-17,text/tab-separated-values,13232,13232,0.0004\nCC-MAIN-2021-17,text/troff,8637,8636,0.0003\nCC-MAIN-2021-17,text/turtle,32892,32891,0.0010\nCC-MAIN-2021-17,text/vtt,18608,18608,0.0006\nCC-MAIN-2021-17,text/x-c++src,11240,11239,0.0004\nCC-MAIN-2021-17,text/x-chdr,26090,26087,0.0008\nCC-MAIN-2021-17,text/x-csrc,51576,51575,0.0016\nCC-MAIN-2021-17,text/x-diff,65381,65374,0.0021\nCC-MAIN-2021-17,text/x-jsp,2367,2364,0.0001\nCC-MAIN-2021-17,text/x-log,54146,54145,0.0017\nCC-MAIN-2021-17,text/x-matlab,62873,62772,0.0020\nCC-MAIN-2021-17,text/x-perl,77168,77113,0.0025\nCC-MAIN-2021-17,text/x-php,107363,107033,0.0034\nCC-MAIN-2021-17,text/x-python,12422,12419,0.0004\nCC-MAIN-2021-17,text/x-vcalendar,15864,15864,0.0005\nCC-MAIN-2021-17,text/x-vcard,107105,107032,0.0034\nCC-MAIN-2021-17,text/x-web-markdown,9165,9165,0.0003\nCC-MAIN-2021-17,text/x-yaml,7416,7416,0.0002\nCC-MAIN-2021-17,video/mp4,71158,70905,0.0023\nCC-MAIN-2021-17,video/quicktime,9160,9142,0.0003\nCC-MAIN-2021-17,video/webm,2819,2814,0.0001\nCC-MAIN-2021-17,video/x-m4v,1282,1275,0.0000\nCC-MAIN-2021-21,<other>,394790,394093,0.0150\nCC-MAIN-2021-21,application/atom+xml,2033614,2032976,0.0773\nCC-MAIN-2021-21,application/epub+zip,47427,47401,0.0018\nCC-MAIN-2021-21,application/gpx+xml,9855,9853,0.0004\nCC-MAIN-2021-21,application/gzip,47973,47905,0.0018\nCC-MAIN-2021-21,application/javascript,23441,23427,0.0009\nCC-MAIN-2021-21,application/json,516663,516392,0.0196\nCC-MAIN-2021-21,application/marc,3948,3948,0.0001\nCC-MAIN-2021-21,application/mbox,100324,100312,0.0038\nCC-MAIN-2021-21,application/msword,57783,57618,0.0022\nCC-MAIN-2021-21,application/octet-stream,434809,434511,0.0165\nCC-MAIN-2021-21,application/pdf,27808355,27755330,1.0565\nCC-MAIN-2021-21,application/pgp-signature,47703,47703,0.0018\nCC-MAIN-2021-21,application/pkcs7-signature,8988,8988,0.0003\nCC-MAIN-2021-21,application/postscript,2789,2789,0.0001\nCC-MAIN-2021-21,application/rdf+xml,223683,223585,0.0085\nCC-MAIN-2021-21,application/rss+xml,3298724,3293737,0.1253\nCC-MAIN-2021-21,application/rtf,64855,64747,0.0025\nCC-MAIN-2021-21,application/text,14746,14746,0.0006\nCC-MAIN-2021-21,application/vnd.android.package-archive,9592,9487,0.0004\nCC-MAIN-2021-21,application/vnd.google-earth.kml+xml,59183,59173,0.0022\nCC-MAIN-2021-21,application/vnd.google-earth.kmz,9691,9686,0.0004\nCC-MAIN-2021-21,application/vnd.ms-excel,46823,46765,0.0018\nCC-MAIN-2021-21,application/vnd.ms-powerpoint,25270,25265,0.0010\nCC-MAIN-2021-21,application/vnd.oasis.opendocument.spreadsheet,6598,6578,0.0003\nCC-MAIN-2021-21,application/vnd.oasis.opendocument.text,24177,24143,0.0009\nCC-MAIN-2021-21,application/vnd.openxmlformats-officedocument.presentationml.presentation,9211,9179,0.0003\nCC-MAIN-2021-21,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,33252,33201,0.0013\nCC-MAIN-2021-21,application/vnd.openxmlformats-officedocument.wordprocessingml.document,69238,68657,0.0026\nCC-MAIN-2021-21,application/x-bibtex-text-file,161352,161310,0.0061\nCC-MAIN-2021-21,application/x-bittorrent,7108,7102,0.0003\nCC-MAIN-2021-21,application/x-bzip2,32438,32434,0.0012\nCC-MAIN-2021-21,application/x-dosexec,7473,7049,0.0003\nCC-MAIN-2021-21,application/x-endnote-refer,50919,50915,0.0019\nCC-MAIN-2021-21,application/x-hdf,4176,4176,0.0002\nCC-MAIN-2021-21,application/x-mobipocket-ebook,13938,13920,0.0005\nCC-MAIN-2021-21,application/x-ms-asx,11694,11689,0.0004\nCC-MAIN-2021-21,application/x-msdownload,3752,3719,0.0001\nCC-MAIN-2021-21,application/x-rar-compressed,257,257,0.0000\nCC-MAIN-2021-21,application/x-research-info-systems,4201,4201,0.0002\nCC-MAIN-2021-21,application/x-sh,26927,26890,0.0010\nCC-MAIN-2021-21,application/x-shockwave-flash,10999,10965,0.0004\nCC-MAIN-2021-21,application/x-stata-do,14028,14003,0.0005\nCC-MAIN-2021-21,application/x-tex,7031,7031,0.0003\nCC-MAIN-2021-21,application/x-tex-tfm,2200,2200,0.0001\nCC-MAIN-2021-21,application/x-tika-msoffice,82695,82621,0.0031\nCC-MAIN-2021-21,application/x-tika-ooxml,56989,56951,0.0022\nCC-MAIN-2021-21,application/x-wais-source,14752,14752,0.0006\nCC-MAIN-2021-21,application/x-xz,2630,2629,0.0001\nCC-MAIN-2021-21,application/xhtml+xml,392359024,390032219,14.9065\nCC-MAIN-2021-21,application/xml,1787123,1782707,0.0679\nCC-MAIN-2021-21,application/zip,195923,194836,0.0074\nCC-MAIN-2021-21,application/zlib,19437,19408,0.0007\nCC-MAIN-2021-21,application/zstd,20903,20903,0.0008\nCC-MAIN-2021-21,audio/mp4,1667,1667,0.0001\nCC-MAIN-2021-21,audio/mpeg,137638,135782,0.0052\nCC-MAIN-2021-21,audio/vnd.wave,9552,9427,0.0004\nCC-MAIN-2021-21,audio/x-mpegurl,2421,2418,0.0001\nCC-MAIN-2021-21,image/gif,120967,120563,0.0046\nCC-MAIN-2021-21,image/jpeg,4177631,4169443,0.1587\nCC-MAIN-2021-21,image/png,719129,716580,0.0273\nCC-MAIN-2021-21,image/svg+xml,18488,18480,0.0007\nCC-MAIN-2021-21,image/tiff,13221,13217,0.0005\nCC-MAIN-2021-21,image/vnd.djvu,5412,5401,0.0002\nCC-MAIN-2021-21,image/vnd.dxf; format=ascii,9450,9435,0.0004\nCC-MAIN-2021-21,image/webp,8854,8854,0.0003\nCC-MAIN-2021-21,message/rfc822,80174,80127,0.0030\nCC-MAIN-2021-21,text/calendar,760375,760210,0.0289\nCC-MAIN-2021-21,text/css,10401,10396,0.0004\nCC-MAIN-2021-21,text/csv,108442,108415,0.0041\nCC-MAIN-2021-21,text/html,2192574725,2179133576,83.3000\nCC-MAIN-2021-21,text/markdown,669,669,0.0000\nCC-MAIN-2021-21,text/plain,2219795,2217766,0.0843\nCC-MAIN-2021-21,text/prs.lines.tag,22419,22419,0.0009\nCC-MAIN-2021-21,text/tab-separated-values,16692,16692,0.0006\nCC-MAIN-2021-21,text/troff,9008,9008,0.0003\nCC-MAIN-2021-21,text/turtle,22498,22491,0.0009\nCC-MAIN-2021-21,text/vtt,19831,19831,0.0008\nCC-MAIN-2021-21,text/x-c++src,10495,10495,0.0004\nCC-MAIN-2021-21,text/x-chdr,21724,21722,0.0008\nCC-MAIN-2021-21,text/x-csrc,42951,42938,0.0016\nCC-MAIN-2021-21,text/x-diff,70484,70476,0.0027\nCC-MAIN-2021-21,text/x-jsp,6950,6946,0.0003\nCC-MAIN-2021-21,text/x-log,66398,66395,0.0025\nCC-MAIN-2021-21,text/x-matlab,65030,64814,0.0025\nCC-MAIN-2021-21,text/x-perl,79648,79635,0.0030\nCC-MAIN-2021-21,text/x-php,155611,154765,0.0059\nCC-MAIN-2021-21,text/x-python,15385,15384,0.0006\nCC-MAIN-2021-21,text/x-vcalendar,9704,9703,0.0004\nCC-MAIN-2021-21,text/x-vcard,106064,106038,0.0040\nCC-MAIN-2021-21,text/x-web-markdown,9865,9863,0.0004\nCC-MAIN-2021-21,text/x-yaml,9385,9385,0.0004\nCC-MAIN-2021-21,video/mp4,61412,61006,0.0023\nCC-MAIN-2021-21,video/quicktime,6544,6533,0.0002\nCC-MAIN-2021-21,video/webm,2835,2834,0.0001\nCC-MAIN-2021-21,video/x-m4v,1047,1044,0.0000\nCC-MAIN-2021-25,<other>,328263,327902,0.0134\nCC-MAIN-2021-25,application/atom+xml,1982638,1982115,0.0807\nCC-MAIN-2021-25,application/epub+zip,43746,43676,0.0018\nCC-MAIN-2021-25,application/gpx+xml,8565,8562,0.0003\nCC-MAIN-2021-25,application/gzip,51902,51795,0.0021\nCC-MAIN-2021-25,application/javascript,21279,21269,0.0009\nCC-MAIN-2021-25,application/json,509599,509120,0.0207\nCC-MAIN-2021-25,application/marc,6017,6017,0.0002\nCC-MAIN-2021-25,application/mbox,85255,85240,0.0035\nCC-MAIN-2021-25,application/msword,47968,47857,0.0020\nCC-MAIN-2021-25,application/octet-stream,432891,432656,0.0176\nCC-MAIN-2021-25,application/pdf,13374869,13347159,0.5442\nCC-MAIN-2021-25,application/pgp-signature,69548,69535,0.0028\nCC-MAIN-2021-25,application/pkcs7-signature,8755,8755,0.0004\nCC-MAIN-2021-25,application/postscript,1649,1649,0.0001\nCC-MAIN-2021-25,application/rdf+xml,193638,193574,0.0079\nCC-MAIN-2021-25,application/rss+xml,2715250,2712029,0.1105\nCC-MAIN-2021-25,application/rtf,46706,46667,0.0019\nCC-MAIN-2021-25,application/text,13369,13369,0.0005\nCC-MAIN-2021-25,application/vnd.android.package-archive,8266,8157,0.0003\nCC-MAIN-2021-25,application/vnd.google-earth.kml+xml,48572,48568,0.0020\nCC-MAIN-2021-25,application/vnd.google-earth.kmz,8163,8161,0.0003\nCC-MAIN-2021-25,application/vnd.ms-excel,51189,51083,0.0021\nCC-MAIN-2021-25,application/vnd.ms-powerpoint,27988,27985,0.0011\nCC-MAIN-2021-25,application/vnd.oasis.opendocument.spreadsheet,5862,5858,0.0002\nCC-MAIN-2021-25,application/vnd.oasis.opendocument.text,18130,18120,0.0007\nCC-MAIN-2021-25,application/vnd.openxmlformats-officedocument.presentationml.presentation,5705,5699,0.0002\nCC-MAIN-2021-25,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,30527,30192,0.0012\nCC-MAIN-2021-25,application/vnd.openxmlformats-officedocument.wordprocessingml.document,59535,59433,0.0024\nCC-MAIN-2021-25,application/x-bibtex-text-file,167032,166885,0.0068\nCC-MAIN-2021-25,application/x-bittorrent,6454,6448,0.0003\nCC-MAIN-2021-25,application/x-bzip2,21622,21610,0.0009\nCC-MAIN-2021-25,application/x-dosexec,6537,6325,0.0003\nCC-MAIN-2021-25,application/x-endnote-refer,46151,46151,0.0019\nCC-MAIN-2021-25,application/x-hdf,3524,3518,0.0001\nCC-MAIN-2021-25,application/x-mobipocket-ebook,12118,12054,0.0005\nCC-MAIN-2021-25,application/x-ms-asx,6642,6638,0.0003\nCC-MAIN-2021-25,application/x-msdownload,5497,5473,0.0002\nCC-MAIN-2021-25,application/x-rar-compressed,84,84,0.0000\nCC-MAIN-2021-25,application/x-research-info-systems,5744,5744,0.0002\nCC-MAIN-2021-25,application/x-sh,24200,24186,0.0010\nCC-MAIN-2021-25,application/x-shockwave-flash,8485,8465,0.0003\nCC-MAIN-2021-25,application/x-stata-do,23169,23111,0.0009\nCC-MAIN-2021-25,application/x-tex,8403,8403,0.0003\nCC-MAIN-2021-25,application/x-tex-tfm,2652,2652,0.0001\nCC-MAIN-2021-25,application/x-tika-msoffice,69153,69130,0.0028\nCC-MAIN-2021-25,application/x-tika-ooxml,61725,61677,0.0025\nCC-MAIN-2021-25,application/x-wais-source,7842,7842,0.0003\nCC-MAIN-2021-25,application/x-xz,3260,3259,0.0001\nCC-MAIN-2021-25,application/xhtml+xml,368242489,366293012,14.9836\nCC-MAIN-2021-25,application/xml,1643256,1641104,0.0669\nCC-MAIN-2021-25,application/zip,207389,206629,0.0084\nCC-MAIN-2021-25,application/zlib,14794,14754,0.0006\nCC-MAIN-2021-25,application/zstd,30982,30982,0.0013\nCC-MAIN-2021-25,audio/mp4,1172,1172,0.0000\nCC-MAIN-2021-25,audio/mpeg,132535,131207,0.0054\nCC-MAIN-2021-25,audio/vnd.wave,12132,12132,0.0005\nCC-MAIN-2021-25,audio/x-mpegurl,1232,1232,0.0001\nCC-MAIN-2021-25,image/gif,112513,112227,0.0046\nCC-MAIN-2021-25,image/jpeg,4638281,4624550,0.1887\nCC-MAIN-2021-25,image/png,909774,905956,0.0370\nCC-MAIN-2021-25,image/svg+xml,21255,21190,0.0009\nCC-MAIN-2021-25,image/tiff,12819,12817,0.0005\nCC-MAIN-2021-25,image/vnd.djvu,13524,13523,0.0006\nCC-MAIN-2021-25,image/vnd.dxf; format=ascii,10866,10862,0.0004\nCC-MAIN-2021-25,image/webp,7248,7248,0.0003\nCC-MAIN-2021-25,message/rfc822,64556,64541,0.0026\nCC-MAIN-2021-25,text/calendar,675526,675331,0.0275\nCC-MAIN-2021-25,text/css,6217,6215,0.0003\nCC-MAIN-2021-25,text/csv,96269,96256,0.0039\nCC-MAIN-2021-25,text/html,2057253268,2044807729,83.7088\nCC-MAIN-2021-25,text/markdown,215,215,0.0000\nCC-MAIN-2021-25,text/plain,2108287,2103396,0.0858\nCC-MAIN-2021-25,text/prs.lines.tag,25000,25000,0.0010\nCC-MAIN-2021-25,text/tab-separated-values,12927,12927,0.0005\nCC-MAIN-2021-25,text/troff,9135,9135,0.0004\nCC-MAIN-2021-25,text/turtle,26261,26258,0.0011\nCC-MAIN-2021-25,text/vtt,19402,19402,0.0008\nCC-MAIN-2021-25,text/x-c++src,8164,8164,0.0003\nCC-MAIN-2021-25,text/x-chdr,23230,23219,0.0009\nCC-MAIN-2021-25,text/x-csrc,54129,54119,0.0022\nCC-MAIN-2021-25,text/x-diff,65718,65711,0.0027\nCC-MAIN-2021-25,text/x-jsp,3527,3521,0.0001\nCC-MAIN-2021-25,text/x-log,57948,57948,0.0024\nCC-MAIN-2021-25,text/x-matlab,64164,64151,0.0026\nCC-MAIN-2021-25,text/x-perl,66995,66977,0.0027\nCC-MAIN-2021-25,text/x-php,88826,88564,0.0036\nCC-MAIN-2021-25,text/x-python,11590,11590,0.0005\nCC-MAIN-2021-25,text/x-vcalendar,9034,9034,0.0004\nCC-MAIN-2021-25,text/x-vcard,78177,78119,0.0032\nCC-MAIN-2021-25,text/x-web-markdown,8922,8919,0.0004\nCC-MAIN-2021-25,text/x-yaml,8426,8426,0.0003\nCC-MAIN-2021-25,video/mp4,65742,65596,0.0027\nCC-MAIN-2021-25,video/quicktime,7904,7886,0.0003\nCC-MAIN-2021-25,video/webm,2672,2667,0.0001\nCC-MAIN-2021-25,video/x-m4v,1126,1124,0.0000\nCC-MAIN-2021-31,<other>,289907,289439,0.0092\nCC-MAIN-2021-31,application/atom+xml,2174270,2173705,0.0687\nCC-MAIN-2021-31,application/epub+zip,35660,35649,0.0011\nCC-MAIN-2021-31,application/gpx+xml,7989,7989,0.0003\nCC-MAIN-2021-31,application/gzip,43555,43462,0.0014\nCC-MAIN-2021-31,application/javascript,18381,18376,0.0006\nCC-MAIN-2021-31,application/json,497438,496932,0.0157\nCC-MAIN-2021-31,application/marc,4674,4674,0.0001\nCC-MAIN-2021-31,application/mbox,84160,84150,0.0027\nCC-MAIN-2021-31,application/msword,42267,42129,0.0013\nCC-MAIN-2021-31,application/octet-stream,473026,472309,0.0149\nCC-MAIN-2021-31,application/pdf,8389141,8368352,0.2651\nCC-MAIN-2021-31,application/pgp-signature,33500,33476,0.0011\nCC-MAIN-2021-31,application/pkcs7-signature,5746,5745,0.0002\nCC-MAIN-2021-31,application/postscript,2289,2289,0.0001\nCC-MAIN-2021-31,application/rdf+xml,190021,189967,0.0060\nCC-MAIN-2021-31,application/rss+xml,2853435,2849801,0.0902\nCC-MAIN-2021-31,application/rtf,54020,54010,0.0017\nCC-MAIN-2021-31,application/text,14324,14323,0.0005\nCC-MAIN-2021-31,application/vnd.android.package-archive,7775,7679,0.0002\nCC-MAIN-2021-31,application/vnd.google-earth.kml+xml,48701,48695,0.0015\nCC-MAIN-2021-31,application/vnd.google-earth.kmz,10337,10337,0.0003\nCC-MAIN-2021-31,application/vnd.ms-excel,26323,26301,0.0008\nCC-MAIN-2021-31,application/vnd.ms-powerpoint,23301,23300,0.0007\nCC-MAIN-2021-31,application/vnd.oasis.opendocument.spreadsheet,4508,4505,0.0001\nCC-MAIN-2021-31,application/vnd.oasis.opendocument.text,12512,12508,0.0004\nCC-MAIN-2021-31,application/vnd.openxmlformats-officedocument.presentationml.presentation,5922,5911,0.0002\nCC-MAIN-2021-31,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,30096,30078,0.0010\nCC-MAIN-2021-31,application/vnd.openxmlformats-officedocument.wordprocessingml.document,53217,53115,0.0017\nCC-MAIN-2021-31,application/x-bibtex-text-file,163621,163472,0.0052\nCC-MAIN-2021-31,application/x-bittorrent,6461,6442,0.0002\nCC-MAIN-2021-31,application/x-bzip2,54284,54278,0.0017\nCC-MAIN-2021-31,application/x-dosexec,6175,5854,0.0002\nCC-MAIN-2021-31,application/x-endnote-refer,38364,38363,0.0012\nCC-MAIN-2021-31,application/x-hdf,5530,5530,0.0002\nCC-MAIN-2021-31,application/x-mobipocket-ebook,7944,7941,0.0003\nCC-MAIN-2021-31,application/x-ms-asx,4874,4873,0.0002\nCC-MAIN-2021-31,application/x-msdownload,3271,3237,0.0001\nCC-MAIN-2021-31,application/x-rar-compressed,108,108,0.0000\nCC-MAIN-2021-31,application/x-research-info-systems,6702,6699,0.0002\nCC-MAIN-2021-31,application/x-sh,30053,30042,0.0009\nCC-MAIN-2021-31,application/x-shockwave-flash,6422,6398,0.0002\nCC-MAIN-2021-31,application/x-stata-do,18175,18175,0.0006\nCC-MAIN-2021-31,application/x-tex,5999,5999,0.0002\nCC-MAIN-2021-31,application/x-tex-tfm,2153,2153,0.0001\nCC-MAIN-2021-31,application/x-tika-msoffice,60474,60454,0.0019\nCC-MAIN-2021-31,application/x-tika-ooxml,49211,49199,0.0016\nCC-MAIN-2021-31,application/x-wais-source,5289,5289,0.0002\nCC-MAIN-2021-31,application/x-xz,9291,9291,0.0003\nCC-MAIN-2021-31,application/xhtml+xml,425050367,422982150,13.4293\nCC-MAIN-2021-31,application/xml,1670174,1667826,0.0528\nCC-MAIN-2021-31,application/zip,166182,165374,0.0053\nCC-MAIN-2021-31,application/zlib,10632,10595,0.0003\nCC-MAIN-2021-31,application/zstd,15436,15436,0.0005\nCC-MAIN-2021-31,audio/mp4,1050,1050,0.0000\nCC-MAIN-2021-31,audio/mpeg,103813,102538,0.0033\nCC-MAIN-2021-31,audio/vnd.wave,8740,8740,0.0003\nCC-MAIN-2021-31,audio/x-mpegurl,648,648,0.0000\nCC-MAIN-2021-31,image/gif,108298,107897,0.0034\nCC-MAIN-2021-31,image/jpeg,4731753,4719232,0.1495\nCC-MAIN-2021-31,image/png,1012785,1010605,0.0320\nCC-MAIN-2021-31,image/svg+xml,22796,22742,0.0007\nCC-MAIN-2021-31,image/tiff,11113,11110,0.0004\nCC-MAIN-2021-31,image/vnd.djvu,3570,3568,0.0001\nCC-MAIN-2021-31,image/vnd.dxf; format=ascii,9384,9384,0.0003\nCC-MAIN-2021-31,image/webp,3373,3372,0.0001\nCC-MAIN-2021-31,message/rfc822,51148,51116,0.0016\nCC-MAIN-2021-31,text/calendar,666054,665918,0.0210\nCC-MAIN-2021-31,text/css,8569,8564,0.0003\nCC-MAIN-2021-31,text/csv,94810,94784,0.0030\nCC-MAIN-2021-31,text/html,2712790424,2698103847,85.7097\nCC-MAIN-2021-31,text/markdown,249,249,0.0000\nCC-MAIN-2021-31,text/plain,1932007,1930385,0.0610\nCC-MAIN-2021-31,text/prs.lines.tag,22890,22889,0.0007\nCC-MAIN-2021-31,text/tab-separated-values,9604,9604,0.0003\nCC-MAIN-2021-31,text/troff,10958,10958,0.0003\nCC-MAIN-2021-31,text/turtle,27746,27745,0.0009\nCC-MAIN-2021-31,text/vtt,20469,20467,0.0006\nCC-MAIN-2021-31,text/x-c++src,9335,9334,0.0003\nCC-MAIN-2021-31,text/x-chdr,26270,26270,0.0008\nCC-MAIN-2021-31,text/x-csrc,49885,49882,0.0016\nCC-MAIN-2021-31,text/x-diff,49064,49062,0.0016\nCC-MAIN-2021-31,text/x-jsp,2200,2196,0.0001\nCC-MAIN-2021-31,text/x-log,72150,72147,0.0023\nCC-MAIN-2021-31,text/x-matlab,50156,50111,0.0016\nCC-MAIN-2021-31,text/x-perl,60883,60875,0.0019\nCC-MAIN-2021-31,text/x-php,96094,95826,0.0030\nCC-MAIN-2021-31,text/x-python,11301,11300,0.0004\nCC-MAIN-2021-31,text/x-vcalendar,7923,7923,0.0003\nCC-MAIN-2021-31,text/x-vcard,79116,79066,0.0025\nCC-MAIN-2021-31,text/x-web-markdown,7279,7279,0.0002\nCC-MAIN-2021-31,text/x-yaml,11086,11086,0.0004\nCC-MAIN-2021-31,video/mp4,61319,61245,0.0019\nCC-MAIN-2021-31,video/quicktime,6464,6463,0.0002\nCC-MAIN-2021-31,video/webm,2244,2242,0.0001\nCC-MAIN-2021-31,video/x-m4v,1148,1147,0.0000\nCC-MAIN-2021-39,<other>,425071,424538,0.0144\nCC-MAIN-2021-39,application/atom+xml,3696333,3695892,0.1249\nCC-MAIN-2021-39,application/epub+zip,63288,63247,0.0021\nCC-MAIN-2021-39,application/gpx+xml,13163,13162,0.0004\nCC-MAIN-2021-39,application/gzip,53582,53459,0.0018\nCC-MAIN-2021-39,application/javascript,25289,25236,0.0009\nCC-MAIN-2021-39,application/json,691088,690741,0.0233\nCC-MAIN-2021-39,application/marc,6127,6127,0.0002\nCC-MAIN-2021-39,application/mbox,125652,125649,0.0042\nCC-MAIN-2021-39,application/msword,79219,79073,0.0027\nCC-MAIN-2021-39,application/octet-stream,630811,630414,0.0213\nCC-MAIN-2021-39,application/pdf,27436510,27356768,0.9269\nCC-MAIN-2021-39,application/pgp-signature,63330,63329,0.0021\nCC-MAIN-2021-39,application/pkcs7-signature,10250,10246,0.0003\nCC-MAIN-2021-39,application/postscript,4630,4630,0.0002\nCC-MAIN-2021-39,application/rdf+xml,268341,268274,0.0091\nCC-MAIN-2021-39,application/rss+xml,4017235,4012997,0.1357\nCC-MAIN-2021-39,application/rtf,60882,60835,0.0021\nCC-MAIN-2021-39,application/text,21383,21383,0.0007\nCC-MAIN-2021-39,application/vnd.android.package-archive,9751,9616,0.0003\nCC-MAIN-2021-39,application/vnd.google-earth.kml+xml,68162,68151,0.0023\nCC-MAIN-2021-39,application/vnd.google-earth.kmz,12855,12854,0.0004\nCC-MAIN-2021-39,application/vnd.ms-excel,45795,45661,0.0015\nCC-MAIN-2021-39,application/vnd.ms-powerpoint,33038,33032,0.0011\nCC-MAIN-2021-39,application/vnd.oasis.opendocument.spreadsheet,8151,8137,0.0003\nCC-MAIN-2021-39,application/vnd.oasis.opendocument.text,26814,26801,0.0009\nCC-MAIN-2021-39,application/vnd.openxmlformats-officedocument.presentationml.presentation,10615,10592,0.0004\nCC-MAIN-2021-39,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,47415,47339,0.0016\nCC-MAIN-2021-39,application/vnd.openxmlformats-officedocument.wordprocessingml.document,89710,89303,0.0030\nCC-MAIN-2021-39,application/x-bibtex-text-file,258946,258910,0.0087\nCC-MAIN-2021-39,application/x-bittorrent,8641,8622,0.0003\nCC-MAIN-2021-39,application/x-bzip2,10997,10991,0.0004\nCC-MAIN-2021-39,application/x-dosexec,9582,9225,0.0003\nCC-MAIN-2021-39,application/x-endnote-refer,56140,56140,0.0019\nCC-MAIN-2021-39,application/x-hdf,22137,22137,0.0007\nCC-MAIN-2021-39,application/x-mobipocket-ebook,15081,15076,0.0005\nCC-MAIN-2021-39,application/x-ms-asx,9169,9160,0.0003\nCC-MAIN-2021-39,application/x-msdownload,4777,4709,0.0002\nCC-MAIN-2021-39,application/x-rar-compressed,216,216,0.0000\nCC-MAIN-2021-39,application/x-research-info-systems,10669,10669,0.0004\nCC-MAIN-2021-39,application/x-sh,34089,34062,0.0012\nCC-MAIN-2021-39,application/x-shockwave-flash,12160,12101,0.0004\nCC-MAIN-2021-39,application/x-stata-do,37337,37328,0.0013\nCC-MAIN-2021-39,application/x-tex,11613,11600,0.0004\nCC-MAIN-2021-39,application/x-tex-tfm,1403,1403,0.0000\nCC-MAIN-2021-39,application/x-tika-msoffice,106991,106952,0.0036\nCC-MAIN-2021-39,application/x-tika-ooxml,95678,95662,0.0032\nCC-MAIN-2021-39,application/x-wais-source,6571,6571,0.0002\nCC-MAIN-2021-39,application/x-xz,8162,8162,0.0003\nCC-MAIN-2021-39,application/xhtml+xml,431175186,428942570,14.5672\nCC-MAIN-2021-39,application/xml,2116672,2112665,0.0715\nCC-MAIN-2021-39,application/zip,272926,271474,0.0092\nCC-MAIN-2021-39,application/zlib,4290,4219,0.0001\nCC-MAIN-2021-39,application/zstd,23647,23646,0.0008\nCC-MAIN-2021-39,audio/mp4,1765,1764,0.0001\nCC-MAIN-2021-39,audio/mpeg,184241,182434,0.0062\nCC-MAIN-2021-39,audio/vnd.wave,16261,16252,0.0005\nCC-MAIN-2021-39,audio/x-mpegurl,1806,1806,0.0001\nCC-MAIN-2021-39,image/gif,144574,143979,0.0049\nCC-MAIN-2021-39,image/jpeg,5680600,5668144,0.1919\nCC-MAIN-2021-39,image/png,943849,941377,0.0319\nCC-MAIN-2021-39,image/svg+xml,28196,28073,0.0010\nCC-MAIN-2021-39,image/tiff,20254,20249,0.0007\nCC-MAIN-2021-39,image/vnd.djvu,12521,12481,0.0004\nCC-MAIN-2021-39,image/vnd.dxf; format=ascii,12015,12012,0.0004\nCC-MAIN-2021-39,image/webp,8928,8882,0.0003\nCC-MAIN-2021-39,message/rfc822,79512,79469,0.0027\nCC-MAIN-2021-39,text/asp,1,1,0.0000\nCC-MAIN-2021-39,text/calendar,1188775,1188472,0.0402\nCC-MAIN-2021-39,text/css,12693,12686,0.0004\nCC-MAIN-2021-39,text/csv,142256,142224,0.0048\nCC-MAIN-2021-39,text/html,2475190266,2460006144,83.6240\nCC-MAIN-2021-39,text/markdown,223,223,0.0000\nCC-MAIN-2021-39,text/plain,2899626,2897312,0.0980\nCC-MAIN-2021-39,text/prs.lines.tag,61028,61028,0.0021\nCC-MAIN-2021-39,text/tab-separated-values,21652,21652,0.0007\nCC-MAIN-2021-39,text/troff,13487,13487,0.0005\nCC-MAIN-2021-39,text/turtle,34680,34670,0.0012\nCC-MAIN-2021-39,text/vtt,31256,31256,0.0011\nCC-MAIN-2021-39,text/x-c++src,14533,14530,0.0005\nCC-MAIN-2021-39,text/x-chdr,31088,31086,0.0011\nCC-MAIN-2021-39,text/x-csrc,59027,59024,0.0020\nCC-MAIN-2021-39,text/x-diff,67309,67290,0.0023\nCC-MAIN-2021-39,text/x-jsp,2954,2947,0.0001\nCC-MAIN-2021-39,text/x-log,74019,74017,0.0025\nCC-MAIN-2021-39,text/x-matlab,79234,79155,0.0027\nCC-MAIN-2021-39,text/x-perl,86800,86781,0.0029\nCC-MAIN-2021-39,text/x-php,104132,103815,0.0035\nCC-MAIN-2021-39,text/x-python,16640,16637,0.0006\nCC-MAIN-2021-39,text/x-vcalendar,13809,13808,0.0005\nCC-MAIN-2021-39,text/x-vcard,146189,146093,0.0049\nCC-MAIN-2021-39,text/x-web-markdown,9841,9839,0.0003\nCC-MAIN-2021-39,text/x-yaml,14782,14781,0.0005\nCC-MAIN-2021-39,video/mp4,79704,79588,0.0027\nCC-MAIN-2021-39,video/quicktime,10111,10101,0.0003\nCC-MAIN-2021-39,video/webm,4017,4005,0.0001\nCC-MAIN-2021-39,video/x-m4v,1555,1551,0.0001\nCC-MAIN-2021-43,<other>,472348,471797,0.0141\nCC-MAIN-2021-43,application/atom+xml,3033553,3033206,0.0906\nCC-MAIN-2021-43,application/epub+zip,61275,61241,0.0018\nCC-MAIN-2021-43,application/gpx+xml,14915,14915,0.0004\nCC-MAIN-2021-43,application/gzip,64406,64278,0.0019\nCC-MAIN-2021-43,application/javascript,23544,23526,0.0007\nCC-MAIN-2021-43,application/json,733400,733206,0.0219\nCC-MAIN-2021-43,application/marc,12767,12767,0.0004\nCC-MAIN-2021-43,application/mbox,124633,124628,0.0037\nCC-MAIN-2021-43,application/msword,85942,85738,0.0026\nCC-MAIN-2021-43,application/octet-stream,728878,728530,0.0218\nCC-MAIN-2021-43,application/pdf,34368722,34302165,1.0262\nCC-MAIN-2021-43,application/pgp-signature,82685,82621,0.0025\nCC-MAIN-2021-43,application/pkcs7-signature,13723,13722,0.0004\nCC-MAIN-2021-43,application/postscript,4920,4920,0.0001\nCC-MAIN-2021-43,application/rdf+xml,288522,288402,0.0086\nCC-MAIN-2021-43,application/rss+xml,3867584,3864053,0.1155\nCC-MAIN-2021-43,application/rtf,61134,61121,0.0018\nCC-MAIN-2021-43,application/text,23922,23922,0.0007\nCC-MAIN-2021-43,application/vnd.android.package-archive,11414,11286,0.0003\nCC-MAIN-2021-43,application/vnd.google-earth.kml+xml,68948,68930,0.0021\nCC-MAIN-2021-43,application/vnd.google-earth.kmz,11031,11031,0.0003\nCC-MAIN-2021-43,application/vnd.ms-excel,56013,55858,0.0017\nCC-MAIN-2021-43,application/vnd.ms-powerpoint,38616,38591,0.0012\nCC-MAIN-2021-43,application/vnd.oasis.opendocument.spreadsheet,14928,14899,0.0004\nCC-MAIN-2021-43,application/vnd.oasis.opendocument.text,29580,29567,0.0009\nCC-MAIN-2021-43,application/vnd.openxmlformats-officedocument.presentationml.presentation,9657,9635,0.0003\nCC-MAIN-2021-43,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,46570,46459,0.0014\nCC-MAIN-2021-43,application/vnd.openxmlformats-officedocument.wordprocessingml.document,105205,104829,0.0031\nCC-MAIN-2021-43,application/x-bibtex-text-file,246788,246772,0.0074\nCC-MAIN-2021-43,application/x-bittorrent,11951,11908,0.0004\nCC-MAIN-2021-43,application/x-bzip2,44548,44532,0.0013\nCC-MAIN-2021-43,application/x-dosexec,9288,8830,0.0003\nCC-MAIN-2021-43,application/x-endnote-refer,66481,66481,0.0020\nCC-MAIN-2021-43,application/x-hdf,12186,12186,0.0004\nCC-MAIN-2021-43,application/x-mobipocket-ebook,12903,12897,0.0004\nCC-MAIN-2021-43,application/x-ms-asx,7164,7163,0.0002\nCC-MAIN-2021-43,application/x-msdownload,5402,5315,0.0002\nCC-MAIN-2021-43,application/x-rar-compressed,384,384,0.0000\nCC-MAIN-2021-43,application/x-research-info-systems,8588,8588,0.0003\nCC-MAIN-2021-43,application/x-sh,37017,36997,0.0011\nCC-MAIN-2021-43,application/x-shockwave-flash,11735,11695,0.0004\nCC-MAIN-2021-43,application/x-stata-do,31690,31668,0.0009\nCC-MAIN-2021-43,application/x-tex,11196,11196,0.0003\nCC-MAIN-2021-43,application/x-tex-tfm,7783,7783,0.0002\nCC-MAIN-2021-43,application/x-tika-msoffice,104029,104007,0.0031\nCC-MAIN-2021-43,application/x-tika-ooxml,93537,93502,0.0028\nCC-MAIN-2021-43,application/x-wais-source,7513,7513,0.0002\nCC-MAIN-2021-43,application/x-xz,15942,15940,0.0005\nCC-MAIN-2021-43,application/xhtml+xml,471022080,468725372,14.0638\nCC-MAIN-2021-43,application/xml,2156307,2152906,0.0644\nCC-MAIN-2021-43,application/zip,321328,318718,0.0096\nCC-MAIN-2021-43,application/zlib,4768,4708,0.0001\nCC-MAIN-2021-43,application/zstd,34194,34140,0.0010\nCC-MAIN-2021-43,audio/mp4,1771,1770,0.0001\nCC-MAIN-2021-43,audio/mpeg,174814,173095,0.0052\nCC-MAIN-2021-43,audio/vnd.wave,17660,17597,0.0005\nCC-MAIN-2021-43,audio/x-mpegurl,4970,4970,0.0001\nCC-MAIN-2021-43,image/gif,140546,139761,0.0042\nCC-MAIN-2021-43,image/jpeg,5628783,5612367,0.1681\nCC-MAIN-2021-43,image/png,902089,897238,0.0269\nCC-MAIN-2021-43,image/svg+xml,28818,28717,0.0009\nCC-MAIN-2021-43,image/tiff,22324,22166,0.0007\nCC-MAIN-2021-43,image/vnd.djvu,18170,18138,0.0005\nCC-MAIN-2021-43,image/vnd.dxf; format=ascii,11477,11475,0.0003\nCC-MAIN-2021-43,image/webp,11294,11276,0.0003\nCC-MAIN-2021-43,message/rfc822,83098,83042,0.0025\nCC-MAIN-2021-43,text/asp,1,1,0.0000\nCC-MAIN-2021-43,text/calendar,1203673,1203198,0.0359\nCC-MAIN-2021-43,text/css,11266,11255,0.0003\nCC-MAIN-2021-43,text/csv,163175,163126,0.0049\nCC-MAIN-2021-43,text/html,2817607848,2803110474,84.1283\nCC-MAIN-2021-43,text/markdown,573,573,0.0000\nCC-MAIN-2021-43,text/plain,3318608,3317099,0.0991\nCC-MAIN-2021-43,text/prs.lines.tag,70908,70908,0.0021\nCC-MAIN-2021-43,text/tab-separated-values,22271,22270,0.0007\nCC-MAIN-2021-43,text/troff,20200,20198,0.0006\nCC-MAIN-2021-43,text/turtle,38431,38428,0.0011\nCC-MAIN-2021-43,text/vtt,31688,31688,0.0009\nCC-MAIN-2021-43,text/x-c++src,13680,13680,0.0004\nCC-MAIN-2021-43,text/x-chdr,34235,34232,0.0010\nCC-MAIN-2021-43,text/x-csrc,64917,64915,0.0019\nCC-MAIN-2021-43,text/x-diff,77579,77570,0.0023\nCC-MAIN-2021-43,text/x-jsp,3725,3715,0.0001\nCC-MAIN-2021-43,text/x-log,67509,67507,0.0020\nCC-MAIN-2021-43,text/x-matlab,89957,89909,0.0027\nCC-MAIN-2021-43,text/x-perl,84655,84603,0.0025\nCC-MAIN-2021-43,text/x-php,167759,167120,0.0050\nCC-MAIN-2021-43,text/x-python,22095,22094,0.0007\nCC-MAIN-2021-43,text/x-vcalendar,14350,14348,0.0004\nCC-MAIN-2021-43,text/x-vcard,142820,142804,0.0043\nCC-MAIN-2021-43,text/x-web-markdown,14539,14532,0.0004\nCC-MAIN-2021-43,text/x-yaml,12097,12097,0.0004\nCC-MAIN-2021-43,video/mp4,76488,75954,0.0023\nCC-MAIN-2021-43,video/quicktime,8096,8089,0.0002\nCC-MAIN-2021-43,video/webm,4066,4065,0.0001\nCC-MAIN-2021-43,video/x-m4v,1355,1355,0.0000\nCC-MAIN-2021-49,<other>,520530,519881,0.0206\nCC-MAIN-2021-49,application/atom+xml,3264036,3263615,0.1292\nCC-MAIN-2021-49,application/epub+zip,68476,68433,0.0027\nCC-MAIN-2021-49,application/gpx+xml,16868,16866,0.0007\nCC-MAIN-2021-49,application/gzip,79763,79622,0.0032\nCC-MAIN-2021-49,application/javascript,37090,37010,0.0015\nCC-MAIN-2021-49,application/json,816804,816492,0.0323\nCC-MAIN-2021-49,application/marc,11724,11724,0.0005\nCC-MAIN-2021-49,application/mbox,146734,146704,0.0058\nCC-MAIN-2021-49,application/msword,92942,92518,0.0037\nCC-MAIN-2021-49,application/octet-stream,793113,792633,0.0314\nCC-MAIN-2021-49,application/pdf,35652626,35567433,1.4108\nCC-MAIN-2021-49,application/pgp-signature,85744,85743,0.0034\nCC-MAIN-2021-49,application/pkcs7-signature,13167,13163,0.0005\nCC-MAIN-2021-49,application/postscript,6656,6651,0.0003\nCC-MAIN-2021-49,application/rdf+xml,306493,306393,0.0121\nCC-MAIN-2021-49,application/rss+xml,3716385,3713030,0.1471\nCC-MAIN-2021-49,application/rtf,68467,68407,0.0027\nCC-MAIN-2021-49,application/text,20265,20265,0.0008\nCC-MAIN-2021-49,application/vnd.android.package-archive,8111,7965,0.0003\nCC-MAIN-2021-49,application/vnd.google-earth.kml+xml,73821,73777,0.0029\nCC-MAIN-2021-49,application/vnd.google-earth.kmz,11859,11856,0.0005\nCC-MAIN-2021-49,application/vnd.ms-excel,60934,60745,0.0024\nCC-MAIN-2021-49,application/vnd.ms-powerpoint,36372,36362,0.0014\nCC-MAIN-2021-49,application/vnd.oasis.opendocument.spreadsheet,12862,12850,0.0005\nCC-MAIN-2021-49,application/vnd.oasis.opendocument.text,33823,33793,0.0013\nCC-MAIN-2021-49,application/vnd.openxmlformats-officedocument.presentationml.presentation,11321,11244,0.0004\nCC-MAIN-2021-49,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,59281,58976,0.0023\nCC-MAIN-2021-49,application/vnd.openxmlformats-officedocument.wordprocessingml.document,103725,103316,0.0041\nCC-MAIN-2021-49,application/x-bibtex-text-file,267161,267126,0.0106\nCC-MAIN-2021-49,application/x-bittorrent,10564,10557,0.0004\nCC-MAIN-2021-49,application/x-bzip2,32965,32949,0.0013\nCC-MAIN-2021-49,application/x-dosexec,8721,8373,0.0003\nCC-MAIN-2021-49,application/x-endnote-refer,77426,77426,0.0031\nCC-MAIN-2021-49,application/x-hdf,64854,64854,0.0026\nCC-MAIN-2021-49,application/x-mobipocket-ebook,13440,13408,0.0005\nCC-MAIN-2021-49,application/x-ms-asx,7005,7004,0.0003\nCC-MAIN-2021-49,application/x-msdownload,5397,5308,0.0002\nCC-MAIN-2021-49,application/x-rar-compressed,272,272,0.0000\nCC-MAIN-2021-49,application/x-research-info-systems,7711,7711,0.0003\nCC-MAIN-2021-49,application/x-sh,39690,39674,0.0016\nCC-MAIN-2021-49,application/x-shockwave-flash,13197,13166,0.0005\nCC-MAIN-2021-49,application/x-stata-do,29579,29541,0.0012\nCC-MAIN-2021-49,application/x-tex,11765,11758,0.0005\nCC-MAIN-2021-49,application/x-tex-tfm,11259,11259,0.0004\nCC-MAIN-2021-49,application/x-tika-msoffice,117049,116995,0.0046\nCC-MAIN-2021-49,application/x-tika-ooxml,109506,109458,0.0043\nCC-MAIN-2021-49,application/x-wais-source,11088,11088,0.0004\nCC-MAIN-2021-49,application/x-xz,15299,15298,0.0006\nCC-MAIN-2021-49,application/xhtml+xml,369701083,367371422,14.6296\nCC-MAIN-2021-49,application/xml,2064894,2062305,0.0817\nCC-MAIN-2021-49,application/zip,334611,332721,0.0132\nCC-MAIN-2021-49,application/zlib,5568,5505,0.0002\nCC-MAIN-2021-49,application/zstd,35405,35404,0.0014\nCC-MAIN-2021-49,audio/mp4,2331,2328,0.0001\nCC-MAIN-2021-49,audio/mpeg,200960,198962,0.0080\nCC-MAIN-2021-49,audio/vnd.wave,20677,20580,0.0008\nCC-MAIN-2021-49,audio/x-mpegurl,7484,7484,0.0003\nCC-MAIN-2021-49,image/gif,163519,162996,0.0065\nCC-MAIN-2021-49,image/jpeg,6117165,6104558,0.2421\nCC-MAIN-2021-49,image/png,992984,990247,0.0393\nCC-MAIN-2021-49,image/svg+xml,32185,32156,0.0013\nCC-MAIN-2021-49,image/tiff,27827,27824,0.0011\nCC-MAIN-2021-49,image/vnd.djvu,24552,24551,0.0010\nCC-MAIN-2021-49,image/vnd.dxf; format=ascii,14973,14971,0.0006\nCC-MAIN-2021-49,image/webp,19736,19705,0.0008\nCC-MAIN-2021-49,message/rfc822,99414,98557,0.0039\nCC-MAIN-2021-49,text/calendar,1291503,1291258,0.0511\nCC-MAIN-2021-49,text/css,11691,11632,0.0005\nCC-MAIN-2021-49,text/csv,164445,164391,0.0065\nCC-MAIN-2021-49,text/html,2093818470,2079835824,82.8554\nCC-MAIN-2021-49,text/markdown,1071,1071,0.0000\nCC-MAIN-2021-49,text/plain,3655076,3652190,0.1446\nCC-MAIN-2021-49,text/prs.lines.tag,133369,133369,0.0053\nCC-MAIN-2021-49,text/tab-separated-values,30255,30255,0.0012\nCC-MAIN-2021-49,text/troff,18645,18644,0.0007\nCC-MAIN-2021-49,text/turtle,49474,49473,0.0020\nCC-MAIN-2021-49,text/vtt,29766,29766,0.0012\nCC-MAIN-2021-49,text/x-c++src,22800,22800,0.0009\nCC-MAIN-2021-49,text/x-chdr,51147,51145,0.0020\nCC-MAIN-2021-49,text/x-csrc,78016,78011,0.0031\nCC-MAIN-2021-49,text/x-diff,74089,74020,0.0029\nCC-MAIN-2021-49,text/x-jsp,4507,4502,0.0002\nCC-MAIN-2021-49,text/x-log,125293,125291,0.0050\nCC-MAIN-2021-49,text/x-matlab,94650,94642,0.0037\nCC-MAIN-2021-49,text/x-perl,97657,97620,0.0039\nCC-MAIN-2021-49,text/x-php,137631,137228,0.0054\nCC-MAIN-2021-49,text/x-python,26042,26039,0.0010\nCC-MAIN-2021-49,text/x-vcalendar,22395,22393,0.0009\nCC-MAIN-2021-49,text/x-vcard,152286,152247,0.0060\nCC-MAIN-2021-49,text/x-web-markdown,15685,15679,0.0006\nCC-MAIN-2021-49,text/x-yaml,14366,14365,0.0006\nCC-MAIN-2021-49,video/mp4,89817,89009,0.0036\nCC-MAIN-2021-49,video/quicktime,10846,10840,0.0004\nCC-MAIN-2021-49,video/webm,3692,3692,0.0001\nCC-MAIN-2021-49,video/x-m4v,1807,1803,0.0001\nCC-MAIN-2022-05,<other>,465857,465234,0.0156\nCC-MAIN-2022-05,application/atom+xml,2593808,2593458,0.0869\nCC-MAIN-2022-05,application/epub+zip,74019,73984,0.0025\nCC-MAIN-2022-05,application/gpx+xml,11981,11981,0.0004\nCC-MAIN-2022-05,application/gzip,82373,82262,0.0028\nCC-MAIN-2022-05,application/javascript,23662,23571,0.0008\nCC-MAIN-2022-05,application/json,809975,809754,0.0271\nCC-MAIN-2022-05,application/marc,51701,51701,0.0017\nCC-MAIN-2022-05,application/mbox,129493,129457,0.0043\nCC-MAIN-2022-05,application/msword,73117,72925,0.0024\nCC-MAIN-2022-05,application/octet-stream,746239,745535,0.0250\nCC-MAIN-2022-05,application/pdf,25454705,25396339,0.8524\nCC-MAIN-2022-05,application/pgp-signature,85984,85982,0.0029\nCC-MAIN-2022-05,application/pkcs7-signature,10426,10425,0.0003\nCC-MAIN-2022-05,application/postscript,3942,3941,0.0001\nCC-MAIN-2022-05,application/rdf+xml,343004,342941,0.0115\nCC-MAIN-2022-05,application/rss+xml,3562381,3558754,0.1193\nCC-MAIN-2022-05,application/rtf,59023,59021,0.0020\nCC-MAIN-2022-05,application/text,12077,12077,0.0004\nCC-MAIN-2022-05,application/vnd.android.package-archive,7267,7152,0.0002\nCC-MAIN-2022-05,application/vnd.google-earth.kml+xml,74375,74348,0.0025\nCC-MAIN-2022-05,application/vnd.google-earth.kmz,24690,24688,0.0008\nCC-MAIN-2022-05,application/vnd.ms-excel,47428,47267,0.0016\nCC-MAIN-2022-05,application/vnd.ms-powerpoint,20219,20216,0.0007\nCC-MAIN-2022-05,application/vnd.oasis.opendocument.spreadsheet,10718,10698,0.0004\nCC-MAIN-2022-05,application/vnd.oasis.opendocument.text,32667,32661,0.0011\nCC-MAIN-2022-05,application/vnd.openxmlformats-officedocument.presentationml.presentation,7907,7832,0.0003\nCC-MAIN-2022-05,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,51197,51053,0.0017\nCC-MAIN-2022-05,application/vnd.openxmlformats-officedocument.wordprocessingml.document,76264,76047,0.0026\nCC-MAIN-2022-05,application/x-bibtex-text-file,256154,256148,0.0086\nCC-MAIN-2022-05,application/x-bittorrent,9317,9309,0.0003\nCC-MAIN-2022-05,application/x-bzip2,22120,22113,0.0007\nCC-MAIN-2022-05,application/x-dosexec,6501,6241,0.0002\nCC-MAIN-2022-05,application/x-endnote-refer,73599,73599,0.0025\nCC-MAIN-2022-05,application/x-hdf,14558,14558,0.0005\nCC-MAIN-2022-05,application/x-mobipocket-ebook,14145,14139,0.0005\nCC-MAIN-2022-05,application/x-ms-asx,5687,5686,0.0002\nCC-MAIN-2022-05,application/x-msdownload,4290,4226,0.0001\nCC-MAIN-2022-05,application/x-rar-compressed,360,360,0.0000\nCC-MAIN-2022-05,application/x-research-info-systems,7411,7411,0.0002\nCC-MAIN-2022-05,application/x-sh,45421,45403,0.0015\nCC-MAIN-2022-05,application/x-shockwave-flash,10013,9986,0.0003\nCC-MAIN-2022-05,application/x-stata-do,38614,38613,0.0013\nCC-MAIN-2022-05,application/x-tex,15237,15234,0.0005\nCC-MAIN-2022-05,application/x-tex-tfm,16059,16059,0.0005\nCC-MAIN-2022-05,application/x-tika-msoffice,98580,98562,0.0033\nCC-MAIN-2022-05,application/x-tika-ooxml,87054,87025,0.0029\nCC-MAIN-2022-05,application/x-wais-source,7670,7670,0.0003\nCC-MAIN-2022-05,application/x-xz,22062,22061,0.0007\nCC-MAIN-2022-05,application/xhtml+xml,419969054,417838306,14.0628\nCC-MAIN-2022-05,application/xml,2323465,2321012,0.0778\nCC-MAIN-2022-05,application/zip,323605,321883,0.0108\nCC-MAIN-2022-05,application/zlib,6432,6403,0.0002\nCC-MAIN-2022-05,application/zstd,54351,54349,0.0018\nCC-MAIN-2022-05,audio/mp4,1806,1792,0.0001\nCC-MAIN-2022-05,audio/mpeg,159944,158095,0.0054\nCC-MAIN-2022-05,audio/vnd.wave,20192,20083,0.0007\nCC-MAIN-2022-05,audio/x-mpegurl,7890,7888,0.0003\nCC-MAIN-2022-05,image/gif,145430,145063,0.0049\nCC-MAIN-2022-05,image/jpeg,4856181,4848026,0.1626\nCC-MAIN-2022-05,image/png,744267,742253,0.0249\nCC-MAIN-2022-05,image/svg+xml,29708,29690,0.0010\nCC-MAIN-2022-05,image/tiff,52423,52422,0.0018\nCC-MAIN-2022-05,image/vnd.djvu,19428,19426,0.0007\nCC-MAIN-2022-05,image/vnd.dxf; format=ascii,11740,11740,0.0004\nCC-MAIN-2022-05,image/webp,12985,12879,0.0004\nCC-MAIN-2022-05,message/rfc822,92925,92895,0.0031\nCC-MAIN-2022-05,text/calendar,1094160,1093999,0.0366\nCC-MAIN-2022-05,text/css,11891,11859,0.0004\nCC-MAIN-2022-05,text/csv,148532,148479,0.0050\nCC-MAIN-2022-05,text/html,2515948973,2502857817,84.2471\nCC-MAIN-2022-05,text/markdown,1653,1653,0.0001\nCC-MAIN-2022-05,text/plain,3558432,3557096,0.1192\nCC-MAIN-2022-05,text/prs.lines.tag,104115,104114,0.0035\nCC-MAIN-2022-05,text/tab-separated-values,25510,25510,0.0009\nCC-MAIN-2022-05,text/troff,20589,20589,0.0007\nCC-MAIN-2022-05,text/turtle,48277,48274,0.0016\nCC-MAIN-2022-05,text/vtt,19911,19908,0.0007\nCC-MAIN-2022-05,text/x-c++src,20959,20959,0.0007\nCC-MAIN-2022-05,text/x-chdr,49225,49225,0.0016\nCC-MAIN-2022-05,text/x-csrc,76451,76449,0.0026\nCC-MAIN-2022-05,text/x-diff,67682,67651,0.0023\nCC-MAIN-2022-05,text/x-jsp,4286,4279,0.0001\nCC-MAIN-2022-05,text/x-log,82203,82201,0.0028\nCC-MAIN-2022-05,text/x-matlab,99150,99149,0.0033\nCC-MAIN-2022-05,text/x-perl,80967,80963,0.0027\nCC-MAIN-2022-05,text/x-php,108246,107825,0.0036\nCC-MAIN-2022-05,text/x-python,30195,30195,0.0010\nCC-MAIN-2022-05,text/x-vcalendar,15639,15639,0.0005\nCC-MAIN-2022-05,text/x-vcard,125851,125817,0.0042\nCC-MAIN-2022-05,text/x-web-markdown,17789,17787,0.0006\nCC-MAIN-2022-05,text/x-yaml,19483,19483,0.0007\nCC-MAIN-2022-05,video/mp4,65279,65026,0.0022\nCC-MAIN-2022-05,video/quicktime,8592,8589,0.0003\nCC-MAIN-2022-05,video/webm,3209,3209,0.0001\nCC-MAIN-2022-05,video/x-m4v,1604,1603,0.0001\nCC-MAIN-2022-21,<other>,448699,447891,0.0130\nCC-MAIN-2022-21,application/atom+xml,3173081,3172605,0.0920\nCC-MAIN-2022-21,application/epub+zip,52563,52513,0.0015\nCC-MAIN-2022-21,application/gpx+xml,13342,13340,0.0004\nCC-MAIN-2022-21,application/gzip,82073,81980,0.0024\nCC-MAIN-2022-21,application/javascript,30640,30526,0.0009\nCC-MAIN-2022-21,application/json,769453,769200,0.0223\nCC-MAIN-2022-21,application/marc,49397,49392,0.0014\nCC-MAIN-2022-21,application/mbox,108925,108909,0.0032\nCC-MAIN-2022-21,application/msword,69769,69614,0.0020\nCC-MAIN-2022-21,application/octet-stream,833027,831795,0.0241\nCC-MAIN-2022-21,application/pdf,27066880,27006316,0.7846\nCC-MAIN-2022-21,application/pgp-signature,67933,67924,0.0020\nCC-MAIN-2022-21,application/pkcs7-signature,12421,12420,0.0004\nCC-MAIN-2022-21,application/postscript,3465,3465,0.0001\nCC-MAIN-2022-21,application/rdf+xml,287886,287763,0.0083\nCC-MAIN-2022-21,application/rss+xml,3479914,3474437,0.1009\nCC-MAIN-2022-21,application/rtf,66373,66344,0.0019\nCC-MAIN-2022-21,application/text,12268,12268,0.0004\nCC-MAIN-2022-21,application/vnd.android.package-archive,7666,7531,0.0002\nCC-MAIN-2022-21,application/vnd.google-earth.kml+xml,78327,78305,0.0023\nCC-MAIN-2022-21,application/vnd.google-earth.kmz,10663,10659,0.0003\nCC-MAIN-2022-21,application/vnd.ms-excel,42006,41943,0.0012\nCC-MAIN-2022-21,application/vnd.ms-powerpoint,12337,12337,0.0004\nCC-MAIN-2022-21,application/vnd.oasis.opendocument.spreadsheet,8192,8163,0.0002\nCC-MAIN-2022-21,application/vnd.oasis.opendocument.text,27390,27345,0.0008\nCC-MAIN-2022-21,application/vnd.openxmlformats-officedocument.presentationml.presentation,7557,7509,0.0002\nCC-MAIN-2022-21,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,49409,49358,0.0014\nCC-MAIN-2022-21,application/vnd.openxmlformats-officedocument.wordprocessingml.document,73540,73287,0.0021\nCC-MAIN-2022-21,application/x-bibtex-text-file,219181,219154,0.0064\nCC-MAIN-2022-21,application/x-bittorrent,10135,10121,0.0003\nCC-MAIN-2022-21,application/x-bzip2,15656,15643,0.0005\nCC-MAIN-2022-21,application/x-dosexec,8312,8024,0.0002\nCC-MAIN-2022-21,application/x-endnote-refer,57050,57049,0.0017\nCC-MAIN-2022-21,application/x-hdf,23307,23307,0.0007\nCC-MAIN-2022-21,application/x-mobipocket-ebook,11267,11257,0.0003\nCC-MAIN-2022-21,application/x-ms-asx,5796,5793,0.0002\nCC-MAIN-2022-21,application/x-msdownload,5678,5646,0.0002\nCC-MAIN-2022-21,application/x-rar-compressed,220,220,0.0000\nCC-MAIN-2022-21,application/x-research-info-systems,5394,5393,0.0002\nCC-MAIN-2022-21,application/x-sh,44133,44119,0.0013\nCC-MAIN-2022-21,application/x-shockwave-flash,9168,9159,0.0003\nCC-MAIN-2022-21,application/x-stata-do,49465,49438,0.0014\nCC-MAIN-2022-21,application/x-tex,9549,9548,0.0003\nCC-MAIN-2022-21,application/x-tex-tfm,4661,4661,0.0001\nCC-MAIN-2022-21,application/x-tika-msoffice,88772,88768,0.0026\nCC-MAIN-2022-21,application/x-tika-ooxml,90871,90831,0.0026\nCC-MAIN-2022-21,application/x-wais-source,7723,7723,0.0002\nCC-MAIN-2022-21,application/x-xz,7640,7636,0.0002\nCC-MAIN-2022-21,application/xhtml+xml,433116328,430797763,12.5547\nCC-MAIN-2022-21,application/xml,2270078,2265803,0.0658\nCC-MAIN-2022-21,application/zip,280205,278839,0.0081\nCC-MAIN-2022-21,application/zlib,12492,12282,0.0004\nCC-MAIN-2022-21,application/zstd,25926,25844,0.0008\nCC-MAIN-2022-21,audio/mp4,1657,1656,0.0000\nCC-MAIN-2022-21,audio/mpeg,159705,158385,0.0046\nCC-MAIN-2022-21,audio/vnd.wave,15462,15288,0.0004\nCC-MAIN-2022-21,audio/x-mpegurl,1707,1707,0.0000\nCC-MAIN-2022-21,image/gif,171088,170693,0.0050\nCC-MAIN-2022-21,image/jpeg,6576377,6562659,0.1906\nCC-MAIN-2022-21,image/png,1435241,1431702,0.0416\nCC-MAIN-2022-21,image/svg+xml,50985,50929,0.0015\nCC-MAIN-2022-21,image/tiff,17062,17038,0.0005\nCC-MAIN-2022-21,image/vnd.djvu,15244,15242,0.0004\nCC-MAIN-2022-21,image/vnd.dxf; format=ascii,11662,11660,0.0003\nCC-MAIN-2022-21,image/webp,24049,23994,0.0007\nCC-MAIN-2022-21,message/rfc822,95028,95000,0.0028\nCC-MAIN-2022-21,text/calendar,1057042,1056635,0.0306\nCC-MAIN-2022-21,text/css,13098,13074,0.0004\nCC-MAIN-2022-21,text/csv,152902,152854,0.0044\nCC-MAIN-2022-21,text/html,2962647666,2943040859,85.8782\nCC-MAIN-2022-21,text/markdown,1742,1742,0.0001\nCC-MAIN-2022-21,text/plain,2999790,2998151,0.0870\nCC-MAIN-2022-21,text/prs.lines.tag,88800,88797,0.0026\nCC-MAIN-2022-21,text/tab-separated-values,26244,26225,0.0008\nCC-MAIN-2022-21,text/troff,19199,19197,0.0006\nCC-MAIN-2022-21,text/turtle,39963,39944,0.0012\nCC-MAIN-2022-21,text/vtt,17392,17392,0.0005\nCC-MAIN-2022-21,text/x-c++src,16045,16045,0.0005\nCC-MAIN-2022-21,text/x-chdr,36918,36917,0.0011\nCC-MAIN-2022-21,text/x-csrc,65223,65221,0.0019\nCC-MAIN-2022-21,text/x-diff,53700,53665,0.0016\nCC-MAIN-2022-21,text/x-jsp,3514,3509,0.0001\nCC-MAIN-2022-21,text/x-log,62323,62319,0.0018\nCC-MAIN-2022-21,text/x-matlab,82522,82501,0.0024\nCC-MAIN-2022-21,text/x-perl,88537,88532,0.0026\nCC-MAIN-2022-21,text/x-php,137238,136717,0.0040\nCC-MAIN-2022-21,text/x-python,28640,28634,0.0008\nCC-MAIN-2022-21,text/x-vcalendar,18475,18475,0.0005\nCC-MAIN-2022-21,text/x-vcard,127291,127238,0.0037\nCC-MAIN-2022-21,text/x-web-markdown,16818,16816,0.0005\nCC-MAIN-2022-21,text/x-yaml,12754,12753,0.0004\nCC-MAIN-2022-21,video/mp4,91156,91037,0.0026\nCC-MAIN-2022-21,video/quicktime,14349,14336,0.0004\nCC-MAIN-2022-21,video/webm,3419,3418,0.0001\nCC-MAIN-2022-21,video/x-m4v,1985,1983,0.0001\nCC-MAIN-2022-27,<other>,469619,468806,0.0151\nCC-MAIN-2022-27,application/atom+xml,3531417,3531080,0.1136\nCC-MAIN-2022-27,application/epub+zip,58008,57951,0.0019\nCC-MAIN-2022-27,application/gpx+xml,14462,14462,0.0005\nCC-MAIN-2022-27,application/gzip,79233,79076,0.0025\nCC-MAIN-2022-27,application/javascript,25150,25062,0.0008\nCC-MAIN-2022-27,application/json,765651,765427,0.0246\nCC-MAIN-2022-27,application/marc,45519,45517,0.0015\nCC-MAIN-2022-27,application/mbox,121009,120963,0.0039\nCC-MAIN-2022-27,application/msword,77433,77331,0.0025\nCC-MAIN-2022-27,application/octet-stream,642917,642105,0.0207\nCC-MAIN-2022-27,application/pdf,31445930,31368995,1.0113\nCC-MAIN-2022-27,application/pgp-signature,89367,89366,0.0029\nCC-MAIN-2022-27,application/pkcs7-signature,16320,16319,0.0005\nCC-MAIN-2022-27,application/postscript,4211,4208,0.0001\nCC-MAIN-2022-27,application/rdf+xml,308718,308606,0.0099\nCC-MAIN-2022-27,application/rss+xml,3594536,3590589,0.1156\nCC-MAIN-2022-27,application/rtf,55525,55514,0.0018\nCC-MAIN-2022-27,application/text,13794,13794,0.0004\nCC-MAIN-2022-27,application/vnd.android.package-archive,8652,8492,0.0003\nCC-MAIN-2022-27,application/vnd.google-earth.kml+xml,74708,74669,0.0024\nCC-MAIN-2022-27,application/vnd.google-earth.kmz,9502,9499,0.0003\nCC-MAIN-2022-27,application/vnd.ms-excel,56106,56022,0.0018\nCC-MAIN-2022-27,application/vnd.ms-powerpoint,14033,14022,0.0005\nCC-MAIN-2022-27,application/vnd.oasis.opendocument.spreadsheet,11634,11621,0.0004\nCC-MAIN-2022-27,application/vnd.oasis.opendocument.text,38899,38881,0.0013\nCC-MAIN-2022-27,application/vnd.openxmlformats-officedocument.presentationml.presentation,12931,12892,0.0004\nCC-MAIN-2022-27,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,55438,55225,0.0018\nCC-MAIN-2022-27,application/vnd.openxmlformats-officedocument.wordprocessingml.document,93225,93012,0.0030\nCC-MAIN-2022-27,application/x-bibtex-text-file,195793,195763,0.0063\nCC-MAIN-2022-27,application/x-bittorrent,10251,10247,0.0003\nCC-MAIN-2022-27,application/x-bzip2,43915,43898,0.0014\nCC-MAIN-2022-27,application/x-dosexec,9398,8614,0.0003\nCC-MAIN-2022-27,application/x-endnote-refer,61894,61879,0.0020\nCC-MAIN-2022-27,application/x-hdf,46399,46398,0.0015\nCC-MAIN-2022-27,application/x-mobipocket-ebook,11443,11406,0.0004\nCC-MAIN-2022-27,application/x-ms-asx,4840,4838,0.0002\nCC-MAIN-2022-27,application/x-msdownload,5879,5853,0.0002\nCC-MAIN-2022-27,application/x-rar-compressed,320,320,0.0000\nCC-MAIN-2022-27,application/x-research-info-systems,5374,5374,0.0002\nCC-MAIN-2022-27,application/x-sh,39257,39235,0.0013\nCC-MAIN-2022-27,application/x-shockwave-flash,8726,8718,0.0003\nCC-MAIN-2022-27,application/x-stata-do,38025,38003,0.0012\nCC-MAIN-2022-27,application/x-tex,8020,8020,0.0003\nCC-MAIN-2022-27,application/x-tex-tfm,12200,12200,0.0004\nCC-MAIN-2022-27,application/x-tika-msoffice,102461,102449,0.0033\nCC-MAIN-2022-27,application/x-tika-ooxml,109880,109852,0.0035\nCC-MAIN-2022-27,application/x-wais-source,7890,7890,0.0003\nCC-MAIN-2022-27,application/x-xz,13016,13014,0.0004\nCC-MAIN-2022-27,application/xhtml+xml,396656788,394611368,12.7558\nCC-MAIN-2022-27,application/xml,2242871,2240165,0.0721\nCC-MAIN-2022-27,application/zip,325308,324041,0.0105\nCC-MAIN-2022-27,application/zlib,8407,8351,0.0003\nCC-MAIN-2022-27,application/zstd,32260,32260,0.0010\nCC-MAIN-2022-27,audio/mp4,1378,1376,0.0000\nCC-MAIN-2022-27,audio/mpeg,193117,191782,0.0062\nCC-MAIN-2022-27,audio/vnd.wave,19040,18920,0.0006\nCC-MAIN-2022-27,audio/x-mpegurl,3293,3292,0.0001\nCC-MAIN-2022-27,image/gif,124710,124336,0.0040\nCC-MAIN-2022-27,image/jpeg,5856316,5846113,0.1883\nCC-MAIN-2022-27,image/png,1085233,1080925,0.0349\nCC-MAIN-2022-27,image/svg+xml,47131,47104,0.0015\nCC-MAIN-2022-27,image/tiff,34714,34714,0.0011\nCC-MAIN-2022-27,image/vnd.djvu,12959,12959,0.0004\nCC-MAIN-2022-27,image/vnd.dxf; format=ascii,16404,16402,0.0005\nCC-MAIN-2022-27,image/webp,25665,25639,0.0008\nCC-MAIN-2022-27,message/rfc822,88315,88306,0.0028\nCC-MAIN-2022-27,text/asp,1,1,0.0000\nCC-MAIN-2022-27,text/calendar,1233460,1232959,0.0397\nCC-MAIN-2022-27,text/css,14270,14249,0.0005\nCC-MAIN-2022-27,text/csv,153938,153883,0.0050\nCC-MAIN-2022-27,text/html,2654603477,2638947512,85.3677\nCC-MAIN-2022-27,text/markdown,1505,1505,0.0000\nCC-MAIN-2022-27,text/plain,3311856,3309500,0.1065\nCC-MAIN-2022-27,text/prs.lines.tag,108933,108933,0.0035\nCC-MAIN-2022-27,text/tab-separated-values,26537,26537,0.0009\nCC-MAIN-2022-27,text/troff,18193,18193,0.0006\nCC-MAIN-2022-27,text/turtle,38069,38037,0.0012\nCC-MAIN-2022-27,text/vtt,22350,22350,0.0007\nCC-MAIN-2022-27,text/x-c++src,12108,12108,0.0004\nCC-MAIN-2022-27,text/x-chdr,33984,33984,0.0011\nCC-MAIN-2022-27,text/x-csrc,52655,52654,0.0017\nCC-MAIN-2022-27,text/x-diff,46852,46842,0.0015\nCC-MAIN-2022-27,text/x-jsp,3784,3776,0.0001\nCC-MAIN-2022-27,text/x-log,75170,75170,0.0024\nCC-MAIN-2022-27,text/x-matlab,102773,102768,0.0033\nCC-MAIN-2022-27,text/x-perl,75143,75126,0.0024\nCC-MAIN-2022-27,text/x-php,138426,137960,0.0045\nCC-MAIN-2022-27,text/x-python,21974,21969,0.0007\nCC-MAIN-2022-27,text/x-vcalendar,16055,16055,0.0005\nCC-MAIN-2022-27,text/x-vcard,134028,133918,0.0043\nCC-MAIN-2022-27,text/x-web-markdown,13542,13539,0.0004\nCC-MAIN-2022-27,text/x-yaml,15463,15461,0.0005\nCC-MAIN-2022-27,video/mp4,73520,73318,0.0024\nCC-MAIN-2022-27,video/quicktime,10467,10458,0.0003\nCC-MAIN-2022-27,video/webm,6566,6560,0.0002\nCC-MAIN-2022-27,video/x-m4v,1736,1720,0.0001\nCC-MAIN-2022-33,<other>,473731,472861,0.0183\nCC-MAIN-2022-33,application/atom+xml,2962545,2961907,0.1144\nCC-MAIN-2022-33,application/epub+zip,70153,70133,0.0027\nCC-MAIN-2022-33,application/gpx+xml,13901,13901,0.0005\nCC-MAIN-2022-33,application/gzip,108410,108111,0.0042\nCC-MAIN-2022-33,application/javascript,35183,35076,0.0014\nCC-MAIN-2022-33,application/json,789230,789043,0.0305\nCC-MAIN-2022-33,application/marc,43391,43381,0.0017\nCC-MAIN-2022-33,application/mbox,134753,134597,0.0052\nCC-MAIN-2022-33,application/msword,81301,80994,0.0031\nCC-MAIN-2022-33,application/octet-stream,708661,707938,0.0274\nCC-MAIN-2022-33,application/pdf,28912943,28852156,1.1169\nCC-MAIN-2022-33,application/pgp-signature,72568,72565,0.0028\nCC-MAIN-2022-33,application/pkcs7-signature,11810,11808,0.0005\nCC-MAIN-2022-33,application/postscript,4644,4622,0.0002\nCC-MAIN-2022-33,application/rdf+xml,301584,301490,0.0117\nCC-MAIN-2022-33,application/rss+xml,3330566,3326141,0.1287\nCC-MAIN-2022-33,application/rtf,65718,65685,0.0025\nCC-MAIN-2022-33,application/text,14101,14101,0.0005\nCC-MAIN-2022-33,application/vnd.android.package-archive,7658,7519,0.0003\nCC-MAIN-2022-33,application/vnd.google-earth.kml+xml,63032,63018,0.0024\nCC-MAIN-2022-33,application/vnd.google-earth.kmz,10222,10219,0.0004\nCC-MAIN-2022-33,application/vnd.ms-excel,52107,51953,0.0020\nCC-MAIN-2022-33,application/vnd.ms-powerpoint,14401,14388,0.0006\nCC-MAIN-2022-33,application/vnd.oasis.opendocument.spreadsheet,13632,13606,0.0005\nCC-MAIN-2022-33,application/vnd.oasis.opendocument.text,33837,33808,0.0013\nCC-MAIN-2022-33,application/vnd.openxmlformats-officedocument.presentationml.presentation,10702,10621,0.0004\nCC-MAIN-2022-33,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,58524,58245,0.0023\nCC-MAIN-2022-33,application/vnd.openxmlformats-officedocument.wordprocessingml.document,99497,99219,0.0038\nCC-MAIN-2022-33,application/x-bibtex-text-file,226317,226283,0.0087\nCC-MAIN-2022-33,application/x-bittorrent,11638,11623,0.0004\nCC-MAIN-2022-33,application/x-bzip2,8596,8590,0.0003\nCC-MAIN-2022-33,application/x-dosexec,9083,8720,0.0004\nCC-MAIN-2022-33,application/x-endnote-refer,63295,63287,0.0024\nCC-MAIN-2022-33,application/x-hdf,52413,52412,0.0020\nCC-MAIN-2022-33,application/x-mobipocket-ebook,12423,12422,0.0005\nCC-MAIN-2022-33,application/x-ms-asx,4072,4070,0.0002\nCC-MAIN-2022-33,application/x-msdownload,5148,5090,0.0002\nCC-MAIN-2022-33,application/x-rar-compressed,441,441,0.0000\nCC-MAIN-2022-33,application/x-research-info-systems,3814,3814,0.0001\nCC-MAIN-2022-33,application/x-sh,38322,38307,0.0015\nCC-MAIN-2022-33,application/x-shockwave-flash,9057,9048,0.0003\nCC-MAIN-2022-33,application/x-stata-do,33208,33206,0.0013\nCC-MAIN-2022-33,application/x-tex,9482,9482,0.0004\nCC-MAIN-2022-33,application/x-tex-tfm,11763,11763,0.0005\nCC-MAIN-2022-33,application/x-tika-msoffice,113806,113762,0.0044\nCC-MAIN-2022-33,application/x-tika-ooxml,99398,99324,0.0038\nCC-MAIN-2022-33,application/x-wais-source,6528,6528,0.0003\nCC-MAIN-2022-33,application/x-xz,30068,30067,0.0012\nCC-MAIN-2022-33,application/xhtml+xml,343516153,341402831,13.2699\nCC-MAIN-2022-33,application/xml,2010451,2006682,0.0777\nCC-MAIN-2022-33,application/zip,353216,351598,0.0136\nCC-MAIN-2022-33,application/zlib,7999,7928,0.0003\nCC-MAIN-2022-33,application/zstd,37283,37283,0.0014\nCC-MAIN-2022-33,audio/mp4,2085,2047,0.0001\nCC-MAIN-2022-33,audio/mpeg,194312,192994,0.0075\nCC-MAIN-2022-33,audio/vnd.wave,18190,18130,0.0007\nCC-MAIN-2022-33,audio/x-mpegurl,5276,5276,0.0002\nCC-MAIN-2022-33,image/gif,144326,143912,0.0056\nCC-MAIN-2022-33,image/jpeg,6806608,6786818,0.2629\nCC-MAIN-2022-33,image/png,1236888,1232215,0.0478\nCC-MAIN-2022-33,image/svg+xml,52630,52542,0.0020\nCC-MAIN-2022-33,image/tiff,44775,44774,0.0017\nCC-MAIN-2022-33,image/vnd.djvu,20252,20240,0.0008\nCC-MAIN-2022-33,image/vnd.dxf; format=ascii,14095,13996,0.0005\nCC-MAIN-2022-33,image/webp,26754,26653,0.0010\nCC-MAIN-2022-33,message/rfc822,108765,108752,0.0042\nCC-MAIN-2022-33,text/calendar,1377234,1376929,0.0532\nCC-MAIN-2022-33,text/css,9269,9244,0.0004\nCC-MAIN-2022-33,text/csv,150473,150433,0.0058\nCC-MAIN-2022-33,text/html,2189008938,2172653548,84.5605\nCC-MAIN-2022-33,text/markdown,2338,2338,0.0001\nCC-MAIN-2022-33,text/plain,3221665,3218105,0.1245\nCC-MAIN-2022-33,text/prs.lines.tag,122701,122681,0.0047\nCC-MAIN-2022-33,text/tab-separated-values,27127,27111,0.0010\nCC-MAIN-2022-33,text/troff,20169,20167,0.0008\nCC-MAIN-2022-33,text/turtle,40020,40012,0.0015\nCC-MAIN-2022-33,text/vtt,21990,21990,0.0008\nCC-MAIN-2022-33,text/x-c++src,13218,13217,0.0005\nCC-MAIN-2022-33,text/x-chdr,30195,30191,0.0012\nCC-MAIN-2022-33,text/x-csrc,54704,54684,0.0021\nCC-MAIN-2022-33,text/x-diff,53536,53499,0.0021\nCC-MAIN-2022-33,text/x-jsp,3783,3781,0.0001\nCC-MAIN-2022-33,text/x-log,100084,100060,0.0039\nCC-MAIN-2022-33,text/x-matlab,83071,83058,0.0032\nCC-MAIN-2022-33,text/x-perl,88733,88727,0.0034\nCC-MAIN-2022-33,text/x-php,125787,125253,0.0049\nCC-MAIN-2022-33,text/x-python,25067,25061,0.0010\nCC-MAIN-2022-33,text/x-vcalendar,16492,16488,0.0006\nCC-MAIN-2022-33,text/x-vcard,128567,128494,0.0050\nCC-MAIN-2022-33,text/x-web-markdown,14807,14802,0.0006\nCC-MAIN-2022-33,text/x-yaml,15971,15967,0.0006\nCC-MAIN-2022-33,video/mp4,69059,68836,0.0027\nCC-MAIN-2022-33,video/quicktime,11757,11742,0.0005\nCC-MAIN-2022-33,video/webm,3964,3946,0.0002\nCC-MAIN-2022-33,video/x-m4v,1796,1782,0.0001\nCC-MAIN-2022-40,<other>,455396,454856,0.0143\nCC-MAIN-2022-40,application/atom+xml,2394070,2393693,0.0754\nCC-MAIN-2022-40,application/epub+zip,47453,47446,0.0015\nCC-MAIN-2022-40,application/gpx+xml,10598,10588,0.0003\nCC-MAIN-2022-40,application/gzip,100725,100609,0.0032\nCC-MAIN-2022-40,application/javascript,22206,22192,0.0007\nCC-MAIN-2022-40,application/json,748890,748685,0.0236\nCC-MAIN-2022-40,application/marc,42985,42984,0.0014\nCC-MAIN-2022-40,application/mbox,113909,113881,0.0036\nCC-MAIN-2022-40,application/msword,59700,59591,0.0019\nCC-MAIN-2022-40,application/octet-stream,844319,843742,0.0266\nCC-MAIN-2022-40,application/pdf,22666367,22613239,0.7135\nCC-MAIN-2022-40,application/pgp-signature,89625,89621,0.0028\nCC-MAIN-2022-40,application/pkcs7-signature,10648,10646,0.0003\nCC-MAIN-2022-40,application/postscript,3132,3132,0.0001\nCC-MAIN-2022-40,application/rdf+xml,288888,288530,0.0091\nCC-MAIN-2022-40,application/rss+xml,3089807,3086109,0.0973\nCC-MAIN-2022-40,application/rtf,59225,59213,0.0019\nCC-MAIN-2022-40,application/text,15109,15109,0.0005\nCC-MAIN-2022-40,application/vnd.android.package-archive,6737,6561,0.0002\nCC-MAIN-2022-40,application/vnd.google-earth.kml+xml,80164,80106,0.0025\nCC-MAIN-2022-40,application/vnd.google-earth.kmz,10547,10546,0.0003\nCC-MAIN-2022-40,application/vnd.ms-excel,42552,42471,0.0013\nCC-MAIN-2022-40,application/vnd.ms-powerpoint,7700,7695,0.0002\nCC-MAIN-2022-40,application/vnd.oasis.opendocument.spreadsheet,11619,11597,0.0004\nCC-MAIN-2022-40,application/vnd.oasis.opendocument.text,25841,25822,0.0008\nCC-MAIN-2022-40,application/vnd.openxmlformats-officedocument.presentationml.presentation,6186,6160,0.0002\nCC-MAIN-2022-40,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,51620,51479,0.0016\nCC-MAIN-2022-40,application/vnd.openxmlformats-officedocument.wordprocessingml.document,72264,72028,0.0023\nCC-MAIN-2022-40,application/x-bibtex-text-file,217726,217706,0.0069\nCC-MAIN-2022-40,application/x-bittorrent,10466,10434,0.0003\nCC-MAIN-2022-40,application/x-bzip2,48079,48076,0.0015\nCC-MAIN-2022-40,application/x-dosexec,5719,5534,0.0002\nCC-MAIN-2022-40,application/x-endnote-refer,59819,59815,0.0019\nCC-MAIN-2022-40,application/x-hdf,43026,43026,0.0014\nCC-MAIN-2022-40,application/x-mobipocket-ebook,10980,10978,0.0003\nCC-MAIN-2022-40,application/x-ms-asx,3633,3632,0.0001\nCC-MAIN-2022-40,application/x-msdownload,5690,5677,0.0002\nCC-MAIN-2022-40,application/x-rar-compressed,423,423,0.0000\nCC-MAIN-2022-40,application/x-research-info-systems,7059,7059,0.0002\nCC-MAIN-2022-40,application/x-sh,39404,39382,0.0012\nCC-MAIN-2022-40,application/x-shockwave-flash,5961,5952,0.0002\nCC-MAIN-2022-40,application/x-stata-do,57306,57303,0.0018\nCC-MAIN-2022-40,application/x-tex,11286,11276,0.0004\nCC-MAIN-2022-40,application/x-tex-tfm,7046,7046,0.0002\nCC-MAIN-2022-40,application/x-tika-msoffice,86138,86114,0.0027\nCC-MAIN-2022-40,application/x-tika-ooxml,84820,84804,0.0027\nCC-MAIN-2022-40,application/x-wais-source,8272,8272,0.0003\nCC-MAIN-2022-40,application/x-xz,10894,10894,0.0003\nCC-MAIN-2022-40,application/xhtml+xml,382330979,380518489,12.0352\nCC-MAIN-2022-40,application/xml,2148529,2145373,0.0676\nCC-MAIN-2022-40,application/zip,315348,312785,0.0099\nCC-MAIN-2022-40,application/zlib,5732,5679,0.0002\nCC-MAIN-2022-40,application/zstd,48494,48493,0.0015\nCC-MAIN-2022-40,audio/mp4,1608,1540,0.0001\nCC-MAIN-2022-40,audio/mpeg,154805,153674,0.0049\nCC-MAIN-2022-40,audio/vnd.wave,19452,19450,0.0006\nCC-MAIN-2022-40,audio/x-mpegurl,6285,6285,0.0002\nCC-MAIN-2022-40,image/gif,116991,116682,0.0037\nCC-MAIN-2022-40,image/jpeg,5225030,5213889,0.1645\nCC-MAIN-2022-40,image/png,981336,978400,0.0309\nCC-MAIN-2022-40,image/svg+xml,39712,39665,0.0013\nCC-MAIN-2022-40,image/tiff,19166,19154,0.0006\nCC-MAIN-2022-40,image/vnd.djvu,16660,16660,0.0005\nCC-MAIN-2022-40,image/vnd.dxf; format=ascii,9016,9015,0.0003\nCC-MAIN-2022-40,image/webp,38892,38810,0.0012\nCC-MAIN-2022-40,message/rfc822,90201,90185,0.0028\nCC-MAIN-2022-40,text/calendar,1179010,1178637,0.0371\nCC-MAIN-2022-40,text/css,14821,14795,0.0005\nCC-MAIN-2022-40,text/csv,128271,128228,0.0040\nCC-MAIN-2022-40,text/html,2747427054,2732710242,86.4851\nCC-MAIN-2022-40,text/markdown,1768,1768,0.0001\nCC-MAIN-2022-40,text/plain,3340763,3338821,0.1052\nCC-MAIN-2022-40,text/prs.lines.tag,129085,129084,0.0041\nCC-MAIN-2022-40,text/tab-separated-values,22039,22039,0.0007\nCC-MAIN-2022-40,text/troff,20485,20484,0.0006\nCC-MAIN-2022-40,text/turtle,45435,45149,0.0014\nCC-MAIN-2022-40,text/vtt,19146,19146,0.0006\nCC-MAIN-2022-40,text/x-c++src,10002,10002,0.0003\nCC-MAIN-2022-40,text/x-chdr,30017,30017,0.0009\nCC-MAIN-2022-40,text/x-csrc,53972,53970,0.0017\nCC-MAIN-2022-40,text/x-diff,56706,56702,0.0018\nCC-MAIN-2022-40,text/x-jsp,3689,3675,0.0001\nCC-MAIN-2022-40,text/x-log,67607,67606,0.0021\nCC-MAIN-2022-40,text/x-matlab,77143,76976,0.0024\nCC-MAIN-2022-40,text/x-perl,95456,95448,0.0030\nCC-MAIN-2022-40,text/x-php,116466,116037,0.0037\nCC-MAIN-2022-40,text/x-python,22946,22942,0.0007\nCC-MAIN-2022-40,text/x-vcalendar,16003,16003,0.0005\nCC-MAIN-2022-40,text/x-vcard,105207,105179,0.0033\nCC-MAIN-2022-40,text/x-web-markdown,14029,14023,0.0004\nCC-MAIN-2022-40,text/x-yaml,13282,13282,0.0004\nCC-MAIN-2022-40,video/mp4,66971,66820,0.0021\nCC-MAIN-2022-40,video/quicktime,11278,11278,0.0004\nCC-MAIN-2022-40,video/webm,2637,2636,0.0001\nCC-MAIN-2022-40,video/x-m4v,1495,1489,0.0000\nCC-MAIN-2022-49,<other>,503901,503218,0.0149\nCC-MAIN-2022-49,application/atom+xml,3263894,3263450,0.0965\nCC-MAIN-2022-49,application/epub+zip,52365,52345,0.0015\nCC-MAIN-2022-49,application/gpx+xml,14962,14958,0.0004\nCC-MAIN-2022-49,application/gzip,80266,80042,0.0024\nCC-MAIN-2022-49,application/javascript,26011,26008,0.0008\nCC-MAIN-2022-49,application/json,825768,825553,0.0244\nCC-MAIN-2022-49,application/marc,46758,46751,0.0014\nCC-MAIN-2022-49,application/mbox,104482,104469,0.0031\nCC-MAIN-2022-49,application/msword,69165,69040,0.0020\nCC-MAIN-2022-49,application/octet-stream,841470,840926,0.0249\nCC-MAIN-2022-49,application/pdf,27598086,27531685,0.8161\nCC-MAIN-2022-49,application/pgp-signature,109017,109016,0.0032\nCC-MAIN-2022-49,application/pkcs7-signature,14676,14672,0.0004\nCC-MAIN-2022-49,application/postscript,4045,4045,0.0001\nCC-MAIN-2022-49,application/rdf+xml,291881,291773,0.0086\nCC-MAIN-2022-49,application/rss+xml,3593410,3588641,0.1063\nCC-MAIN-2022-49,application/rtf,62272,62249,0.0018\nCC-MAIN-2022-49,application/text,14073,14073,0.0004\nCC-MAIN-2022-49,application/vnd.android.package-archive,7208,6982,0.0002\nCC-MAIN-2022-49,application/vnd.google-earth.kml+xml,86833,86805,0.0026\nCC-MAIN-2022-49,application/vnd.google-earth.kmz,8895,8893,0.0003\nCC-MAIN-2022-49,application/vnd.ms-excel,45441,45392,0.0013\nCC-MAIN-2022-49,application/vnd.ms-powerpoint,8087,8073,0.0002\nCC-MAIN-2022-49,application/vnd.oasis.opendocument.spreadsheet,11442,11421,0.0003\nCC-MAIN-2022-49,application/vnd.oasis.opendocument.text,33301,33286,0.0010\nCC-MAIN-2022-49,application/vnd.openxmlformats-officedocument.presentationml.presentation,8751,8720,0.0003\nCC-MAIN-2022-49,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,58035,57813,0.0017\nCC-MAIN-2022-49,application/vnd.openxmlformats-officedocument.wordprocessingml.document,87081,86746,0.0026\nCC-MAIN-2022-49,application/x-bibtex-text-file,233502,233498,0.0069\nCC-MAIN-2022-49,application/x-bittorrent,10596,10583,0.0003\nCC-MAIN-2022-49,application/x-bzip2,34073,34066,0.0010\nCC-MAIN-2022-49,application/x-dosexec,7144,6872,0.0002\nCC-MAIN-2022-49,application/x-endnote-refer,62154,62153,0.0018\nCC-MAIN-2022-49,application/x-hdf,104645,104645,0.0031\nCC-MAIN-2022-49,application/x-mobipocket-ebook,10998,10980,0.0003\nCC-MAIN-2022-49,application/x-ms-asx,2524,2520,0.0001\nCC-MAIN-2022-49,application/x-msdownload,5899,5870,0.0002\nCC-MAIN-2022-49,application/x-rar-compressed,361,361,0.0000\nCC-MAIN-2022-49,application/x-research-info-systems,5073,5073,0.0002\nCC-MAIN-2022-49,application/x-sh,38560,38538,0.0011\nCC-MAIN-2022-49,application/x-shockwave-flash,8858,8845,0.0003\nCC-MAIN-2022-49,application/x-stata-do,53861,53859,0.0016\nCC-MAIN-2022-49,application/x-tex,12398,12397,0.0004\nCC-MAIN-2022-49,application/x-tex-tfm,17641,17641,0.0005\nCC-MAIN-2022-49,application/x-tika-msoffice,101549,101519,0.0030\nCC-MAIN-2022-49,application/x-tika-ooxml,100607,100547,0.0030\nCC-MAIN-2022-49,application/x-wais-source,8031,8031,0.0002\nCC-MAIN-2022-49,application/x-xz,28380,28343,0.0008\nCC-MAIN-2022-49,application/xhtml+xml,394836398,392823109,11.6760\nCC-MAIN-2022-49,application/xml,1989704,1986479,0.0588\nCC-MAIN-2022-49,application/zip,308798,306638,0.0091\nCC-MAIN-2022-49,application/zlib,3989,3949,0.0001\nCC-MAIN-2022-49,application/zstd,53783,53779,0.0016\nCC-MAIN-2022-49,audio/mp4,1826,1811,0.0001\nCC-MAIN-2022-49,audio/mpeg,176471,175410,0.0052\nCC-MAIN-2022-49,audio/vnd.wave,18450,18449,0.0005\nCC-MAIN-2022-49,audio/x-mpegurl,5259,5259,0.0002\nCC-MAIN-2022-49,image/gif,124062,123722,0.0037\nCC-MAIN-2022-49,image/jpeg,5353210,5341713,0.1583\nCC-MAIN-2022-49,image/png,881415,878643,0.0261\nCC-MAIN-2022-49,image/svg+xml,36738,36686,0.0011\nCC-MAIN-2022-49,image/tiff,41193,41188,0.0012\nCC-MAIN-2022-49,image/vnd.djvu,11807,11806,0.0003\nCC-MAIN-2022-49,image/vnd.dxf; format=ascii,11105,11104,0.0003\nCC-MAIN-2022-49,image/webp,43810,43649,0.0013\nCC-MAIN-2022-49,message/rfc822,93059,93048,0.0028\nCC-MAIN-2022-49,text/calendar,1331605,1331288,0.0394\nCC-MAIN-2022-49,text/css,15679,15676,0.0005\nCC-MAIN-2022-49,text/csv,132845,132804,0.0039\nCC-MAIN-2022-49,text/html,2932905363,2914099794,86.7310\nCC-MAIN-2022-49,text/markdown,1537,1537,0.0000\nCC-MAIN-2022-49,text/plain,3535044,3532215,0.1045\nCC-MAIN-2022-49,text/prs.lines.tag,105941,105941,0.0031\nCC-MAIN-2022-49,text/tab-separated-values,32339,32338,0.0010\nCC-MAIN-2022-49,text/troff,23057,23057,0.0007\nCC-MAIN-2022-49,text/turtle,41065,41045,0.0012\nCC-MAIN-2022-49,text/vtt,21740,21733,0.0006\nCC-MAIN-2022-49,text/x-c++src,9217,9216,0.0003\nCC-MAIN-2022-49,text/x-chdr,25945,25943,0.0008\nCC-MAIN-2022-49,text/x-csrc,49416,49413,0.0015\nCC-MAIN-2022-49,text/x-diff,52921,52893,0.0016\nCC-MAIN-2022-49,text/x-jsp,3204,3199,0.0001\nCC-MAIN-2022-49,text/x-log,82307,82299,0.0024\nCC-MAIN-2022-49,text/x-matlab,82311,82300,0.0024\nCC-MAIN-2022-49,text/x-perl,68811,68768,0.0020\nCC-MAIN-2022-49,text/x-php,104980,104505,0.0031\nCC-MAIN-2022-49,text/x-python,17915,17911,0.0005\nCC-MAIN-2022-49,text/x-vcalendar,18587,18583,0.0005\nCC-MAIN-2022-49,text/x-vcard,134936,134907,0.0040\nCC-MAIN-2022-49,text/x-web-markdown,11189,11186,0.0003\nCC-MAIN-2022-49,text/x-yaml,11148,11148,0.0003\nCC-MAIN-2022-49,video/mp4,69105,68808,0.0020\nCC-MAIN-2022-49,video/quicktime,10588,10578,0.0003\nCC-MAIN-2022-49,video/webm,3112,3110,0.0001\nCC-MAIN-2022-49,video/x-m4v,1474,1471,0.0000\nCC-MAIN-2023-06,<other>,453030,452465,0.0142\nCC-MAIN-2023-06,application/atom+xml,3077932,3077671,0.0965\nCC-MAIN-2023-06,application/epub+zip,46095,46081,0.0014\nCC-MAIN-2023-06,application/gpx+xml,13830,13830,0.0004\nCC-MAIN-2023-06,application/gzip,58387,58225,0.0018\nCC-MAIN-2023-06,application/javascript,15380,15375,0.0005\nCC-MAIN-2023-06,application/json,730509,730011,0.0229\nCC-MAIN-2023-06,application/marc,41119,41118,0.0013\nCC-MAIN-2023-06,application/mbox,67758,67588,0.0021\nCC-MAIN-2023-06,application/msword,64986,64797,0.0020\nCC-MAIN-2023-06,application/octet-stream,597710,596293,0.0187\nCC-MAIN-2023-06,application/pdf,25239471,25167546,0.7913\nCC-MAIN-2023-06,application/pgp-signature,92887,92804,0.0029\nCC-MAIN-2023-06,application/pkcs7-signature,13402,13395,0.0004\nCC-MAIN-2023-06,application/postscript,3577,3577,0.0001\nCC-MAIN-2023-06,application/rdf+xml,278818,278668,0.0087\nCC-MAIN-2023-06,application/rss+xml,3222915,3219522,0.1010\nCC-MAIN-2023-06,application/rtf,42178,42160,0.0013\nCC-MAIN-2023-06,application/text,4145,4145,0.0001\nCC-MAIN-2023-06,application/vnd.android.package-archive,5095,4935,0.0002\nCC-MAIN-2023-06,application/vnd.google-earth.kml+xml,112940,112926,0.0035\nCC-MAIN-2023-06,application/vnd.google-earth.kmz,11120,11120,0.0003\nCC-MAIN-2023-06,application/vnd.ms-excel,41769,41713,0.0013\nCC-MAIN-2023-06,application/vnd.ms-powerpoint,9543,9539,0.0003\nCC-MAIN-2023-06,application/vnd.oasis.opendocument.spreadsheet,12474,12458,0.0004\nCC-MAIN-2023-06,application/vnd.oasis.opendocument.text,31391,31371,0.0010\nCC-MAIN-2023-06,application/vnd.openxmlformats-officedocument.presentationml.presentation,7835,7802,0.0002\nCC-MAIN-2023-06,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,48976,48752,0.0015\nCC-MAIN-2023-06,application/vnd.openxmlformats-officedocument.wordprocessingml.document,78946,78711,0.0025\nCC-MAIN-2023-06,application/x-bibtex-text-file,226914,226896,0.0071\nCC-MAIN-2023-06,application/x-bittorrent,7664,7663,0.0002\nCC-MAIN-2023-06,application/x-bzip2,23396,23381,0.0007\nCC-MAIN-2023-06,application/x-dosexec,6758,6545,0.0002\nCC-MAIN-2023-06,application/x-endnote-refer,45581,45581,0.0014\nCC-MAIN-2023-06,application/x-hdf,92778,92778,0.0029\nCC-MAIN-2023-06,application/x-mobipocket-ebook,8942,8936,0.0003\nCC-MAIN-2023-06,application/x-ms-asx,2880,2877,0.0001\nCC-MAIN-2023-06,application/x-msdownload,5183,5164,0.0002\nCC-MAIN-2023-06,application/x-rar-compressed,153,153,0.0000\nCC-MAIN-2023-06,application/x-research-info-systems,6747,6747,0.0002\nCC-MAIN-2023-06,application/x-sh,33045,33027,0.0010\nCC-MAIN-2023-06,application/x-shockwave-flash,7691,7676,0.0002\nCC-MAIN-2023-06,application/x-stata-do,33009,32979,0.0010\nCC-MAIN-2023-06,application/x-tex,7379,7377,0.0002\nCC-MAIN-2023-06,application/x-tex-tfm,13794,13794,0.0004\nCC-MAIN-2023-06,application/x-tika-msoffice,95045,94996,0.0030\nCC-MAIN-2023-06,application/x-tika-ooxml,91989,91939,0.0029\nCC-MAIN-2023-06,application/x-wais-source,6355,6355,0.0002\nCC-MAIN-2023-06,application/x-xz,24177,24174,0.0008\nCC-MAIN-2023-06,application/xhtml+xml,361413366,359699524,11.3311\nCC-MAIN-2023-06,application/xml,1973009,1969963,0.0619\nCC-MAIN-2023-06,application/zip,263333,260840,0.0083\nCC-MAIN-2023-06,application/zlib,5283,5231,0.0002\nCC-MAIN-2023-06,application/zstd,45943,45857,0.0014\nCC-MAIN-2023-06,audio/mp4,1601,1596,0.0001\nCC-MAIN-2023-06,audio/mpeg,167057,166228,0.0052\nCC-MAIN-2023-06,audio/vnd.wave,13194,13192,0.0004\nCC-MAIN-2023-06,audio/x-mpegurl,4766,4766,0.0001\nCC-MAIN-2023-06,image/gif,110393,110073,0.0035\nCC-MAIN-2023-06,image/jpeg,4442636,4434110,0.1393\nCC-MAIN-2023-06,image/png,671427,669339,0.0211\nCC-MAIN-2023-06,image/svg+xml,24682,24614,0.0008\nCC-MAIN-2023-06,image/tiff,22557,22556,0.0007\nCC-MAIN-2023-06,image/vnd.djvu,17116,17115,0.0005\nCC-MAIN-2023-06,image/vnd.dxf; format=ascii,8199,8199,0.0003\nCC-MAIN-2023-06,image/webp,69128,68998,0.0022\nCC-MAIN-2023-06,message/rfc822,56757,56748,0.0018\nCC-MAIN-2023-06,text/asp,1,1,0.0000\nCC-MAIN-2023-06,text/calendar,1061265,1060565,0.0333\nCC-MAIN-2023-06,text/css,14549,14546,0.0005\nCC-MAIN-2023-06,text/csv,105661,105637,0.0033\nCC-MAIN-2023-06,text/html,2779705013,2763405977,87.1496\nCC-MAIN-2023-06,text/markdown,144,144,0.0000\nCC-MAIN-2023-06,text/plain,3286745,3284707,0.1030\nCC-MAIN-2023-06,text/prs.lines.tag,175133,175132,0.0055\nCC-MAIN-2023-06,text/tab-separated-values,7169,7169,0.0002\nCC-MAIN-2023-06,text/troff,17574,17574,0.0006\nCC-MAIN-2023-06,text/turtle,38260,38221,0.0012\nCC-MAIN-2023-06,text/vtt,21120,21118,0.0007\nCC-MAIN-2023-06,text/x-c++src,9756,9756,0.0003\nCC-MAIN-2023-06,text/x-chdr,25473,25472,0.0008\nCC-MAIN-2023-06,text/x-csrc,40411,40410,0.0013\nCC-MAIN-2023-06,text/x-diff,41680,41615,0.0013\nCC-MAIN-2023-06,text/x-jsp,2879,2872,0.0001\nCC-MAIN-2023-06,text/x-log,90584,90584,0.0028\nCC-MAIN-2023-06,text/x-matlab,69720,69716,0.0022\nCC-MAIN-2023-06,text/x-perl,61597,61471,0.0019\nCC-MAIN-2023-06,text/x-php,98476,98135,0.0031\nCC-MAIN-2023-06,text/x-python,12569,12566,0.0004\nCC-MAIN-2023-06,text/x-vcalendar,19108,19106,0.0006\nCC-MAIN-2023-06,text/x-vcard,109136,108999,0.0034\nCC-MAIN-2023-06,text/x-web-markdown,11386,11385,0.0004\nCC-MAIN-2023-06,text/x-yaml,13341,13341,0.0004\nCC-MAIN-2023-06,video/mp4,52741,52509,0.0017\nCC-MAIN-2023-06,video/quicktime,8733,8724,0.0003\nCC-MAIN-2023-06,video/webm,2659,2659,0.0001\nCC-MAIN-2023-06,video/x-m4v,1179,1177,0.0000\nCC-MAIN-2023-14,<other>,461631,461073,0.0148\nCC-MAIN-2023-14,application/atom+xml,3489076,3488702,0.1119\nCC-MAIN-2023-14,application/epub+zip,55226,55213,0.0018\nCC-MAIN-2023-14,application/gpx+xml,14636,14560,0.0005\nCC-MAIN-2023-14,application/gzip,65058,64847,0.0021\nCC-MAIN-2023-14,application/javascript,19229,19205,0.0006\nCC-MAIN-2023-14,application/json,709624,709454,0.0228\nCC-MAIN-2023-14,application/marc,34377,34377,0.0011\nCC-MAIN-2023-14,application/mbox,65873,65866,0.0021\nCC-MAIN-2023-14,application/msword,69965,69827,0.0022\nCC-MAIN-2023-14,application/octet-stream,666037,665758,0.0214\nCC-MAIN-2023-14,application/pdf,28802446,28734343,0.9236\nCC-MAIN-2023-14,application/pgp-signature,102642,102640,0.0033\nCC-MAIN-2023-14,application/pkcs7-signature,12662,12661,0.0004\nCC-MAIN-2023-14,application/postscript,4378,4374,0.0001\nCC-MAIN-2023-14,application/rdf+xml,277837,277675,0.0089\nCC-MAIN-2023-14,application/rss+xml,3158396,3155047,0.1013\nCC-MAIN-2023-14,application/rtf,40439,40436,0.0013\nCC-MAIN-2023-14,application/text,4535,4535,0.0001\nCC-MAIN-2023-14,application/vnd.android.package-archive,3611,3554,0.0001\nCC-MAIN-2023-14,application/vnd.google-earth.kml+xml,105916,105876,0.0034\nCC-MAIN-2023-14,application/vnd.google-earth.kmz,16357,16353,0.0005\nCC-MAIN-2023-14,application/vnd.ms-excel,44052,44004,0.0014\nCC-MAIN-2023-14,application/vnd.ms-powerpoint,10916,10909,0.0004\nCC-MAIN-2023-14,application/vnd.oasis.opendocument.spreadsheet,12664,12579,0.0004\nCC-MAIN-2023-14,application/vnd.oasis.opendocument.text,31939,31928,0.0010\nCC-MAIN-2023-14,application/vnd.openxmlformats-officedocument.presentationml.presentation,9683,9654,0.0003\nCC-MAIN-2023-14,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,57497,57286,0.0018\nCC-MAIN-2023-14,application/vnd.openxmlformats-officedocument.wordprocessingml.document,86286,85889,0.0028\nCC-MAIN-2023-14,application/x-bibtex-text-file,249879,249870,0.0080\nCC-MAIN-2023-14,application/x-bittorrent,7452,7447,0.0002\nCC-MAIN-2023-14,application/x-bzip2,26667,26665,0.0009\nCC-MAIN-2023-14,application/x-dosexec,4295,4185,0.0001\nCC-MAIN-2023-14,application/x-endnote-refer,44821,44821,0.0014\nCC-MAIN-2023-14,application/x-hdf,32405,32405,0.0010\nCC-MAIN-2023-14,application/x-mobipocket-ebook,13739,13735,0.0004\nCC-MAIN-2023-14,application/x-ms-asx,3994,3992,0.0001\nCC-MAIN-2023-14,application/x-msdownload,6886,6868,0.0002\nCC-MAIN-2023-14,application/x-rar-compressed,198,198,0.0000\nCC-MAIN-2023-14,application/x-research-info-systems,6384,6384,0.0002\nCC-MAIN-2023-14,application/x-sh,27644,27630,0.0009\nCC-MAIN-2023-14,application/x-shockwave-flash,7175,7166,0.0002\nCC-MAIN-2023-14,application/x-stata-do,34790,34790,0.0011\nCC-MAIN-2023-14,application/x-tex,8845,8845,0.0003\nCC-MAIN-2023-14,application/x-tex-tfm,6528,6528,0.0002\nCC-MAIN-2023-14,application/x-tika-msoffice,92472,92429,0.0030\nCC-MAIN-2023-14,application/x-tika-ooxml,99857,99827,0.0032\nCC-MAIN-2023-14,application/x-wais-source,8408,8408,0.0003\nCC-MAIN-2023-14,application/x-xz,11465,11463,0.0004\nCC-MAIN-2023-14,application/xhtml+xml,344534539,342846762,11.0476\nCC-MAIN-2023-14,application/xml,1928521,1926084,0.0618\nCC-MAIN-2023-14,application/zip,208043,206550,0.0067\nCC-MAIN-2023-14,application/zlib,3679,3648,0.0001\nCC-MAIN-2023-14,application/zstd,39707,39705,0.0013\nCC-MAIN-2023-14,audio/mp4,1013,1013,0.0000\nCC-MAIN-2023-14,audio/mpeg,115560,115008,0.0037\nCC-MAIN-2023-14,audio/vnd.wave,11244,11244,0.0004\nCC-MAIN-2023-14,audio/x-mpegurl,5426,5426,0.0002\nCC-MAIN-2023-14,image/gif,111654,111341,0.0036\nCC-MAIN-2023-14,image/jpeg,4865002,4856440,0.1560\nCC-MAIN-2023-14,image/png,897118,894474,0.0288\nCC-MAIN-2023-14,image/svg+xml,31840,31766,0.0010\nCC-MAIN-2023-14,image/tiff,16794,16794,0.0005\nCC-MAIN-2023-14,image/vnd.djvu,11219,11219,0.0004\nCC-MAIN-2023-14,image/vnd.dxf; format=ascii,7605,7605,0.0002\nCC-MAIN-2023-14,image/webp,71038,70858,0.0023\nCC-MAIN-2023-14,message/rfc822,45095,45088,0.0014\nCC-MAIN-2023-14,text/asp,2,1,0.0000\nCC-MAIN-2023-14,text/aspdotnet,6,6,0.0000\nCC-MAIN-2023-14,text/calendar,1039760,1039622,0.0333\nCC-MAIN-2023-14,text/css,16791,16787,0.0005\nCC-MAIN-2023-14,text/csv,107446,107394,0.0034\nCC-MAIN-2023-14,text/html,2721070426,2704660311,87.2520\nCC-MAIN-2023-14,text/markdown,204,204,0.0000\nCC-MAIN-2023-14,text/plain,3431960,3428758,0.1100\nCC-MAIN-2023-14,text/prs.lines.tag,131889,131889,0.0042\nCC-MAIN-2023-14,text/tab-separated-values,10043,10043,0.0003\nCC-MAIN-2023-14,text/troff,19756,19756,0.0006\nCC-MAIN-2023-14,text/turtle,43963,43885,0.0014\nCC-MAIN-2023-14,text/vtt,20322,20319,0.0007\nCC-MAIN-2023-14,text/x-c++src,8711,8711,0.0003\nCC-MAIN-2023-14,text/x-chdr,37567,37562,0.0012\nCC-MAIN-2023-14,text/x-csrc,56548,56535,0.0018\nCC-MAIN-2023-14,text/x-diff,32273,32255,0.0010\nCC-MAIN-2023-14,text/x-jsp,4176,4170,0.0001\nCC-MAIN-2023-14,text/x-log,116897,116895,0.0037\nCC-MAIN-2023-14,text/x-matlab,57552,57546,0.0018\nCC-MAIN-2023-14,text/x-perl,56288,56249,0.0018\nCC-MAIN-2023-14,text/x-php,118842,118454,0.0038\nCC-MAIN-2023-14,text/x-python,9684,9658,0.0003\nCC-MAIN-2023-14,text/x-vcalendar,18085,18081,0.0006\nCC-MAIN-2023-14,text/x-vcard,117282,117265,0.0038\nCC-MAIN-2023-14,text/x-web-markdown,12146,12140,0.0004\nCC-MAIN-2023-14,text/x-yaml,10727,10727,0.0003\nCC-MAIN-2023-14,video/mp4,42449,42365,0.0014\nCC-MAIN-2023-14,video/quicktime,7064,7062,0.0002\nCC-MAIN-2023-14,video/webm,1836,1836,0.0001\nCC-MAIN-2023-14,video/x-m4v,729,729,0.0000\nCC-MAIN-2023-23,<other>,378640,378192,0.0121\nCC-MAIN-2023-23,application/atom+xml,3030744,3030358,0.0965\nCC-MAIN-2023-23,application/epub+zip,48863,48414,0.0016\nCC-MAIN-2023-23,application/gpx+xml,12527,12527,0.0004\nCC-MAIN-2023-23,application/gzip,56563,56488,0.0018\nCC-MAIN-2023-23,application/javascript,15178,15173,0.0005\nCC-MAIN-2023-23,application/json,725406,725158,0.0231\nCC-MAIN-2023-23,application/marc,49657,49654,0.0016\nCC-MAIN-2023-23,application/mbox,58828,58804,0.0019\nCC-MAIN-2023-23,application/msword,71538,71301,0.0023\nCC-MAIN-2023-23,application/octet-stream,719023,718344,0.0229\nCC-MAIN-2023-23,application/pdf,27187296,27125758,0.8657\nCC-MAIN-2023-23,application/pgp-signature,109920,109919,0.0035\nCC-MAIN-2023-23,application/pkcs7-signature,13023,13023,0.0004\nCC-MAIN-2023-23,application/postscript,3887,3883,0.0001\nCC-MAIN-2023-23,application/rdf+xml,300591,300448,0.0096\nCC-MAIN-2023-23,application/rss+xml,3189130,3184866,0.1015\nCC-MAIN-2023-23,application/rtf,47249,47238,0.0015\nCC-MAIN-2023-23,application/text,4718,4718,0.0002\nCC-MAIN-2023-23,application/vnd.android.package-archive,2214,2195,0.0001\nCC-MAIN-2023-23,application/vnd.google-earth.kml+xml,86385,86361,0.0028\nCC-MAIN-2023-23,application/vnd.google-earth.kmz,12580,12577,0.0004\nCC-MAIN-2023-23,application/vnd.ms-excel,46376,46006,0.0015\nCC-MAIN-2023-23,application/vnd.ms-powerpoint,9625,9619,0.0003\nCC-MAIN-2023-23,application/vnd.oasis.opendocument.spreadsheet,10453,10428,0.0003\nCC-MAIN-2023-23,application/vnd.oasis.opendocument.text,26800,26782,0.0009\nCC-MAIN-2023-23,application/vnd.openxmlformats-officedocument.presentationml.presentation,8527,8504,0.0003\nCC-MAIN-2023-23,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,48659,48289,0.0015\nCC-MAIN-2023-23,application/vnd.openxmlformats-officedocument.wordprocessingml.document,69850,69400,0.0022\nCC-MAIN-2023-23,application/x-bibtex-text-file,259334,259236,0.0083\nCC-MAIN-2023-23,application/x-bittorrent,6451,6446,0.0002\nCC-MAIN-2023-23,application/x-bzip2,1110,1109,0.0000\nCC-MAIN-2023-23,application/x-dosexec,2721,2646,0.0001\nCC-MAIN-2023-23,application/x-endnote-refer,46647,46646,0.0015\nCC-MAIN-2023-23,application/x-hdf,23866,23866,0.0008\nCC-MAIN-2023-23,application/x-mobipocket-ebook,10385,10365,0.0003\nCC-MAIN-2023-23,application/x-ms-asx,3770,3769,0.0001\nCC-MAIN-2023-23,application/x-msdownload,2418,2412,0.0001\nCC-MAIN-2023-23,application/x-rar-compressed,190,190,0.0000\nCC-MAIN-2023-23,application/x-research-info-systems,5502,5502,0.0002\nCC-MAIN-2023-23,application/x-sh,30895,30881,0.0010\nCC-MAIN-2023-23,application/x-shockwave-flash,8143,8140,0.0003\nCC-MAIN-2023-23,application/x-stata-do,22784,22772,0.0007\nCC-MAIN-2023-23,application/x-tex,10471,10468,0.0003\nCC-MAIN-2023-23,application/x-tex-tfm,4369,4369,0.0001\nCC-MAIN-2023-23,application/x-tika-msoffice,67664,67632,0.0022\nCC-MAIN-2023-23,application/x-tika-ooxml,88199,88187,0.0028\nCC-MAIN-2023-23,application/x-wais-source,8655,8655,0.0003\nCC-MAIN-2023-23,application/x-xz,21222,21222,0.0007\nCC-MAIN-2023-23,application/xhtml+xml,344814535,343099038,10.9793\nCC-MAIN-2023-23,application/xml,1858741,1855997,0.0592\nCC-MAIN-2023-23,application/zip,168040,167481,0.0054\nCC-MAIN-2023-23,application/zlib,5581,5451,0.0002\nCC-MAIN-2023-23,application/zstd,882,880,0.0000\nCC-MAIN-2023-23,audio/mp4,569,569,0.0000\nCC-MAIN-2023-23,audio/mpeg,79279,79095,0.0025\nCC-MAIN-2023-23,audio/vnd.wave,11190,11190,0.0004\nCC-MAIN-2023-23,audio/x-mpegurl,5732,5731,0.0002\nCC-MAIN-2023-23,image/gif,113653,113367,0.0036\nCC-MAIN-2023-23,image/jpeg,5167182,5157615,0.1645\nCC-MAIN-2023-23,image/png,987244,984018,0.0314\nCC-MAIN-2023-23,image/svg+xml,30781,30712,0.0010\nCC-MAIN-2023-23,image/tiff,8433,8385,0.0003\nCC-MAIN-2023-23,image/vnd.djvu,12433,12433,0.0004\nCC-MAIN-2023-23,image/vnd.dxf; format=ascii,6532,6532,0.0002\nCC-MAIN-2023-23,image/webp,71633,71516,0.0023\nCC-MAIN-2023-23,message/rfc822,70825,70813,0.0023\nCC-MAIN-2023-23,text/asp,7,6,0.0000\nCC-MAIN-2023-23,text/aspdotnet,10,10,0.0000\nCC-MAIN-2023-23,text/calendar,1107423,1106907,0.0353\nCC-MAIN-2023-23,text/css,15686,15684,0.0005\nCC-MAIN-2023-23,text/csv,106584,106489,0.0034\nCC-MAIN-2023-23,text/html,2744692249,2727842718,87.3946\nCC-MAIN-2023-23,text/markdown,83,83,0.0000\nCC-MAIN-2023-23,text/plain,3405763,3403183,0.1084\nCC-MAIN-2023-23,text/prs.lines.tag,142094,142080,0.0045\nCC-MAIN-2023-23,text/tab-separated-values,7970,7965,0.0003\nCC-MAIN-2023-23,text/troff,21866,21866,0.0007\nCC-MAIN-2023-23,text/turtle,44949,44944,0.0014\nCC-MAIN-2023-23,text/vtt,25014,25012,0.0008\nCC-MAIN-2023-23,text/x-c++src,8353,8350,0.0003\nCC-MAIN-2023-23,text/x-chdr,21310,21308,0.0007\nCC-MAIN-2023-23,text/x-csrc,38787,38782,0.0012\nCC-MAIN-2023-23,text/x-diff,43555,43531,0.0014\nCC-MAIN-2023-23,text/x-jsp,4735,4682,0.0002\nCC-MAIN-2023-23,text/x-log,59154,59153,0.0019\nCC-MAIN-2023-23,text/x-matlab,77616,77591,0.0025\nCC-MAIN-2023-23,text/x-perl,61085,61030,0.0019\nCC-MAIN-2023-23,text/x-php,102339,101869,0.0033\nCC-MAIN-2023-23,text/x-python,9456,9450,0.0003\nCC-MAIN-2023-23,text/x-vcalendar,18274,18270,0.0006\nCC-MAIN-2023-23,text/x-vcard,120148,120072,0.0038\nCC-MAIN-2023-23,text/x-web-markdown,11213,11211,0.0004\nCC-MAIN-2023-23,text/x-yaml,16409,16408,0.0005\nCC-MAIN-2023-23,video/mp4,23965,23914,0.0008\nCC-MAIN-2023-23,video/quicktime,3662,3662,0.0001\nCC-MAIN-2023-23,video/webm,1327,1327,0.0000\nCC-MAIN-2023-23,video/x-m4v,571,571,0.0000\nCC-MAIN-2023-40,<other>,419769,419341,0.0122\nCC-MAIN-2023-40,application/atom+xml,3506789,3506193,0.1018\nCC-MAIN-2023-40,application/epub+zip,41352,41304,0.0012\nCC-MAIN-2023-40,application/gpx+xml,14943,14942,0.0004\nCC-MAIN-2023-40,application/gzip,49475,49366,0.0014\nCC-MAIN-2023-40,application/javascript,19564,19547,0.0006\nCC-MAIN-2023-40,application/json,694720,694449,0.0202\nCC-MAIN-2023-40,application/marc,35014,35014,0.0010\nCC-MAIN-2023-40,application/mbox,70308,70163,0.0020\nCC-MAIN-2023-40,application/msword,77034,76699,0.0022\nCC-MAIN-2023-40,application/octet-stream,1105482,1104314,0.0321\nCC-MAIN-2023-40,application/pdf,29691380,29623727,0.8619\nCC-MAIN-2023-40,application/pgp-signature,99846,99834,0.0029\nCC-MAIN-2023-40,application/pkcs7-signature,15799,15765,0.0005\nCC-MAIN-2023-40,application/postscript,5869,5867,0.0002\nCC-MAIN-2023-40,application/rdf+xml,290503,290320,0.0084\nCC-MAIN-2023-40,application/rss+xml,3040435,3034082,0.0883\nCC-MAIN-2023-40,application/rtf,43884,43845,0.0013\nCC-MAIN-2023-40,application/text,4257,4257,0.0001\nCC-MAIN-2023-40,application/vnd.android.package-archive,2248,2227,0.0001\nCC-MAIN-2023-40,application/vnd.google-earth.kml+xml,126184,125823,0.0037\nCC-MAIN-2023-40,application/vnd.google-earth.kmz,16492,16486,0.0005\nCC-MAIN-2023-40,application/vnd.ms-excel,47184,47074,0.0014\nCC-MAIN-2023-40,application/vnd.ms-powerpoint,9895,9890,0.0003\nCC-MAIN-2023-40,application/vnd.oasis.opendocument.spreadsheet,9537,9462,0.0003\nCC-MAIN-2023-40,application/vnd.oasis.opendocument.text,30260,30254,0.0009\nCC-MAIN-2023-40,application/vnd.openxmlformats-officedocument.presentationml.presentation,8016,7922,0.0002\nCC-MAIN-2023-40,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,47238,47025,0.0014\nCC-MAIN-2023-40,application/vnd.openxmlformats-officedocument.wordprocessingml.document,77845,77578,0.0023\nCC-MAIN-2023-40,application/x-bibtex-text-file,306993,306881,0.0089\nCC-MAIN-2023-40,application/x-bittorrent,6514,6508,0.0002\nCC-MAIN-2023-40,application/x-bzip2,990,989,0.0000\nCC-MAIN-2023-40,application/x-dosexec,3260,3229,0.0001\nCC-MAIN-2023-40,application/x-endnote-refer,46437,46397,0.0013\nCC-MAIN-2023-40,application/x-hdf,20866,20866,0.0006\nCC-MAIN-2023-40,application/x-mobipocket-ebook,10274,10258,0.0003\nCC-MAIN-2023-40,application/x-ms-asx,4640,4640,0.0001\nCC-MAIN-2023-40,application/x-msdownload,3361,3354,0.0001\nCC-MAIN-2023-40,application/x-rar-compressed,184,184,0.0000\nCC-MAIN-2023-40,application/x-research-info-systems,5173,5173,0.0002\nCC-MAIN-2023-40,application/x-sh,38397,38384,0.0011\nCC-MAIN-2023-40,application/x-shockwave-flash,6902,6896,0.0002\nCC-MAIN-2023-40,application/x-stata-do,16693,16686,0.0005\nCC-MAIN-2023-40,application/x-tex,9386,9384,0.0003\nCC-MAIN-2023-40,application/x-tex-tfm,12222,12222,0.0004\nCC-MAIN-2023-40,application/x-tika-msoffice,76195,76139,0.0022\nCC-MAIN-2023-40,application/x-tika-ooxml,89894,89852,0.0026\nCC-MAIN-2023-40,application/x-wais-source,8333,8333,0.0002\nCC-MAIN-2023-40,application/x-xz,8868,8847,0.0003\nCC-MAIN-2023-40,application/xhtml+xml,342637691,340599167,9.9459\nCC-MAIN-2023-40,application/xml,1987307,1984028,0.0577\nCC-MAIN-2023-40,application/zip,165756,164917,0.0048\nCC-MAIN-2023-40,application/zlib,4498,4464,0.0001\nCC-MAIN-2023-40,application/zstd,81,81,0.0000\nCC-MAIN-2023-40,audio/mp4,583,583,0.0000\nCC-MAIN-2023-40,audio/mpeg,70887,70494,0.0021\nCC-MAIN-2023-40,audio/vnd.wave,10061,10061,0.0003\nCC-MAIN-2023-40,audio/x-mpegurl,4867,4867,0.0001\nCC-MAIN-2023-40,image/gif,99820,99502,0.0029\nCC-MAIN-2023-40,image/jpeg,5490775,5478444,0.1594\nCC-MAIN-2023-40,image/png,1038036,1034680,0.0301\nCC-MAIN-2023-40,image/svg+xml,33194,33102,0.0010\nCC-MAIN-2023-40,image/tiff,10009,10008,0.0003\nCC-MAIN-2023-40,image/vnd.djvu,12682,12681,0.0004\nCC-MAIN-2023-40,image/vnd.dxf; format=ascii,6585,6583,0.0002\nCC-MAIN-2023-40,image/webp,84302,84064,0.0024\nCC-MAIN-2023-40,message/rfc822,70278,70268,0.0020\nCC-MAIN-2023-40,text/asp,38,38,0.0000\nCC-MAIN-2023-40,text/aspdotnet,8,7,0.0000\nCC-MAIN-2023-40,text/calendar,1153948,1153446,0.0335\nCC-MAIN-2023-40,text/css,18546,18546,0.0005\nCC-MAIN-2023-40,text/csv,106882,106838,0.0031\nCC-MAIN-2023-40,text/html,3047167855,3023298886,88.4515\nCC-MAIN-2023-40,text/markdown,152,152,0.0000\nCC-MAIN-2023-40,text/plain,3660520,3656244,0.1063\nCC-MAIN-2023-40,text/prs.lines.tag,152472,152470,0.0044\nCC-MAIN-2023-40,text/tab-separated-values,6313,6298,0.0002\nCC-MAIN-2023-40,text/troff,17193,17193,0.0005\nCC-MAIN-2023-40,text/turtle,44300,44262,0.0013\nCC-MAIN-2023-40,text/vtt,25265,25221,0.0007\nCC-MAIN-2023-40,text/x-c++src,7694,7694,0.0002\nCC-MAIN-2023-40,text/x-chdr,21027,21026,0.0006\nCC-MAIN-2023-40,text/x-csrc,34272,34261,0.0010\nCC-MAIN-2023-40,text/x-diff,43776,43723,0.0013\nCC-MAIN-2023-40,text/x-jsp,3626,3620,0.0001\nCC-MAIN-2023-40,text/x-log,115442,115442,0.0034\nCC-MAIN-2023-40,text/x-matlab,71243,71199,0.0021\nCC-MAIN-2023-40,text/x-perl,68259,68197,0.0020\nCC-MAIN-2023-40,text/x-php,103198,102544,0.0030\nCC-MAIN-2023-40,text/x-python,11583,11579,0.0003\nCC-MAIN-2023-40,text/x-vcalendar,16237,16232,0.0005\nCC-MAIN-2023-40,text/x-vcard,109672,109613,0.0032\nCC-MAIN-2023-40,text/x-web-markdown,11128,11124,0.0003\nCC-MAIN-2023-40,text/x-yaml,7821,7821,0.0002\nCC-MAIN-2023-40,video/mp4,26519,26483,0.0008\nCC-MAIN-2023-40,video/quicktime,3734,3734,0.0001\nCC-MAIN-2023-40,video/webm,1494,1493,0.0000\nCC-MAIN-2023-40,video/x-m4v,504,504,0.0000\nCC-MAIN-2023-50,<other>,513046,512378,0.0153\nCC-MAIN-2023-50,application/atom+xml,3289037,3288320,0.0981\nCC-MAIN-2023-50,application/epub+zip,53094,52979,0.0016\nCC-MAIN-2023-50,application/gpx+xml,20898,20851,0.0006\nCC-MAIN-2023-50,application/gzip,55480,55173,0.0017\nCC-MAIN-2023-50,application/javascript,23851,23747,0.0007\nCC-MAIN-2023-50,application/json,750947,750579,0.0224\nCC-MAIN-2023-50,application/marc,35352,35352,0.0011\nCC-MAIN-2023-50,application/mbox,62012,61989,0.0018\nCC-MAIN-2023-50,application/msword,79612,79337,0.0024\nCC-MAIN-2023-50,application/octet-stream,382118,381226,0.0114\nCC-MAIN-2023-50,application/pdf,34351241,34267536,1.0242\nCC-MAIN-2023-50,application/pgp-signature,86954,86953,0.0026\nCC-MAIN-2023-50,application/pkcs7-signature,18635,18632,0.0006\nCC-MAIN-2023-50,application/postscript,6412,6403,0.0002\nCC-MAIN-2023-50,application/rdf+xml,263515,263212,0.0079\nCC-MAIN-2023-50,application/rss+xml,2966180,2961063,0.0884\nCC-MAIN-2023-50,application/rtf,35148,35132,0.0010\nCC-MAIN-2023-50,application/text,3999,3999,0.0001\nCC-MAIN-2023-50,application/vnd.android.package-archive,2659,2626,0.0001\nCC-MAIN-2023-50,application/vnd.google-earth.kml+xml,86064,85985,0.0026\nCC-MAIN-2023-50,application/vnd.google-earth.kmz,20076,20069,0.0006\nCC-MAIN-2023-50,application/vnd.ms-excel,51895,51816,0.0015\nCC-MAIN-2023-50,application/vnd.ms-powerpoint,9419,9403,0.0003\nCC-MAIN-2023-50,application/vnd.oasis.opendocument.spreadsheet,11960,11913,0.0004\nCC-MAIN-2023-50,application/vnd.oasis.opendocument.text,28999,28956,0.0009\nCC-MAIN-2023-50,application/vnd.openxmlformats-officedocument.presentationml.presentation,8612,8421,0.0003\nCC-MAIN-2023-50,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,55045,54754,0.0016\nCC-MAIN-2023-50,application/vnd.openxmlformats-officedocument.wordprocessingml.document,84341,83841,0.0025\nCC-MAIN-2023-50,application/x-bibtex-text-file,265564,265477,0.0079\nCC-MAIN-2023-50,application/x-bittorrent,7377,7375,0.0002\nCC-MAIN-2023-50,application/x-bzip2,21619,21618,0.0006\nCC-MAIN-2023-50,application/x-dosexec,2366,2333,0.0001\nCC-MAIN-2023-50,application/x-endnote-refer,44405,44382,0.0013\nCC-MAIN-2023-50,application/x-hdf,22732,22732,0.0007\nCC-MAIN-2023-50,application/x-mobipocket-ebook,16762,16726,0.0005\nCC-MAIN-2023-50,application/x-ms-asx,8592,8570,0.0003\nCC-MAIN-2023-50,application/x-msdownload,3027,3008,0.0001\nCC-MAIN-2023-50,application/x-pds,29251,29245,0.0009\nCC-MAIN-2023-50,application/x-rar-compressed,132,132,0.0000\nCC-MAIN-2023-50,application/x-research-info-systems,4370,4370,0.0001\nCC-MAIN-2023-50,application/x-sh,34589,34557,0.0010\nCC-MAIN-2023-50,application/x-shockwave-flash,7381,7376,0.0002\nCC-MAIN-2023-50,application/x-stata-do,12401,12400,0.0004\nCC-MAIN-2023-50,application/x-tex,8686,8683,0.0003\nCC-MAIN-2023-50,application/x-tex-tfm,12767,12767,0.0004\nCC-MAIN-2023-50,application/x-tika-msoffice,69424,69399,0.0021\nCC-MAIN-2023-50,application/x-tika-ooxml,93028,93009,0.0028\nCC-MAIN-2023-50,application/x-wais-source,8135,8135,0.0002\nCC-MAIN-2023-50,application/x-xz,6478,6477,0.0002\nCC-MAIN-2023-50,application/xhtml+xml,340326479,337782129,10.1468\nCC-MAIN-2023-50,application/xml,2061713,2056999,0.0615\nCC-MAIN-2023-50,application/zip,173584,172339,0.0052\nCC-MAIN-2023-50,application/zlib,4070,4023,0.0001\nCC-MAIN-2023-50,application/zstd,65,65,0.0000\nCC-MAIN-2023-50,audio/mp4,674,674,0.0000\nCC-MAIN-2023-50,audio/mpeg,62989,62711,0.0019\nCC-MAIN-2023-50,audio/vnd.wave,9585,9585,0.0003\nCC-MAIN-2023-50,audio/x-mpegurl,4967,4967,0.0001\nCC-MAIN-2023-50,image/gif,90000,89648,0.0027\nCC-MAIN-2023-50,image/jpeg,5484562,5474047,0.1635\nCC-MAIN-2023-50,image/png,1026298,1022453,0.0306\nCC-MAIN-2023-50,image/svg+xml,36103,35980,0.0011\nCC-MAIN-2023-50,image/tiff,14608,14604,0.0004\nCC-MAIN-2023-50,image/vnd.djvu,15511,15511,0.0005\nCC-MAIN-2023-50,image/vnd.dxf; format=ascii,8987,8986,0.0003\nCC-MAIN-2023-50,image/webp,101142,100813,0.0030\nCC-MAIN-2023-50,message/rfc822,34298,34293,0.0010\nCC-MAIN-2023-50,text/asp,54,54,0.0000\nCC-MAIN-2023-50,text/aspdotnet,13,13,0.0000\nCC-MAIN-2023-50,text/calendar,1175997,1175011,0.0351\nCC-MAIN-2023-50,text/css,17479,17473,0.0005\nCC-MAIN-2023-50,text/csv,111688,111360,0.0033\nCC-MAIN-2023-50,text/html,2955234029,2931729258,88.1096\nCC-MAIN-2023-50,text/markdown,43,43,0.0000\nCC-MAIN-2023-50,text/plain,3081301,3079469,0.0919\nCC-MAIN-2023-50,text/prs.lines.tag,215764,215764,0.0064\nCC-MAIN-2023-50,text/tab-separated-values,11437,11437,0.0003\nCC-MAIN-2023-50,text/troff,19706,19704,0.0006\nCC-MAIN-2023-50,text/turtle,43045,42972,0.0013\nCC-MAIN-2023-50,text/vtt,22106,22105,0.0007\nCC-MAIN-2023-50,text/x-c++src,5765,5762,0.0002\nCC-MAIN-2023-50,text/x-chdr,16776,16776,0.0005\nCC-MAIN-2023-50,text/x-csrc,38930,38914,0.0012\nCC-MAIN-2023-50,text/x-diff,38250,38178,0.0011\nCC-MAIN-2023-50,text/x-jsp,4670,4660,0.0001\nCC-MAIN-2023-50,text/x-log,55939,55932,0.0017\nCC-MAIN-2023-50,text/x-matlab,84816,84783,0.0025\nCC-MAIN-2023-50,text/x-perl,57152,57110,0.0017\nCC-MAIN-2023-50,text/x-php,104354,103914,0.0031\nCC-MAIN-2023-50,text/x-python,12523,12521,0.0004\nCC-MAIN-2023-50,text/x-vcalendar,12873,12871,0.0004\nCC-MAIN-2023-50,text/x-vcard,120302,120231,0.0036\nCC-MAIN-2023-50,text/x-web-markdown,15415,15410,0.0005\nCC-MAIN-2023-50,text/x-yaml,17880,17880,0.0005\nCC-MAIN-2023-50,video/mp4,26206,26146,0.0008\nCC-MAIN-2023-50,video/quicktime,3595,3594,0.0001\nCC-MAIN-2023-50,video/webm,2232,2232,0.0001\nCC-MAIN-2023-50,video/x-m4v,462,462,0.0000\nCC-MAIN-2024-10,<other>,346639,346299,0.0112\nCC-MAIN-2024-10,application/atom+xml,3125723,3125247,0.1006\nCC-MAIN-2024-10,application/epub+zip,51745,51646,0.0017\nCC-MAIN-2024-10,application/gpx+xml,16951,16947,0.0005\nCC-MAIN-2024-10,application/gzip,85,85,0.0000\nCC-MAIN-2024-10,application/javascript,38477,38462,0.0012\nCC-MAIN-2024-10,application/json,721055,720562,0.0232\nCC-MAIN-2024-10,application/marc,32562,32539,0.0010\nCC-MAIN-2024-10,application/mbox,55220,55140,0.0018\nCC-MAIN-2024-10,application/msword,75372,75188,0.0024\nCC-MAIN-2024-10,application/octet-stream,333740,333350,0.0107\nCC-MAIN-2024-10,application/pdf,29004460,28930825,0.9337\nCC-MAIN-2024-10,application/pgp-signature,85723,85723,0.0028\nCC-MAIN-2024-10,application/pkcs7-signature,13185,13167,0.0004\nCC-MAIN-2024-10,application/postscript,4107,4105,0.0001\nCC-MAIN-2024-10,application/rdf+xml,263760,263565,0.0085\nCC-MAIN-2024-10,application/rss+xml,2729479,2724993,0.0879\nCC-MAIN-2024-10,application/rtf,33948,33925,0.0011\nCC-MAIN-2024-10,application/text,1616,1616,0.0001\nCC-MAIN-2024-10,application/vnd.android.package-archive,20,20,0.0000\nCC-MAIN-2024-10,application/vnd.google-earth.kml+xml,108563,108456,0.0035\nCC-MAIN-2024-10,application/vnd.google-earth.kmz,12124,12097,0.0004\nCC-MAIN-2024-10,application/vnd.ms-excel,48243,48176,0.0016\nCC-MAIN-2024-10,application/vnd.ms-powerpoint,9165,9150,0.0003\nCC-MAIN-2024-10,application/vnd.oasis.opendocument.spreadsheet,11121,11095,0.0004\nCC-MAIN-2024-10,application/vnd.oasis.opendocument.text,26811,26795,0.0009\nCC-MAIN-2024-10,application/vnd.openxmlformats-officedocument.presentationml.presentation,8616,8549,0.0003\nCC-MAIN-2024-10,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,45668,45394,0.0015\nCC-MAIN-2024-10,application/vnd.openxmlformats-officedocument.wordprocessingml.document,82181,81732,0.0026\nCC-MAIN-2024-10,application/x-bibtex-text-file,273284,273217,0.0088\nCC-MAIN-2024-10,application/x-bittorrent,5524,5521,0.0002\nCC-MAIN-2024-10,application/x-bzip2,1,1,0.0000\nCC-MAIN-2024-10,application/x-dosexec,2,2,0.0000\nCC-MAIN-2024-10,application/x-endnote-refer,37111,37095,0.0012\nCC-MAIN-2024-10,application/x-mobipocket-ebook,15472,15443,0.0005\nCC-MAIN-2024-10,application/x-ms-asx,5222,5215,0.0002\nCC-MAIN-2024-10,application/x-msdownload,133,129,0.0000\nCC-MAIN-2024-10,application/x-pds,32723,32723,0.0011\nCC-MAIN-2024-10,application/x-rar-compressed,9,9,0.0000\nCC-MAIN-2024-10,application/x-research-info-systems,4901,4901,0.0002\nCC-MAIN-2024-10,application/x-sh,29974,29955,0.0010\nCC-MAIN-2024-10,application/x-shockwave-flash,8250,8244,0.0003\nCC-MAIN-2024-10,application/x-stata-do,10755,10754,0.0003\nCC-MAIN-2024-10,application/x-tex,9452,9439,0.0003\nCC-MAIN-2024-10,application/x-tex-tfm,10180,10180,0.0003\nCC-MAIN-2024-10,application/x-tika-msoffice,65896,65827,0.0021\nCC-MAIN-2024-10,application/x-tika-ooxml,88358,88324,0.0028\nCC-MAIN-2024-10,application/x-wais-source,5889,5889,0.0002\nCC-MAIN-2024-10,application/x-xz,87,87,0.0000\nCC-MAIN-2024-10,application/xhtml+xml,289948688,288140302,9.3335\nCC-MAIN-2024-10,application/xml,1744767,1740824,0.0562\nCC-MAIN-2024-10,application/zip,333,333,0.0000\nCC-MAIN-2024-10,application/zlib,3475,3428,0.0001\nCC-MAIN-2024-10,audio/mpeg,474,474,0.0000\nCC-MAIN-2024-10,audio/vnd.wave,51,51,0.0000\nCC-MAIN-2024-10,audio/x-mpegurl,19,19,0.0000\nCC-MAIN-2024-10,image/gif,165,165,0.0000\nCC-MAIN-2024-10,image/jpeg,6383,6317,0.0002\nCC-MAIN-2024-10,image/png,929,914,0.0000\nCC-MAIN-2024-10,image/svg+xml,44,44,0.0000\nCC-MAIN-2024-10,image/tiff,2,2,0.0000\nCC-MAIN-2024-10,image/webp,43,43,0.0000\nCC-MAIN-2024-10,message/rfc822,22925,22923,0.0007\nCC-MAIN-2024-10,text/asp,23,21,0.0000\nCC-MAIN-2024-10,text/aspdotnet,11,11,0.0000\nCC-MAIN-2024-10,text/calendar,1082932,1082407,0.0349\nCC-MAIN-2024-10,text/css,20439,20437,0.0007\nCC-MAIN-2024-10,text/csv,99177,99078,0.0032\nCC-MAIN-2024-10,text/html,2771905808,2748494425,89.2285\nCC-MAIN-2024-10,text/markdown,36,36,0.0000\nCC-MAIN-2024-10,text/plain,3001118,2998824,0.0966\nCC-MAIN-2024-10,text/prs.lines.tag,186439,186439,0.0060\nCC-MAIN-2024-10,text/tab-separated-values,7550,7549,0.0002\nCC-MAIN-2024-10,text/troff,18831,18831,0.0006\nCC-MAIN-2024-10,text/turtle,49507,49409,0.0016\nCC-MAIN-2024-10,text/vtt,25093,24893,0.0008\nCC-MAIN-2024-10,text/x-c++src,6200,6196,0.0002\nCC-MAIN-2024-10,text/x-chdr,15402,15401,0.0005\nCC-MAIN-2024-10,text/x-csrc,29273,29266,0.0009\nCC-MAIN-2024-10,text/x-diff,36248,36194,0.0012\nCC-MAIN-2024-10,text/x-jsp,3714,3708,0.0001\nCC-MAIN-2024-10,text/x-log,58604,58604,0.0019\nCC-MAIN-2024-10,text/x-matlab,66868,66809,0.0022\nCC-MAIN-2024-10,text/x-perl,50235,50198,0.0016\nCC-MAIN-2024-10,text/x-php,89119,88679,0.0029\nCC-MAIN-2024-10,text/x-python,11500,11489,0.0004\nCC-MAIN-2024-10,text/x-vcalendar,14942,14935,0.0005\nCC-MAIN-2024-10,text/x-vcard,107433,107373,0.0035\nCC-MAIN-2024-10,text/x-web-markdown,10830,10824,0.0003\nCC-MAIN-2024-10,text/x-yaml,10259,10259,0.0003\nCC-MAIN-2024-10,video/mp4,95,95,0.0000\nCC-MAIN-2024-18,<other>,321353,321142,0.0115\nCC-MAIN-2024-18,application/atom+xml,2812994,2812622,0.1009\nCC-MAIN-2024-18,application/epub+zip,46149,46097,0.0017\nCC-MAIN-2024-18,application/gpx+xml,13919,13919,0.0005\nCC-MAIN-2024-18,application/gzip,60,60,0.0000\nCC-MAIN-2024-18,application/javascript,34218,34189,0.0012\nCC-MAIN-2024-18,application/json,724875,724346,0.0260\nCC-MAIN-2024-18,application/marc,34489,34477,0.0012\nCC-MAIN-2024-18,application/mbox,54472,54458,0.0020\nCC-MAIN-2024-18,application/msword,65063,64913,0.0023\nCC-MAIN-2024-18,application/octet-stream,319705,319406,0.0115\nCC-MAIN-2024-18,application/pdf,25489356,25427012,0.9146\nCC-MAIN-2024-18,application/pgp-signature,78329,78325,0.0028\nCC-MAIN-2024-18,application/pkcs7-signature,11249,11244,0.0004\nCC-MAIN-2024-18,application/postscript,3286,3282,0.0001\nCC-MAIN-2024-18,application/rdf+xml,253871,253651,0.0091\nCC-MAIN-2024-18,application/rss+xml,2446994,2443837,0.0878\nCC-MAIN-2024-18,application/rtf,30427,30410,0.0011\nCC-MAIN-2024-18,application/text,909,909,0.0000\nCC-MAIN-2024-18,application/vnd.android.package-archive,7,7,0.0000\nCC-MAIN-2024-18,application/vnd.google-earth.kml+xml,97169,96796,0.0035\nCC-MAIN-2024-18,application/vnd.google-earth.kmz,11591,11582,0.0004\nCC-MAIN-2024-18,application/vnd.ms-excel,47949,47872,0.0017\nCC-MAIN-2024-18,application/vnd.ms-powerpoint,8004,7999,0.0003\nCC-MAIN-2024-18,application/vnd.oasis.opendocument.spreadsheet,11497,11467,0.0004\nCC-MAIN-2024-18,application/vnd.oasis.opendocument.text,23460,23447,0.0008\nCC-MAIN-2024-18,application/vnd.openxmlformats-officedocument.presentationml.presentation,6084,6063,0.0002\nCC-MAIN-2024-18,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,43683,42987,0.0016\nCC-MAIN-2024-18,application/vnd.openxmlformats-officedocument.wordprocessingml.document,70472,70139,0.0025\nCC-MAIN-2024-18,application/x-bibtex-text-file,286914,286616,0.0103\nCC-MAIN-2024-18,application/x-bittorrent,5286,5283,0.0002\nCC-MAIN-2024-18,application/x-dosexec,2,2,0.0000\nCC-MAIN-2024-18,application/x-endnote-refer,43505,43476,0.0016\nCC-MAIN-2024-18,application/x-mobipocket-ebook,14496,14475,0.0005\nCC-MAIN-2024-18,application/x-ms-asx,3664,3662,0.0001\nCC-MAIN-2024-18,application/x-msdownload,95,86,0.0000\nCC-MAIN-2024-18,application/x-pds,50682,50678,0.0018\nCC-MAIN-2024-18,application/x-rar-compressed,1,1,0.0000\nCC-MAIN-2024-18,application/x-research-info-systems,4778,4778,0.0002\nCC-MAIN-2024-18,application/x-sh,28914,28893,0.0010\nCC-MAIN-2024-18,application/x-shockwave-flash,8246,8239,0.0003\nCC-MAIN-2024-18,application/x-stata-do,15203,15202,0.0005\nCC-MAIN-2024-18,application/x-tex,8793,8792,0.0003\nCC-MAIN-2024-18,application/x-tex-tfm,15540,15540,0.0006\nCC-MAIN-2024-18,application/x-tika-msoffice,65878,65825,0.0024\nCC-MAIN-2024-18,application/x-tika-ooxml,81795,81766,0.0029\nCC-MAIN-2024-18,application/x-wais-source,5558,5558,0.0002\nCC-MAIN-2024-18,application/xhtml+xml,261613118,260206969,9.3876\nCC-MAIN-2024-18,application/xml,1688428,1685522,0.0606\nCC-MAIN-2024-18,application/zip,453,453,0.0000\nCC-MAIN-2024-18,application/zlib,3274,3218,0.0001\nCC-MAIN-2024-18,audio/mpeg,571,571,0.0000\nCC-MAIN-2024-18,audio/vnd.wave,14,14,0.0000\nCC-MAIN-2024-18,audio/x-mpegurl,12,12,0.0000\nCC-MAIN-2024-18,image/gif,92,92,0.0000\nCC-MAIN-2024-18,image/jpeg,4889,4877,0.0002\nCC-MAIN-2024-18,image/png,515,512,0.0000\nCC-MAIN-2024-18,image/svg+xml,50,50,0.0000\nCC-MAIN-2024-18,image/tiff,2,2,0.0000\nCC-MAIN-2024-18,image/vnd.djvu,2,2,0.0000\nCC-MAIN-2024-18,image/webp,31,31,0.0000\nCC-MAIN-2024-18,message/rfc822,14859,14855,0.0005\nCC-MAIN-2024-18,text/asp,13,13,0.0000\nCC-MAIN-2024-18,text/aspdotnet,13,13,0.0000\nCC-MAIN-2024-18,text/calendar,979896,979497,0.0352\nCC-MAIN-2024-18,text/css,19426,19423,0.0007\nCC-MAIN-2024-18,text/csv,88427,87952,0.0032\nCC-MAIN-2024-18,text/html,2484829166,2468098124,89.1642\nCC-MAIN-2024-18,text/markdown,53,53,0.0000\nCC-MAIN-2024-18,text/plain,3015975,3014143,0.1082\nCC-MAIN-2024-18,text/prs.lines.tag,234562,234554,0.0084\nCC-MAIN-2024-18,text/tab-separated-values,6670,6662,0.0002\nCC-MAIN-2024-18,text/troff,25167,25165,0.0009\nCC-MAIN-2024-18,text/turtle,45444,45351,0.0016\nCC-MAIN-2024-18,text/vtt,22580,22563,0.0008\nCC-MAIN-2024-18,text/x-c++src,4899,4895,0.0002\nCC-MAIN-2024-18,text/x-chdr,15170,15163,0.0005\nCC-MAIN-2024-18,text/x-csrc,30196,30171,0.0011\nCC-MAIN-2024-18,text/x-diff,36675,36657,0.0013\nCC-MAIN-2024-18,text/x-jsp,2810,2804,0.0001\nCC-MAIN-2024-18,text/x-log,59015,59014,0.0021\nCC-MAIN-2024-18,text/x-matlab,61670,61644,0.0022\nCC-MAIN-2024-18,text/x-perl,47916,47866,0.0017\nCC-MAIN-2024-18,text/x-php,96507,96222,0.0035\nCC-MAIN-2024-18,text/x-python,14452,14449,0.0005\nCC-MAIN-2024-18,text/x-vcalendar,12496,12495,0.0004\nCC-MAIN-2024-18,text/x-vcard,102147,102117,0.0037\nCC-MAIN-2024-18,text/x-web-markdown,9911,9910,0.0004\nCC-MAIN-2024-18,text/x-yaml,11385,11384,0.0004\nCC-MAIN-2024-18,video/mp4,118,118,0.0000\nCC-MAIN-2024-18,video/webm,4,4,0.0000\nCC-MAIN-2024-22,<other>,314059,313801,0.0116\nCC-MAIN-2024-22,application/atom+xml,2742522,2742205,0.1012\nCC-MAIN-2024-22,application/epub+zip,56138,55958,0.0021\nCC-MAIN-2024-22,application/gpx+xml,13903,13903,0.0005\nCC-MAIN-2024-22,application/gzip,105,105,0.0000\nCC-MAIN-2024-22,application/javascript,30561,30546,0.0011\nCC-MAIN-2024-22,application/json,684559,684071,0.0253\nCC-MAIN-2024-22,application/marc,33935,33931,0.0013\nCC-MAIN-2024-22,application/mbox,48862,48776,0.0018\nCC-MAIN-2024-22,application/msword,59996,59861,0.0022\nCC-MAIN-2024-22,application/octet-stream,309689,309301,0.0114\nCC-MAIN-2024-22,application/pdf,20978860,20927617,0.7742\nCC-MAIN-2024-22,application/pgp-signature,75101,75101,0.0028\nCC-MAIN-2024-22,application/pkcs7-signature,13193,13191,0.0005\nCC-MAIN-2024-22,application/postscript,5829,5829,0.0002\nCC-MAIN-2024-22,application/rdf+xml,259530,259368,0.0096\nCC-MAIN-2024-22,application/rss+xml,2282800,2279419,0.0842\nCC-MAIN-2024-22,application/rtf,34850,34835,0.0013\nCC-MAIN-2024-22,application/text,232,232,0.0000\nCC-MAIN-2024-22,application/vnd.android.package-archive,6,6,0.0000\nCC-MAIN-2024-22,application/vnd.google-earth.kml+xml,108563,108191,0.0040\nCC-MAIN-2024-22,application/vnd.google-earth.kmz,41341,41340,0.0015\nCC-MAIN-2024-22,application/vnd.ms-excel,37079,36976,0.0014\nCC-MAIN-2024-22,application/vnd.ms-powerpoint,8495,8484,0.0003\nCC-MAIN-2024-22,application/vnd.oasis.opendocument.spreadsheet,11290,11279,0.0004\nCC-MAIN-2024-22,application/vnd.oasis.opendocument.text,21510,21498,0.0008\nCC-MAIN-2024-22,application/vnd.openxmlformats-officedocument.presentationml.presentation,4803,4773,0.0002\nCC-MAIN-2024-22,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,34974,34791,0.0013\nCC-MAIN-2024-22,application/vnd.openxmlformats-officedocument.wordprocessingml.document,60427,60138,0.0022\nCC-MAIN-2024-22,application/x-bibtex-text-file,263606,263565,0.0097\nCC-MAIN-2024-22,application/x-bittorrent,4787,4787,0.0002\nCC-MAIN-2024-22,application/x-bzip2,45,45,0.0000\nCC-MAIN-2024-22,application/x-endnote-refer,38801,38791,0.0014\nCC-MAIN-2024-22,application/x-mobipocket-ebook,21223,21079,0.0008\nCC-MAIN-2024-22,application/x-ms-asx,2260,2257,0.0001\nCC-MAIN-2024-22,application/x-msdownload,93,84,0.0000\nCC-MAIN-2024-22,application/x-pds,20397,20393,0.0008\nCC-MAIN-2024-22,application/x-rar-compressed,2,2,0.0000\nCC-MAIN-2024-22,application/x-research-info-systems,5653,5653,0.0002\nCC-MAIN-2024-22,application/x-sh,32597,32587,0.0012\nCC-MAIN-2024-22,application/x-shockwave-flash,7922,7919,0.0003\nCC-MAIN-2024-22,application/x-stata-do,13856,13853,0.0005\nCC-MAIN-2024-22,application/x-tex,10398,10355,0.0004\nCC-MAIN-2024-22,application/x-tex-tfm,8089,8089,0.0003\nCC-MAIN-2024-22,application/x-tika-msoffice,63367,63339,0.0023\nCC-MAIN-2024-22,application/x-tika-ooxml,73528,73511,0.0027\nCC-MAIN-2024-22,application/x-wais-source,5334,5334,0.0002\nCC-MAIN-2024-22,application/x-xz,2,2,0.0000\nCC-MAIN-2024-22,application/xhtml+xml,246672291,245385255,9.1027\nCC-MAIN-2024-22,application/xml,1578558,1576114,0.0583\nCC-MAIN-2024-22,application/zip,1766,1766,0.0001\nCC-MAIN-2024-22,application/zlib,4468,4449,0.0002\nCC-MAIN-2024-22,audio/mpeg,178,178,0.0000\nCC-MAIN-2024-22,audio/vnd.wave,24,24,0.0000\nCC-MAIN-2024-22,audio/x-mpegurl,26,26,0.0000\nCC-MAIN-2024-22,image/gif,72,72,0.0000\nCC-MAIN-2024-22,image/jpeg,5363,5360,0.0002\nCC-MAIN-2024-22,image/png,526,524,0.0000\nCC-MAIN-2024-22,image/svg+xml,39,39,0.0000\nCC-MAIN-2024-22,image/tiff,3,3,0.0000\nCC-MAIN-2024-22,image/vnd.djvu,9,9,0.0000\nCC-MAIN-2024-22,image/webp,18,18,0.0000\nCC-MAIN-2024-22,message/rfc822,16928,16927,0.0006\nCC-MAIN-2024-22,text/asp,24,14,0.0000\nCC-MAIN-2024-22,text/aspdotnet,8,8,0.0000\nCC-MAIN-2024-22,text/calendar,887657,887411,0.0328\nCC-MAIN-2024-22,text/css,20319,20315,0.0007\nCC-MAIN-2024-22,text/csv,91774,91643,0.0034\nCC-MAIN-2024-22,text/html,2428084407,2412498965,89.6012\nCC-MAIN-2024-22,text/markdown,82,82,0.0000\nCC-MAIN-2024-22,text/plain,2892301,2890894,0.1067\nCC-MAIN-2024-22,text/prs.lines.tag,213997,213996,0.0079\nCC-MAIN-2024-22,text/tab-separated-values,9343,9333,0.0003\nCC-MAIN-2024-22,text/troff,19531,19530,0.0007\nCC-MAIN-2024-22,text/turtle,45271,45236,0.0017\nCC-MAIN-2024-22,text/vtt,20770,20768,0.0008\nCC-MAIN-2024-22,text/x-c++src,5133,5132,0.0002\nCC-MAIN-2024-22,text/x-chdr,13175,13172,0.0005\nCC-MAIN-2024-22,text/x-csrc,26202,26189,0.0010\nCC-MAIN-2024-22,text/x-diff,32389,32385,0.0012\nCC-MAIN-2024-22,text/x-jsp,2530,2524,0.0001\nCC-MAIN-2024-22,text/x-log,54178,54178,0.0020\nCC-MAIN-2024-22,text/x-matlab,59800,59787,0.0022\nCC-MAIN-2024-22,text/x-perl,49492,49399,0.0018\nCC-MAIN-2024-22,text/x-php,93325,93074,0.0034\nCC-MAIN-2024-22,text/x-python,10909,10906,0.0004\nCC-MAIN-2024-22,text/x-vcalendar,12500,12498,0.0005\nCC-MAIN-2024-22,text/x-vcard,88973,88945,0.0033\nCC-MAIN-2024-22,text/x-web-markdown,9541,9531,0.0004\nCC-MAIN-2024-22,text/x-yaml,8785,8785,0.0003\nCC-MAIN-2024-22,video/mp4,115,115,0.0000\nCC-MAIN-2024-22,video/webm,1,1,0.0000\nCC-MAIN-2024-22,video/x-m4v,2,2,0.0000\nCC-MAIN-2024-26,<other>,315101,314891,0.0113\nCC-MAIN-2024-26,application/atom+xml,3272434,3271915,0.1170\nCC-MAIN-2024-26,application/epub+zip,52786,52656,0.0019\nCC-MAIN-2024-26,application/gpx+xml,12999,12999,0.0005\nCC-MAIN-2024-26,application/gzip,43,43,0.0000\nCC-MAIN-2024-26,application/javascript,27735,27728,0.0010\nCC-MAIN-2024-26,application/json,764415,764053,0.0273\nCC-MAIN-2024-26,application/marc,32892,32887,0.0012\nCC-MAIN-2024-26,application/mbox,46177,46130,0.0017\nCC-MAIN-2024-26,application/msword,52395,52311,0.0019\nCC-MAIN-2024-26,application/octet-stream,372970,372744,0.0133\nCC-MAIN-2024-26,application/pdf,20002346,19956706,0.7149\nCC-MAIN-2024-26,application/pgp-signature,67463,67463,0.0024\nCC-MAIN-2024-26,application/pkcs7-signature,14422,14391,0.0005\nCC-MAIN-2024-26,application/postscript,8029,8028,0.0003\nCC-MAIN-2024-26,application/rdf+xml,275904,275774,0.0099\nCC-MAIN-2024-26,application/rss+xml,2503316,2498899,0.0895\nCC-MAIN-2024-26,application/rtf,38869,38856,0.0014\nCC-MAIN-2024-26,application/text,243,243,0.0000\nCC-MAIN-2024-26,application/vnd.android.package-archive,9,9,0.0000\nCC-MAIN-2024-26,application/vnd.google-earth.kml+xml,101160,101049,0.0036\nCC-MAIN-2024-26,application/vnd.google-earth.kmz,10145,10142,0.0004\nCC-MAIN-2024-26,application/vnd.ms-excel,35987,35947,0.0013\nCC-MAIN-2024-26,application/vnd.ms-powerpoint,6745,6743,0.0002\nCC-MAIN-2024-26,application/vnd.oasis.opendocument.spreadsheet,8621,8612,0.0003\nCC-MAIN-2024-26,application/vnd.oasis.opendocument.text,21698,21688,0.0008\nCC-MAIN-2024-26,application/vnd.openxmlformats-officedocument.presentationml.presentation,5989,5975,0.0002\nCC-MAIN-2024-26,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,37712,37394,0.0013\nCC-MAIN-2024-26,application/vnd.openxmlformats-officedocument.wordprocessingml.document,60923,60800,0.0022\nCC-MAIN-2024-26,application/x-bibtex-text-file,274360,274306,0.0098\nCC-MAIN-2024-26,application/x-bittorrent,5351,5351,0.0002\nCC-MAIN-2024-26,application/x-bzip2,2,2,0.0000\nCC-MAIN-2024-26,application/x-dosexec,1,1,0.0000\nCC-MAIN-2024-26,application/x-endnote-refer,42105,42090,0.0015\nCC-MAIN-2024-26,application/x-mobipocket-ebook,19751,19650,0.0007\nCC-MAIN-2024-26,application/x-ms-asx,3162,3161,0.0001\nCC-MAIN-2024-26,application/x-msdownload,103,97,0.0000\nCC-MAIN-2024-26,application/x-pds,33522,33522,0.0012\nCC-MAIN-2024-26,application/x-rar-compressed,4,4,0.0000\nCC-MAIN-2024-26,application/x-research-info-systems,4756,4756,0.0002\nCC-MAIN-2024-26,application/x-sh,26032,26013,0.0009\nCC-MAIN-2024-26,application/x-shockwave-flash,5027,5020,0.0002\nCC-MAIN-2024-26,application/x-stata-do,12114,12109,0.0004\nCC-MAIN-2024-26,application/x-tex,6936,6935,0.0002\nCC-MAIN-2024-26,application/x-tex-tfm,14241,14241,0.0005\nCC-MAIN-2024-26,application/x-tika-msoffice,59680,59680,0.0021\nCC-MAIN-2024-26,application/x-tika-ooxml,63740,63724,0.0023\nCC-MAIN-2024-26,application/x-wais-source,6365,6365,0.0002\nCC-MAIN-2024-26,application/x-xz,2,2,0.0000\nCC-MAIN-2024-26,application/xhtml+xml,261168997,259765688,9.3340\nCC-MAIN-2024-26,application/xml,1648825,1646512,0.0589\nCC-MAIN-2024-26,application/zip,1426,1426,0.0001\nCC-MAIN-2024-26,application/zlib,6991,6946,0.0002\nCC-MAIN-2024-26,audio/mpeg,144,144,0.0000\nCC-MAIN-2024-26,audio/vnd.wave,32,32,0.0000\nCC-MAIN-2024-26,audio/x-mpegurl,26,26,0.0000\nCC-MAIN-2024-26,image/gif,175,175,0.0000\nCC-MAIN-2024-26,image/jpeg,5616,5614,0.0002\nCC-MAIN-2024-26,image/png,575,575,0.0000\nCC-MAIN-2024-26,image/svg+xml,14,14,0.0000\nCC-MAIN-2024-26,image/tiff,6,6,0.0000\nCC-MAIN-2024-26,image/webp,14,14,0.0000\nCC-MAIN-2024-26,message/rfc822,17697,17695,0.0006\nCC-MAIN-2024-26,text/asp,4,4,0.0000\nCC-MAIN-2024-26,text/aspdotnet,6,6,0.0000\nCC-MAIN-2024-26,text/calendar,983594,983224,0.0352\nCC-MAIN-2024-26,text/css,22535,22531,0.0008\nCC-MAIN-2024-26,text/csv,103158,103078,0.0037\nCC-MAIN-2024-26,text/html,2501407019,2485399052,89.3983\nCC-MAIN-2024-26,text/markdown,94,94,0.0000\nCC-MAIN-2024-26,text/plain,3090459,3088619,0.1105\nCC-MAIN-2024-26,text/prs.lines.tag,227616,227606,0.0081\nCC-MAIN-2024-26,text/tab-separated-values,7035,7034,0.0003\nCC-MAIN-2024-26,text/troff,24546,24543,0.0009\nCC-MAIN-2024-26,text/turtle,53139,53133,0.0019\nCC-MAIN-2024-26,text/vtt,19812,19733,0.0007\nCC-MAIN-2024-26,text/x-c++src,5412,5410,0.0002\nCC-MAIN-2024-26,text/x-chdr,16617,16614,0.0006\nCC-MAIN-2024-26,text/x-csrc,27473,27471,0.0010\nCC-MAIN-2024-26,text/x-diff,39661,39650,0.0014\nCC-MAIN-2024-26,text/x-jsp,2081,2078,0.0001\nCC-MAIN-2024-26,text/x-log,91422,91418,0.0033\nCC-MAIN-2024-26,text/x-matlab,64488,64476,0.0023\nCC-MAIN-2024-26,text/x-perl,43858,43842,0.0016\nCC-MAIN-2024-26,text/x-php,102949,102544,0.0037\nCC-MAIN-2024-26,text/x-python,8543,8542,0.0003\nCC-MAIN-2024-26,text/x-vcalendar,13320,13313,0.0005\nCC-MAIN-2024-26,text/x-vcard,93575,93543,0.0033\nCC-MAIN-2024-26,text/x-web-markdown,10675,10670,0.0004\nCC-MAIN-2024-26,text/x-yaml,10597,10595,0.0004\nCC-MAIN-2024-26,video/mp4,17,17,0.0000\nCC-MAIN-2024-26,video/webm,1,1,0.0000\nCC-MAIN-2024-30,<other>,325872,325398,0.0128\nCC-MAIN-2024-30,application/atom+xml,2662152,2661909,0.1045\nCC-MAIN-2024-30,application/epub+zip,51074,50954,0.0020\nCC-MAIN-2024-30,application/gpx+xml,13731,13729,0.0005\nCC-MAIN-2024-30,application/gzip,19,19,0.0000\nCC-MAIN-2024-30,application/javascript,11385,11361,0.0004\nCC-MAIN-2024-30,application/json,757719,757420,0.0298\nCC-MAIN-2024-30,application/marc,35251,35250,0.0014\nCC-MAIN-2024-30,application/mbox,54111,54049,0.0021\nCC-MAIN-2024-30,application/msword,56502,56403,0.0022\nCC-MAIN-2024-30,application/octet-stream,405149,404800,0.0159\nCC-MAIN-2024-30,application/pdf,24127180,24083853,0.9474\nCC-MAIN-2024-30,application/pgp-signature,96420,96419,0.0038\nCC-MAIN-2024-30,application/pkcs7-signature,13585,13581,0.0005\nCC-MAIN-2024-30,application/postscript,7128,7128,0.0003\nCC-MAIN-2024-30,application/rdf+xml,264284,263613,0.0104\nCC-MAIN-2024-30,application/rss+xml,2325264,2322511,0.0913\nCC-MAIN-2024-30,application/rtf,43917,43900,0.0017\nCC-MAIN-2024-30,application/text,152,152,0.0000\nCC-MAIN-2024-30,application/vnd.android.package-archive,11,11,0.0000\nCC-MAIN-2024-30,application/vnd.google-earth.kml+xml,110864,110511,0.0044\nCC-MAIN-2024-30,application/vnd.google-earth.kmz,19622,19622,0.0008\nCC-MAIN-2024-30,application/vnd.ms-excel,44119,44011,0.0017\nCC-MAIN-2024-30,application/vnd.ms-powerpoint,7086,7079,0.0003\nCC-MAIN-2024-30,application/vnd.oasis.opendocument.spreadsheet,10770,10758,0.0004\nCC-MAIN-2024-30,application/vnd.oasis.opendocument.text,22693,22685,0.0009\nCC-MAIN-2024-30,application/vnd.openxmlformats-officedocument.presentationml.presentation,6601,6587,0.0003\nCC-MAIN-2024-30,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,39338,38498,0.0015\nCC-MAIN-2024-30,application/vnd.openxmlformats-officedocument.wordprocessingml.document,64816,64517,0.0025\nCC-MAIN-2024-30,application/x-bibtex-text-file,273573,273509,0.0107\nCC-MAIN-2024-30,application/x-bittorrent,5234,5233,0.0002\nCC-MAIN-2024-30,application/x-bzip2,1,1,0.0000\nCC-MAIN-2024-30,application/x-dosexec,3,3,0.0000\nCC-MAIN-2024-30,application/x-endnote-refer,48424,48404,0.0019\nCC-MAIN-2024-30,application/x-mobipocket-ebook,18275,18163,0.0007\nCC-MAIN-2024-30,application/x-ms-asx,4147,4146,0.0002\nCC-MAIN-2024-30,application/x-msdownload,42,37,0.0000\nCC-MAIN-2024-30,application/x-pds,38388,38388,0.0015\nCC-MAIN-2024-30,application/x-rar-compressed,4,4,0.0000\nCC-MAIN-2024-30,application/x-research-info-systems,5255,5255,0.0002\nCC-MAIN-2024-30,application/x-sh,28719,28705,0.0011\nCC-MAIN-2024-30,application/x-shockwave-flash,6510,6499,0.0003\nCC-MAIN-2024-30,application/x-stata-do,11585,11584,0.0005\nCC-MAIN-2024-30,application/x-tex,7499,7499,0.0003\nCC-MAIN-2024-30,application/x-tex-tfm,14789,14789,0.0006\nCC-MAIN-2024-30,application/x-tika-msoffice,63055,63046,0.0025\nCC-MAIN-2024-30,application/x-tika-ooxml,80483,80463,0.0032\nCC-MAIN-2024-30,application/x-wais-source,5199,5199,0.0002\nCC-MAIN-2024-30,application/x-xz,1,1,0.0000\nCC-MAIN-2024-30,application/xhtml+xml,238373523,237198953,9.3604\nCC-MAIN-2024-30,application/xml,2705024,2703193,0.1062\nCC-MAIN-2024-30,application/zip,780,779,0.0000\nCC-MAIN-2024-30,application/zlib,4558,4521,0.0002\nCC-MAIN-2024-30,audio/mpeg,310,310,0.0000\nCC-MAIN-2024-30,audio/vnd.wave,31,31,0.0000\nCC-MAIN-2024-30,audio/x-mpegurl,24,24,0.0000\nCC-MAIN-2024-30,image/gif,109,109,0.0000\nCC-MAIN-2024-30,image/jpeg,5353,5352,0.0002\nCC-MAIN-2024-30,image/png,997,993,0.0000\nCC-MAIN-2024-30,image/svg+xml,102,102,0.0000\nCC-MAIN-2024-30,image/tiff,1,1,0.0000\nCC-MAIN-2024-30,image/vnd.djvu,1,1,0.0000\nCC-MAIN-2024-30,image/webp,27,27,0.0000\nCC-MAIN-2024-30,message/rfc822,23861,23861,0.0009\nCC-MAIN-2024-30,text/asp,4,4,0.0000\nCC-MAIN-2024-30,text/aspdotnet,4,4,0.0000\nCC-MAIN-2024-30,text/calendar,934168,933925,0.0367\nCC-MAIN-2024-30,text/css,19191,19189,0.0008\nCC-MAIN-2024-30,text/csv,98160,97386,0.0039\nCC-MAIN-2024-30,text/html,2268436770,2255456000,89.0760\nCC-MAIN-2024-30,text/markdown,64,64,0.0000\nCC-MAIN-2024-30,text/plain,2978108,2975752,0.1169\nCC-MAIN-2024-30,text/prs.lines.tag,270939,270932,0.0106\nCC-MAIN-2024-30,text/tab-separated-values,6988,6985,0.0003\nCC-MAIN-2024-30,text/troff,18247,18245,0.0007\nCC-MAIN-2024-30,text/turtle,54211,53873,0.0021\nCC-MAIN-2024-30,text/vtt,20692,20670,0.0008\nCC-MAIN-2024-30,text/x-c++src,4864,4864,0.0002\nCC-MAIN-2024-30,text/x-chdr,13331,13331,0.0005\nCC-MAIN-2024-30,text/x-csrc,22903,22901,0.0009\nCC-MAIN-2024-30,text/x-diff,47345,47332,0.0019\nCC-MAIN-2024-30,text/x-jsp,2460,2457,0.0001\nCC-MAIN-2024-30,text/x-log,65906,65905,0.0026\nCC-MAIN-2024-30,text/x-matlab,58755,58746,0.0023\nCC-MAIN-2024-30,text/x-perl,48032,48004,0.0019\nCC-MAIN-2024-30,text/x-php,90884,90617,0.0036\nCC-MAIN-2024-30,text/x-python,9590,9584,0.0004\nCC-MAIN-2024-30,text/x-vcalendar,13002,13001,0.0005\nCC-MAIN-2024-30,text/x-vcard,93103,93057,0.0037\nCC-MAIN-2024-30,text/x-web-markdown,10081,10076,0.0004\nCC-MAIN-2024-30,text/x-yaml,9823,9821,0.0004\nCC-MAIN-2024-30,video/mp4,60,60,0.0000\nCC-MAIN-2024-30,video/quicktime,3,3,0.0000\nCC-MAIN-2024-30,video/webm,5,5,0.0000\nCC-MAIN-2024-33,<other>,312510,312216,0.0135\nCC-MAIN-2024-33,application/atom+xml,2590140,2589913,0.1118\nCC-MAIN-2024-33,application/epub+zip,43942,43880,0.0019\nCC-MAIN-2024-33,application/gpx+xml,15943,15943,0.0007\nCC-MAIN-2024-33,application/gzip,51,51,0.0000\nCC-MAIN-2024-33,application/javascript,10629,10619,0.0005\nCC-MAIN-2024-33,application/json,740075,739641,0.0320\nCC-MAIN-2024-33,application/marc,33676,33672,0.0015\nCC-MAIN-2024-33,application/mbox,47416,47359,0.0020\nCC-MAIN-2024-33,application/msword,61889,61725,0.0027\nCC-MAIN-2024-33,application/octet-stream,306386,306085,0.0132\nCC-MAIN-2024-33,application/pdf,21700633,21655275,0.9370\nCC-MAIN-2024-33,application/pgp-signature,87497,87497,0.0038\nCC-MAIN-2024-33,application/pkcs7-signature,10936,10928,0.0005\nCC-MAIN-2024-33,application/postscript,8210,8205,0.0004\nCC-MAIN-2024-33,application/rdf+xml,250641,250318,0.0108\nCC-MAIN-2024-33,application/rss+xml,2178808,2176448,0.0941\nCC-MAIN-2024-33,application/rtf,42158,42148,0.0018\nCC-MAIN-2024-33,application/text,186,186,0.0000\nCC-MAIN-2024-33,application/vnd.android.package-archive,5,5,0.0000\nCC-MAIN-2024-33,application/vnd.google-earth.kml+xml,62624,62349,0.0027\nCC-MAIN-2024-33,application/vnd.google-earth.kmz,17740,17738,0.0008\nCC-MAIN-2024-33,application/vnd.ms-excel,43873,43831,0.0019\nCC-MAIN-2024-33,application/vnd.ms-powerpoint,7189,7162,0.0003\nCC-MAIN-2024-33,application/vnd.oasis.opendocument.spreadsheet,8684,8670,0.0004\nCC-MAIN-2024-33,application/vnd.oasis.opendocument.text,20244,20199,0.0009\nCC-MAIN-2024-33,application/vnd.openxmlformats-officedocument.presentationml.presentation,5317,5257,0.0002\nCC-MAIN-2024-33,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,37661,37518,0.0016\nCC-MAIN-2024-33,application/vnd.openxmlformats-officedocument.wordprocessingml.document,60072,59777,0.0026\nCC-MAIN-2024-33,application/x-bibtex-text-file,264054,263902,0.0114\nCC-MAIN-2024-33,application/x-bittorrent,6262,6262,0.0003\nCC-MAIN-2024-33,application/x-bzip2,1,1,0.0000\nCC-MAIN-2024-33,application/x-dosexec,4,4,0.0000\nCC-MAIN-2024-33,application/x-endnote-refer,42820,42811,0.0018\nCC-MAIN-2024-33,application/x-mobipocket-ebook,17373,17319,0.0008\nCC-MAIN-2024-33,application/x-ms-asx,2545,2544,0.0001\nCC-MAIN-2024-33,application/x-msdownload,29,27,0.0000\nCC-MAIN-2024-33,application/x-pds,127223,127223,0.0055\nCC-MAIN-2024-33,application/x-rar-compressed,7,7,0.0000\nCC-MAIN-2024-33,application/x-research-info-systems,5730,5730,0.0002\nCC-MAIN-2024-33,application/x-sh,29932,29918,0.0013\nCC-MAIN-2024-33,application/x-shockwave-flash,5009,5005,0.0002\nCC-MAIN-2024-33,application/x-stata-do,10166,10164,0.0004\nCC-MAIN-2024-33,application/x-tex,7378,7373,0.0003\nCC-MAIN-2024-33,application/x-tex-tfm,25706,25706,0.0011\nCC-MAIN-2024-33,application/x-tika-msoffice,66643,66634,0.0029\nCC-MAIN-2024-33,application/x-tika-ooxml,87852,87844,0.0038\nCC-MAIN-2024-33,application/x-wais-source,7454,7452,0.0003\nCC-MAIN-2024-33,application/x-xz,1,1,0.0000\nCC-MAIN-2024-33,application/xhtml+xml,218850044,217838598,9.4498\nCC-MAIN-2024-33,application/xml,1624581,1622803,0.0701\nCC-MAIN-2024-33,application/zip,796,796,0.0000\nCC-MAIN-2024-33,application/zlib,4327,4292,0.0002\nCC-MAIN-2024-33,audio/mpeg,477,477,0.0000\nCC-MAIN-2024-33,audio/vnd.wave,53,53,0.0000\nCC-MAIN-2024-33,audio/x-mpegurl,25,25,0.0000\nCC-MAIN-2024-33,image/gif,72,72,0.0000\nCC-MAIN-2024-33,image/jpeg,6130,6124,0.0003\nCC-MAIN-2024-33,image/png,990,990,0.0000\nCC-MAIN-2024-33,image/svg+xml,36,36,0.0000\nCC-MAIN-2024-33,image/tiff,6,6,0.0000\nCC-MAIN-2024-33,image/vnd.djvu,7,7,0.0000\nCC-MAIN-2024-33,image/webp,40,40,0.0000\nCC-MAIN-2024-33,message/rfc822,15411,15409,0.0007\nCC-MAIN-2024-33,text/asp,1,1,0.0000\nCC-MAIN-2024-33,text/aspdotnet,7,7,0.0000\nCC-MAIN-2024-33,text/calendar,844766,844542,0.0365\nCC-MAIN-2024-33,text/css,18718,18714,0.0008\nCC-MAIN-2024-33,text/csv,98267,97624,0.0042\nCC-MAIN-2024-33,text/html,2061214084,2049829982,89.0017\nCC-MAIN-2024-33,text/markdown,50,50,0.0000\nCC-MAIN-2024-33,text/plain,3011072,3004720,0.1300\nCC-MAIN-2024-33,text/prs.lines.tag,265043,265024,0.0114\nCC-MAIN-2024-33,text/tab-separated-values,5208,5207,0.0002\nCC-MAIN-2024-33,text/troff,19117,19116,0.0008\nCC-MAIN-2024-33,text/turtle,49022,49004,0.0021\nCC-MAIN-2024-33,text/vtt,17316,17310,0.0007\nCC-MAIN-2024-33,text/x-c++src,3960,3960,0.0002\nCC-MAIN-2024-33,text/x-chdr,13370,13369,0.0006\nCC-MAIN-2024-33,text/x-csrc,27239,27234,0.0012\nCC-MAIN-2024-33,text/x-diff,31274,31270,0.0014\nCC-MAIN-2024-33,text/x-jsp,2754,2748,0.0001\nCC-MAIN-2024-33,text/x-log,80292,80292,0.0035\nCC-MAIN-2024-33,text/x-matlab,58903,58891,0.0025\nCC-MAIN-2024-33,text/x-perl,48739,48735,0.0021\nCC-MAIN-2024-33,text/x-php,76640,76345,0.0033\nCC-MAIN-2024-33,text/x-python,9600,9597,0.0004\nCC-MAIN-2024-33,text/x-vcalendar,10801,10800,0.0005\nCC-MAIN-2024-33,text/x-vcard,88814,88781,0.0038\nCC-MAIN-2024-33,text/x-web-markdown,8801,8799,0.0004\nCC-MAIN-2024-33,text/x-yaml,8182,8181,0.0004\nCC-MAIN-2024-33,video/mp4,56,56,0.0000\nCC-MAIN-2024-33,video/webm,1,1,0.0000\nCC-MAIN-2024-38,<other>,353407,353137,0.0126\nCC-MAIN-2024-38,application/atom+xml,2852501,2852201,0.1018\nCC-MAIN-2024-38,application/epub+zip,37214,37121,0.0013\nCC-MAIN-2024-38,application/gpx+xml,13690,13687,0.0005\nCC-MAIN-2024-38,application/gzip,35,35,0.0000\nCC-MAIN-2024-38,application/javascript,12037,12035,0.0004\nCC-MAIN-2024-38,application/json,738988,738483,0.0264\nCC-MAIN-2024-38,application/marc,35184,35176,0.0013\nCC-MAIN-2024-38,application/mbox,45275,45244,0.0016\nCC-MAIN-2024-38,application/msword,48820,48694,0.0017\nCC-MAIN-2024-38,application/octet-stream,382942,382658,0.0137\nCC-MAIN-2024-38,application/pdf,17247835,17208061,0.6158\nCC-MAIN-2024-38,application/pgp-signature,65409,65408,0.0023\nCC-MAIN-2024-38,application/pkcs7-signature,8900,8891,0.0003\nCC-MAIN-2024-38,application/postscript,7272,7272,0.0003\nCC-MAIN-2024-38,application/rdf+xml,252361,252114,0.0090\nCC-MAIN-2024-38,application/rss+xml,2213051,2210613,0.0790\nCC-MAIN-2024-38,application/rtf,35771,35756,0.0013\nCC-MAIN-2024-38,application/text,613,613,0.0000\nCC-MAIN-2024-38,application/vnd.google-earth.kml+xml,65093,64828,0.0023\nCC-MAIN-2024-38,application/vnd.google-earth.kmz,16723,16722,0.0006\nCC-MAIN-2024-38,application/vnd.ms-excel,34895,34728,0.0012\nCC-MAIN-2024-38,application/vnd.ms-powerpoint,8675,8661,0.0003\nCC-MAIN-2024-38,application/vnd.oasis.opendocument.spreadsheet,7879,7867,0.0003\nCC-MAIN-2024-38,application/vnd.oasis.opendocument.text,17180,17176,0.0006\nCC-MAIN-2024-38,application/vnd.openxmlformats-officedocument.presentationml.presentation,4538,4515,0.0002\nCC-MAIN-2024-38,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,32595,32270,0.0012\nCC-MAIN-2024-38,application/vnd.openxmlformats-officedocument.wordprocessingml.document,49672,49356,0.0018\nCC-MAIN-2024-38,application/x-bibtex-text-file,269010,268935,0.0096\nCC-MAIN-2024-38,application/x-bittorrent,5323,5322,0.0002\nCC-MAIN-2024-38,application/x-dosexec,1,1,0.0000\nCC-MAIN-2024-38,application/x-endnote-refer,43222,43209,0.0015\nCC-MAIN-2024-38,application/x-mobipocket-ebook,14881,14817,0.0005\nCC-MAIN-2024-38,application/x-ms-asx,3658,3654,0.0001\nCC-MAIN-2024-38,application/x-msdownload,72,70,0.0000\nCC-MAIN-2024-38,application/x-pds,60893,60893,0.0022\nCC-MAIN-2024-38,application/x-rar-compressed,1,1,0.0000\nCC-MAIN-2024-38,application/x-research-info-systems,5957,5954,0.0002\nCC-MAIN-2024-38,application/x-sh,26616,26601,0.0010\nCC-MAIN-2024-38,application/x-shockwave-flash,4965,4959,0.0002\nCC-MAIN-2024-38,application/x-stata-do,11181,11181,0.0004\nCC-MAIN-2024-38,application/x-tex,11007,11006,0.0004\nCC-MAIN-2024-38,application/x-tex-tfm,21629,21629,0.0008\nCC-MAIN-2024-38,application/x-tika-msoffice,58436,58428,0.0021\nCC-MAIN-2024-38,application/x-tika-ooxml,67497,67472,0.0024\nCC-MAIN-2024-38,application/x-wais-source,7641,7639,0.0003\nCC-MAIN-2024-38,application/x-xz,4,4,0.0000\nCC-MAIN-2024-38,application/xhtml+xml,243654091,242611723,8.6992\nCC-MAIN-2024-38,application/xml,1635084,1633252,0.0584\nCC-MAIN-2024-38,application/zip,590,590,0.0000\nCC-MAIN-2024-38,application/zlib,2127,2102,0.0001\nCC-MAIN-2024-38,audio/mpeg,487,487,0.0000\nCC-MAIN-2024-38,audio/vnd.wave,56,56,0.0000\nCC-MAIN-2024-38,audio/x-mpegurl,21,21,0.0000\nCC-MAIN-2024-38,image/gif,64,62,0.0000\nCC-MAIN-2024-38,image/jpeg,5213,5212,0.0002\nCC-MAIN-2024-38,image/png,352,351,0.0000\nCC-MAIN-2024-38,image/svg+xml,60,60,0.0000\nCC-MAIN-2024-38,image/webp,25,25,0.0000\nCC-MAIN-2024-38,message/rfc822,22877,22873,0.0008\nCC-MAIN-2024-38,text/asp,3,3,0.0000\nCC-MAIN-2024-38,text/aspdotnet,5,5,0.0000\nCC-MAIN-2024-38,text/calendar,809261,809014,0.0289\nCC-MAIN-2024-38,text/css,17329,17327,0.0006\nCC-MAIN-2024-38,text/csv,91259,91029,0.0033\nCC-MAIN-2024-38,text/html,2525241904,2512213727,90.1584\nCC-MAIN-2024-38,text/markdown,22,22,0.0000\nCC-MAIN-2024-38,text/plain,3417666,3412936,0.1220\nCC-MAIN-2024-38,text/prs.lines.tag,228369,228368,0.0082\nCC-MAIN-2024-38,text/tab-separated-values,5384,5380,0.0002\nCC-MAIN-2024-38,text/troff,20837,20835,0.0007\nCC-MAIN-2024-38,text/turtle,52502,52319,0.0019\nCC-MAIN-2024-38,text/vtt,15459,15454,0.0006\nCC-MAIN-2024-38,text/x-c++src,5200,5198,0.0002\nCC-MAIN-2024-38,text/x-chdr,11639,11637,0.0004\nCC-MAIN-2024-38,text/x-csrc,19890,19888,0.0007\nCC-MAIN-2024-38,text/x-diff,34576,34570,0.0012\nCC-MAIN-2024-38,text/x-jsp,2969,2965,0.0001\nCC-MAIN-2024-38,text/x-log,78146,78146,0.0028\nCC-MAIN-2024-38,text/x-matlab,61761,61753,0.0022\nCC-MAIN-2024-38,text/x-perl,45908,45906,0.0016\nCC-MAIN-2024-38,text/x-php,88007,87810,0.0031\nCC-MAIN-2024-38,text/x-python,9283,9282,0.0003\nCC-MAIN-2024-38,text/x-vcalendar,12346,12344,0.0004\nCC-MAIN-2024-38,text/x-vcard,85204,85172,0.0030\nCC-MAIN-2024-38,text/x-web-markdown,9824,9820,0.0004\nCC-MAIN-2024-38,text/x-yaml,7058,7058,0.0003\nCC-MAIN-2024-38,video/mp4,48,48,0.0000\nCC-MAIN-2024-38,video/quicktime,1,1,0.0000\nCC-MAIN-2024-38,video/webm,6,6,0.0000\nCC-MAIN-2024-38,video/x-m4v,1,1,0.0000\nCC-MAIN-2024-42,<other>,356302,355791,0.0143\nCC-MAIN-2024-42,application/atom+xml,2821050,2820781,0.1131\nCC-MAIN-2024-42,application/epub+zip,51705,51534,0.0021\nCC-MAIN-2024-42,application/gpx+xml,18763,18763,0.0008\nCC-MAIN-2024-42,application/gzip,51,51,0.0000\nCC-MAIN-2024-42,application/javascript,12112,12102,0.0005\nCC-MAIN-2024-42,application/json,762125,761653,0.0305\nCC-MAIN-2024-42,application/marc,36110,36110,0.0014\nCC-MAIN-2024-42,application/mbox,50808,50775,0.0020\nCC-MAIN-2024-42,application/msword,66571,66434,0.0027\nCC-MAIN-2024-42,application/octet-stream,359472,359174,0.0144\nCC-MAIN-2024-42,application/pdf,25859011,25804344,1.0364\nCC-MAIN-2024-42,application/pgp-signature,108808,108808,0.0044\nCC-MAIN-2024-42,application/pkcs7-signature,12559,12559,0.0005\nCC-MAIN-2024-42,application/postscript,7426,7426,0.0003\nCC-MAIN-2024-42,application/rdf+xml,245905,245780,0.0099\nCC-MAIN-2024-42,application/rss+xml,2267157,2264999,0.0909\nCC-MAIN-2024-42,application/rtf,35748,35745,0.0014\nCC-MAIN-2024-42,application/text,767,767,0.0000\nCC-MAIN-2024-42,application/vnd.android.package-archive,3,3,0.0000\nCC-MAIN-2024-42,application/vnd.google-earth.kml+xml,63539,63476,0.0025\nCC-MAIN-2024-42,application/vnd.google-earth.kmz,21382,21377,0.0009\nCC-MAIN-2024-42,application/vnd.ms-excel,26630,26544,0.0011\nCC-MAIN-2024-42,application/vnd.ms-powerpoint,8945,8939,0.0004\nCC-MAIN-2024-42,application/vnd.oasis.opendocument.spreadsheet,15618,15606,0.0006\nCC-MAIN-2024-42,application/vnd.oasis.opendocument.text,23608,23608,0.0009\nCC-MAIN-2024-42,application/vnd.openxmlformats-officedocument.presentationml.presentation,6321,6277,0.0003\nCC-MAIN-2024-42,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,41312,40947,0.0017\nCC-MAIN-2024-42,application/vnd.openxmlformats-officedocument.wordprocessingml.document,68137,67872,0.0027\nCC-MAIN-2024-42,application/x-bibtex-text-file,299847,299794,0.0120\nCC-MAIN-2024-42,application/x-bittorrent,6503,6503,0.0003\nCC-MAIN-2024-42,application/x-dosexec,1,1,0.0000\nCC-MAIN-2024-42,application/x-endnote-refer,49124,49119,0.0020\nCC-MAIN-2024-42,application/x-mobipocket-ebook,19482,19340,0.0008\nCC-MAIN-2024-42,application/x-ms-asx,5231,5231,0.0002\nCC-MAIN-2024-42,application/x-msdownload,93,90,0.0000\nCC-MAIN-2024-42,application/x-pds,55503,55503,0.0022\nCC-MAIN-2024-42,application/x-rar-compressed,1,1,0.0000\nCC-MAIN-2024-42,application/x-research-info-systems,5090,5088,0.0002\nCC-MAIN-2024-42,application/x-sh,26415,26401,0.0011\nCC-MAIN-2024-42,application/x-shockwave-flash,5834,5824,0.0002\nCC-MAIN-2024-42,application/x-stata-do,9958,9956,0.0004\nCC-MAIN-2024-42,application/x-tex,9481,9477,0.0004\nCC-MAIN-2024-42,application/x-tex-tfm,24498,24498,0.0010\nCC-MAIN-2024-42,application/x-tika-msoffice,67775,67767,0.0027\nCC-MAIN-2024-42,application/x-tika-ooxml,62721,62718,0.0025\nCC-MAIN-2024-42,application/x-wais-source,6814,6814,0.0003\nCC-MAIN-2024-42,application/xhtml+xml,228753437,227720980,9.1678\nCC-MAIN-2024-42,application/xml,1665404,1663514,0.0667\nCC-MAIN-2024-42,application/zip,817,817,0.0000\nCC-MAIN-2024-42,application/zlib,3695,3651,0.0001\nCC-MAIN-2024-42,audio/mpeg,329,329,0.0000\nCC-MAIN-2024-42,audio/vnd.wave,34,34,0.0000\nCC-MAIN-2024-42,audio/x-mpegurl,21,21,0.0000\nCC-MAIN-2024-42,image/gif,154,153,0.0000\nCC-MAIN-2024-42,image/jpeg,6241,6241,0.0003\nCC-MAIN-2024-42,image/png,545,538,0.0000\nCC-MAIN-2024-42,image/svg+xml,48,48,0.0000\nCC-MAIN-2024-42,image/tiff,11,11,0.0000\nCC-MAIN-2024-42,image/vnd.djvu,2,2,0.0000\nCC-MAIN-2024-42,image/webp,21,21,0.0000\nCC-MAIN-2024-42,message/rfc822,20686,20682,0.0008\nCC-MAIN-2024-42,text/asp,5,4,0.0000\nCC-MAIN-2024-42,text/aspdotnet,1,1,0.0000\nCC-MAIN-2024-42,text/calendar,998347,998092,0.0400\nCC-MAIN-2024-42,text/css,17073,17071,0.0007\nCC-MAIN-2024-42,text/csv,97807,97009,0.0039\nCC-MAIN-2024-42,text/html,2224818659,2212809426,89.1643\nCC-MAIN-2024-42,text/markdown,47,47,0.0000\nCC-MAIN-2024-42,text/plain,3978591,3950429,0.1595\nCC-MAIN-2024-42,text/prs.lines.tag,232556,232540,0.0093\nCC-MAIN-2024-42,text/tab-separated-values,7189,7188,0.0003\nCC-MAIN-2024-42,text/troff,20053,20052,0.0008\nCC-MAIN-2024-42,text/turtle,55005,54941,0.0022\nCC-MAIN-2024-42,text/vtt,17585,17569,0.0007\nCC-MAIN-2024-42,text/x-c++src,6204,6201,0.0002\nCC-MAIN-2024-42,text/x-chdr,14201,14200,0.0006\nCC-MAIN-2024-42,text/x-csrc,23575,23575,0.0009\nCC-MAIN-2024-42,text/x-diff,35745,35738,0.0014\nCC-MAIN-2024-42,text/x-jsp,2510,2496,0.0001\nCC-MAIN-2024-42,text/x-log,90087,90087,0.0036\nCC-MAIN-2024-42,text/x-matlab,63719,63699,0.0026\nCC-MAIN-2024-42,text/x-perl,43488,43452,0.0017\nCC-MAIN-2024-42,text/x-php,69476,69264,0.0028\nCC-MAIN-2024-42,text/x-python,8888,8888,0.0004\nCC-MAIN-2024-42,text/x-vcalendar,13129,13129,0.0005\nCC-MAIN-2024-42,text/x-vcard,102044,102004,0.0041\nCC-MAIN-2024-42,text/x-web-markdown,11907,11903,0.0005\nCC-MAIN-2024-42,text/x-yaml,8971,8971,0.0004\nCC-MAIN-2024-42,video/mp4,107,107,0.0000\nCC-MAIN-2024-42,video/quicktime,2,2,0.0000\nCC-MAIN-2024-42,video/webm,21,21,0.0000\nCC-MAIN-2024-42,video/x-m4v,1,1,0.0000\nCC-MAIN-2024-46,<other>,400400,400107,0.0149\nCC-MAIN-2024-46,application/atom+xml,2720448,2720209,0.1012\nCC-MAIN-2024-46,application/epub+zip,52815,52633,0.0020\nCC-MAIN-2024-46,application/gpx+xml,15085,15085,0.0006\nCC-MAIN-2024-46,application/gzip,60,60,0.0000\nCC-MAIN-2024-46,application/javascript,11352,10991,0.0004\nCC-MAIN-2024-46,application/json,884814,884123,0.0329\nCC-MAIN-2024-46,application/marc,37604,37604,0.0014\nCC-MAIN-2024-46,application/mbox,49838,49812,0.0019\nCC-MAIN-2024-46,application/msword,54200,54037,0.0020\nCC-MAIN-2024-46,application/octet-stream,409621,409310,0.0152\nCC-MAIN-2024-46,application/pdf,21363807,21317844,0.7948\nCC-MAIN-2024-46,application/pgp-signature,89187,89179,0.0033\nCC-MAIN-2024-46,application/pkcs7-signature,11517,11505,0.0004\nCC-MAIN-2024-46,application/postscript,7631,7630,0.0003\nCC-MAIN-2024-46,application/rdf+xml,235647,235418,0.0088\nCC-MAIN-2024-46,application/rss+xml,2249933,2247824,0.0837\nCC-MAIN-2024-46,application/rtf,32567,32563,0.0012\nCC-MAIN-2024-46,application/text,816,816,0.0000\nCC-MAIN-2024-46,application/vnd.android.package-archive,6,6,0.0000\nCC-MAIN-2024-46,application/vnd.google-earth.kml+xml,80478,79832,0.0030\nCC-MAIN-2024-46,application/vnd.google-earth.kmz,20384,20383,0.0008\nCC-MAIN-2024-46,application/vnd.ms-excel,27395,27349,0.0010\nCC-MAIN-2024-46,application/vnd.ms-powerpoint,11818,11814,0.0004\nCC-MAIN-2024-46,application/vnd.oasis.opendocument.spreadsheet,9440,9434,0.0004\nCC-MAIN-2024-46,application/vnd.oasis.opendocument.text,22727,22724,0.0008\nCC-MAIN-2024-46,application/vnd.openxmlformats-officedocument.presentationml.presentation,5526,5518,0.0002\nCC-MAIN-2024-46,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,36857,36711,0.0014\nCC-MAIN-2024-46,application/vnd.openxmlformats-officedocument.wordprocessingml.document,63502,63348,0.0024\nCC-MAIN-2024-46,application/x-bibtex-text-file,296333,296288,0.0110\nCC-MAIN-2024-46,application/x-bittorrent,7332,7332,0.0003\nCC-MAIN-2024-46,application/x-endnote-refer,51956,51952,0.0019\nCC-MAIN-2024-46,application/x-mobipocket-ebook,19924,19759,0.0007\nCC-MAIN-2024-46,application/x-ms-asx,4009,4005,0.0001\nCC-MAIN-2024-46,application/x-msdownload,101,96,0.0000\nCC-MAIN-2024-46,application/x-pds,50392,50392,0.0019\nCC-MAIN-2024-46,application/x-research-info-systems,3584,3580,0.0001\nCC-MAIN-2024-46,application/x-sh,29138,29127,0.0011\nCC-MAIN-2024-46,application/x-shockwave-flash,5203,5201,0.0002\nCC-MAIN-2024-46,application/x-stata-do,11279,11279,0.0004\nCC-MAIN-2024-46,application/x-tex,8935,8928,0.0003\nCC-MAIN-2024-46,application/x-tex-tfm,8856,8856,0.0003\nCC-MAIN-2024-46,application/x-tika-msoffice,54106,54087,0.0020\nCC-MAIN-2024-46,application/x-tika-ooxml,55546,55540,0.0021\nCC-MAIN-2024-46,application/x-wais-source,9917,9917,0.0004\nCC-MAIN-2024-46,application/xhtml+xml,239236712,238280694,8.9008\nCC-MAIN-2024-46,application/xml,2566061,2563543,0.0955\nCC-MAIN-2024-46,application/zip,639,638,0.0000\nCC-MAIN-2024-46,application/zlib,3958,3939,0.0001\nCC-MAIN-2024-46,audio/mpeg,299,299,0.0000\nCC-MAIN-2024-46,audio/vnd.wave,35,35,0.0000\nCC-MAIN-2024-46,audio/x-mpegurl,36,36,0.0000\nCC-MAIN-2024-46,image/gif,102,101,0.0000\nCC-MAIN-2024-46,image/jpeg,4051,4049,0.0002\nCC-MAIN-2024-46,image/png,684,679,0.0000\nCC-MAIN-2024-46,image/svg+xml,4,4,0.0000\nCC-MAIN-2024-46,image/webp,21,21,0.0000\nCC-MAIN-2024-46,message/rfc822,24014,24012,0.0009\nCC-MAIN-2024-46,text/asp,2,2,0.0000\nCC-MAIN-2024-46,text/aspdotnet,1,1,0.0000\nCC-MAIN-2024-46,text/calendar,947795,947621,0.0353\nCC-MAIN-2024-46,text/css,14763,14761,0.0005\nCC-MAIN-2024-46,text/csv,93945,93279,0.0035\nCC-MAIN-2024-46,text/html,2410361090,2398341515,89.6775\nCC-MAIN-2024-46,text/markdown,30,30,0.0000\nCC-MAIN-2024-46,text/plain,4208932,4207881,0.1566\nCC-MAIN-2024-46,text/prs.lines.tag,243875,243854,0.0091\nCC-MAIN-2024-46,text/tab-separated-values,9594,9592,0.0004\nCC-MAIN-2024-46,text/troff,21832,21831,0.0008\nCC-MAIN-2024-46,text/turtle,53698,53556,0.0020\nCC-MAIN-2024-46,text/vtt,20602,20592,0.0008\nCC-MAIN-2024-46,text/x-c++src,7192,7192,0.0003\nCC-MAIN-2024-46,text/x-chdr,12461,12460,0.0005\nCC-MAIN-2024-46,text/x-csrc,24651,24650,0.0009\nCC-MAIN-2024-46,text/x-diff,37091,37085,0.0014\nCC-MAIN-2024-46,text/x-jsp,2344,2337,0.0001\nCC-MAIN-2024-46,text/x-log,55824,55824,0.0021\nCC-MAIN-2024-46,text/x-matlab,63017,63011,0.0023\nCC-MAIN-2024-46,text/x-perl,40922,40869,0.0015\nCC-MAIN-2024-46,text/x-php,90707,90526,0.0034\nCC-MAIN-2024-46,text/x-python,9664,9664,0.0004\nCC-MAIN-2024-46,text/x-vcalendar,14177,14177,0.0005\nCC-MAIN-2024-46,text/x-vcard,96303,96276,0.0036\nCC-MAIN-2024-46,text/x-web-markdown,12247,12210,0.0005\nCC-MAIN-2024-46,text/x-yaml,9998,9998,0.0004\nCC-MAIN-2024-46,video/mp4,288,288,0.0000\nCC-MAIN-2024-51,<other>,317692,317471,0.0121\nCC-MAIN-2024-51,application/atom+xml,2967149,2966522,0.1126\nCC-MAIN-2024-51,application/epub+zip,62525,62240,0.0024\nCC-MAIN-2024-51,application/gpx+xml,15352,15350,0.0006\nCC-MAIN-2024-51,application/gzip,722,722,0.0000\nCC-MAIN-2024-51,application/javascript,13632,13138,0.0005\nCC-MAIN-2024-51,application/json,938720,937822,0.0356\nCC-MAIN-2024-51,application/marc,42437,42436,0.0016\nCC-MAIN-2024-51,application/mbox,49692,49660,0.0019\nCC-MAIN-2024-51,application/msword,54893,54790,0.0021\nCC-MAIN-2024-51,application/octet-stream,464863,464562,0.0176\nCC-MAIN-2024-51,application/pdf,22016726,21966270,0.8354\nCC-MAIN-2024-51,application/pgp-signature,78609,78609,0.0030\nCC-MAIN-2024-51,application/pkcs7-signature,13346,13339,0.0005\nCC-MAIN-2024-51,application/postscript,8554,8548,0.0003\nCC-MAIN-2024-51,application/rdf+xml,258260,258037,0.0098\nCC-MAIN-2024-51,application/rss+xml,2397559,2395661,0.0910\nCC-MAIN-2024-51,application/rtf,42268,42264,0.0016\nCC-MAIN-2024-51,application/text,97,97,0.0000\nCC-MAIN-2024-51,application/vnd.android.package-archive,3,3,0.0000\nCC-MAIN-2024-51,application/vnd.google-earth.kml+xml,61149,60965,0.0023\nCC-MAIN-2024-51,application/vnd.google-earth.kmz,12512,12507,0.0005\nCC-MAIN-2024-51,application/vnd.ms-excel,27356,27301,0.0010\nCC-MAIN-2024-51,application/vnd.ms-powerpoint,6406,6395,0.0002\nCC-MAIN-2024-51,application/vnd.oasis.opendocument.spreadsheet,13755,13742,0.0005\nCC-MAIN-2024-51,application/vnd.oasis.opendocument.text,24484,24474,0.0009\nCC-MAIN-2024-51,application/vnd.openxmlformats-officedocument.presentationml.presentation,6461,6443,0.0002\nCC-MAIN-2024-51,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,38511,38377,0.0015\nCC-MAIN-2024-51,application/vnd.openxmlformats-officedocument.wordprocessingml.document,63102,62927,0.0024\nCC-MAIN-2024-51,application/x-bibtex-text-file,294094,294058,0.0112\nCC-MAIN-2024-51,application/x-bittorrent,5718,5714,0.0002\nCC-MAIN-2024-51,application/x-dosexec,2,2,0.0000\nCC-MAIN-2024-51,application/x-endnote-refer,46507,46503,0.0018\nCC-MAIN-2024-51,application/x-mobipocket-ebook,24833,24554,0.0009\nCC-MAIN-2024-51,application/x-ms-asx,3412,3411,0.0001\nCC-MAIN-2024-51,application/x-msdownload,67,57,0.0000\nCC-MAIN-2024-51,application/x-pds,42408,42408,0.0016\nCC-MAIN-2024-51,application/x-rar-compressed,19,19,0.0000\nCC-MAIN-2024-51,application/x-research-info-systems,4141,4141,0.0002\nCC-MAIN-2024-51,application/x-sh,26844,26831,0.0010\nCC-MAIN-2024-51,application/x-shockwave-flash,5629,5628,0.0002\nCC-MAIN-2024-51,application/x-stata-do,11909,11909,0.0005\nCC-MAIN-2024-51,application/x-tex,8300,8300,0.0003\nCC-MAIN-2024-51,application/x-tex-tfm,11741,11741,0.0004\nCC-MAIN-2024-51,application/x-tika-msoffice,68979,68960,0.0026\nCC-MAIN-2024-51,application/x-tika-ooxml,59640,59631,0.0023\nCC-MAIN-2024-51,application/x-wais-source,9193,9183,0.0003\nCC-MAIN-2024-51,application/xhtml+xml,242689608,241517093,9.2090\nCC-MAIN-2024-51,application/xml,1733475,1731050,0.0658\nCC-MAIN-2024-51,application/zip,1100,1100,0.0000\nCC-MAIN-2024-51,application/zlib,3143,3125,0.0001\nCC-MAIN-2024-51,audio/mpeg,318,317,0.0000\nCC-MAIN-2024-51,audio/vnd.wave,32,32,0.0000\nCC-MAIN-2024-51,audio/x-mpegurl,44,44,0.0000\nCC-MAIN-2024-51,image/gif,71,70,0.0000\nCC-MAIN-2024-51,image/jpeg,6144,6144,0.0002\nCC-MAIN-2024-51,image/png,631,629,0.0000\nCC-MAIN-2024-51,image/svg+xml,5,5,0.0000\nCC-MAIN-2024-51,image/tiff,1,1,0.0000\nCC-MAIN-2024-51,image/vnd.djvu,3,3,0.0000\nCC-MAIN-2024-51,image/webp,53,52,0.0000\nCC-MAIN-2024-51,message/rfc822,29389,29380,0.0011\nCC-MAIN-2024-51,text/asp,2,2,0.0000\nCC-MAIN-2024-51,text/aspdotnet,6,6,0.0000\nCC-MAIN-2024-51,text/calendar,1030458,1030217,0.0391\nCC-MAIN-2024-51,text/css,14609,14607,0.0006\nCC-MAIN-2024-51,text/csv,104592,104343,0.0040\nCC-MAIN-2024-51,text/html,2354521897,2342274000,89.3434\nCC-MAIN-2024-51,text/markdown,100,100,0.0000\nCC-MAIN-2024-51,text/plain,3710400,3709467,0.1408\nCC-MAIN-2024-51,text/prs.lines.tag,265111,265109,0.0101\nCC-MAIN-2024-51,text/tab-separated-values,11769,11769,0.0004\nCC-MAIN-2024-51,text/troff,31658,31645,0.0012\nCC-MAIN-2024-51,text/turtle,63184,63027,0.0024\nCC-MAIN-2024-51,text/vtt,25347,25335,0.0010\nCC-MAIN-2024-51,text/x-c++src,7190,7189,0.0003\nCC-MAIN-2024-51,text/x-chdr,18200,18199,0.0007\nCC-MAIN-2024-51,text/x-csrc,27382,27381,0.0010\nCC-MAIN-2024-51,text/x-diff,34425,34417,0.0013\nCC-MAIN-2024-51,text/x-jsp,2849,2846,0.0001\nCC-MAIN-2024-51,text/x-log,74428,74428,0.0028\nCC-MAIN-2024-51,text/x-matlab,61464,61457,0.0023\nCC-MAIN-2024-51,text/x-perl,44117,44108,0.0017\nCC-MAIN-2024-51,text/x-php,85169,84923,0.0032\nCC-MAIN-2024-51,text/x-python,9878,9872,0.0004\nCC-MAIN-2024-51,text/x-vcalendar,15855,15854,0.0006\nCC-MAIN-2024-51,text/x-vcard,96618,96518,0.0037\nCC-MAIN-2024-51,text/x-web-markdown,12651,12649,0.0005\nCC-MAIN-2024-51,text/x-yaml,8332,8332,0.0003\nCC-MAIN-2024-51,video/mp4,370,370,0.0000\nCC-MAIN-2024-51,video/quicktime,5,5,0.0000\nCC-MAIN-2024-51,video/x-m4v,2,2,0.0000\nCC-MAIN-2025-05,<other>,499922,499705,0.0165\nCC-MAIN-2025-05,application/atom+xml,3167720,3165844,0.1045\nCC-MAIN-2025-05,application/epub+zip,43534,43414,0.0014\nCC-MAIN-2025-05,application/gpx+xml,14717,14714,0.0005\nCC-MAIN-2025-05,application/gzip,36,36,0.0000\nCC-MAIN-2025-05,application/javascript,14147,14134,0.0005\nCC-MAIN-2025-05,application/json,958061,957442,0.0316\nCC-MAIN-2025-05,application/marc,38316,38315,0.0013\nCC-MAIN-2025-05,application/mbox,46885,46848,0.0015\nCC-MAIN-2025-05,application/msword,52511,52352,0.0017\nCC-MAIN-2025-05,application/octet-stream,428542,428220,0.0141\nCC-MAIN-2025-05,application/pdf,19926901,19875664,0.6574\nCC-MAIN-2025-05,application/pgp-signature,98535,98535,0.0033\nCC-MAIN-2025-05,application/pkcs7-signature,11662,11659,0.0004\nCC-MAIN-2025-05,application/postscript,10121,10121,0.0003\nCC-MAIN-2025-05,application/rdf+xml,276998,276903,0.0091\nCC-MAIN-2025-05,application/rss+xml,2445452,2443322,0.0807\nCC-MAIN-2025-05,application/rtf,41903,41897,0.0014\nCC-MAIN-2025-05,application/text,95,95,0.0000\nCC-MAIN-2025-05,application/vnd.android.package-archive,3,3,0.0000\nCC-MAIN-2025-05,application/vnd.google-earth.kml+xml,69288,68797,0.0023\nCC-MAIN-2025-05,application/vnd.google-earth.kmz,10815,10804,0.0004\nCC-MAIN-2025-05,application/vnd.ms-excel,28537,28476,0.0009\nCC-MAIN-2025-05,application/vnd.ms-powerpoint,4254,4251,0.0001\nCC-MAIN-2025-05,application/vnd.oasis.opendocument.spreadsheet,12722,12705,0.0004\nCC-MAIN-2025-05,application/vnd.oasis.opendocument.text,22173,22164,0.0007\nCC-MAIN-2025-05,application/vnd.openxmlformats-officedocument.presentationml.presentation,6141,6115,0.0002\nCC-MAIN-2025-05,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,36139,35757,0.0012\nCC-MAIN-2025-05,application/vnd.openxmlformats-officedocument.wordprocessingml.document,61291,61001,0.0020\nCC-MAIN-2025-05,application/x-bibtex-text-file,316992,316950,0.0105\nCC-MAIN-2025-05,application/x-bittorrent,6296,6295,0.0002\nCC-MAIN-2025-05,application/x-dosexec,2,2,0.0000\nCC-MAIN-2025-05,application/x-endnote-refer,41434,41429,0.0014\nCC-MAIN-2025-05,application/x-mobipocket-ebook,14324,14232,0.0005\nCC-MAIN-2025-05,application/x-ms-asx,3556,3547,0.0001\nCC-MAIN-2025-05,application/x-msdownload,53,48,0.0000\nCC-MAIN-2025-05,application/x-pds,85785,85785,0.0028\nCC-MAIN-2025-05,application/x-rar-compressed,1,1,0.0000\nCC-MAIN-2025-05,application/x-research-info-systems,3114,3114,0.0001\nCC-MAIN-2025-05,application/x-sh,24144,24122,0.0008\nCC-MAIN-2025-05,application/x-shockwave-flash,5134,5132,0.0002\nCC-MAIN-2025-05,application/x-stata-do,10459,10459,0.0003\nCC-MAIN-2025-05,application/x-tex,9926,9923,0.0003\nCC-MAIN-2025-05,application/x-tex-tfm,20196,20196,0.0007\nCC-MAIN-2025-05,application/x-tika-msoffice,73357,73330,0.0024\nCC-MAIN-2025-05,application/x-tika-ooxml,58003,57993,0.0019\nCC-MAIN-2025-05,application/x-wais-source,8745,8745,0.0003\nCC-MAIN-2025-05,application/x-xz,4,4,0.0000\nCC-MAIN-2025-05,application/xhtml+xml,263868889,262594690,8.7049\nCC-MAIN-2025-05,application/xml,1943043,1940499,0.0641\nCC-MAIN-2025-05,application/zip,1057,1057,0.0000\nCC-MAIN-2025-05,application/zlib,3087,3051,0.0001\nCC-MAIN-2025-05,audio/mpeg,852,852,0.0000\nCC-MAIN-2025-05,audio/vnd.wave,30,30,0.0000\nCC-MAIN-2025-05,audio/x-mpegurl,39,39,0.0000\nCC-MAIN-2025-05,image/gif,36,34,0.0000\nCC-MAIN-2025-05,image/jpeg,5517,5517,0.0002\nCC-MAIN-2025-05,image/png,1977,1976,0.0001\nCC-MAIN-2025-05,image/svg+xml,2,2,0.0000\nCC-MAIN-2025-05,image/vnd.djvu,1,1,0.0000\nCC-MAIN-2025-05,image/webp,30,30,0.0000\nCC-MAIN-2025-05,message/rfc822,23915,23911,0.0008\nCC-MAIN-2025-05,text/asp,5,5,0.0000\nCC-MAIN-2025-05,text/aspdotnet,6,6,0.0000\nCC-MAIN-2025-05,text/calendar,1040301,1039972,0.0343\nCC-MAIN-2025-05,text/css,18540,18538,0.0006\nCC-MAIN-2025-05,text/csv,109428,109278,0.0036\nCC-MAIN-2025-05,text/html,2731118776,2716213156,90.0979\nCC-MAIN-2025-05,text/markdown,54,54,0.0000\nCC-MAIN-2025-05,text/plain,3184175,3183369,0.1050\nCC-MAIN-2025-05,text/prs.lines.tag,341013,340950,0.0112\nCC-MAIN-2025-05,text/tab-separated-values,10865,10849,0.0004\nCC-MAIN-2025-05,text/troff,24946,24945,0.0008\nCC-MAIN-2025-05,text/turtle,60117,60072,0.0020\nCC-MAIN-2025-05,text/vtt,25478,25470,0.0008\nCC-MAIN-2025-05,text/x-c++src,5095,5095,0.0002\nCC-MAIN-2025-05,text/x-chdr,11441,11440,0.0004\nCC-MAIN-2025-05,text/x-csrc,18756,18750,0.0006\nCC-MAIN-2025-05,text/x-diff,30988,30980,0.0010\nCC-MAIN-2025-05,text/x-jsp,2216,2205,0.0001\nCC-MAIN-2025-05,text/x-log,68551,68504,0.0023\nCC-MAIN-2025-05,text/x-matlab,63714,63711,0.0021\nCC-MAIN-2025-05,text/x-perl,42752,42750,0.0014\nCC-MAIN-2025-05,text/x-php,105591,105234,0.0035\nCC-MAIN-2025-05,text/x-python,8138,8129,0.0003\nCC-MAIN-2025-05,text/x-vcalendar,13630,13629,0.0004\nCC-MAIN-2025-05,text/x-vcard,93516,93460,0.0031\nCC-MAIN-2025-05,text/x-web-markdown,12129,12122,0.0004\nCC-MAIN-2025-05,text/x-yaml,10445,10444,0.0003\nCC-MAIN-2025-05,video/mp4,249,249,0.0000\nCC-MAIN-2025-05,video/quicktime,1,1,0.0000\nCC-MAIN-2025-08,<other>,408908,408712,0.0153\nCC-MAIN-2025-08,application/atom+xml,3079149,3078522,0.1149\nCC-MAIN-2025-08,application/epub+zip,50468,50145,0.0019\nCC-MAIN-2025-08,application/gpx+xml,18426,18426,0.0007\nCC-MAIN-2025-08,application/gzip,12,12,0.0000\nCC-MAIN-2025-08,application/javascript,13922,13907,0.0005\nCC-MAIN-2025-08,application/json,1015104,1014092,0.0379\nCC-MAIN-2025-08,application/marc,45366,45363,0.0017\nCC-MAIN-2025-08,application/mbox,64897,64821,0.0024\nCC-MAIN-2025-08,application/msword,55078,54971,0.0021\nCC-MAIN-2025-08,application/octet-stream,433033,432455,0.0162\nCC-MAIN-2025-08,application/pdf,21005751,20957577,0.7839\nCC-MAIN-2025-08,application/pgp-signature,93491,93491,0.0035\nCC-MAIN-2025-08,application/pkcs7-signature,11295,11288,0.0004\nCC-MAIN-2025-08,application/postscript,8511,8510,0.0003\nCC-MAIN-2025-08,application/rdf+xml,263568,263393,0.0098\nCC-MAIN-2025-08,application/rss+xml,2439340,2437171,0.0910\nCC-MAIN-2025-08,application/rtf,36986,36978,0.0014\nCC-MAIN-2025-08,application/text,127,127,0.0000\nCC-MAIN-2025-08,application/vnd.android.package-archive,3,3,0.0000\nCC-MAIN-2025-08,application/vnd.google-earth.kml+xml,64411,64302,0.0024\nCC-MAIN-2025-08,application/vnd.google-earth.kmz,11089,11085,0.0004\nCC-MAIN-2025-08,application/vnd.ms-excel,28491,28438,0.0011\nCC-MAIN-2025-08,application/vnd.ms-powerpoint,4480,4474,0.0002\nCC-MAIN-2025-08,application/vnd.oasis.opendocument.spreadsheet,11686,11656,0.0004\nCC-MAIN-2025-08,application/vnd.oasis.opendocument.text,21514,21511,0.0008\nCC-MAIN-2025-08,application/vnd.openxmlformats-officedocument.presentationml.presentation,6304,6278,0.0002\nCC-MAIN-2025-08,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,36018,35894,0.0013\nCC-MAIN-2025-08,application/vnd.openxmlformats-officedocument.wordprocessingml.document,63932,63805,0.0024\nCC-MAIN-2025-08,application/x-bibtex-text-file,320121,320081,0.0119\nCC-MAIN-2025-08,application/x-bittorrent,6469,6466,0.0002\nCC-MAIN-2025-08,application/x-dosexec,2,2,0.0000\nCC-MAIN-2025-08,application/x-endnote-refer,42798,42796,0.0016\nCC-MAIN-2025-08,application/x-mobipocket-ebook,20946,20649,0.0008\nCC-MAIN-2025-08,application/x-ms-asx,4319,4314,0.0002\nCC-MAIN-2025-08,application/x-msdownload,55,49,0.0000\nCC-MAIN-2025-08,application/x-pds,42279,42279,0.0016\nCC-MAIN-2025-08,application/x-rar-compressed,3,3,0.0000\nCC-MAIN-2025-08,application/x-research-info-systems,2236,2234,0.0001\nCC-MAIN-2025-08,application/x-sh,30106,30059,0.0011\nCC-MAIN-2025-08,application/x-shockwave-flash,5443,5441,0.0002\nCC-MAIN-2025-08,application/x-stata-do,13256,13252,0.0005\nCC-MAIN-2025-08,application/x-tex,8207,8204,0.0003\nCC-MAIN-2025-08,application/x-tex-tfm,17218,17218,0.0006\nCC-MAIN-2025-08,application/x-tika-msoffice,76042,76008,0.0028\nCC-MAIN-2025-08,application/x-tika-ooxml,56610,56607,0.0021\nCC-MAIN-2025-08,application/x-wais-source,8232,8232,0.0003\nCC-MAIN-2025-08,application/xhtml+xml,244867406,243723411,9.1378\nCC-MAIN-2025-08,application/xml,1994154,1991787,0.0744\nCC-MAIN-2025-08,application/zip,597,597,0.0000\nCC-MAIN-2025-08,application/zlib,7212,7188,0.0003\nCC-MAIN-2025-08,audio/mpeg,527,527,0.0000\nCC-MAIN-2025-08,audio/vnd.wave,25,25,0.0000\nCC-MAIN-2025-08,audio/x-mpegurl,36,36,0.0000\nCC-MAIN-2025-08,image/gif,55,55,0.0000\nCC-MAIN-2025-08,image/jpeg,5342,5342,0.0002\nCC-MAIN-2025-08,image/png,537,535,0.0000\nCC-MAIN-2025-08,image/svg+xml,12,12,0.0000\nCC-MAIN-2025-08,image/tiff,4,4,0.0000\nCC-MAIN-2025-08,image/vnd.djvu,1,1,0.0000\nCC-MAIN-2025-08,image/webp,40,40,0.0000\nCC-MAIN-2025-08,message/rfc822,21923,21922,0.0008\nCC-MAIN-2025-08,text/asp,3,3,0.0000\nCC-MAIN-2025-08,text/aspdotnet,4,4,0.0000\nCC-MAIN-2025-08,text/calendar,1107778,1107338,0.0413\nCC-MAIN-2025-08,text/css,15068,15066,0.0006\nCC-MAIN-2025-08,text/csv,112491,112437,0.0042\nCC-MAIN-2025-08,text/html,2397212413,2384071794,89.4580\nCC-MAIN-2025-08,text/markdown,136,136,0.0000\nCC-MAIN-2025-08,text/plain,3431228,3430279,0.1280\nCC-MAIN-2025-08,text/prs.lines.tag,310274,310256,0.0116\nCC-MAIN-2025-08,text/tab-separated-values,11043,11043,0.0004\nCC-MAIN-2025-08,text/troff,28855,28854,0.0011\nCC-MAIN-2025-08,text/turtle,65379,65258,0.0024\nCC-MAIN-2025-08,text/vtt,25289,25283,0.0009\nCC-MAIN-2025-08,text/x-c++src,6406,6406,0.0002\nCC-MAIN-2025-08,text/x-chdr,15275,15274,0.0006\nCC-MAIN-2025-08,text/x-csrc,22960,22953,0.0009\nCC-MAIN-2025-08,text/x-diff,35544,35537,0.0013\nCC-MAIN-2025-08,text/x-jsp,1939,1936,0.0001\nCC-MAIN-2025-08,text/x-log,81629,81629,0.0030\nCC-MAIN-2025-08,text/x-matlab,71521,71505,0.0027\nCC-MAIN-2025-08,text/x-perl,45097,45095,0.0017\nCC-MAIN-2025-08,text/x-php,118564,118066,0.0044\nCC-MAIN-2025-08,text/x-python,9503,9495,0.0004\nCC-MAIN-2025-08,text/x-vcalendar,13777,13773,0.0005\nCC-MAIN-2025-08,text/x-vcard,98391,98360,0.0037\nCC-MAIN-2025-08,text/x-web-markdown,11877,11875,0.0004\nCC-MAIN-2025-08,text/x-yaml,9990,9990,0.0004\nCC-MAIN-2025-08,video/mp4,24,24,0.0000\nCC-MAIN-2025-08,video/quicktime,18,18,0.0000\nCC-MAIN-2025-08,video/webm,4,4,0.0000\nCC-MAIN-2025-08,video/x-m4v,3,3,0.0000\nCC-MAIN-2025-13,<other>,370756,370539,0.0135\nCC-MAIN-2025-13,application/atom+xml,3098706,3098084,0.1131\nCC-MAIN-2025-13,application/epub+zip,53906,53555,0.0020\nCC-MAIN-2025-13,application/gpx+xml,14108,14108,0.0005\nCC-MAIN-2025-13,application/gzip,18,18,0.0000\nCC-MAIN-2025-13,application/javascript,12465,12459,0.0005\nCC-MAIN-2025-13,application/json,921162,920831,0.0336\nCC-MAIN-2025-13,application/marc,47102,47101,0.0017\nCC-MAIN-2025-13,application/mbox,60273,60191,0.0022\nCC-MAIN-2025-13,application/msword,56410,56255,0.0021\nCC-MAIN-2025-13,application/octet-stream,518253,517930,0.0189\nCC-MAIN-2025-13,application/pdf,18893854,18848705,0.6893\nCC-MAIN-2025-13,application/pgp-signature,95217,95217,0.0035\nCC-MAIN-2025-13,application/pkcs7-signature,12149,12103,0.0004\nCC-MAIN-2025-13,application/postscript,10999,10998,0.0004\nCC-MAIN-2025-13,application/rdf+xml,281983,281851,0.0103\nCC-MAIN-2025-13,application/rss+xml,2363927,2361848,0.0862\nCC-MAIN-2025-13,application/rtf,36576,36570,0.0013\nCC-MAIN-2025-13,application/text,121,121,0.0000\nCC-MAIN-2025-13,application/vnd.android.package-archive,2,2,0.0000\nCC-MAIN-2025-13,application/vnd.google-earth.kml+xml,61384,61203,0.0022\nCC-MAIN-2025-13,application/vnd.google-earth.kmz,11707,11691,0.0004\nCC-MAIN-2025-13,application/vnd.ms-excel,29760,29475,0.0011\nCC-MAIN-2025-13,application/vnd.ms-powerpoint,4197,4169,0.0002\nCC-MAIN-2025-13,application/vnd.oasis.opendocument.spreadsheet,12512,12497,0.0005\nCC-MAIN-2025-13,application/vnd.oasis.opendocument.text,18217,18201,0.0007\nCC-MAIN-2025-13,application/vnd.openxmlformats-officedocument.presentationml.presentation,6090,6037,0.0002\nCC-MAIN-2025-13,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,41284,41158,0.0015\nCC-MAIN-2025-13,application/vnd.openxmlformats-officedocument.wordprocessingml.document,60590,60251,0.0022\nCC-MAIN-2025-13,application/x-bibtex-text-file,325108,325039,0.0119\nCC-MAIN-2025-13,application/x-bittorrent,5836,5836,0.0002\nCC-MAIN-2025-13,application/x-bzip2,3,3,0.0000\nCC-MAIN-2025-13,application/x-dosexec,1,1,0.0000\nCC-MAIN-2025-13,application/x-endnote-refer,49827,49821,0.0018\nCC-MAIN-2025-13,application/x-mobipocket-ebook,24715,24390,0.0009\nCC-MAIN-2025-13,application/x-ms-asx,4744,4744,0.0002\nCC-MAIN-2025-13,application/x-msdownload,346,343,0.0000\nCC-MAIN-2025-13,application/x-pds,85840,85840,0.0031\nCC-MAIN-2025-13,application/x-rar-compressed,1,1,0.0000\nCC-MAIN-2025-13,application/x-research-info-systems,1875,1874,0.0001\nCC-MAIN-2025-13,application/x-sh,28999,28980,0.0011\nCC-MAIN-2025-13,application/x-shockwave-flash,4070,4069,0.0001\nCC-MAIN-2025-13,application/x-stata-do,14585,14583,0.0005\nCC-MAIN-2025-13,application/x-tex,7902,7902,0.0003\nCC-MAIN-2025-13,application/x-tex-tfm,15258,15258,0.0006\nCC-MAIN-2025-13,application/x-tika-msoffice,82101,82037,0.0030\nCC-MAIN-2025-13,application/x-tika-ooxml,56876,56874,0.0021\nCC-MAIN-2025-13,application/x-wais-source,7685,7685,0.0003\nCC-MAIN-2025-13,application/xhtml+xml,241222218,240122871,8.8010\nCC-MAIN-2025-13,application/xml,1901777,1899520,0.0694\nCC-MAIN-2025-13,application/zip,783,783,0.0000\nCC-MAIN-2025-13,application/zlib,2508,2485,0.0001\nCC-MAIN-2025-13,audio/mpeg,828,828,0.0000\nCC-MAIN-2025-13,audio/vnd.wave,32,32,0.0000\nCC-MAIN-2025-13,audio/x-mpegurl,36,36,0.0000\nCC-MAIN-2025-13,image/gif,70,70,0.0000\nCC-MAIN-2025-13,image/jpeg,5224,5224,0.0002\nCC-MAIN-2025-13,image/png,444,444,0.0000\nCC-MAIN-2025-13,image/svg+xml,8,8,0.0000\nCC-MAIN-2025-13,image/tiff,1,1,0.0000\nCC-MAIN-2025-13,image/vnd.djvu,26151,26149,0.0010\nCC-MAIN-2025-13,image/webp,40,40,0.0000\nCC-MAIN-2025-13,message/rfc822,19011,19004,0.0007\nCC-MAIN-2025-13,text/asp,1,1,0.0000\nCC-MAIN-2025-13,text/calendar,999637,999300,0.0365\nCC-MAIN-2025-13,text/css,16347,16343,0.0006\nCC-MAIN-2025-13,text/csv,110038,109946,0.0040\nCC-MAIN-2025-13,text/html,2464098263,2450362761,89.9029\nCC-MAIN-2025-13,text/markdown,98,98,0.0000\nCC-MAIN-2025-13,text/plain,3567341,3566021,0.1302\nCC-MAIN-2025-13,text/prs.lines.tag,411039,411030,0.0150\nCC-MAIN-2025-13,text/tab-separated-values,10670,10670,0.0004\nCC-MAIN-2025-13,text/troff,37953,37952,0.0014\nCC-MAIN-2025-13,text/turtle,63771,63659,0.0023\nCC-MAIN-2025-13,text/vtt,23503,23498,0.0009\nCC-MAIN-2025-13,text/x-c++src,4562,4562,0.0002\nCC-MAIN-2025-13,text/x-chdr,13053,13053,0.0005\nCC-MAIN-2025-13,text/x-csrc,21702,21701,0.0008\nCC-MAIN-2025-13,text/x-diff,35135,35132,0.0013\nCC-MAIN-2025-13,text/x-jsp,2288,2282,0.0001\nCC-MAIN-2025-13,text/x-log,90380,90378,0.0033\nCC-MAIN-2025-13,text/x-matlab,69442,69426,0.0025\nCC-MAIN-2025-13,text/x-perl,51349,51330,0.0019\nCC-MAIN-2025-13,text/x-php,88949,88768,0.0032\nCC-MAIN-2025-13,text/x-python,8824,8821,0.0003\nCC-MAIN-2025-13,text/x-vcalendar,14195,14193,0.0005\nCC-MAIN-2025-13,text/x-vcard,92537,92494,0.0034\nCC-MAIN-2025-13,text/x-web-markdown,13720,13718,0.0005\nCC-MAIN-2025-13,text/x-yaml,10581,10581,0.0004\nCC-MAIN-2025-13,video/mp4,160,160,0.0000\nCC-MAIN-2025-13,video/webm,6,6,0.0000\nCC-MAIN-2025-13,video/x-m4v,12,12,0.0000\nCC-MAIN-2025-18,<other>,376970,376666,0.0137\nCC-MAIN-2025-18,application/atom+xml,2957805,2957375,0.1077\nCC-MAIN-2025-18,application/epub+zip,62549,62242,0.0023\nCC-MAIN-2025-18,application/gpx+xml,15732,15730,0.0006\nCC-MAIN-2025-18,application/gzip,15,15,0.0000\nCC-MAIN-2025-18,application/javascript,16128,16116,0.0006\nCC-MAIN-2025-18,application/json,886933,886472,0.0323\nCC-MAIN-2025-18,application/marc,43658,43656,0.0016\nCC-MAIN-2025-18,application/mbox,45943,45891,0.0017\nCC-MAIN-2025-18,application/msword,52567,52420,0.0019\nCC-MAIN-2025-18,application/octet-stream,513740,513408,0.0187\nCC-MAIN-2025-18,application/pdf,18698788,18653797,0.6806\nCC-MAIN-2025-18,application/pgp-signature,78667,78667,0.0029\nCC-MAIN-2025-18,application/pkcs7-signature,12380,12376,0.0005\nCC-MAIN-2025-18,application/postscript,8387,8386,0.0003\nCC-MAIN-2025-18,application/rdf+xml,263644,263517,0.0096\nCC-MAIN-2025-18,application/rss+xml,2401663,2399504,0.0874\nCC-MAIN-2025-18,application/rtf,38765,38756,0.0014\nCC-MAIN-2025-18,application/text,120,120,0.0000\nCC-MAIN-2025-18,application/vnd.android.package-archive,39,39,0.0000\nCC-MAIN-2025-18,application/vnd.google-earth.kml+xml,69272,69151,0.0025\nCC-MAIN-2025-18,application/vnd.google-earth.kmz,9251,9250,0.0003\nCC-MAIN-2025-18,application/vnd.ms-excel,33020,32945,0.0012\nCC-MAIN-2025-18,application/vnd.ms-powerpoint,4934,4927,0.0002\nCC-MAIN-2025-18,application/vnd.oasis.opendocument.spreadsheet,9196,9183,0.0003\nCC-MAIN-2025-18,application/vnd.oasis.opendocument.text,20407,20400,0.0007\nCC-MAIN-2025-18,application/vnd.openxmlformats-officedocument.presentationml.presentation,6285,6226,0.0002\nCC-MAIN-2025-18,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,47399,47263,0.0017\nCC-MAIN-2025-18,application/vnd.openxmlformats-officedocument.wordprocessingml.document,62176,61887,0.0023\nCC-MAIN-2025-18,application/x-bibtex-text-file,416892,416848,0.0152\nCC-MAIN-2025-18,application/x-bittorrent,5686,5685,0.0002\nCC-MAIN-2025-18,application/x-bzip2,1,1,0.0000\nCC-MAIN-2025-18,application/x-dosexec,3,3,0.0000\nCC-MAIN-2025-18,application/x-endnote-refer,45807,45804,0.0017\nCC-MAIN-2025-18,application/x-mobipocket-ebook,22873,22592,0.0008\nCC-MAIN-2025-18,application/x-ms-asx,2904,2904,0.0001\nCC-MAIN-2025-18,application/x-msdownload,59,56,0.0000\nCC-MAIN-2025-18,application/x-pds,67769,67769,0.0025\nCC-MAIN-2025-18,application/x-rar-compressed,1,1,0.0000\nCC-MAIN-2025-18,application/x-research-info-systems,1839,1839,0.0001\nCC-MAIN-2025-18,application/x-sh,26700,26685,0.0010\nCC-MAIN-2025-18,application/x-shockwave-flash,3524,3521,0.0001\nCC-MAIN-2025-18,application/x-stata-do,11808,11803,0.0004\nCC-MAIN-2025-18,application/x-tex,8851,8848,0.0003\nCC-MAIN-2025-18,application/x-tex-tfm,31044,31044,0.0011\nCC-MAIN-2025-18,application/x-tika-msoffice,70643,70564,0.0026\nCC-MAIN-2025-18,application/x-tika-ooxml,55645,55619,0.0020\nCC-MAIN-2025-18,application/x-wais-source,6616,6616,0.0002\nCC-MAIN-2025-18,application/xhtml+xml,241598475,240480558,8.7939\nCC-MAIN-2025-18,application/xml,2220447,2199713,0.0808\nCC-MAIN-2025-18,application/zip,807,806,0.0000\nCC-MAIN-2025-18,application/zlib,3509,3488,0.0001\nCC-MAIN-2025-18,audio/mp4,1,1,0.0000\nCC-MAIN-2025-18,audio/mpeg,1127,1127,0.0000\nCC-MAIN-2025-18,audio/vnd.wave,31,31,0.0000\nCC-MAIN-2025-18,audio/x-mpegurl,17,17,0.0000\nCC-MAIN-2025-18,image/gif,88,86,0.0000\nCC-MAIN-2025-18,image/jpeg,5663,5661,0.0002\nCC-MAIN-2025-18,image/png,507,506,0.0000\nCC-MAIN-2025-18,image/svg+xml,30,30,0.0000\nCC-MAIN-2025-18,image/tiff,2,2,0.0000\nCC-MAIN-2025-18,image/vnd.djvu,17877,17874,0.0007\nCC-MAIN-2025-18,image/webp,134,134,0.0000\nCC-MAIN-2025-18,message/rfc822,20402,20398,0.0007\nCC-MAIN-2025-18,text/asp,2,2,0.0000\nCC-MAIN-2025-18,text/calendar,1048358,1047937,0.0382\nCC-MAIN-2025-18,text/css,15752,15748,0.0006\nCC-MAIN-2025-18,text/csv,116907,116831,0.0043\nCC-MAIN-2025-18,text/html,2469376515,2455013708,89.8826\nCC-MAIN-2025-18,text/markdown,140,140,0.0000\nCC-MAIN-2025-18,text/plain,4442552,4441231,0.1617\nCC-MAIN-2025-18,text/prs.lines.tag,319382,319354,0.0116\nCC-MAIN-2025-18,text/tab-separated-values,12074,12074,0.0004\nCC-MAIN-2025-18,text/troff,26302,26298,0.0010\nCC-MAIN-2025-18,text/turtle,65754,65675,0.0024\nCC-MAIN-2025-18,text/vtt,26496,26489,0.0010\nCC-MAIN-2025-18,text/x-c++src,7146,7146,0.0003\nCC-MAIN-2025-18,text/x-chdr,15344,15341,0.0006\nCC-MAIN-2025-18,text/x-csrc,22271,22268,0.0008\nCC-MAIN-2025-18,text/x-diff,39249,39244,0.0014\nCC-MAIN-2025-18,text/x-jsp,1262,1257,0.0000\nCC-MAIN-2025-18,text/x-log,104953,104941,0.0038\nCC-MAIN-2025-18,text/x-matlab,49342,49331,0.0018\nCC-MAIN-2025-18,text/x-perl,49446,49441,0.0018\nCC-MAIN-2025-18,text/x-php,77141,76878,0.0028\nCC-MAIN-2025-18,text/x-python,7750,7747,0.0003\nCC-MAIN-2025-18,text/x-vcalendar,11442,11439,0.0004\nCC-MAIN-2025-18,text/x-vcard,94089,94030,0.0034\nCC-MAIN-2025-18,text/x-web-markdown,14100,14099,0.0005\nCC-MAIN-2025-18,text/x-yaml,7908,7907,0.0003\nCC-MAIN-2025-18,video/mp4,195,194,0.0000\nCC-MAIN-2025-18,video/quicktime,1,1,0.0000\nCC-MAIN-2025-18,video/webm,22,22,0.0000\nCC-MAIN-2025-21,<other>,261182,260883,0.0105\nCC-MAIN-2025-21,application/atom+xml,2642578,2642137,0.1067\nCC-MAIN-2025-21,application/epub+zip,42804,42681,0.0017\nCC-MAIN-2025-21,application/gpx+xml,14943,14943,0.0006\nCC-MAIN-2025-21,application/gzip,87,87,0.0000\nCC-MAIN-2025-21,application/javascript,13883,13879,0.0006\nCC-MAIN-2025-21,application/json,600022,599416,0.0242\nCC-MAIN-2025-21,application/marc,34713,34713,0.0014\nCC-MAIN-2025-21,application/mbox,30214,30170,0.0012\nCC-MAIN-2025-21,application/msword,32450,32181,0.0013\nCC-MAIN-2025-21,application/octet-stream,307651,307332,0.0124\nCC-MAIN-2025-21,application/pdf,14817516,14781292,0.5982\nCC-MAIN-2025-21,application/pgp-signature,31245,31240,0.0013\nCC-MAIN-2025-21,application/pkcs7-signature,8326,8326,0.0003\nCC-MAIN-2025-21,application/postscript,7980,7977,0.0003\nCC-MAIN-2025-21,application/rdf+xml,211412,211335,0.0085\nCC-MAIN-2025-21,application/rss+xml,1694690,1693113,0.0684\nCC-MAIN-2025-21,application/rtf,30126,30115,0.0012\nCC-MAIN-2025-21,application/text,97,97,0.0000\nCC-MAIN-2025-21,application/vnd.android.package-archive,5,5,0.0000\nCC-MAIN-2025-21,application/vnd.google-earth.kml+xml,54840,54734,0.0022\nCC-MAIN-2025-21,application/vnd.google-earth.kmz,7334,7330,0.0003\nCC-MAIN-2025-21,application/vnd.ms-excel,16484,16389,0.0007\nCC-MAIN-2025-21,application/vnd.ms-powerpoint,3930,3925,0.0002\nCC-MAIN-2025-21,application/vnd.oasis.opendocument.spreadsheet,6569,6560,0.0003\nCC-MAIN-2025-21,application/vnd.oasis.opendocument.text,14930,14925,0.0006\nCC-MAIN-2025-21,application/vnd.openxmlformats-officedocument.presentationml.presentation,4934,4905,0.0002\nCC-MAIN-2025-21,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,28585,28425,0.0012\nCC-MAIN-2025-21,application/vnd.openxmlformats-officedocument.wordprocessingml.document,49849,49536,0.0020\nCC-MAIN-2025-21,application/x-bibtex-text-file,278926,278825,0.0113\nCC-MAIN-2025-21,application/x-bittorrent,4917,4917,0.0002\nCC-MAIN-2025-21,application/x-endnote-refer,39737,39725,0.0016\nCC-MAIN-2025-21,application/x-mobipocket-ebook,15866,15762,0.0006\nCC-MAIN-2025-21,application/x-ms-asx,3137,3137,0.0001\nCC-MAIN-2025-21,application/x-msdownload,200,199,0.0000\nCC-MAIN-2025-21,application/x-pds,21381,21381,0.0009\nCC-MAIN-2025-21,application/x-rar-compressed,3,3,0.0000\nCC-MAIN-2025-21,application/x-research-info-systems,1302,1301,0.0001\nCC-MAIN-2025-21,application/x-sh,19462,19444,0.0008\nCC-MAIN-2025-21,application/x-shockwave-flash,3356,3353,0.0001\nCC-MAIN-2025-21,application/x-stata-do,9708,9698,0.0004\nCC-MAIN-2025-21,application/x-tex,6257,6253,0.0003\nCC-MAIN-2025-21,application/x-tex-tfm,8203,8203,0.0003\nCC-MAIN-2025-21,application/x-tika-msoffice,44519,44464,0.0018\nCC-MAIN-2025-21,application/x-tika-ooxml,34941,34937,0.0014\nCC-MAIN-2025-21,application/x-wais-source,4221,4221,0.0002\nCC-MAIN-2025-21,application/x-xz,6,6,0.0000\nCC-MAIN-2025-21,application/xhtml+xml,207499729,206661470,8.3765\nCC-MAIN-2025-21,application/xml,1555813,1529980,0.0628\nCC-MAIN-2025-21,application/zip,326,326,0.0000\nCC-MAIN-2025-21,application/zlib,3219,3206,0.0001\nCC-MAIN-2025-21,audio/mpeg,206,206,0.0000\nCC-MAIN-2025-21,audio/vnd.wave,26,26,0.0000\nCC-MAIN-2025-21,audio/x-mpegurl,12,12,0.0000\nCC-MAIN-2025-21,image/gif,68,68,0.0000\nCC-MAIN-2025-21,image/jpeg,3656,3650,0.0001\nCC-MAIN-2025-21,image/png,360,357,0.0000\nCC-MAIN-2025-21,image/svg+xml,8,8,0.0000\nCC-MAIN-2025-21,image/tiff,32,32,0.0000\nCC-MAIN-2025-21,image/vnd.djvu,15695,15693,0.0006\nCC-MAIN-2025-21,image/webp,19,19,0.0000\nCC-MAIN-2025-21,message/rfc822,16086,16086,0.0006\nCC-MAIN-2025-21,text/asp,1,1,0.0000\nCC-MAIN-2025-21,text/calendar,886485,886213,0.0358\nCC-MAIN-2025-21,text/css,13370,13368,0.0005\nCC-MAIN-2025-21,text/csv,73200,72947,0.0030\nCC-MAIN-2025-21,text/html,2240732213,2228737202,90.4555\nCC-MAIN-2025-21,text/markdown,61,61,0.0000\nCC-MAIN-2025-21,text/plain,4359005,4334477,0.1760\nCC-MAIN-2025-21,text/prs.lines.tag,92117,92099,0.0037\nCC-MAIN-2025-21,text/tab-separated-values,8397,8397,0.0003\nCC-MAIN-2025-21,text/troff,9751,9748,0.0004\nCC-MAIN-2025-21,text/turtle,50316,50294,0.0020\nCC-MAIN-2025-21,text/vtt,19926,19907,0.0008\nCC-MAIN-2025-21,text/x-c++src,4163,4161,0.0002\nCC-MAIN-2025-21,text/x-chdr,12403,12402,0.0005\nCC-MAIN-2025-21,text/x-csrc,12850,12843,0.0005\nCC-MAIN-2025-21,text/x-diff,20792,20782,0.0008\nCC-MAIN-2025-21,text/x-jsp,1186,1182,0.0000\nCC-MAIN-2025-21,text/x-log,48961,48959,0.0020\nCC-MAIN-2025-21,text/x-matlab,29833,29832,0.0012\nCC-MAIN-2025-21,text/x-perl,43759,43755,0.0018\nCC-MAIN-2025-21,text/x-php,72353,72112,0.0029\nCC-MAIN-2025-21,text/x-python,5489,5486,0.0002\nCC-MAIN-2025-21,text/x-vcalendar,9633,9632,0.0004\nCC-MAIN-2025-21,text/x-vcard,81211,81105,0.0033\nCC-MAIN-2025-21,text/x-web-markdown,10607,10607,0.0004\nCC-MAIN-2025-21,text/x-yaml,6686,6686,0.0003\nCC-MAIN-2025-21,video/mp4,48,46,0.0000\nCC-MAIN-2025-21,video/quicktime,4,4,0.0000\nCC-MAIN-2025-21,video/webm,5,5,0.0000\nCC-MAIN-2025-21,video/x-m4v,1,1,0.0000\nCC-MAIN-2025-26,<other>,251253,250994,0.0105\nCC-MAIN-2025-26,application/atom+xml,3111897,3111445,0.1304\nCC-MAIN-2025-26,application/epub+zip,50021,49881,0.0021\nCC-MAIN-2025-26,application/gpx+xml,14972,14970,0.0006\nCC-MAIN-2025-26,application/gzip,13,13,0.0000\nCC-MAIN-2025-26,application/javascript,17535,17517,0.0007\nCC-MAIN-2025-26,application/json,633416,632732,0.0266\nCC-MAIN-2025-26,application/marc,29784,29781,0.0012\nCC-MAIN-2025-26,application/mbox,34232,34204,0.0014\nCC-MAIN-2025-26,application/msword,34564,34385,0.0014\nCC-MAIN-2025-26,application/octet-stream,293162,292646,0.0123\nCC-MAIN-2025-26,application/pdf,14932117,14897649,0.6259\nCC-MAIN-2025-26,application/pgp-signature,35137,35135,0.0015\nCC-MAIN-2025-26,application/pkcs7-signature,9425,9421,0.0004\nCC-MAIN-2025-26,application/postscript,8832,8832,0.0004\nCC-MAIN-2025-26,application/rdf+xml,210283,210182,0.0088\nCC-MAIN-2025-26,application/rss+xml,1658892,1657251,0.0695\nCC-MAIN-2025-26,application/rtf,30619,30604,0.0013\nCC-MAIN-2025-26,application/text,169,169,0.0000\nCC-MAIN-2025-26,application/vnd.android.package-archive,13,13,0.0000\nCC-MAIN-2025-26,application/vnd.google-earth.kml+xml,55996,55919,0.0023\nCC-MAIN-2025-26,application/vnd.google-earth.kmz,6803,6799,0.0003\nCC-MAIN-2025-26,application/vnd.ms-excel,14730,14672,0.0006\nCC-MAIN-2025-26,application/vnd.ms-powerpoint,3412,3399,0.0001\nCC-MAIN-2025-26,application/vnd.oasis.opendocument.spreadsheet,6416,6402,0.0003\nCC-MAIN-2025-26,application/vnd.oasis.opendocument.text,14609,14595,0.0006\nCC-MAIN-2025-26,application/vnd.openxmlformats-officedocument.presentationml.presentation,4973,4926,0.0002\nCC-MAIN-2025-26,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,32031,31813,0.0013\nCC-MAIN-2025-26,application/vnd.openxmlformats-officedocument.wordprocessingml.document,47024,46753,0.0020\nCC-MAIN-2025-26,application/x-bibtex-text-file,295283,295088,0.0124\nCC-MAIN-2025-26,application/x-bittorrent,4999,4997,0.0002\nCC-MAIN-2025-26,application/x-endnote-refer,42313,42305,0.0018\nCC-MAIN-2025-26,application/x-mobipocket-ebook,15134,15034,0.0006\nCC-MAIN-2025-26,application/x-ms-asx,2224,2223,0.0001\nCC-MAIN-2025-26,application/x-msdownload,371,371,0.0000\nCC-MAIN-2025-26,application/x-pds,28809,28809,0.0012\nCC-MAIN-2025-26,application/x-research-info-systems,1937,1937,0.0001\nCC-MAIN-2025-26,application/x-sh,16223,16207,0.0007\nCC-MAIN-2025-26,application/x-shockwave-flash,3036,3033,0.0001\nCC-MAIN-2025-26,application/x-stata-do,12506,12494,0.0005\nCC-MAIN-2025-26,application/x-tex,5097,5096,0.0002\nCC-MAIN-2025-26,application/x-tex-tfm,4663,4663,0.0002\nCC-MAIN-2025-26,application/x-tika-msoffice,48147,48140,0.0020\nCC-MAIN-2025-26,application/x-tika-ooxml,39610,39609,0.0017\nCC-MAIN-2025-26,application/x-wais-source,3861,3861,0.0002\nCC-MAIN-2025-26,application/xhtml+xml,203519681,202695888,8.5312\nCC-MAIN-2025-26,application/xml,1601845,1590821,0.0671\nCC-MAIN-2025-26,application/zip,321,321,0.0000\nCC-MAIN-2025-26,application/zlib,2549,2537,0.0001\nCC-MAIN-2025-26,audio/mpeg,495,495,0.0000\nCC-MAIN-2025-26,audio/vnd.wave,65,65,0.0000\nCC-MAIN-2025-26,audio/x-mpegurl,49,49,0.0000\nCC-MAIN-2025-26,image/gif,84,84,0.0000\nCC-MAIN-2025-26,image/jpeg,4305,4300,0.0002\nCC-MAIN-2025-26,image/png,472,471,0.0000\nCC-MAIN-2025-26,image/svg+xml,5,5,0.0000\nCC-MAIN-2025-26,image/vnd.djvu,25321,25320,0.0011\nCC-MAIN-2025-26,image/webp,53,53,0.0000\nCC-MAIN-2025-26,message/rfc822,15089,15089,0.0006\nCC-MAIN-2025-26,text/asp,3,3,0.0000\nCC-MAIN-2025-26,text/calendar,889291,889010,0.0373\nCC-MAIN-2025-26,text/css,17388,17386,0.0007\nCC-MAIN-2025-26,text/csv,73163,73028,0.0031\nCC-MAIN-2025-26,text/html,2153434189,2141846924,90.2679\nCC-MAIN-2025-26,text/markdown,65,65,0.0000\nCC-MAIN-2025-26,text/plain,3413830,3405718,0.1431\nCC-MAIN-2025-26,text/prs.lines.tag,84668,84658,0.0035\nCC-MAIN-2025-26,text/tab-separated-values,11627,11624,0.0005\nCC-MAIN-2025-26,text/troff,11278,11276,0.0005\nCC-MAIN-2025-26,text/turtle,49641,49615,0.0021\nCC-MAIN-2025-26,text/vtt,21160,21154,0.0009\nCC-MAIN-2025-26,text/x-c++src,3089,3089,0.0001\nCC-MAIN-2025-26,text/x-chdr,8626,8626,0.0004\nCC-MAIN-2025-26,text/x-csrc,13909,13904,0.0006\nCC-MAIN-2025-26,text/x-diff,21127,21124,0.0009\nCC-MAIN-2025-26,text/x-jsp,991,987,0.0000\nCC-MAIN-2025-26,text/x-log,46978,46977,0.0020\nCC-MAIN-2025-26,text/x-matlab,26853,26840,0.0011\nCC-MAIN-2025-26,text/x-perl,42838,42835,0.0018\nCC-MAIN-2025-26,text/x-php,70764,70605,0.0030\nCC-MAIN-2025-26,text/x-python,5378,5375,0.0002\nCC-MAIN-2025-26,text/x-vcalendar,11062,11059,0.0005\nCC-MAIN-2025-26,text/x-vcard,88793,88752,0.0037\nCC-MAIN-2025-26,text/x-web-markdown,11303,11301,0.0005\nCC-MAIN-2025-26,text/x-yaml,8775,8775,0.0004\nCC-MAIN-2025-26,video/mp4,274,274,0.0000\nCC-MAIN-2025-26,video/quicktime,7,7,0.0000\nCC-MAIN-2025-26,video/webm,2,2,0.0000\nCC-MAIN-2025-30,<other>,269557,269268,0.0111\nCC-MAIN-2025-30,application/atom+xml,3215168,3214717,0.1327\nCC-MAIN-2025-30,application/epub+zip,46900,46798,0.0019\nCC-MAIN-2025-30,application/gpx+xml,14035,14035,0.0006\nCC-MAIN-2025-30,application/gzip,17,17,0.0000\nCC-MAIN-2025-30,application/javascript,17813,17798,0.0007\nCC-MAIN-2025-30,application/json,668478,667954,0.0276\nCC-MAIN-2025-30,application/marc,30916,30910,0.0013\nCC-MAIN-2025-30,application/mbox,39508,39455,0.0016\nCC-MAIN-2025-30,application/msword,40128,40046,0.0017\nCC-MAIN-2025-30,application/octet-stream,284436,284079,0.0117\nCC-MAIN-2025-30,application/pdf,15820487,15790285,0.6530\nCC-MAIN-2025-30,application/pgp-signature,34973,34973,0.0014\nCC-MAIN-2025-30,application/pkcs7-signature,10712,10711,0.0004\nCC-MAIN-2025-30,application/postscript,10335,10327,0.0004\nCC-MAIN-2025-30,application/rdf+xml,220521,220433,0.0091\nCC-MAIN-2025-30,application/rss+xml,1678431,1677226,0.0693\nCC-MAIN-2025-30,application/rtf,31739,31729,0.0013\nCC-MAIN-2025-30,application/text,58,58,0.0000\nCC-MAIN-2025-30,application/vnd.android.package-archive,6,6,0.0000\nCC-MAIN-2025-30,application/vnd.google-earth.kml+xml,48118,48083,0.0020\nCC-MAIN-2025-30,application/vnd.google-earth.kmz,7833,7832,0.0003\nCC-MAIN-2025-30,application/vnd.ms-excel,18550,18522,0.0008\nCC-MAIN-2025-30,application/vnd.ms-powerpoint,4321,4308,0.0002\nCC-MAIN-2025-30,application/vnd.oasis.opendocument.spreadsheet,7940,7935,0.0003\nCC-MAIN-2025-30,application/vnd.oasis.opendocument.text,17215,17208,0.0007\nCC-MAIN-2025-30,application/vnd.openxmlformats-officedocument.presentationml.presentation,6580,6558,0.0003\nCC-MAIN-2025-30,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,35386,35294,0.0015\nCC-MAIN-2025-30,application/vnd.openxmlformats-officedocument.wordprocessingml.document,53024,52849,0.0022\nCC-MAIN-2025-30,application/x-bibtex-text-file,317800,317631,0.0131\nCC-MAIN-2025-30,application/x-bittorrent,4824,4824,0.0002\nCC-MAIN-2025-30,application/x-endnote-refer,51305,51287,0.0021\nCC-MAIN-2025-30,application/x-mobipocket-ebook,15978,15876,0.0007\nCC-MAIN-2025-30,application/x-ms-asx,2808,2807,0.0001\nCC-MAIN-2025-30,application/x-msdownload,323,323,0.0000\nCC-MAIN-2025-30,application/x-pds,53511,53511,0.0022\nCC-MAIN-2025-30,application/x-rar-compressed,10,10,0.0000\nCC-MAIN-2025-30,application/x-research-info-systems,1495,1495,0.0001\nCC-MAIN-2025-30,application/x-sh,21390,21362,0.0009\nCC-MAIN-2025-30,application/x-shockwave-flash,2766,2766,0.0001\nCC-MAIN-2025-30,application/x-stata-do,9373,9366,0.0004\nCC-MAIN-2025-30,application/x-tex,5722,5721,0.0002\nCC-MAIN-2025-30,application/x-tex-tfm,7988,7988,0.0003\nCC-MAIN-2025-30,application/x-tika-msoffice,57361,57358,0.0024\nCC-MAIN-2025-30,application/x-tika-ooxml,39114,39105,0.0016\nCC-MAIN-2025-30,application/x-wais-source,4258,4258,0.0002\nCC-MAIN-2025-30,application/xhtml+xml,205022672,204209339,8.4630\nCC-MAIN-2025-30,application/xml,1660573,1650557,0.0685\nCC-MAIN-2025-30,application/zip,584,584,0.0000\nCC-MAIN-2025-30,application/zlib,2197,2183,0.0001\nCC-MAIN-2025-30,audio/mp4,1,1,0.0000\nCC-MAIN-2025-30,audio/mpeg,536,536,0.0000\nCC-MAIN-2025-30,audio/vnd.wave,44,44,0.0000\nCC-MAIN-2025-30,audio/x-mpegurl,70,70,0.0000\nCC-MAIN-2025-30,image/gif,66,66,0.0000\nCC-MAIN-2025-30,image/jpeg,5672,5670,0.0002\nCC-MAIN-2025-30,image/png,432,430,0.0000\nCC-MAIN-2025-30,image/svg+xml,2,2,0.0000\nCC-MAIN-2025-30,image/tiff,1,1,0.0000\nCC-MAIN-2025-30,image/vnd.djvu,31356,31356,0.0013\nCC-MAIN-2025-30,image/webp,58,58,0.0000\nCC-MAIN-2025-30,message/rfc822,18144,18142,0.0007\nCC-MAIN-2025-30,text/calendar,905917,905182,0.0374\nCC-MAIN-2025-30,text/css,11690,11686,0.0005\nCC-MAIN-2025-30,text/csv,74621,74601,0.0031\nCC-MAIN-2025-30,text/html,2188729885,2176880529,90.3470\nCC-MAIN-2025-30,text/markdown,169,166,0.0000\nCC-MAIN-2025-30,text/plain,2293874,2292524,0.0947\nCC-MAIN-2025-30,text/prs.lines.tag,105982,105967,0.0044\nCC-MAIN-2025-30,text/tab-separated-values,8722,8722,0.0004\nCC-MAIN-2025-30,text/troff,13373,13373,0.0006\nCC-MAIN-2025-30,text/turtle,50988,50955,0.0021\nCC-MAIN-2025-30,text/vtt,24630,24615,0.0010\nCC-MAIN-2025-30,text/x-c++src,2822,2822,0.0001\nCC-MAIN-2025-30,text/x-chdr,8732,8732,0.0004\nCC-MAIN-2025-30,text/x-csrc,17951,17950,0.0007\nCC-MAIN-2025-30,text/x-diff,24845,24836,0.0010\nCC-MAIN-2025-30,text/x-jsp,1160,1155,0.0000\nCC-MAIN-2025-30,text/x-log,54121,54120,0.0022\nCC-MAIN-2025-30,text/x-matlab,30899,30897,0.0013\nCC-MAIN-2025-30,text/x-perl,38659,38655,0.0016\nCC-MAIN-2025-30,text/x-php,79244,79084,0.0033\nCC-MAIN-2025-30,text/x-python,6130,6129,0.0003\nCC-MAIN-2025-30,text/x-vcalendar,11501,11498,0.0005\nCC-MAIN-2025-30,text/x-vcard,90042,90004,0.0037\nCC-MAIN-2025-30,text/x-web-markdown,12264,12263,0.0005\nCC-MAIN-2025-30,text/x-yaml,10443,10443,0.0004\nCC-MAIN-2025-30,video/mp4,221,220,0.0000\nCC-MAIN-2025-30,video/quicktime,2,2,0.0000\nCC-MAIN-2025-30,video/webm,1,1,0.0000\nCC-MAIN-2025-33,<other>,254644,254042,0.0104\nCC-MAIN-2025-33,application/atom+xml,2936105,2935747,0.1202\nCC-MAIN-2025-33,application/epub+zip,48091,47943,0.0020\nCC-MAIN-2025-33,application/gpx+xml,13803,13803,0.0006\nCC-MAIN-2025-33,application/gzip,19,19,0.0000\nCC-MAIN-2025-33,application/javascript,15868,15849,0.0006\nCC-MAIN-2025-33,application/json,640659,640343,0.0262\nCC-MAIN-2025-33,application/marc,26199,26198,0.0011\nCC-MAIN-2025-33,application/mbox,33468,33398,0.0014\nCC-MAIN-2025-33,application/msword,36448,36374,0.0015\nCC-MAIN-2025-33,application/octet-stream,389248,388409,0.0159\nCC-MAIN-2025-33,application/pdf,14486528,14457606,0.5931\nCC-MAIN-2025-33,application/pgp-signature,33106,33106,0.0014\nCC-MAIN-2025-33,application/pkcs7-signature,9235,9228,0.0004\nCC-MAIN-2025-33,application/postscript,7843,7842,0.0003\nCC-MAIN-2025-33,application/rdf+xml,207069,206949,0.0085\nCC-MAIN-2025-33,application/rss+xml,1624107,1623036,0.0665\nCC-MAIN-2025-33,application/rtf,33131,33126,0.0014\nCC-MAIN-2025-33,application/text,7,7,0.0000\nCC-MAIN-2025-33,application/vnd.android.package-archive,3,3,0.0000\nCC-MAIN-2025-33,application/vnd.google-earth.kml+xml,50892,50854,0.0021\nCC-MAIN-2025-33,application/vnd.google-earth.kmz,6690,6690,0.0003\nCC-MAIN-2025-33,application/vnd.ms-excel,16383,16380,0.0007\nCC-MAIN-2025-33,application/vnd.ms-powerpoint,3896,3885,0.0002\nCC-MAIN-2025-33,application/vnd.oasis.opendocument.spreadsheet,5698,5687,0.0002\nCC-MAIN-2025-33,application/vnd.oasis.opendocument.text,14810,14791,0.0006\nCC-MAIN-2025-33,application/vnd.openxmlformats-officedocument.presentationml.presentation,5961,5901,0.0002\nCC-MAIN-2025-33,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,33383,33327,0.0014\nCC-MAIN-2025-33,application/vnd.openxmlformats-officedocument.wordprocessingml.document,48337,48158,0.0020\nCC-MAIN-2025-33,application/x-bibtex-text-file,297719,297532,0.0122\nCC-MAIN-2025-33,application/x-bittorrent,6113,6112,0.0003\nCC-MAIN-2025-33,application/x-dosexec,1,1,0.0000\nCC-MAIN-2025-33,application/x-endnote-refer,42623,42612,0.0017\nCC-MAIN-2025-33,application/x-mobipocket-ebook,17614,17474,0.0007\nCC-MAIN-2025-33,application/x-ms-asx,2632,2632,0.0001\nCC-MAIN-2025-33,application/x-msdownload,276,276,0.0000\nCC-MAIN-2025-33,application/x-pds,35429,35429,0.0015\nCC-MAIN-2025-33,application/x-rar-compressed,2,2,0.0000\nCC-MAIN-2025-33,application/x-research-info-systems,1195,1195,0.0000\nCC-MAIN-2025-33,application/x-sh,15870,15843,0.0006\nCC-MAIN-2025-33,application/x-shockwave-flash,2037,2034,0.0001\nCC-MAIN-2025-33,application/x-stata-do,8115,8115,0.0003\nCC-MAIN-2025-33,application/x-tex,6770,6770,0.0003\nCC-MAIN-2025-33,application/x-tex-tfm,7161,7161,0.0003\nCC-MAIN-2025-33,application/x-tika-msoffice,55038,55033,0.0023\nCC-MAIN-2025-33,application/x-tika-ooxml,37824,37802,0.0015\nCC-MAIN-2025-33,application/x-wais-source,3489,3489,0.0001\nCC-MAIN-2025-33,application/x-xz,1,1,0.0000\nCC-MAIN-2025-33,application/xhtml+xml,199355406,198606709,8.1620\nCC-MAIN-2025-33,application/xml,1593255,1583329,0.0652\nCC-MAIN-2025-33,application/zip,233,233,0.0000\nCC-MAIN-2025-33,application/zlib,4053,4004,0.0002\nCC-MAIN-2025-33,audio/mpeg,444,444,0.0000\nCC-MAIN-2025-33,audio/vnd.wave,54,54,0.0000\nCC-MAIN-2025-33,audio/x-mpegurl,55,55,0.0000\nCC-MAIN-2025-33,image/gif,29,29,0.0000\nCC-MAIN-2025-33,image/jpeg,5723,5720,0.0002\nCC-MAIN-2025-33,image/png,473,473,0.0000\nCC-MAIN-2025-33,image/svg+xml,11,11,0.0000\nCC-MAIN-2025-33,image/vnd.djvu,9556,9555,0.0004\nCC-MAIN-2025-33,image/webp,10,10,0.0000\nCC-MAIN-2025-33,message/rfc822,20586,20578,0.0008\nCC-MAIN-2025-33,text/calendar,885062,884787,0.0362\nCC-MAIN-2025-33,text/css,11637,11634,0.0005\nCC-MAIN-2025-33,text/csv,77034,76829,0.0032\nCC-MAIN-2025-33,text/html,2216347634,2204565901,90.7412\nCC-MAIN-2025-33,text/markdown,988,987,0.0000\nCC-MAIN-2025-33,text/plain,2107506,2106335,0.0863\nCC-MAIN-2025-33,text/prs.lines.tag,97936,97934,0.0040\nCC-MAIN-2025-33,text/tab-separated-values,8519,8518,0.0003\nCC-MAIN-2025-33,text/troff,12671,12671,0.0005\nCC-MAIN-2025-33,text/turtle,52242,52224,0.0021\nCC-MAIN-2025-33,text/vtt,24465,24448,0.0010\nCC-MAIN-2025-33,text/x-c++src,3028,3026,0.0001\nCC-MAIN-2025-33,text/x-chdr,8799,8798,0.0004\nCC-MAIN-2025-33,text/x-csrc,12003,12002,0.0005\nCC-MAIN-2025-33,text/x-diff,22569,22562,0.0009\nCC-MAIN-2025-33,text/x-jsp,1341,1339,0.0001\nCC-MAIN-2025-33,text/x-log,45815,45814,0.0019\nCC-MAIN-2025-33,text/x-matlab,36295,36293,0.0015\nCC-MAIN-2025-33,text/x-perl,35550,35548,0.0015\nCC-MAIN-2025-33,text/x-php,75396,75253,0.0031\nCC-MAIN-2025-33,text/x-python,4806,4806,0.0002\nCC-MAIN-2025-33,text/x-vcalendar,10898,10894,0.0004\nCC-MAIN-2025-33,text/x-vcard,75603,75563,0.0031\nCC-MAIN-2025-33,text/x-web-markdown,15143,15140,0.0006\nCC-MAIN-2025-33,text/x-yaml,8678,8677,0.0004\nCC-MAIN-2025-33,video/mp4,430,429,0.0000\nCC-MAIN-2025-33,video/quicktime,2,2,0.0000\nCC-MAIN-2025-38,<other>,244717,244247,0.0103\nCC-MAIN-2025-38,application/atom+xml,2802469,2802104,0.1175\nCC-MAIN-2025-38,application/epub+zip,40543,40438,0.0017\nCC-MAIN-2025-38,application/gpx+xml,14162,14161,0.0006\nCC-MAIN-2025-38,application/gzip,12,12,0.0000\nCC-MAIN-2025-38,application/javascript,35359,35349,0.0015\nCC-MAIN-2025-38,application/json,661411,661134,0.0277\nCC-MAIN-2025-38,application/marc,23163,23151,0.0010\nCC-MAIN-2025-38,application/mbox,32173,32117,0.0013\nCC-MAIN-2025-38,application/msword,32757,32721,0.0014\nCC-MAIN-2025-38,application/octet-stream,255306,254967,0.0107\nCC-MAIN-2025-38,application/pdf,13644284,13616791,0.5719\nCC-MAIN-2025-38,application/pgp-signature,28901,28901,0.0012\nCC-MAIN-2025-38,application/pkcs7-signature,6202,6198,0.0003\nCC-MAIN-2025-38,application/postscript,6955,6952,0.0003\nCC-MAIN-2025-38,application/rdf+xml,196441,196388,0.0082\nCC-MAIN-2025-38,application/rss+xml,1562536,1561483,0.0655\nCC-MAIN-2025-38,application/rtf,31026,31005,0.0013\nCC-MAIN-2025-38,application/text,148,148,0.0000\nCC-MAIN-2025-38,application/vnd.android.package-archive,5,5,0.0000\nCC-MAIN-2025-38,application/vnd.google-earth.kml+xml,45654,45618,0.0019\nCC-MAIN-2025-38,application/vnd.google-earth.kmz,4685,4684,0.0002\nCC-MAIN-2025-38,application/vnd.ms-excel,17187,17156,0.0007\nCC-MAIN-2025-38,application/vnd.ms-powerpoint,3952,3946,0.0002\nCC-MAIN-2025-38,application/vnd.oasis.opendocument.spreadsheet,6507,6502,0.0003\nCC-MAIN-2025-38,application/vnd.oasis.opendocument.text,12446,12444,0.0005\nCC-MAIN-2025-38,application/vnd.openxmlformats-officedocument.presentationml.presentation,5327,5303,0.0002\nCC-MAIN-2025-38,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,28860,28780,0.0012\nCC-MAIN-2025-38,application/vnd.openxmlformats-officedocument.wordprocessingml.document,45094,44965,0.0019\nCC-MAIN-2025-38,application/x-bibtex-text-file,296583,296478,0.0124\nCC-MAIN-2025-38,application/x-bittorrent,5688,5686,0.0002\nCC-MAIN-2025-38,application/x-endnote-refer,46822,46800,0.0020\nCC-MAIN-2025-38,application/x-mobipocket-ebook,14975,14874,0.0006\nCC-MAIN-2025-38,application/x-ms-asx,4970,4970,0.0002\nCC-MAIN-2025-38,application/x-msdownload,511,504,0.0000\nCC-MAIN-2025-38,application/x-pds,21938,21934,0.0009\nCC-MAIN-2025-38,application/x-rar-compressed,2,2,0.0000\nCC-MAIN-2025-38,application/x-research-info-systems,879,879,0.0000\nCC-MAIN-2025-38,application/x-sh,20945,20902,0.0009\nCC-MAIN-2025-38,application/x-shockwave-flash,2079,2076,0.0001\nCC-MAIN-2025-38,application/x-stata-do,8456,8453,0.0004\nCC-MAIN-2025-38,application/x-tex,6436,6435,0.0003\nCC-MAIN-2025-38,application/x-tex-tfm,9526,9526,0.0004\nCC-MAIN-2025-38,application/x-tika-msoffice,44155,44141,0.0019\nCC-MAIN-2025-38,application/x-tika-ooxml,34275,34259,0.0014\nCC-MAIN-2025-38,application/x-wais-source,4303,4303,0.0002\nCC-MAIN-2025-38,application/x-xz,1,1,0.0000\nCC-MAIN-2025-38,application/xhtml+xml,185332045,184619353,7.7676\nCC-MAIN-2025-38,application/xml,1601160,1598872,0.0671\nCC-MAIN-2025-38,application/zip,339,339,0.0000\nCC-MAIN-2025-38,application/zlib,2146,2064,0.0001\nCC-MAIN-2025-38,audio/mpeg,333,333,0.0000\nCC-MAIN-2025-38,audio/vnd.wave,75,75,0.0000\nCC-MAIN-2025-38,audio/x-mpegurl,38,38,0.0000\nCC-MAIN-2025-38,image/gif,40,40,0.0000\nCC-MAIN-2025-38,image/jpeg,4494,4492,0.0002\nCC-MAIN-2025-38,image/png,460,457,0.0000\nCC-MAIN-2025-38,image/svg+xml,8,8,0.0000\nCC-MAIN-2025-38,image/tiff,3,3,0.0000\nCC-MAIN-2025-38,image/vnd.djvu,7026,7025,0.0003\nCC-MAIN-2025-38,image/webp,54,53,0.0000\nCC-MAIN-2025-38,message/rfc822,16071,16062,0.0007\nCC-MAIN-2025-38,text/calendar,853964,853699,0.0358\nCC-MAIN-2025-38,text/css,12971,12968,0.0005\nCC-MAIN-2025-38,text/csv,73181,73173,0.0031\nCC-MAIN-2025-38,text/html,2175236630,2163383874,91.1680\nCC-MAIN-2025-38,text/markdown,2923,2907,0.0001\nCC-MAIN-2025-38,text/plain,1967442,1966680,0.0825\nCC-MAIN-2025-38,text/prs.lines.tag,105303,105301,0.0044\nCC-MAIN-2025-38,text/tab-separated-values,9773,9773,0.0004\nCC-MAIN-2025-38,text/troff,9035,9035,0.0004\nCC-MAIN-2025-38,text/turtle,45730,45724,0.0019\nCC-MAIN-2025-38,text/vtt,20468,20457,0.0009\nCC-MAIN-2025-38,text/x-c++src,3411,3404,0.0001\nCC-MAIN-2025-38,text/x-chdr,7952,7949,0.0003\nCC-MAIN-2025-38,text/x-csrc,11507,11506,0.0005\nCC-MAIN-2025-38,text/x-diff,20893,20891,0.0009\nCC-MAIN-2025-38,text/x-jsp,1288,1279,0.0001\nCC-MAIN-2025-38,text/x-log,47641,47639,0.0020\nCC-MAIN-2025-38,text/x-matlab,40075,40054,0.0017\nCC-MAIN-2025-38,text/x-perl,29792,29788,0.0012\nCC-MAIN-2025-38,text/x-php,74147,73944,0.0031\nCC-MAIN-2025-38,text/x-python,9509,9508,0.0004\nCC-MAIN-2025-38,text/x-vcalendar,11312,11311,0.0005\nCC-MAIN-2025-38,text/x-vcard,70779,70572,0.0030\nCC-MAIN-2025-38,text/x-web-markdown,16817,16814,0.0007\nCC-MAIN-2025-38,text/x-yaml,6498,6497,0.0003\nCC-MAIN-2025-38,video/mp4,49,49,0.0000\nCC-MAIN-2025-38,video/quicktime,1,1,0.0000\nCC-MAIN-2025-43,<other>,245156,244968,0.0094\nCC-MAIN-2025-43,application/atom+xml,2527239,2526890,0.0966\nCC-MAIN-2025-43,application/epub+zip,46827,46682,0.0018\nCC-MAIN-2025-43,application/gpx+xml,15279,15279,0.0006\nCC-MAIN-2025-43,application/gzip,138,138,0.0000\nCC-MAIN-2025-43,application/javascript,22995,22985,0.0009\nCC-MAIN-2025-43,application/json,627658,627212,0.0240\nCC-MAIN-2025-43,application/marc,25303,25299,0.0010\nCC-MAIN-2025-43,application/mbox,26736,26669,0.0010\nCC-MAIN-2025-43,application/msword,35526,35393,0.0014\nCC-MAIN-2025-43,application/octet-stream,246725,246281,0.0094\nCC-MAIN-2025-43,application/pdf,15317088,15286405,0.5853\nCC-MAIN-2025-43,application/pgp-signature,27071,27071,0.0010\nCC-MAIN-2025-43,application/pkcs7-signature,9548,9540,0.0004\nCC-MAIN-2025-43,application/postscript,6727,6726,0.0003\nCC-MAIN-2025-43,application/rdf+xml,198615,198533,0.0076\nCC-MAIN-2025-43,application/rss+xml,1629436,1628289,0.0623\nCC-MAIN-2025-43,application/rtf,31881,31873,0.0012\nCC-MAIN-2025-43,application/text,123,123,0.0000\nCC-MAIN-2025-43,application/vnd.android.package-archive,3,3,0.0000\nCC-MAIN-2025-43,application/vnd.google-earth.kml+xml,53369,53342,0.0020\nCC-MAIN-2025-43,application/vnd.google-earth.kmz,6495,6493,0.0002\nCC-MAIN-2025-43,application/vnd.ms-excel,13960,13902,0.0005\nCC-MAIN-2025-43,application/vnd.ms-powerpoint,4305,4291,0.0002\nCC-MAIN-2025-43,application/vnd.oasis.opendocument.spreadsheet,9524,9516,0.0004\nCC-MAIN-2025-43,application/vnd.oasis.opendocument.text,14297,14294,0.0005\nCC-MAIN-2025-43,application/vnd.openxmlformats-officedocument.presentationml.presentation,4933,4858,0.0002\nCC-MAIN-2025-43,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,41638,41528,0.0016\nCC-MAIN-2025-43,application/vnd.openxmlformats-officedocument.wordprocessingml.document,49269,49094,0.0019\nCC-MAIN-2025-43,application/x-bibtex-text-file,290350,290236,0.0111\nCC-MAIN-2025-43,application/x-bittorrent,5868,5864,0.0002\nCC-MAIN-2025-43,application/x-endnote-refer,45022,45002,0.0017\nCC-MAIN-2025-43,application/x-mobipocket-ebook,16566,16444,0.0006\nCC-MAIN-2025-43,application/x-ms-asx,6974,6974,0.0003\nCC-MAIN-2025-43,application/x-msdownload,192,192,0.0000\nCC-MAIN-2025-43,application/x-pds,45843,45560,0.0018\nCC-MAIN-2025-43,application/x-rar-compressed,17,17,0.0000\nCC-MAIN-2025-43,application/x-research-info-systems,1134,1134,0.0000\nCC-MAIN-2025-43,application/x-sh,17458,17443,0.0007\nCC-MAIN-2025-43,application/x-shockwave-flash,2117,2114,0.0001\nCC-MAIN-2025-43,application/x-stata-do,7803,7799,0.0003\nCC-MAIN-2025-43,application/x-tex,7472,7472,0.0003\nCC-MAIN-2025-43,application/x-tex-tfm,6164,6164,0.0002\nCC-MAIN-2025-43,application/x-tika-msoffice,48437,48412,0.0019\nCC-MAIN-2025-43,application/x-tika-ooxml,35952,35948,0.0014\nCC-MAIN-2025-43,application/x-wais-source,3717,3717,0.0001\nCC-MAIN-2025-43,application/xhtml+xml,208201310,207459059,7.9563\nCC-MAIN-2025-43,application/xml,1630616,1628520,0.0623\nCC-MAIN-2025-43,application/zip,330,330,0.0000\nCC-MAIN-2025-43,application/zlib,2204,2139,0.0001\nCC-MAIN-2025-43,audio/mpeg,278,278,0.0000\nCC-MAIN-2025-43,audio/vnd.wave,40,40,0.0000\nCC-MAIN-2025-43,audio/x-mpegurl,59,59,0.0000\nCC-MAIN-2025-43,image/gif,156,152,0.0000\nCC-MAIN-2025-43,image/jpeg,3864,3861,0.0001\nCC-MAIN-2025-43,image/png,368,368,0.0000\nCC-MAIN-2025-43,image/svg+xml,3,3,0.0000\nCC-MAIN-2025-43,image/tiff,1,1,0.0000\nCC-MAIN-2025-43,image/vnd.djvu,7052,7046,0.0003\nCC-MAIN-2025-43,image/webp,46,46,0.0000\nCC-MAIN-2025-43,message/rfc822,14947,14944,0.0006\nCC-MAIN-2025-43,text/calendar,965837,965511,0.0369\nCC-MAIN-2025-43,text/css,14070,14070,0.0005\nCC-MAIN-2025-43,text/csv,83914,83690,0.0032\nCC-MAIN-2025-43,text/html,2381572425,2369089525,91.0110\nCC-MAIN-2025-43,text/markdown,2474,2452,0.0001\nCC-MAIN-2025-43,text/plain,1959016,1958221,0.0749\nCC-MAIN-2025-43,text/prs.lines.tag,118055,118042,0.0045\nCC-MAIN-2025-43,text/tab-separated-values,10767,10767,0.0004\nCC-MAIN-2025-43,text/troff,10992,10988,0.0004\nCC-MAIN-2025-43,text/turtle,46711,46703,0.0018\nCC-MAIN-2025-43,text/vtt,15599,15550,0.0006\nCC-MAIN-2025-43,text/x-c++src,3147,3128,0.0001\nCC-MAIN-2025-43,text/x-chdr,10804,10798,0.0004\nCC-MAIN-2025-43,text/x-csrc,9769,9739,0.0004\nCC-MAIN-2025-43,text/x-diff,19838,19828,0.0008\nCC-MAIN-2025-43,text/x-jsp,1194,1190,0.0000\nCC-MAIN-2025-43,text/x-log,38501,38499,0.0015\nCC-MAIN-2025-43,text/x-matlab,41259,41252,0.0016\nCC-MAIN-2025-43,text/x-perl,29986,29978,0.0011\nCC-MAIN-2025-43,text/x-php,78103,77946,0.0030\nCC-MAIN-2025-43,text/x-python,5927,5927,0.0002\nCC-MAIN-2025-43,text/x-vcalendar,9283,9283,0.0004\nCC-MAIN-2025-43,text/x-vcard,83039,82983,0.0032\nCC-MAIN-2025-43,text/x-web-markdown,18744,18698,0.0007\nCC-MAIN-2025-43,text/x-yaml,7144,7144,0.0003\nCC-MAIN-2025-43,video/mp4,34,33,0.0000\nCC-MAIN-2025-43,video/quicktime,1,1,0.0000\nCC-MAIN-2025-47,<other>,240030,239819,0.0105\nCC-MAIN-2025-47,application/atom+xml,3326559,3326174,0.1450\nCC-MAIN-2025-47,application/epub+zip,44957,44851,0.0020\nCC-MAIN-2025-47,application/gpx+xml,15520,15520,0.0007\nCC-MAIN-2025-47,application/gzip,224,224,0.0000\nCC-MAIN-2025-47,application/javascript,18509,18457,0.0008\nCC-MAIN-2025-47,application/json,646438,646109,0.0282\nCC-MAIN-2025-47,application/marc,20309,20304,0.0009\nCC-MAIN-2025-47,application/mbox,28004,27961,0.0012\nCC-MAIN-2025-47,application/msword,38426,38328,0.0017\nCC-MAIN-2025-47,application/octet-stream,257809,257361,0.0112\nCC-MAIN-2025-47,application/pdf,15948974,15916300,0.6951\nCC-MAIN-2025-47,application/pgp-signature,31088,31088,0.0014\nCC-MAIN-2025-47,application/pkcs7-signature,9137,9128,0.0004\nCC-MAIN-2025-47,application/postscript,6931,6931,0.0003\nCC-MAIN-2025-47,application/rdf+xml,195225,195152,0.0085\nCC-MAIN-2025-47,application/rss+xml,1602060,1600806,0.0698\nCC-MAIN-2025-47,application/rtf,35130,35120,0.0015\nCC-MAIN-2025-47,application/text,101,101,0.0000\nCC-MAIN-2025-47,application/vnd.android.package-archive,3,3,0.0000\nCC-MAIN-2025-47,application/vnd.google-earth.kml+xml,51992,51972,0.0023\nCC-MAIN-2025-47,application/vnd.google-earth.kmz,6266,6263,0.0003\nCC-MAIN-2025-47,application/vnd.ms-excel,16017,15346,0.0007\nCC-MAIN-2025-47,application/vnd.ms-powerpoint,4093,4086,0.0002\nCC-MAIN-2025-47,application/vnd.oasis.opendocument.spreadsheet,7716,7713,0.0003\nCC-MAIN-2025-47,application/vnd.oasis.opendocument.text,19709,19700,0.0009\nCC-MAIN-2025-47,application/vnd.openxmlformats-officedocument.presentationml.presentation,5288,5213,0.0002\nCC-MAIN-2025-47,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,37137,35875,0.0016\nCC-MAIN-2025-47,application/vnd.openxmlformats-officedocument.wordprocessingml.document,53738,53573,0.0023\nCC-MAIN-2025-47,application/x-bibtex-text-file,309373,309288,0.0135\nCC-MAIN-2025-47,application/x-bittorrent,4351,4349,0.0002\nCC-MAIN-2025-47,application/x-dosexec,1,1,0.0000\nCC-MAIN-2025-47,application/x-endnote-refer,47009,46999,0.0020\nCC-MAIN-2025-47,application/x-mobipocket-ebook,18134,18038,0.0008\nCC-MAIN-2025-47,application/x-ms-asx,2841,2841,0.0001\nCC-MAIN-2025-47,application/x-msdownload,152,152,0.0000\nCC-MAIN-2025-47,application/x-pds,36098,35858,0.0016\nCC-MAIN-2025-47,application/x-rar-compressed,7,7,0.0000\nCC-MAIN-2025-47,application/x-research-info-systems,972,972,0.0000\nCC-MAIN-2025-47,application/x-sh,18413,18403,0.0008\nCC-MAIN-2025-47,application/x-shockwave-flash,2154,2150,0.0001\nCC-MAIN-2025-47,application/x-stata-do,8713,8706,0.0004\nCC-MAIN-2025-47,application/x-tex,7005,7005,0.0003\nCC-MAIN-2025-47,application/x-tex-tfm,3287,3287,0.0001\nCC-MAIN-2025-47,application/x-tika-msoffice,52555,52538,0.0023\nCC-MAIN-2025-47,application/x-tika-ooxml,35245,35241,0.0015\nCC-MAIN-2025-47,application/x-wais-source,2986,2986,0.0001\nCC-MAIN-2025-47,application/xhtml+xml,203197061,202318332,8.8559\nCC-MAIN-2025-47,application/xml,1604351,1601353,0.0699\nCC-MAIN-2025-47,application/zip,305,305,0.0000\nCC-MAIN-2025-47,application/zlib,2849,2816,0.0001\nCC-MAIN-2025-47,audio/mp4,1,1,0.0000\nCC-MAIN-2025-47,audio/mpeg,433,433,0.0000\nCC-MAIN-2025-47,audio/vnd.wave,79,79,0.0000\nCC-MAIN-2025-47,audio/x-mpegurl,63,63,0.0000\nCC-MAIN-2025-47,image/gif,208,205,0.0000\nCC-MAIN-2025-47,image/jpeg,2615,2609,0.0001\nCC-MAIN-2025-47,image/png,262,261,0.0000\nCC-MAIN-2025-47,image/svg+xml,6,6,0.0000\nCC-MAIN-2025-47,image/tiff,4,4,0.0000\nCC-MAIN-2025-47,image/vnd.djvu,12060,12060,0.0005\nCC-MAIN-2025-47,image/webp,197,197,0.0000\nCC-MAIN-2025-47,message/rfc822,16767,16762,0.0007\nCC-MAIN-2025-47,text/calendar,1090619,1090030,0.0475\nCC-MAIN-2025-47,text/css,15330,15328,0.0007\nCC-MAIN-2025-47,text/csv,73044,72988,0.0032\nCC-MAIN-2025-47,text/html,2062707916,2051777122,89.8990\nCC-MAIN-2025-47,text/markdown,1985,1970,0.0001\nCC-MAIN-2025-47,text/plain,1986934,1986153,0.0866\nCC-MAIN-2025-47,text/prs.lines.tag,111049,111039,0.0048\nCC-MAIN-2025-47,text/tab-separated-values,12532,12530,0.0005\nCC-MAIN-2025-47,text/troff,9385,9385,0.0004\nCC-MAIN-2025-47,text/turtle,38879,38874,0.0017\nCC-MAIN-2025-47,text/vtt,15480,15451,0.0007\nCC-MAIN-2025-47,text/x-c++src,2859,2851,0.0001\nCC-MAIN-2025-47,text/x-chdr,17798,17794,0.0008\nCC-MAIN-2025-47,text/x-csrc,10429,10426,0.0005\nCC-MAIN-2025-47,text/x-diff,19758,19758,0.0009\nCC-MAIN-2025-47,text/x-jsp,986,983,0.0000\nCC-MAIN-2025-47,text/x-log,45115,45100,0.0020\nCC-MAIN-2025-47,text/x-matlab,41031,41031,0.0018\nCC-MAIN-2025-47,text/x-perl,26143,26141,0.0011\nCC-MAIN-2025-47,text/x-php,68136,67909,0.0030\nCC-MAIN-2025-47,text/x-python,5618,5615,0.0002\nCC-MAIN-2025-47,text/x-vcalendar,9410,9409,0.0004\nCC-MAIN-2025-47,text/x-vcard,81786,81699,0.0036\nCC-MAIN-2025-47,text/x-web-markdown,17803,17802,0.0008\nCC-MAIN-2025-47,text/x-yaml,8661,8661,0.0004\nCC-MAIN-2025-47,video/mp4,275,275,0.0000\nCC-MAIN-2025-47,video/quicktime,2,2,0.0000\nCC-MAIN-2025-47,video/webm,2,2,0.0000\nCC-MAIN-2025-51,<other>,257162,256896,0.0119\nCC-MAIN-2025-51,application/atom+xml,3275474,3275155,0.1510\nCC-MAIN-2025-51,application/epub+zip,53260,53041,0.0025\nCC-MAIN-2025-51,application/gpx+xml,15756,15756,0.0007\nCC-MAIN-2025-51,application/gzip,21,21,0.0000\nCC-MAIN-2025-51,application/javascript,19856,19739,0.0009\nCC-MAIN-2025-51,application/json,602827,602508,0.0278\nCC-MAIN-2025-51,application/marc,18995,18995,0.0009\nCC-MAIN-2025-51,application/mbox,28943,28807,0.0013\nCC-MAIN-2025-51,application/msword,38187,38052,0.0018\nCC-MAIN-2025-51,application/octet-stream,414627,414072,0.0191\nCC-MAIN-2025-51,application/pdf,15366620,15332072,0.7084\nCC-MAIN-2025-51,application/pgp-signature,32293,32293,0.0015\nCC-MAIN-2025-51,application/pkcs7-signature,8624,8617,0.0004\nCC-MAIN-2025-51,application/postscript,5571,5570,0.0003\nCC-MAIN-2025-51,application/rdf+xml,181828,181740,0.0084\nCC-MAIN-2025-51,application/rss+xml,1538559,1537369,0.0709\nCC-MAIN-2025-51,application/rtf,30080,30075,0.0014\nCC-MAIN-2025-51,application/text,479,479,0.0000\nCC-MAIN-2025-51,application/vnd.android.package-archive,7,7,0.0000\nCC-MAIN-2025-51,application/vnd.google-earth.kml+xml,49507,49475,0.0023\nCC-MAIN-2025-51,application/vnd.google-earth.kmz,5229,5229,0.0002\nCC-MAIN-2025-51,application/vnd.ms-excel,15682,15503,0.0007\nCC-MAIN-2025-51,application/vnd.ms-powerpoint,4034,4034,0.0002\nCC-MAIN-2025-51,application/vnd.oasis.opendocument.spreadsheet,7326,7316,0.0003\nCC-MAIN-2025-51,application/vnd.oasis.opendocument.text,14958,14944,0.0007\nCC-MAIN-2025-51,application/vnd.openxmlformats-officedocument.presentationml.presentation,5070,5061,0.0002\nCC-MAIN-2025-51,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,35588,35218,0.0016\nCC-MAIN-2025-51,application/vnd.openxmlformats-officedocument.wordprocessingml.document,50579,50418,0.0023\nCC-MAIN-2025-51,application/x-bibtex-text-file,315086,314978,0.0145\nCC-MAIN-2025-51,application/x-bittorrent,4900,4897,0.0002\nCC-MAIN-2025-51,application/x-endnote-refer,43343,43331,0.0020\nCC-MAIN-2025-51,application/x-mobipocket-ebook,16514,16453,0.0008\nCC-MAIN-2025-51,application/x-ms-asx,2646,2645,0.0001\nCC-MAIN-2025-51,application/x-msdownload,373,373,0.0000\nCC-MAIN-2025-51,application/x-pds,30894,30828,0.0014\nCC-MAIN-2025-51,application/x-rar-compressed,1,1,0.0000\nCC-MAIN-2025-51,application/x-research-info-systems,812,812,0.0000\nCC-MAIN-2025-51,application/x-sh,14812,14793,0.0007\nCC-MAIN-2025-51,application/x-shockwave-flash,1323,1320,0.0001\nCC-MAIN-2025-51,application/x-stata-do,9403,9402,0.0004\nCC-MAIN-2025-51,application/x-tex,6916,6916,0.0003\nCC-MAIN-2025-51,application/x-tex-tfm,4229,4229,0.0002\nCC-MAIN-2025-51,application/x-tika-msoffice,46163,46155,0.0021\nCC-MAIN-2025-51,application/x-tika-ooxml,37860,37848,0.0017\nCC-MAIN-2025-51,application/x-wais-source,2425,2425,0.0001\nCC-MAIN-2025-51,application/xhtml+xml,199822772,199103197,9.2123\nCC-MAIN-2025-51,application/xml,1600058,1597756,0.0738\nCC-MAIN-2025-51,application/zip,307,307,0.0000\nCC-MAIN-2025-51,application/zlib,2328,2298,0.0001\nCC-MAIN-2025-51,audio/mpeg,434,434,0.0000\nCC-MAIN-2025-51,audio/vnd.wave,59,59,0.0000\nCC-MAIN-2025-51,audio/x-mpegurl,59,59,0.0000\nCC-MAIN-2025-51,image/gif,384,383,0.0000\nCC-MAIN-2025-51,image/jpeg,2291,2285,0.0001\nCC-MAIN-2025-51,image/png,216,214,0.0000\nCC-MAIN-2025-51,image/svg+xml,8,8,0.0000\nCC-MAIN-2025-51,image/vnd.djvu,17158,17158,0.0008\nCC-MAIN-2025-51,image/webp,15,15,0.0000\nCC-MAIN-2025-51,message/rfc822,16528,16525,0.0008\nCC-MAIN-2025-51,text/calendar,998254,997959,0.0460\nCC-MAIN-2025-51,text/css,11310,11310,0.0005\nCC-MAIN-2025-51,text/csv,68867,68813,0.0032\nCC-MAIN-2025-51,text/html,1941541196,1931179658,89.5096\nCC-MAIN-2025-51,text/markdown,3350,3332,0.0002\nCC-MAIN-2025-51,text/plain,1885142,1884352,0.0869\nCC-MAIN-2025-51,text/prs.lines.tag,104534,104518,0.0048\nCC-MAIN-2025-51,text/tab-separated-values,12113,12113,0.0006\nCC-MAIN-2025-51,text/troff,12396,12396,0.0006\nCC-MAIN-2025-51,text/turtle,36591,36588,0.0017\nCC-MAIN-2025-51,text/vtt,17368,17333,0.0008\nCC-MAIN-2025-51,text/x-c++src,2684,2676,0.0001\nCC-MAIN-2025-51,text/x-chdr,12310,12309,0.0006\nCC-MAIN-2025-51,text/x-csrc,10648,10641,0.0005\nCC-MAIN-2025-51,text/x-diff,18689,18686,0.0009\nCC-MAIN-2025-51,text/x-jsp,877,876,0.0000\nCC-MAIN-2025-51,text/x-log,33590,33577,0.0015\nCC-MAIN-2025-51,text/x-matlab,43864,43862,0.0020\nCC-MAIN-2025-51,text/x-perl,22163,22159,0.0010\nCC-MAIN-2025-51,text/x-php,52058,51894,0.0024\nCC-MAIN-2025-51,text/x-python,5749,5745,0.0003\nCC-MAIN-2025-51,text/x-vcalendar,8364,8363,0.0004\nCC-MAIN-2025-51,text/x-vcard,80583,80549,0.0037\nCC-MAIN-2025-51,text/x-web-markdown,16872,16837,0.0008\nCC-MAIN-2025-51,text/x-yaml,10138,10138,0.0005\nCC-MAIN-2025-51,video/mp4,109,109,0.0000\nCC-MAIN-2025-51,video/quicktime,1,1,0.0000\nCC-MAIN-2026-04,<other>,236172,235906,0.0101\nCC-MAIN-2026-04,application/atom+xml,3151390,3151053,0.1353\nCC-MAIN-2026-04,application/epub+zip,38475,38410,0.0017\nCC-MAIN-2026-04,application/gpx+xml,16196,16192,0.0007\nCC-MAIN-2026-04,application/gzip,9,9,0.0000\nCC-MAIN-2026-04,application/javascript,20306,20195,0.0009\nCC-MAIN-2026-04,application/json,567210,566832,0.0243\nCC-MAIN-2026-04,application/marc,16130,16130,0.0007\nCC-MAIN-2026-04,application/mbox,23687,23560,0.0010\nCC-MAIN-2026-04,application/msword,36168,36103,0.0016\nCC-MAIN-2026-04,application/octet-stream,354954,354614,0.0152\nCC-MAIN-2026-04,application/pdf,14757711,14725581,0.6335\nCC-MAIN-2026-04,application/pgp-signature,33648,33648,0.0014\nCC-MAIN-2026-04,application/pkcs7-signature,7908,7906,0.0003\nCC-MAIN-2026-04,application/postscript,5664,5663,0.0002\nCC-MAIN-2026-04,application/rdf+xml,177759,177676,0.0076\nCC-MAIN-2026-04,application/rss+xml,1539217,1538005,0.0661\nCC-MAIN-2026-04,application/rtf,26228,26221,0.0011\nCC-MAIN-2026-04,application/text,234,234,0.0000\nCC-MAIN-2026-04,application/vnd.android.package-archive,14,14,0.0000\nCC-MAIN-2026-04,application/vnd.google-earth.kml+xml,55386,55365,0.0024\nCC-MAIN-2026-04,application/vnd.google-earth.kmz,7341,7330,0.0003\nCC-MAIN-2026-04,application/vnd.ms-excel,14923,14784,0.0006\nCC-MAIN-2026-04,application/vnd.ms-powerpoint,2568,2568,0.0001\nCC-MAIN-2026-04,application/vnd.oasis.opendocument.spreadsheet,6875,6875,0.0003\nCC-MAIN-2026-04,application/vnd.oasis.opendocument.text,16413,16407,0.0007\nCC-MAIN-2026-04,application/vnd.openxmlformats-officedocument.presentationml.presentation,4793,4760,0.0002\nCC-MAIN-2026-04,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,38355,38189,0.0016\nCC-MAIN-2026-04,application/vnd.openxmlformats-officedocument.wordprocessingml.document,50543,50371,0.0022\nCC-MAIN-2026-04,application/x-bibtex-text-file,298975,298786,0.0128\nCC-MAIN-2026-04,application/x-bittorrent,15575,15570,0.0007\nCC-MAIN-2026-04,application/x-endnote-refer,33240,33232,0.0014\nCC-MAIN-2026-04,application/x-mobipocket-ebook,12971,12920,0.0006\nCC-MAIN-2026-04,application/x-ms-asx,2513,2511,0.0001\nCC-MAIN-2026-04,application/x-msdownload,196,196,0.0000\nCC-MAIN-2026-04,application/x-pds,29294,29199,0.0013\nCC-MAIN-2026-04,application/x-research-info-systems,677,677,0.0000\nCC-MAIN-2026-04,application/x-sh,18897,18880,0.0008\nCC-MAIN-2026-04,application/x-shockwave-flash,1595,1594,0.0001\nCC-MAIN-2026-04,application/x-stata-do,9998,9994,0.0004\nCC-MAIN-2026-04,application/x-tex,5425,5423,0.0002\nCC-MAIN-2026-04,application/x-tex-tfm,7422,7422,0.0003\nCC-MAIN-2026-04,application/x-tika-msoffice,46166,46161,0.0020\nCC-MAIN-2026-04,application/x-tika-ooxml,37497,37490,0.0016\nCC-MAIN-2026-04,application/x-wais-source,2581,2581,0.0001\nCC-MAIN-2026-04,application/x-xz,3,3,0.0000\nCC-MAIN-2026-04,application/xhtml+xml,195981882,195281471,8.4126\nCC-MAIN-2026-04,application/xml,1538767,1535650,0.0661\nCC-MAIN-2026-04,application/zip,241,241,0.0000\nCC-MAIN-2026-04,application/zlib,3195,3100,0.0001\nCC-MAIN-2026-04,audio/mpeg,622,622,0.0000\nCC-MAIN-2026-04,audio/vnd.wave,31,31,0.0000\nCC-MAIN-2026-04,audio/x-mpegurl,43,43,0.0000\nCC-MAIN-2026-04,image/gif,278,278,0.0000\nCC-MAIN-2026-04,image/jpeg,2399,2395,0.0001\nCC-MAIN-2026-04,image/png,230,229,0.0000\nCC-MAIN-2026-04,image/svg+xml,10,10,0.0000\nCC-MAIN-2026-04,image/tiff,4,4,0.0000\nCC-MAIN-2026-04,image/vnd.djvu,8845,8844,0.0004\nCC-MAIN-2026-04,image/webp,43,43,0.0000\nCC-MAIN-2026-04,message/rfc822,14065,14062,0.0006\nCC-MAIN-2026-04,text/asp,2,2,0.0000\nCC-MAIN-2026-04,text/calendar,956224,955916,0.0410\nCC-MAIN-2026-04,text/css,13514,13512,0.0006\nCC-MAIN-2026-04,text/csv,74931,74476,0.0032\nCC-MAIN-2026-04,text/html,2106989446,2096204105,90.4431\nCC-MAIN-2026-04,text/markdown,3054,3039,0.0001\nCC-MAIN-2026-04,text/plain,1801923,1801157,0.0773\nCC-MAIN-2026-04,text/prs.lines.tag,92554,92551,0.0040\nCC-MAIN-2026-04,text/tab-separated-values,10394,10389,0.0004\nCC-MAIN-2026-04,text/troff,12210,12208,0.0005\nCC-MAIN-2026-04,text/turtle,30072,30072,0.0013\nCC-MAIN-2026-04,text/vtt,22550,22504,0.0010\nCC-MAIN-2026-04,text/x-c++src,3280,3278,0.0001\nCC-MAIN-2026-04,text/x-chdr,11977,11977,0.0005\nCC-MAIN-2026-04,text/x-csrc,11660,11656,0.0005\nCC-MAIN-2026-04,text/x-diff,20515,20508,0.0009\nCC-MAIN-2026-04,text/x-jsp,1094,1094,0.0000\nCC-MAIN-2026-04,text/x-log,33965,33939,0.0015\nCC-MAIN-2026-04,text/x-matlab,19511,19511,0.0008\nCC-MAIN-2026-04,text/x-perl,22882,22880,0.0010\nCC-MAIN-2026-04,text/x-php,91132,90904,0.0039\nCC-MAIN-2026-04,text/x-python,8436,8431,0.0004\nCC-MAIN-2026-04,text/x-vcalendar,7518,7517,0.0003\nCC-MAIN-2026-04,text/x-vcard,73379,73351,0.0031\nCC-MAIN-2026-04,text/x-web-markdown,27940,27845,0.0012\nCC-MAIN-2026-04,text/x-yaml,10517,10516,0.0005\nCC-MAIN-2026-04,video/mp4,114,114,0.0000\nCC-MAIN-2026-04,video/webm,4,4,0.0000\nCC-MAIN-2026-08,<other>,246312,246084,0.0114\nCC-MAIN-2026-08,application/atom+xml,3199359,3198931,0.1476\nCC-MAIN-2026-08,application/epub+zip,43087,43003,0.0020\nCC-MAIN-2026-08,application/gpx+xml,17619,17619,0.0008\nCC-MAIN-2026-08,application/gzip,10,10,0.0000\nCC-MAIN-2026-08,application/javascript,22738,22723,0.0010\nCC-MAIN-2026-08,application/json,567609,566856,0.0262\nCC-MAIN-2026-08,application/marc,15238,15236,0.0007\nCC-MAIN-2026-08,application/mbox,25935,25813,0.0012\nCC-MAIN-2026-08,application/msword,39391,39330,0.0018\nCC-MAIN-2026-08,application/octet-stream,354984,354485,0.0164\nCC-MAIN-2026-08,application/pdf,16165875,16133271,0.7460\nCC-MAIN-2026-08,application/pgp-signature,24521,24520,0.0011\nCC-MAIN-2026-08,application/pkcs7-signature,7363,7361,0.0003\nCC-MAIN-2026-08,application/postscript,4742,4742,0.0002\nCC-MAIN-2026-08,application/rdf+xml,176109,176018,0.0081\nCC-MAIN-2026-08,application/rss+xml,1476079,1475043,0.0681\nCC-MAIN-2026-08,application/rtf,28727,28724,0.0013\nCC-MAIN-2026-08,application/text,291,291,0.0000\nCC-MAIN-2026-08,application/vnd.android.package-archive,9,9,0.0000\nCC-MAIN-2026-08,application/vnd.google-earth.kml+xml,51776,51759,0.0024\nCC-MAIN-2026-08,application/vnd.google-earth.kmz,6296,6291,0.0003\nCC-MAIN-2026-08,application/vnd.ms-excel,17444,17332,0.0008\nCC-MAIN-2026-08,application/vnd.ms-powerpoint,3148,3146,0.0001\nCC-MAIN-2026-08,application/vnd.oasis.opendocument.spreadsheet,8303,8296,0.0004\nCC-MAIN-2026-08,application/vnd.oasis.opendocument.text,17081,17076,0.0008\nCC-MAIN-2026-08,application/vnd.openxmlformats-officedocument.presentationml.presentation,5349,5338,0.0002\nCC-MAIN-2026-08,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,39854,39727,0.0018\nCC-MAIN-2026-08,application/vnd.openxmlformats-officedocument.wordprocessingml.document,53424,53188,0.0025\nCC-MAIN-2026-08,application/x-bibtex-text-file,310714,310343,0.0143\nCC-MAIN-2026-08,application/x-bittorrent,3508,3502,0.0002\nCC-MAIN-2026-08,application/x-endnote-refer,34771,34767,0.0016\nCC-MAIN-2026-08,application/x-mobipocket-ebook,14883,14823,0.0007\nCC-MAIN-2026-08,application/x-ms-asx,2691,2687,0.0001\nCC-MAIN-2026-08,application/x-msdownload,149,149,0.0000\nCC-MAIN-2026-08,application/x-pds,25292,25153,0.0012\nCC-MAIN-2026-08,application/x-rar-compressed,1,1,0.0000\nCC-MAIN-2026-08,application/x-research-info-systems,752,752,0.0000\nCC-MAIN-2026-08,application/x-sh,15832,15817,0.0007\nCC-MAIN-2026-08,application/x-shockwave-flash,1370,1368,0.0001\nCC-MAIN-2026-08,application/x-stata-do,9914,9913,0.0005\nCC-MAIN-2026-08,application/x-tex,6012,6011,0.0003\nCC-MAIN-2026-08,application/x-tex-tfm,7449,7449,0.0003\nCC-MAIN-2026-08,application/x-tika-msoffice,49417,49404,0.0023\nCC-MAIN-2026-08,application/x-tika-ooxml,37470,37460,0.0017\nCC-MAIN-2026-08,application/x-wais-source,3073,3073,0.0001\nCC-MAIN-2026-08,application/xhtml+xml,182365669,181704542,8.4156\nCC-MAIN-2026-08,application/xml,1548014,1545715,0.0714\nCC-MAIN-2026-08,application/zip,429,429,0.0000\nCC-MAIN-2026-08,application/zlib,1990,1963,0.0001\nCC-MAIN-2026-08,audio/mpeg,674,674,0.0000\nCC-MAIN-2026-08,audio/vnd.wave,34,34,0.0000\nCC-MAIN-2026-08,audio/x-mpegurl,59,59,0.0000\nCC-MAIN-2026-08,image/gif,634,634,0.0000\nCC-MAIN-2026-08,image/jpeg,2084,2083,0.0001\nCC-MAIN-2026-08,image/png,415,413,0.0000\nCC-MAIN-2026-08,image/svg+xml,14,14,0.0000\nCC-MAIN-2026-08,image/vnd.djvu,17106,17104,0.0008\nCC-MAIN-2026-08,image/webp,33,33,0.0000\nCC-MAIN-2026-08,message/rfc822,17546,17545,0.0008\nCC-MAIN-2026-08,text/asp,4,4,0.0000\nCC-MAIN-2026-08,text/calendar,972580,972267,0.0449\nCC-MAIN-2026-08,text/css,12912,12910,0.0006\nCC-MAIN-2026-08,text/csv,74746,74594,0.0034\nCC-MAIN-2026-08,text/html,1956424316,1945737628,90.2830\nCC-MAIN-2026-08,text/markdown,6087,6016,0.0003\nCC-MAIN-2026-08,text/plain,1887367,1886276,0.0871\nCC-MAIN-2026-08,text/prs.lines.tag,106559,106556,0.0049\nCC-MAIN-2026-08,text/tab-separated-values,11175,11170,0.0005\nCC-MAIN-2026-08,text/troff,10050,10048,0.0005\nCC-MAIN-2026-08,text/turtle,30040,30037,0.0014\nCC-MAIN-2026-08,text/vtt,19786,19765,0.0009\nCC-MAIN-2026-08,text/x-c++src,3509,3507,0.0002\nCC-MAIN-2026-08,text/x-chdr,13810,13810,0.0006\nCC-MAIN-2026-08,text/x-csrc,11672,11670,0.0005\nCC-MAIN-2026-08,text/x-diff,22787,22780,0.0011\nCC-MAIN-2026-08,text/x-jsp,2498,2490,0.0001\nCC-MAIN-2026-08,text/x-log,36448,36447,0.0017\nCC-MAIN-2026-08,text/x-matlab,21327,21326,0.0010\nCC-MAIN-2026-08,text/x-perl,27085,27080,0.0012\nCC-MAIN-2026-08,text/x-php,69388,69173,0.0032\nCC-MAIN-2026-08,text/x-python,7185,7185,0.0003\nCC-MAIN-2026-08,text/x-vcalendar,8017,8016,0.0004\nCC-MAIN-2026-08,text/x-vcard,78815,78794,0.0036\nCC-MAIN-2026-08,text/x-web-markdown,29409,29402,0.0014\nCC-MAIN-2026-08,text/x-yaml,7275,7275,0.0003\nCC-MAIN-2026-08,video/mp4,201,201,0.0000\nCC-MAIN-2026-08,video/quicktime,2,2,0.0000\nCC-MAIN-2026-12,<other>,240558,240398,0.0122\nCC-MAIN-2026-12,application/atom+xml,3015109,3014764,0.1527\nCC-MAIN-2026-12,application/epub+zip,44404,44324,0.0022\nCC-MAIN-2026-12,application/gpx+xml,15049,15047,0.0008\nCC-MAIN-2026-12,application/gzip,329,329,0.0000\nCC-MAIN-2026-12,application/javascript,21326,21306,0.0011\nCC-MAIN-2026-12,application/json,508673,507939,0.0258\nCC-MAIN-2026-12,application/marc,13491,13491,0.0007\nCC-MAIN-2026-12,application/mbox,27267,27200,0.0014\nCC-MAIN-2026-12,application/msword,33336,33197,0.0017\nCC-MAIN-2026-12,application/octet-stream,305661,305236,0.0155\nCC-MAIN-2026-12,application/pdf,16050266,16018554,0.8127\nCC-MAIN-2026-12,application/pgp-signature,32560,32560,0.0016\nCC-MAIN-2026-12,application/pkcs7-signature,8673,8672,0.0004\nCC-MAIN-2026-12,application/postscript,3161,3161,0.0002\nCC-MAIN-2026-12,application/rdf+xml,146704,146644,0.0074\nCC-MAIN-2026-12,application/rss+xml,1351565,1350708,0.0684\nCC-MAIN-2026-12,application/rtf,26078,26076,0.0013\nCC-MAIN-2026-12,application/text,90,90,0.0000\nCC-MAIN-2026-12,application/vnd.android.package-archive,13,13,0.0000\nCC-MAIN-2026-12,application/vnd.google-earth.kml+xml,49246,49224,0.0025\nCC-MAIN-2026-12,application/vnd.google-earth.kmz,9164,9163,0.0005\nCC-MAIN-2026-12,application/vnd.ms-excel,14129,13972,0.0007\nCC-MAIN-2026-12,application/vnd.ms-powerpoint,2441,2439,0.0001\nCC-MAIN-2026-12,application/vnd.oasis.opendocument.spreadsheet,8759,8748,0.0004\nCC-MAIN-2026-12,application/vnd.oasis.opendocument.text,17835,17827,0.0009\nCC-MAIN-2026-12,application/vnd.openxmlformats-officedocument.presentationml.presentation,5033,4998,0.0003\nCC-MAIN-2026-12,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,33606,33446,0.0017\nCC-MAIN-2026-12,application/vnd.openxmlformats-officedocument.wordprocessingml.document,54692,54467,0.0028\nCC-MAIN-2026-12,application/x-bibtex-text-file,282338,282062,0.0143\nCC-MAIN-2026-12,application/x-bittorrent,3830,3817,0.0002\nCC-MAIN-2026-12,application/x-bzip2,1,1,0.0000\nCC-MAIN-2026-12,application/x-endnote-refer,31404,31400,0.0016\nCC-MAIN-2026-12,application/x-mobipocket-ebook,16253,16180,0.0008\nCC-MAIN-2026-12,application/x-ms-asx,3767,3758,0.0002\nCC-MAIN-2026-12,application/x-msdownload,111,111,0.0000\nCC-MAIN-2026-12,application/x-pds,23469,23392,0.0012\nCC-MAIN-2026-12,application/x-research-info-systems,617,617,0.0000\nCC-MAIN-2026-12,application/x-sh,20260,20238,0.0010\nCC-MAIN-2026-12,application/x-shockwave-flash,1330,1327,0.0001\nCC-MAIN-2026-12,application/x-stata-do,8098,8097,0.0004\nCC-MAIN-2026-12,application/x-tex,5263,5262,0.0003\nCC-MAIN-2026-12,application/x-tex-tfm,6387,6387,0.0003\nCC-MAIN-2026-12,application/x-tika-msoffice,54577,54562,0.0028\nCC-MAIN-2026-12,application/x-tika-ooxml,36531,36527,0.0018\nCC-MAIN-2026-12,application/x-wais-source,2163,2163,0.0001\nCC-MAIN-2026-12,application/xhtml+xml,170393790,169788075,8.6282\nCC-MAIN-2026-12,application/xml,1375872,1373509,0.0697\nCC-MAIN-2026-12,application/zip,231,231,0.0000\nCC-MAIN-2026-12,application/zlib,3105,3081,0.0002\nCC-MAIN-2026-12,audio/mp4,1,1,0.0000\nCC-MAIN-2026-12,audio/mpeg,1042,1042,0.0001\nCC-MAIN-2026-12,audio/vnd.wave,22,22,0.0000\nCC-MAIN-2026-12,audio/x-mpegurl,55,55,0.0000\nCC-MAIN-2026-12,image/gif,679,679,0.0000\nCC-MAIN-2026-12,image/jpeg,4118,4118,0.0002\nCC-MAIN-2026-12,image/png,212,211,0.0000\nCC-MAIN-2026-12,image/svg+xml,7,7,0.0000\nCC-MAIN-2026-12,image/vnd.djvu,8197,8196,0.0004\nCC-MAIN-2026-12,image/webp,9,9,0.0000\nCC-MAIN-2026-12,message/rfc822,13392,13392,0.0007\nCC-MAIN-2026-12,text/asp,3,3,0.0000\nCC-MAIN-2026-12,text/aspdotnet,1,1,0.0000\nCC-MAIN-2026-12,text/calendar,900476,900235,0.0456\nCC-MAIN-2026-12,text/css,11654,11653,0.0006\nCC-MAIN-2026-12,text/csv,62312,62283,0.0032\nCC-MAIN-2026-12,text/html,1777210837,1767115994,89.9924\nCC-MAIN-2026-12,text/markdown,48318,48073,0.0024\nCC-MAIN-2026-12,text/plain,1773218,1771873,0.0898\nCC-MAIN-2026-12,text/prs.lines.tag,131455,131449,0.0067\nCC-MAIN-2026-12,text/tab-separated-values,8237,8235,0.0004\nCC-MAIN-2026-12,text/troff,9162,9162,0.0005\nCC-MAIN-2026-12,text/turtle,23365,23364,0.0012\nCC-MAIN-2026-12,text/vtt,14977,14951,0.0008\nCC-MAIN-2026-12,text/x-c++src,3143,3096,0.0002\nCC-MAIN-2026-12,text/x-chdr,10912,10897,0.0006\nCC-MAIN-2026-12,text/x-csrc,13807,13804,0.0007\nCC-MAIN-2026-12,text/x-diff,20406,20403,0.0010\nCC-MAIN-2026-12,text/x-jsp,1589,1587,0.0001\nCC-MAIN-2026-12,text/x-log,31598,31593,0.0016\nCC-MAIN-2026-12,text/x-matlab,20001,20000,0.0010\nCC-MAIN-2026-12,text/x-perl,24872,24870,0.0013\nCC-MAIN-2026-12,text/x-php,64712,64532,0.0033\nCC-MAIN-2026-12,text/x-python,7655,7651,0.0004\nCC-MAIN-2026-12,text/x-vcalendar,8057,8055,0.0004\nCC-MAIN-2026-12,text/x-vcard,73095,73078,0.0037\nCC-MAIN-2026-12,text/x-web-markdown,26123,26115,0.0013\nCC-MAIN-2026-12,text/x-yaml,8696,8694,0.0004\nCC-MAIN-2026-12,video/mp4,204,204,0.0000\nCC-MAIN-2026-17,<other>,245008,244780,0.0112\nCC-MAIN-2026-17,application/atom+xml,3257201,3256734,0.1486\nCC-MAIN-2026-17,application/epub+zip,40099,40079,0.0018\nCC-MAIN-2026-17,application/gpx+xml,18848,18848,0.0009\nCC-MAIN-2026-17,application/gzip,260,260,0.0000\nCC-MAIN-2026-17,application/javascript,24550,24517,0.0011\nCC-MAIN-2026-17,application/json,551362,550664,0.0252\nCC-MAIN-2026-17,application/marc,14507,14507,0.0007\nCC-MAIN-2026-17,application/mbox,24813,24669,0.0011\nCC-MAIN-2026-17,application/msword,38812,38671,0.0018\nCC-MAIN-2026-17,application/octet-stream,304522,303985,0.0139\nCC-MAIN-2026-17,application/pdf,19274948,19242380,0.8794\nCC-MAIN-2026-17,application/pgp-signature,44465,44465,0.0020\nCC-MAIN-2026-17,application/pkcs7-signature,9265,9263,0.0004\nCC-MAIN-2026-17,application/postscript,2760,2760,0.0001\nCC-MAIN-2026-17,application/rdf+xml,138832,138710,0.0063\nCC-MAIN-2026-17,application/rss+xml,1445867,1444384,0.0660\nCC-MAIN-2026-17,application/rtf,19562,19561,0.0009\nCC-MAIN-2026-17,application/text,184,184,0.0000\nCC-MAIN-2026-17,application/vnd.android.package-archive,6,6,0.0000\nCC-MAIN-2026-17,application/vnd.google-earth.kml+xml,53564,53537,0.0024\nCC-MAIN-2026-17,application/vnd.google-earth.kmz,10791,10788,0.0005\nCC-MAIN-2026-17,application/vnd.ms-excel,14578,14447,0.0007\nCC-MAIN-2026-17,application/vnd.ms-powerpoint,3473,3471,0.0002\nCC-MAIN-2026-17,application/vnd.oasis.opendocument.spreadsheet,7568,7561,0.0003\nCC-MAIN-2026-17,application/vnd.oasis.opendocument.text,19313,19307,0.0009\nCC-MAIN-2026-17,application/vnd.openxmlformats-officedocument.presentationml.presentation,5107,5076,0.0002\nCC-MAIN-2026-17,application/vnd.openxmlformats-officedocument.spreadsheetml.sheet,34668,34312,0.0016\nCC-MAIN-2026-17,application/vnd.openxmlformats-officedocument.wordprocessingml.document,61875,61685,0.0028\nCC-MAIN-2026-17,application/x-bibtex-text-file,277951,277571,0.0127\nCC-MAIN-2026-17,application/x-bittorrent,3802,3793,0.0002\nCC-MAIN-2026-17,application/x-endnote-refer,30695,30687,0.0014\nCC-MAIN-2026-17,application/x-mobipocket-ebook,12387,12379,0.0006\nCC-MAIN-2026-17,application/x-ms-asx,3652,3651,0.0002\nCC-MAIN-2026-17,application/x-msdownload,73,73,0.0000\nCC-MAIN-2026-17,application/x-pds,26698,26646,0.0012\nCC-MAIN-2026-17,application/x-rar-compressed,2,2,0.0000\nCC-MAIN-2026-17,application/x-research-info-systems,590,590,0.0000\nCC-MAIN-2026-17,application/x-sh,24279,24261,0.0011\nCC-MAIN-2026-17,application/x-shockwave-flash,1030,1030,0.0000\nCC-MAIN-2026-17,application/x-stata-do,8393,8387,0.0004\nCC-MAIN-2026-17,application/x-tex,6239,6238,0.0003\nCC-MAIN-2026-17,application/x-tex-tfm,8141,8141,0.0004\nCC-MAIN-2026-17,application/x-tika-msoffice,52402,52389,0.0024\nCC-MAIN-2026-17,application/x-tika-ooxml,42446,42433,0.0019\nCC-MAIN-2026-17,application/x-wais-source,3115,3115,0.0001\nCC-MAIN-2026-17,application/xhtml+xml,178793494,178085054,8.1569\nCC-MAIN-2026-17,application/xml,1279158,1270943,0.0584\nCC-MAIN-2026-17,application/zip,254,254,0.0000\nCC-MAIN-2026-17,application/zlib,6681,6628,0.0003\nCC-MAIN-2026-17,audio/mp4,1,1,0.0000\nCC-MAIN-2026-17,audio/mpeg,560,560,0.0000\nCC-MAIN-2026-17,audio/vnd.wave,15,15,0.0000\nCC-MAIN-2026-17,audio/x-mpegurl,72,72,0.0000\nCC-MAIN-2026-17,image/gif,143,142,0.0000\nCC-MAIN-2026-17,image/jpeg,2857,2856,0.0001\nCC-MAIN-2026-17,image/png,259,254,0.0000\nCC-MAIN-2026-17,image/svg+xml,15,15,0.0000\nCC-MAIN-2026-17,image/tiff,4,4,0.0000\nCC-MAIN-2026-17,image/vnd.djvu,14322,14315,0.0007\nCC-MAIN-2026-17,image/webp,15,15,0.0000\nCC-MAIN-2026-17,message/rfc822,15278,15273,0.0007\nCC-MAIN-2026-17,text/calendar,928567,925275,0.0424\nCC-MAIN-2026-17,text/css,12917,12915,0.0006\nCC-MAIN-2026-17,text/csv,66149,65041,0.0030\nCC-MAIN-2026-17,text/html,1981667884,1969928963,90.4072\nCC-MAIN-2026-17,text/markdown,622732,620114,0.0284\nCC-MAIN-2026-17,text/plain,1823475,1821792,0.0832\nCC-MAIN-2026-17,text/prs.lines.tag,119165,119152,0.0054\nCC-MAIN-2026-17,text/tab-separated-values,8558,8557,0.0004\nCC-MAIN-2026-17,text/troff,11316,11310,0.0005\nCC-MAIN-2026-17,text/turtle,22757,22755,0.0010\nCC-MAIN-2026-17,text/vtt,16976,16954,0.0008\nCC-MAIN-2026-17,text/x-c++src,2932,2920,0.0001\nCC-MAIN-2026-17,text/x-chdr,10781,10775,0.0005\nCC-MAIN-2026-17,text/x-csrc,13364,13356,0.0006\nCC-MAIN-2026-17,text/x-diff,20531,20514,0.0009\nCC-MAIN-2026-17,text/x-jsp,1984,1979,0.0001\nCC-MAIN-2026-17,text/x-log,35449,35439,0.0016\nCC-MAIN-2026-17,text/x-matlab,29437,29436,0.0013\nCC-MAIN-2026-17,text/x-perl,17814,17798,0.0008\nCC-MAIN-2026-17,text/x-php,74624,74445,0.0034\nCC-MAIN-2026-17,text/x-python,6985,6983,0.0003\nCC-MAIN-2026-17,text/x-vcalendar,9396,9395,0.0004\nCC-MAIN-2026-17,text/x-vcard,79000,78970,0.0036\nCC-MAIN-2026-17,text/x-web-markdown,42198,42076,0.0019\nCC-MAIN-2026-17,text/x-yaml,9419,9417,0.0004\nCC-MAIN-2026-17,video/mp4,50,50,0.0000\nCC-MAIN-2026-17,video/quicktime,6,6,0.0000\nCC-MAIN-2026-17,video/webm,3,3,0.0000\n"
  },
  {
    "path": "plots/tld/by-year-and-continent.md",
    "content": "---\nlayout: table\ntable_include:\n- tlds-by-year-and-continent.html\n- selected-tlds-by-year.html\ntable_sortlist: \"{sortList: [[0,1]]}\"\n---\n\nTop-Level Domains By Year and Continent\n=======================================\n\nMany top-level domains can be mapped to geographic regions, for example, the country-code TLDs or regional one (`.asia`). For other domains, such as `.com` or `.net` this is not possible. \n\nThe aggregation by year and the percentage allows to better understand the long-term trends of top-level domain and geographical coverage. For the latter, TLDs are mapped to continents.\ndistribution over continents\n\n![Percentage of top-level domains by year and continent](tlds-by-year-and-continent.png)\n\n\nThe underlying data of the plot is provided in the table below or as CSV ([tlds-by-year-and-continent.csv](./tlds-by-year-and-continent.csv)).\n\nThe second table shows the percentage of the 16 most common top-level domains. The data is also provided as CSV: [selected-tlds-by-year.csv](./selected-tlds-by-year.csv)."
  },
  {
    "path": "plots/tld/comparison.md",
    "content": "---\nlayout: table\ntable_include:\n - selected-crawl-comparison-spearman-frequent-tlds.html\n - selected-crawl-comparison.html\ntable_sortlist: \"{sortList: [[4,1]]}\"\n---\n\nEstimation of Representativeness of a Recent Crawl\n==================================================\n\nThe representativeness of the November 2019 crawl (CC-MAIN-2019-47) is estimated by a comparison with the frequency of top-level domains in\n\n- the list of [top-1-million sites](http://s3.amazonaws.com/alexa-static/top-1m.csv.zip) published by [Alexa](https://support.alexa.com/hc/en-us/sections/200063274-Top-Sites), based on unique visitors and page views\n- the [Cisco Umbrella Popularity list](http://s3-us-west-1.amazonaws.com/umbrella-static/index.html) which reflects DNS usage\n- the [Majestic Million](http://downloads.majestic.com/majestic_million.csv), \"[ordered by the number of referring subnets](https://blog.majestic.com/development/majestic-million-csv-daily/)\"\n\nAll three lists have been fetched at the same time the crawl was performed. For the one million domains/sites in the lists the TLDs have been extracted, and for all TLDs the relative frequency has been calculated and compared to the relative frequency of pages, URLs, hosts and domains in the crawl. Comparisons for older crawls are available via the git version history of the project.\n\nThe first table shows [Spearman's rank correlation coefficient](https://en.wikipedia.org/wiki/Spearman%27s_rank_correlation_coefficient) (*ρ*) for the 76 TLDs which cover at least 0.05% of the URLs.  The method is similar to [Sebastian Spiegler's analysis of the 2012 crawl archives](http://commoncrawl.org/2013/08/a-look-inside-common-crawls-210tb-2012-web-corpus/).  He reported *ρ* = 0.84 based on [W3Techs TLD usage statistics](https://w3techs.com/technologies/overview/top_level_domain/all) for comparison which were/are derived from the top Alexa sites.\n\nAs the three lists used for comparison have a different notion of popularity their correlation results differ.  There are also small differences between pages/URLs and hosts/domains.  It is an open question whether differences in the relative frequency by TLD are caused by Common Crawl's crawling strategy or a different average size of sites under various TLDs.\n\n\n\nThe second table shows the relative frequency per TLD for the lists and the recent crawl. The data in this tables was used to calculate the correlation matrix.\n"
  },
  {
    "path": "plots/tld/groups-percentage.html",
    "content": "<table border=\"1\" class=\"dataframe tablesorter tablepercentage\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th>type</th>\n      <th>ARPA</th>\n      <th>IDN ccTLD</th>\n      <th>IDN gTLD</th>\n      <th>ccTLD</th>\n      <th>gTLD</th>\n      <th>grTLD</th>\n      <th>sTLD</th>\n    </tr>\n    <tr>\n      <th>crawl</th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>CC-MAIN-2008-2009</th>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>7.49</td>\n      <td>90.30</td>\n      <td>0.55</td>\n      <td>1.66</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2009-2010</th>\n      <td>0.00</td>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>15.37</td>\n      <td>82.30</td>\n      <td>0.37</td>\n      <td>1.96</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2012</th>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>NaN</td>\n      <td>30.30</td>\n      <td>68.30</td>\n      <td>0.42</td>\n      <td>0.99</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2013-20</th>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>NaN</td>\n      <td>11.89</td>\n      <td>83.69</td>\n      <td>0.06</td>\n      <td>4.36</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2013-48</th>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>NaN</td>\n      <td>7.91</td>\n      <td>87.58</td>\n      <td>0.05</td>\n      <td>4.45</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2014-10</th>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>NaN</td>\n      <td>7.43</td>\n      <td>87.67</td>\n      <td>0.04</td>\n      <td>4.85</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2014-15</th>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>NaN</td>\n      <td>7.89</td>\n      <td>86.91</td>\n      <td>0.05</td>\n      <td>5.15</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2014-23</th>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>7.87</td>\n      <td>87.37</td>\n      <td>0.04</td>\n      <td>4.71</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2014-35</th>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>7.81</td>\n      <td>87.21</td>\n      <td>0.05</td>\n      <td>4.93</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2014-41</th>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>7.77</td>\n      <td>87.22</td>\n      <td>0.05</td>\n      <td>4.96</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2014-42</th>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>8.31</td>\n      <td>86.44</td>\n      <td>0.05</td>\n      <td>5.20</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2014-49</th>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>8.61</td>\n      <td>86.00</td>\n      <td>0.05</td>\n      <td>5.34</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2014-52</th>\n      <td>NaN</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>7.92</td>\n      <td>87.10</td>\n      <td>0.04</td>\n      <td>4.95</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2015-06</th>\n      <td>NaN</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>8.02</td>\n      <td>86.86</td>\n      <td>0.04</td>\n      <td>5.09</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2015-11</th>\n      <td>NaN</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>7.96</td>\n      <td>86.65</td>\n      <td>0.04</td>\n      <td>5.35</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2015-14</th>\n      <td>NaN</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>8.12</td>\n      <td>86.49</td>\n      <td>0.04</td>\n      <td>5.35</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2015-18</th>\n      <td>NaN</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>7.87</td>\n      <td>86.99</td>\n      <td>0.03</td>\n      <td>5.11</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2015-22</th>\n      <td>NaN</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>7.93</td>\n      <td>86.85</td>\n      <td>0.03</td>\n      <td>5.18</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2015-27</th>\n      <td>NaN</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>8.02</td>\n      <td>86.81</td>\n      <td>0.04</td>\n      <td>5.13</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2015-32</th>\n      <td>NaN</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>8.00</td>\n      <td>86.82</td>\n      <td>0.04</td>\n      <td>5.14</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2015-35</th>\n      <td>NaN</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>8.02</td>\n      <td>86.81</td>\n      <td>0.04</td>\n      <td>5.14</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2015-40</th>\n      <td>NaN</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>8.15</td>\n      <td>86.61</td>\n      <td>0.04</td>\n      <td>5.19</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2015-48</th>\n      <td>NaN</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>8.09</td>\n      <td>86.70</td>\n      <td>0.04</td>\n      <td>5.17</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2016-07</th>\n      <td>NaN</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>8.02</td>\n      <td>86.72</td>\n      <td>0.04</td>\n      <td>5.22</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2016-18</th>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>7.93</td>\n      <td>86.72</td>\n      <td>0.05</td>\n      <td>5.30</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2016-22</th>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>12.88</td>\n      <td>82.26</td>\n      <td>0.07</td>\n      <td>4.79</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2016-26</th>\n      <td>0.00</td>\n      <td>0.01</td>\n      <td>NaN</td>\n      <td>13.06</td>\n      <td>82.32</td>\n      <td>0.08</td>\n      <td>4.54</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2016-30</th>\n      <td>NaN</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>12.21</td>\n      <td>83.08</td>\n      <td>0.06</td>\n      <td>4.65</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2016-36</th>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>12.89</td>\n      <td>82.44</td>\n      <td>0.06</td>\n      <td>4.60</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2016-40</th>\n      <td>0.00</td>\n      <td>0.01</td>\n      <td>0.00</td>\n      <td>13.61</td>\n      <td>81.87</td>\n      <td>0.06</td>\n      <td>4.46</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2016-44</th>\n      <td>0.00</td>\n      <td>0.05</td>\n      <td>0.00</td>\n      <td>30.48</td>\n      <td>66.85</td>\n      <td>0.19</td>\n      <td>2.43</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2016-50</th>\n      <td>0.00</td>\n      <td>0.04</td>\n      <td>0.00</td>\n      <td>30.52</td>\n      <td>66.95</td>\n      <td>0.22</td>\n      <td>2.27</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2017-04</th>\n      <td>0.00</td>\n      <td>0.06</td>\n      <td>0.00</td>\n      <td>31.82</td>\n      <td>65.84</td>\n      <td>0.26</td>\n      <td>2.03</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2017-09</th>\n      <td>NaN</td>\n      <td>0.04</td>\n      <td>0.00</td>\n      <td>30.84</td>\n      <td>66.91</td>\n      <td>0.23</td>\n      <td>1.98</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2017-13</th>\n      <td>NaN</td>\n      <td>0.04</td>\n      <td>0.00</td>\n      <td>31.00</td>\n      <td>67.05</td>\n      <td>0.23</td>\n      <td>1.69</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2017-17</th>\n      <td>0.00</td>\n      <td>0.03</td>\n      <td>0.00</td>\n      <td>29.61</td>\n      <td>68.22</td>\n      <td>0.24</td>\n      <td>1.89</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2017-22</th>\n      <td>NaN</td>\n      <td>0.05</td>\n      <td>0.00</td>\n      <td>30.21</td>\n      <td>67.96</td>\n      <td>0.22</td>\n      <td>1.56</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2017-26</th>\n      <td>NaN</td>\n      <td>0.04</td>\n      <td>0.00</td>\n      <td>29.49</td>\n      <td>68.95</td>\n      <td>0.22</td>\n      <td>1.30</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2017-30</th>\n      <td>0.00</td>\n      <td>0.05</td>\n      <td>0.00</td>\n      <td>29.52</td>\n      <td>68.43</td>\n      <td>0.22</td>\n      <td>1.78</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2017-34</th>\n      <td>NaN</td>\n      <td>0.04</td>\n      <td>0.00</td>\n      <td>28.91</td>\n      <td>69.70</td>\n      <td>0.20</td>\n      <td>1.15</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2017-39</th>\n      <td>NaN</td>\n      <td>0.07</td>\n      <td>0.00</td>\n      <td>32.93</td>\n      <td>65.26</td>\n      <td>0.23</td>\n      <td>1.50</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2017-43</th>\n      <td>0.00</td>\n      <td>0.05</td>\n      <td>0.00</td>\n      <td>30.01</td>\n      <td>68.40</td>\n      <td>0.22</td>\n      <td>1.32</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2017-47</th>\n      <td>0.00</td>\n      <td>0.07</td>\n      <td>0.00</td>\n      <td>33.71</td>\n      <td>64.49</td>\n      <td>0.25</td>\n      <td>1.47</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2017-51</th>\n      <td>0.00</td>\n      <td>0.06</td>\n      <td>0.00</td>\n      <td>31.44</td>\n      <td>66.94</td>\n      <td>0.25</td>\n      <td>1.31</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2018-05</th>\n      <td>0.00</td>\n      <td>0.09</td>\n      <td>0.00</td>\n      <td>34.95</td>\n      <td>63.22</td>\n      <td>0.32</td>\n      <td>1.42</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2018-09</th>\n      <td>0.00</td>\n      <td>0.09</td>\n      <td>0.00</td>\n      <td>33.39</td>\n      <td>64.87</td>\n      <td>0.31</td>\n      <td>1.34</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2018-13</th>\n      <td>0.00</td>\n      <td>0.08</td>\n      <td>0.00</td>\n      <td>33.98</td>\n      <td>64.38</td>\n      <td>0.27</td>\n      <td>1.28</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2018-17</th>\n      <td>0.00</td>\n      <td>0.11</td>\n      <td>0.00</td>\n      <td>36.22</td>\n      <td>62.01</td>\n      <td>0.31</td>\n      <td>1.35</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2018-22</th>\n      <td>0.00</td>\n      <td>0.12</td>\n      <td>0.00</td>\n      <td>36.18</td>\n      <td>62.18</td>\n      <td>0.32</td>\n      <td>1.20</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2018-26</th>\n      <td>0.00</td>\n      <td>0.10</td>\n      <td>0.00</td>\n      <td>35.37</td>\n      <td>62.90</td>\n      <td>0.30</td>\n      <td>1.33</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2018-30</th>\n      <td>0.00</td>\n      <td>0.11</td>\n      <td>0.00</td>\n      <td>34.36</td>\n      <td>64.20</td>\n      <td>0.30</td>\n      <td>1.04</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2018-34</th>\n      <td>0.00</td>\n      <td>0.13</td>\n      <td>0.00</td>\n      <td>38.57</td>\n      <td>59.90</td>\n      <td>0.35</td>\n      <td>1.06</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2018-39</th>\n      <td>0.00</td>\n      <td>0.12</td>\n      <td>0.00</td>\n      <td>38.67</td>\n      <td>59.76</td>\n      <td>0.33</td>\n      <td>1.11</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2018-43</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.00</td>\n      <td>38.93</td>\n      <td>59.57</td>\n      <td>0.32</td>\n      <td>1.04</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2018-47</th>\n      <td>0.00</td>\n      <td>0.16</td>\n      <td>0.01</td>\n      <td>39.52</td>\n      <td>59.01</td>\n      <td>0.33</td>\n      <td>0.97</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2018-51</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>39.63</td>\n      <td>58.87</td>\n      <td>0.31</td>\n      <td>1.03</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2019-04</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.00</td>\n      <td>39.68</td>\n      <td>58.92</td>\n      <td>0.32</td>\n      <td>0.94</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2019-09</th>\n      <td>0.00</td>\n      <td>0.15</td>\n      <td>0.01</td>\n      <td>40.38</td>\n      <td>58.03</td>\n      <td>0.36</td>\n      <td>1.06</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2019-13</th>\n      <td>0.00</td>\n      <td>0.13</td>\n      <td>0.01</td>\n      <td>40.41</td>\n      <td>58.02</td>\n      <td>0.32</td>\n      <td>1.11</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2019-18</th>\n      <td>0.00</td>\n      <td>0.13</td>\n      <td>0.01</td>\n      <td>39.94</td>\n      <td>58.29</td>\n      <td>0.34</td>\n      <td>1.29</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2019-22</th>\n      <td>0.00</td>\n      <td>0.11</td>\n      <td>0.01</td>\n      <td>39.99</td>\n      <td>58.28</td>\n      <td>0.31</td>\n      <td>1.31</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2019-26</th>\n      <td>0.00</td>\n      <td>0.12</td>\n      <td>0.01</td>\n      <td>39.65</td>\n      <td>58.45</td>\n      <td>0.30</td>\n      <td>1.49</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2019-30</th>\n      <td>0.00</td>\n      <td>0.10</td>\n      <td>0.01</td>\n      <td>39.33</td>\n      <td>58.72</td>\n      <td>0.28</td>\n      <td>1.56</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2019-35</th>\n      <td>0.00</td>\n      <td>0.12</td>\n      <td>0.01</td>\n      <td>39.51</td>\n      <td>58.53</td>\n      <td>0.28</td>\n      <td>1.55</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2019-39</th>\n      <td>0.00</td>\n      <td>0.10</td>\n      <td>0.01</td>\n      <td>39.44</td>\n      <td>58.35</td>\n      <td>0.26</td>\n      <td>1.84</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2019-43</th>\n      <td>NaN</td>\n      <td>0.12</td>\n      <td>0.01</td>\n      <td>39.61</td>\n      <td>58.09</td>\n      <td>0.26</td>\n      <td>1.91</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2019-47</th>\n      <td>NaN</td>\n      <td>0.11</td>\n      <td>0.01</td>\n      <td>39.63</td>\n      <td>58.29</td>\n      <td>0.26</td>\n      <td>1.70</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2019-51</th>\n      <td>NaN</td>\n      <td>0.12</td>\n      <td>0.00</td>\n      <td>39.36</td>\n      <td>58.51</td>\n      <td>0.25</td>\n      <td>1.75</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2020-05</th>\n      <td>NaN</td>\n      <td>0.13</td>\n      <td>0.01</td>\n      <td>39.96</td>\n      <td>58.01</td>\n      <td>0.24</td>\n      <td>1.65</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2020-10</th>\n      <td>NaN</td>\n      <td>0.12</td>\n      <td>0.01</td>\n      <td>40.34</td>\n      <td>57.67</td>\n      <td>0.25</td>\n      <td>1.62</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2020-16</th>\n      <td>NaN</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>41.18</td>\n      <td>56.95</td>\n      <td>0.24</td>\n      <td>1.48</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2020-24</th>\n      <td>NaN</td>\n      <td>0.12</td>\n      <td>0.01</td>\n      <td>40.63</td>\n      <td>57.48</td>\n      <td>0.24</td>\n      <td>1.52</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2020-29</th>\n      <td>NaN</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>40.90</td>\n      <td>57.20</td>\n      <td>0.24</td>\n      <td>1.51</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2020-34</th>\n      <td>0.00</td>\n      <td>0.11</td>\n      <td>0.01</td>\n      <td>40.55</td>\n      <td>57.13</td>\n      <td>0.22</td>\n      <td>1.98</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2020-40</th>\n      <td>0.00</td>\n      <td>0.19</td>\n      <td>0.01</td>\n      <td>42.21</td>\n      <td>55.81</td>\n      <td>0.27</td>\n      <td>1.51</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2020-45</th>\n      <td>0.00</td>\n      <td>0.15</td>\n      <td>0.01</td>\n      <td>41.67</td>\n      <td>55.94</td>\n      <td>0.25</td>\n      <td>1.98</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2020-50</th>\n      <td>NaN</td>\n      <td>0.16</td>\n      <td>0.01</td>\n      <td>41.66</td>\n      <td>55.96</td>\n      <td>0.26</td>\n      <td>1.96</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2021-04</th>\n      <td>NaN</td>\n      <td>0.17</td>\n      <td>0.01</td>\n      <td>41.61</td>\n      <td>56.25</td>\n      <td>0.26</td>\n      <td>1.71</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2021-10</th>\n      <td>NaN</td>\n      <td>0.16</td>\n      <td>0.01</td>\n      <td>41.97</td>\n      <td>55.74</td>\n      <td>0.27</td>\n      <td>1.86</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2021-17</th>\n      <td>NaN</td>\n      <td>0.17</td>\n      <td>0.01</td>\n      <td>42.18</td>\n      <td>55.64</td>\n      <td>0.27</td>\n      <td>1.74</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2021-21</th>\n      <td>NaN</td>\n      <td>0.16</td>\n      <td>0.01</td>\n      <td>41.75</td>\n      <td>55.93</td>\n      <td>0.26</td>\n      <td>1.89</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2021-25</th>\n      <td>NaN</td>\n      <td>0.15</td>\n      <td>0.01</td>\n      <td>40.80</td>\n      <td>56.75</td>\n      <td>0.25</td>\n      <td>2.04</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2021-31</th>\n      <td>NaN</td>\n      <td>0.16</td>\n      <td>0.01</td>\n      <td>41.20</td>\n      <td>56.70</td>\n      <td>0.27</td>\n      <td>1.66</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2021-39</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>41.06</td>\n      <td>56.43</td>\n      <td>0.25</td>\n      <td>2.11</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2021-43</th>\n      <td>0.00</td>\n      <td>0.15</td>\n      <td>0.01</td>\n      <td>41.26</td>\n      <td>56.36</td>\n      <td>0.25</td>\n      <td>1.98</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2021-49</th>\n      <td>NaN</td>\n      <td>0.12</td>\n      <td>0.01</td>\n      <td>41.06</td>\n      <td>56.10</td>\n      <td>0.24</td>\n      <td>2.47</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2022-05</th>\n      <td>NaN</td>\n      <td>0.13</td>\n      <td>0.01</td>\n      <td>41.40</td>\n      <td>56.07</td>\n      <td>0.25</td>\n      <td>2.15</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2022-21</th>\n      <td>NaN</td>\n      <td>0.13</td>\n      <td>0.01</td>\n      <td>40.73</td>\n      <td>56.84</td>\n      <td>0.25</td>\n      <td>2.03</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2022-27</th>\n      <td>NaN</td>\n      <td>0.13</td>\n      <td>0.01</td>\n      <td>40.80</td>\n      <td>56.63</td>\n      <td>0.25</td>\n      <td>2.19</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2022-33</th>\n      <td>NaN</td>\n      <td>0.12</td>\n      <td>0.01</td>\n      <td>41.09</td>\n      <td>56.02</td>\n      <td>0.24</td>\n      <td>2.53</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2022-40</th>\n      <td>NaN</td>\n      <td>0.15</td>\n      <td>0.01</td>\n      <td>37.01</td>\n      <td>60.38</td>\n      <td>0.27</td>\n      <td>2.18</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2022-49</th>\n      <td>NaN</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>37.15</td>\n      <td>60.24</td>\n      <td>0.26</td>\n      <td>2.20</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2023-06</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>37.11</td>\n      <td>60.35</td>\n      <td>0.26</td>\n      <td>2.12</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2023-14</th>\n      <td>0.00</td>\n      <td>0.15</td>\n      <td>0.01</td>\n      <td>37.47</td>\n      <td>60.09</td>\n      <td>0.25</td>\n      <td>2.03</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2023-23</th>\n      <td>0.00</td>\n      <td>0.15</td>\n      <td>0.01</td>\n      <td>38.16</td>\n      <td>59.37</td>\n      <td>0.25</td>\n      <td>2.05</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2023-40</th>\n      <td>0.00</td>\n      <td>0.15</td>\n      <td>0.01</td>\n      <td>38.53</td>\n      <td>59.12</td>\n      <td>0.26</td>\n      <td>1.94</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2023-50</th>\n      <td>0.00</td>\n      <td>0.17</td>\n      <td>0.01</td>\n      <td>41.94</td>\n      <td>55.71</td>\n      <td>0.25</td>\n      <td>1.92</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2024-10</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>42.11</td>\n      <td>55.71</td>\n      <td>0.24</td>\n      <td>1.79</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2024-18</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>41.63</td>\n      <td>56.13</td>\n      <td>0.24</td>\n      <td>1.84</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2024-22</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>42.43</td>\n      <td>55.34</td>\n      <td>0.23</td>\n      <td>1.84</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2024-26</th>\n      <td>0.00</td>\n      <td>0.15</td>\n      <td>0.01</td>\n      <td>41.77</td>\n      <td>56.00</td>\n      <td>0.23</td>\n      <td>1.84</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2024-30</th>\n      <td>0.00</td>\n      <td>0.15</td>\n      <td>0.01</td>\n      <td>42.32</td>\n      <td>55.48</td>\n      <td>0.24</td>\n      <td>1.79</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2024-33</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>42.37</td>\n      <td>55.34</td>\n      <td>0.25</td>\n      <td>1.90</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2024-38</th>\n      <td>0.00</td>\n      <td>0.16</td>\n      <td>0.01</td>\n      <td>42.92</td>\n      <td>55.00</td>\n      <td>0.24</td>\n      <td>1.67</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2024-42</th>\n      <td>NaN</td>\n      <td>0.17</td>\n      <td>0.01</td>\n      <td>43.22</td>\n      <td>54.57</td>\n      <td>0.24</td>\n      <td>1.80</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2024-46</th>\n      <td>NaN</td>\n      <td>0.16</td>\n      <td>0.01</td>\n      <td>42.57</td>\n      <td>55.32</td>\n      <td>0.24</td>\n      <td>1.70</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2024-51</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>42.95</td>\n      <td>54.86</td>\n      <td>0.25</td>\n      <td>1.79</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2025-05</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>43.02</td>\n      <td>54.97</td>\n      <td>0.25</td>\n      <td>1.61</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2025-08</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>42.83</td>\n      <td>54.96</td>\n      <td>0.25</td>\n      <td>1.81</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2025-13</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>42.37</td>\n      <td>55.38</td>\n      <td>0.24</td>\n      <td>1.86</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2025-18</th>\n      <td>0.00</td>\n      <td>0.13</td>\n      <td>0.01</td>\n      <td>42.72</td>\n      <td>55.08</td>\n      <td>0.24</td>\n      <td>1.81</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2025-21</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>42.78</td>\n      <td>55.13</td>\n      <td>0.25</td>\n      <td>1.69</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2025-26</th>\n      <td>0.00</td>\n      <td>0.15</td>\n      <td>0.01</td>\n      <td>43.05</td>\n      <td>54.81</td>\n      <td>0.26</td>\n      <td>1.74</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2025-30</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>42.60</td>\n      <td>55.35</td>\n      <td>0.24</td>\n      <td>1.66</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2025-33</th>\n      <td>0.00</td>\n      <td>0.15</td>\n      <td>0.01</td>\n      <td>44.22</td>\n      <td>53.79</td>\n      <td>0.25</td>\n      <td>1.58</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2025-38</th>\n      <td>0.00</td>\n      <td>0.17</td>\n      <td>0.01</td>\n      <td>44.28</td>\n      <td>53.70</td>\n      <td>0.26</td>\n      <td>1.59</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2025-43</th>\n      <td>0.00</td>\n      <td>0.14</td>\n      <td>0.01</td>\n      <td>42.79</td>\n      <td>55.42</td>\n      <td>0.23</td>\n      <td>1.41</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2025-47</th>\n      <td>0.00</td>\n      <td>0.16</td>\n      <td>0.01</td>\n      <td>44.57</td>\n      <td>53.44</td>\n      <td>0.24</td>\n      <td>1.57</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2025-51</th>\n      <td>0.00</td>\n      <td>0.16</td>\n      <td>0.01</td>\n      <td>44.94</td>\n      <td>53.07</td>\n      <td>0.24</td>\n      <td>1.58</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2026-04</th>\n      <td>0.00</td>\n      <td>0.15</td>\n      <td>0.01</td>\n      <td>44.49</td>\n      <td>53.58</td>\n      <td>0.24</td>\n      <td>1.53</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2026-08</th>\n      <td>0.00</td>\n      <td>0.15</td>\n      <td>0.01</td>\n      <td>44.61</td>\n      <td>53.47</td>\n      <td>0.24</td>\n      <td>1.52</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2026-12</th>\n      <td>0.00</td>\n      <td>0.16</td>\n      <td>0.01</td>\n      <td>45.16</td>\n      <td>52.90</td>\n      <td>0.24</td>\n      <td>1.53</td>\n    </tr>\n    <tr>\n      <th>CC-MAIN-2026-17</th>\n      <td>0.00</td>\n      <td>0.18</td>\n      <td>0.01</td>\n      <td>44.67</td>\n      <td>53.43</td>\n      <td>0.24</td>\n      <td>1.47</td>\n    </tr>\n  </tbody>\n</table>"
  },
  {
    "path": "plots/tld/groups.md",
    "content": "---\nlayout: table\ntable_include: groups-percentage.html\ntable_sortlist: \"{sortList: [[0,1]]}\"\n---\n\nGroups of Top-Level Domains\n===========================\n\nThe [IANA Root Zone Database](http://www.iana.org/domains/root/db) classifies top-level domains into the following groups:\n\n- [generic](https://en.wikipedia.org/wiki/Generic_top-level_domain) (\"gTLD\"), not bound to a specific country. The core is formed by `.com`, `.info`, `.net` and `.org` TLDs, but was later extended to a long list of generic terms (`.creditcard`, `.bike`), or brands (`.apple`, `.volkswagen`), geographical or cultural entities (`.paris`, `.kiwi`)\n- [sponsored](https://en.wikipedia.org/wiki/Generic_top-level_domain#Sponsored_gTLD) TLDs (\"sTLD\") are restricted to defined groups of users, registration of domains isn't open to anybody. That's obvious for `.gov`, `.mil`, `.edu` but also applies to `.museum` and others\n- generic-restricted (\"grTLD\"): `.biz`, `.name` and `.pro`\n- one single \"infrastructure\" TLD: `.arpa`\n- [country-code top-level domains](https://en.wikipedia.org/wiki/Country_code_top-level_domain): `.uk`, `.fr`, `.jp`, etc.\n\nThe generic and country-code TLDs include [internationalized top-level domains](https://en.wikipedia.org/wiki/Internationalized_domain_name) written in non-Latin alphabets or containing non-ASCII characters. These are listed here as own groups:\n\n- [internationalized country-code TLD](https://en.wikipedia.org/wiki/Internationalized_country_code_top-level_domain) (\"IDN ccTLD\"): `.рф` - Russia\n- internationalized generic TLD (\"IDN gTLD\"): `.セール` - Japanese for 'sale', `.vermögensberatung` - German 'financial consulting'\n\n\n![Percentage of top-level domains groups](groups.png)\n\nSignificant changes to the ratio between generic and country-code top-level domains happened in [May 2016](http://commoncrawl.org/2016/06/may-2016-crawl-archive-now-available/) (400 million seed donation by Moz.com) and [October 2016](http://commoncrawl.org/2016/11/october-2016-crawl-archive-now-available/) where we started to extend the crawl based on host/domain ranks and also increased the crawl size from 1.5--2 billion to about 3 billion pages.\n\nWhile country-code TLDs have been underrepresented in crawls before 2016, the 30% share of country-code TLDs now comes closer to reality. In the present [Alexa top-1-million site list](http://s3.amazonaws.com/alexa-static/top-1m.csv.zip) (for details cf. [comparison of TLDs](./comparison.md)) 61% of the TLDs are generic and 38% country-code TLDs.\n\n"
  },
  {
    "path": "plots/tld/latest-crawl-groups.html",
    "content": "<table border=\"1\" class=\"dataframe tablesorter tablesearcher\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th></th>\n      <th>pages</th>\n      <th>urls</th>\n      <th>hosts</th>\n      <th>domains</th>\n      <th>%urls</th>\n      <th>%hosts</th>\n      <th>%domains</th>\n    </tr>\n    <tr>\n      <th>type</th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>gTLD</th>\n      <td>1,171,334,855</td>\n      <td>1,164,494,368</td>\n      <td>24,710,880</td>\n      <td>23,512,597</td>\n      <td>53.43</td>\n      <td>57.19</td>\n      <td>57.44</td>\n    </tr>\n    <tr>\n      <th>ccTLD</th>\n      <td>978,982,191</td>\n      <td>973,606,537</td>\n      <td>18,109,685</td>\n      <td>17,050,029</td>\n      <td>44.67</td>\n      <td>41.91</td>\n      <td>41.65</td>\n    </tr>\n    <tr>\n      <th>sTLD</th>\n      <td>32,358,184</td>\n      <td>32,108,658</td>\n      <td>187,582</td>\n      <td>180,650</td>\n      <td>1.47</td>\n      <td>0.43</td>\n      <td>0.44</td>\n    </tr>\n    <tr>\n      <th>grTLD</th>\n      <td>5,193,228</td>\n      <td>5,169,879</td>\n      <td>126,260</td>\n      <td>120,978</td>\n      <td>0.24</td>\n      <td>0.29</td>\n      <td>0.30</td>\n    </tr>\n    <tr>\n      <th>IDN ccTLD</th>\n      <td>3,840,679</td>\n      <td>3,829,455</td>\n      <td>70,933</td>\n      <td>69,059</td>\n      <td>0.18</td>\n      <td>0.16</td>\n      <td>0.17</td>\n    </tr>\n    <tr>\n      <th>IDN gTLD</th>\n      <td>172,377</td>\n      <td>171,948</td>\n      <td>4,062</td>\n      <td>3,981</td>\n      <td>0.01</td>\n      <td>0.01</td>\n      <td>0.01</td>\n    </tr>\n    <tr>\n      <th>ARPA</th>\n      <td>1</td>\n      <td>1</td>\n      <td>1</td>\n      <td>1</td>\n      <td>0.00</td>\n      <td>0.00</td>\n      <td>0.00</td>\n    </tr>\n  </tbody>\n</table>"
  },
  {
    "path": "plots/tld/latest-crawl-tlds.html",
    "content": "<table border=\"1\" class=\"dataframe tablesorter tablesearcher\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th></th>\n      <th>pages</th>\n      <th>urls</th>\n      <th>hosts</th>\n      <th>domains</th>\n      <th>%urls</th>\n      <th>%hosts</th>\n      <th>%domains</th>\n    </tr>\n    <tr>\n      <th>tld</th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>com</th>\n      <td>918,035,054</td>\n      <td>912,637,644</td>\n      <td>19,928,575</td>\n      <td>18,965,474</td>\n      <td>41.88</td>\n      <td>46.12</td>\n      <td>46.33</td>\n    </tr>\n    <tr>\n      <th>org</th>\n      <td>120,478,054</td>\n      <td>119,738,931</td>\n      <td>1,831,092</td>\n      <td>1,712,048</td>\n      <td>5.49</td>\n      <td>4.24</td>\n      <td>4.18</td>\n    </tr>\n    <tr>\n      <th>ru</th>\n      <td>106,756,027</td>\n      <td>106,349,919</td>\n      <td>1,188,137</td>\n      <td>1,121,954</td>\n      <td>4.88</td>\n      <td>2.75</td>\n      <td>2.74</td>\n    </tr>\n    <tr>\n      <th>de</th>\n      <td>95,650,541</td>\n      <td>94,950,427</td>\n      <td>2,496,888</td>\n      <td>2,307,593</td>\n      <td>4.36</td>\n      <td>5.78</td>\n      <td>5.64</td>\n    </tr>\n    <tr>\n      <th>net</th>\n      <td>65,050,604</td>\n      <td>64,753,682</td>\n      <td>1,220,248</td>\n      <td>1,148,766</td>\n      <td>2.97</td>\n      <td>2.82</td>\n      <td>2.81</td>\n    </tr>\n    <tr>\n      <th>jp</th>\n      <td>50,331,104</td>\n      <td>50,090,914</td>\n      <td>731,504</td>\n      <td>691,571</td>\n      <td>2.30</td>\n      <td>1.69</td>\n      <td>1.69</td>\n    </tr>\n    <tr>\n      <th>uk</th>\n      <td>46,106,320</td>\n      <td>45,806,154</td>\n      <td>1,062,304</td>\n      <td>1,010,498</td>\n      <td>2.10</td>\n      <td>2.46</td>\n      <td>2.47</td>\n    </tr>\n    <tr>\n      <th>fr</th>\n      <td>42,237,000</td>\n      <td>42,002,602</td>\n      <td>917,847</td>\n      <td>880,184</td>\n      <td>1.93</td>\n      <td>2.12</td>\n      <td>2.15</td>\n    </tr>\n    <tr>\n      <th>pl</th>\n      <td>41,491,471</td>\n      <td>41,309,416</td>\n      <td>634,884</td>\n      <td>603,401</td>\n      <td>1.90</td>\n      <td>1.47</td>\n      <td>1.47</td>\n    </tr>\n    <tr>\n      <th>it</th>\n      <td>38,060,552</td>\n      <td>37,875,266</td>\n      <td>662,750</td>\n      <td>627,568</td>\n      <td>1.74</td>\n      <td>1.53</td>\n      <td>1.53</td>\n    </tr>\n    <tr>\n      <th>br</th>\n      <td>37,254,474</td>\n      <td>37,094,432</td>\n      <td>562,266</td>\n      <td>525,191</td>\n      <td>1.70</td>\n      <td>1.30</td>\n      <td>1.28</td>\n    </tr>\n    <tr>\n      <th>nl</th>\n      <td>32,137,629</td>\n      <td>31,937,772</td>\n      <td>820,393</td>\n      <td>769,987</td>\n      <td>1.47</td>\n      <td>1.90</td>\n      <td>1.88</td>\n    </tr>\n    <tr>\n      <th>cz</th>\n      <td>24,497,312</td>\n      <td>24,243,284</td>\n      <td>377,628</td>\n      <td>353,443</td>\n      <td>1.11</td>\n      <td>0.87</td>\n      <td>0.86</td>\n    </tr>\n    <tr>\n      <th>cn</th>\n      <td>23,650,354</td>\n      <td>23,599,961</td>\n      <td>1,026,423</td>\n      <td>969,028</td>\n      <td>1.08</td>\n      <td>2.38</td>\n      <td>2.37</td>\n    </tr>\n    <tr>\n      <th>es</th>\n      <td>19,880,767</td>\n      <td>19,756,848</td>\n      <td>309,111</td>\n      <td>295,492</td>\n      <td>0.91</td>\n      <td>0.72</td>\n      <td>0.72</td>\n    </tr>\n    <tr>\n      <th>ua</th>\n      <td>19,359,646</td>\n      <td>19,197,917</td>\n      <td>123,964</td>\n      <td>119,024</td>\n      <td>0.88</td>\n      <td>0.29</td>\n      <td>0.29</td>\n    </tr>\n    <tr>\n      <th>au</th>\n      <td>19,300,780</td>\n      <td>19,191,339</td>\n      <td>431,138</td>\n      <td>414,215</td>\n      <td>0.88</td>\n      <td>1.00</td>\n      <td>1.01</td>\n    </tr>\n    <tr>\n      <th>ca</th>\n      <td>18,388,028</td>\n      <td>18,282,578</td>\n      <td>399,341</td>\n      <td>382,048</td>\n      <td>0.84</td>\n      <td>0.92</td>\n      <td>0.93</td>\n    </tr>\n    <tr>\n      <th>edu</th>\n      <td>18,167,199</td>\n      <td>18,038,391</td>\n      <td>106,032</td>\n      <td>103,607</td>\n      <td>0.83</td>\n      <td>0.25</td>\n      <td>0.25</td>\n    </tr>\n    <tr>\n      <th>eu</th>\n      <td>15,928,468</td>\n      <td>15,829,300</td>\n      <td>311,177</td>\n      <td>292,747</td>\n      <td>0.73</td>\n      <td>0.72</td>\n      <td>0.72</td>\n    </tr>\n    <tr>\n      <th>in</th>\n      <td>14,703,150</td>\n      <td>14,650,031</td>\n      <td>278,968</td>\n      <td>264,109</td>\n      <td>0.67</td>\n      <td>0.65</td>\n      <td>0.65</td>\n    </tr>\n    <tr>\n      <th>se</th>\n      <td>14,641,754</td>\n      <td>14,549,917</td>\n      <td>309,180</td>\n      <td>294,004</td>\n      <td>0.67</td>\n      <td>0.72</td>\n      <td>0.72</td>\n    </tr>\n    <tr>\n      <th>ch</th>\n      <td>14,139,669</td>\n      <td>14,023,492</td>\n      <td>401,642</td>\n      <td>371,051</td>\n      <td>0.64</td>\n      <td>0.93</td>\n      <td>0.91</td>\n    </tr>\n    <tr>\n      <th>vn</th>\n      <td>13,013,793</td>\n      <td>12,962,675</td>\n      <td>129,026</td>\n      <td>123,017</td>\n      <td>0.59</td>\n      <td>0.30</td>\n      <td>0.30</td>\n    </tr>\n    <tr>\n      <th>info</th>\n      <td>12,790,040</td>\n      <td>12,741,500</td>\n      <td>220,350</td>\n      <td>207,825</td>\n      <td>0.58</td>\n      <td>0.51</td>\n      <td>0.51</td>\n    </tr>\n    <tr>\n      <th>ro</th>\n      <td>12,775,628</td>\n      <td>12,724,876</td>\n      <td>147,761</td>\n      <td>139,069</td>\n      <td>0.58</td>\n      <td>0.34</td>\n      <td>0.34</td>\n    </tr>\n    <tr>\n      <th>be</th>\n      <td>11,861,578</td>\n      <td>11,785,902</td>\n      <td>293,514</td>\n      <td>274,881</td>\n      <td>0.54</td>\n      <td>0.68</td>\n      <td>0.67</td>\n    </tr>\n    <tr>\n      <th>dk</th>\n      <td>11,544,786</td>\n      <td>11,471,765</td>\n      <td>275,476</td>\n      <td>263,196</td>\n      <td>0.53</td>\n      <td>0.64</td>\n      <td>0.64</td>\n    </tr>\n    <tr>\n      <th>gr</th>\n      <td>11,427,100</td>\n      <td>11,386,614</td>\n      <td>145,816</td>\n      <td>136,383</td>\n      <td>0.52</td>\n      <td>0.34</td>\n      <td>0.33</td>\n    </tr>\n    <tr>\n      <th>hu</th>\n      <td>11,124,200</td>\n      <td>11,076,250</td>\n      <td>193,742</td>\n      <td>181,660</td>\n      <td>0.51</td>\n      <td>0.45</td>\n      <td>0.44</td>\n    </tr>\n    <tr>\n      <th>at</th>\n      <td>10,516,664</td>\n      <td>10,440,830</td>\n      <td>258,354</td>\n      <td>242,569</td>\n      <td>0.48</td>\n      <td>0.60</td>\n      <td>0.59</td>\n    </tr>\n    <tr>\n      <th>id</th>\n      <td>9,633,148</td>\n      <td>9,605,620</td>\n      <td>136,284</td>\n      <td>131,129</td>\n      <td>0.44</td>\n      <td>0.32</td>\n      <td>0.32</td>\n    </tr>\n    <tr>\n      <th>co</th>\n      <td>9,499,717</td>\n      <td>9,398,703</td>\n      <td>189,183</td>\n      <td>183,379</td>\n      <td>0.43</td>\n      <td>0.44</td>\n      <td>0.45</td>\n    </tr>\n    <tr>\n      <th>tw</th>\n      <td>9,396,997</td>\n      <td>9,360,501</td>\n      <td>124,182</td>\n      <td>112,077</td>\n      <td>0.43</td>\n      <td>0.29</td>\n      <td>0.27</td>\n    </tr>\n    <tr>\n      <th>tr</th>\n      <td>9,177,139</td>\n      <td>9,143,395</td>\n      <td>128,514</td>\n      <td>116,768</td>\n      <td>0.42</td>\n      <td>0.30</td>\n      <td>0.29</td>\n    </tr>\n    <tr>\n      <th>kr</th>\n      <td>9,155,743</td>\n      <td>9,128,208</td>\n      <td>195,165</td>\n      <td>163,555</td>\n      <td>0.42</td>\n      <td>0.45</td>\n      <td>0.40</td>\n    </tr>\n    <tr>\n      <th>sk</th>\n      <td>8,689,320</td>\n      <td>8,627,849</td>\n      <td>127,792</td>\n      <td>119,007</td>\n      <td>0.40</td>\n      <td>0.30</td>\n      <td>0.29</td>\n    </tr>\n    <tr>\n      <th>gov</th>\n      <td>8,689,554</td>\n      <td>8,624,661</td>\n      <td>27,028</td>\n      <td>25,495</td>\n      <td>0.40</td>\n      <td>0.06</td>\n      <td>0.06</td>\n    </tr>\n    <tr>\n      <th>fi</th>\n      <td>7,844,908</td>\n      <td>7,794,541</td>\n      <td>144,227</td>\n      <td>137,573</td>\n      <td>0.36</td>\n      <td>0.33</td>\n      <td>0.34</td>\n    </tr>\n    <tr>\n      <th>ar</th>\n      <td>7,591,879</td>\n      <td>7,567,442</td>\n      <td>125,889</td>\n      <td>113,699</td>\n      <td>0.35</td>\n      <td>0.29</td>\n      <td>0.28</td>\n    </tr>\n    <tr>\n      <th>no</th>\n      <td>7,252,962</td>\n      <td>7,205,272</td>\n      <td>141,135</td>\n      <td>133,720</td>\n      <td>0.33</td>\n      <td>0.33</td>\n      <td>0.33</td>\n    </tr>\n    <tr>\n      <th>io</th>\n      <td>7,107,020</td>\n      <td>7,038,495</td>\n      <td>212,249</td>\n      <td>208,109</td>\n      <td>0.32</td>\n      <td>0.49</td>\n      <td>0.51</td>\n    </tr>\n    <tr>\n      <th>pt</th>\n      <td>6,500,568</td>\n      <td>6,462,776</td>\n      <td>94,760</td>\n      <td>88,054</td>\n      <td>0.30</td>\n      <td>0.22</td>\n      <td>0.22</td>\n    </tr>\n    <tr>\n      <th>mx</th>\n      <td>6,367,373</td>\n      <td>6,341,409</td>\n      <td>100,173</td>\n      <td>94,740</td>\n      <td>0.29</td>\n      <td>0.23</td>\n      <td>0.23</td>\n    </tr>\n    <tr>\n      <th>cl</th>\n      <td>5,111,970</td>\n      <td>5,088,776</td>\n      <td>81,026</td>\n      <td>77,224</td>\n      <td>0.23</td>\n      <td>0.19</td>\n      <td>0.19</td>\n    </tr>\n    <tr>\n      <th>il</th>\n      <td>4,828,801</td>\n      <td>4,804,202</td>\n      <td>79,699</td>\n      <td>76,917</td>\n      <td>0.22</td>\n      <td>0.18</td>\n      <td>0.19</td>\n    </tr>\n    <tr>\n      <th>by</th>\n      <td>4,666,987</td>\n      <td>4,645,396</td>\n      <td>43,329</td>\n      <td>41,266</td>\n      <td>0.21</td>\n      <td>0.10</td>\n      <td>0.10</td>\n    </tr>\n    <tr>\n      <th>za</th>\n      <td>4,509,805</td>\n      <td>4,489,262</td>\n      <td>113,557</td>\n      <td>108,413</td>\n      <td>0.21</td>\n      <td>0.26</td>\n      <td>0.26</td>\n    </tr>\n    <tr>\n      <th>tv</th>\n      <td>4,470,769</td>\n      <td>4,451,517</td>\n      <td>35,655</td>\n      <td>33,463</td>\n      <td>0.20</td>\n      <td>0.08</td>\n      <td>0.08</td>\n    </tr>\n    <tr>\n      <th>shop</th>\n      <td>4,447,572</td>\n      <td>4,435,503</td>\n      <td>74,998</td>\n      <td>73,536</td>\n      <td>0.20</td>\n      <td>0.17</td>\n      <td>0.18</td>\n    </tr>\n    <tr>\n      <th>nz</th>\n      <td>4,238,892</td>\n      <td>4,213,404</td>\n      <td>106,498</td>\n      <td>102,214</td>\n      <td>0.19</td>\n      <td>0.25</td>\n      <td>0.25</td>\n    </tr>\n    <tr>\n      <th>rs</th>\n      <td>4,128,226</td>\n      <td>4,112,394</td>\n      <td>44,174</td>\n      <td>40,978</td>\n      <td>0.19</td>\n      <td>0.10</td>\n      <td>0.10</td>\n    </tr>\n    <tr>\n      <th>lt</th>\n      <td>3,893,450</td>\n      <td>3,876,186</td>\n      <td>62,259</td>\n      <td>58,616</td>\n      <td>0.18</td>\n      <td>0.14</td>\n      <td>0.14</td>\n    </tr>\n    <tr>\n      <th>me</th>\n      <td>3,880,514</td>\n      <td>3,856,068</td>\n      <td>84,785</td>\n      <td>82,591</td>\n      <td>0.18</td>\n      <td>0.20</td>\n      <td>0.20</td>\n    </tr>\n    <tr>\n      <th>cc</th>\n      <td>3,674,616</td>\n      <td>3,658,758</td>\n      <td>75,294</td>\n      <td>72,081</td>\n      <td>0.17</td>\n      <td>0.17</td>\n      <td>0.18</td>\n    </tr>\n    <tr>\n      <th>us</th>\n      <td>3,651,299</td>\n      <td>3,628,822</td>\n      <td>93,422</td>\n      <td>89,006</td>\n      <td>0.17</td>\n      <td>0.22</td>\n      <td>0.22</td>\n    </tr>\n    <tr>\n      <th>hr</th>\n      <td>3,501,079</td>\n      <td>3,487,007</td>\n      <td>41,729</td>\n      <td>38,628</td>\n      <td>0.16</td>\n      <td>0.10</td>\n      <td>0.09</td>\n    </tr>\n    <tr>\n      <th>ee</th>\n      <td>3,473,932</td>\n      <td>3,457,253</td>\n      <td>48,658</td>\n      <td>43,816</td>\n      <td>0.16</td>\n      <td>0.11</td>\n      <td>0.11</td>\n    </tr>\n    <tr>\n      <th>app</th>\n      <td>3,203,341</td>\n      <td>3,181,514</td>\n      <td>113,218</td>\n      <td>111,719</td>\n      <td>0.15</td>\n      <td>0.26</td>\n      <td>0.27</td>\n    </tr>\n    <tr>\n      <th>ie</th>\n      <td>3,115,239</td>\n      <td>3,097,579</td>\n      <td>54,718</td>\n      <td>52,573</td>\n      <td>0.14</td>\n      <td>0.13</td>\n      <td>0.13</td>\n    </tr>\n    <tr>\n      <th>online</th>\n      <td>3,087,616</td>\n      <td>3,071,529</td>\n      <td>79,200</td>\n      <td>77,713</td>\n      <td>0.14</td>\n      <td>0.18</td>\n      <td>0.19</td>\n    </tr>\n    <tr>\n      <th>si</th>\n      <td>3,084,130</td>\n      <td>3,070,999</td>\n      <td>42,991</td>\n      <td>39,820</td>\n      <td>0.14</td>\n      <td>0.10</td>\n      <td>0.10</td>\n    </tr>\n    <tr>\n      <th>ai</th>\n      <td>3,097,545</td>\n      <td>3,064,149</td>\n      <td>80,872</td>\n      <td>78,310</td>\n      <td>0.14</td>\n      <td>0.19</td>\n      <td>0.19</td>\n    </tr>\n    <tr>\n      <th>kz</th>\n      <td>3,053,650</td>\n      <td>3,043,287</td>\n      <td>29,245</td>\n      <td>27,871</td>\n      <td>0.14</td>\n      <td>0.07</td>\n      <td>0.07</td>\n    </tr>\n    <tr>\n      <th>bg</th>\n      <td>3,001,650</td>\n      <td>2,988,367</td>\n      <td>26,482</td>\n      <td>25,233</td>\n      <td>0.14</td>\n      <td>0.06</td>\n      <td>0.06</td>\n    </tr>\n    <tr>\n      <th>biz</th>\n      <td>2,883,480</td>\n      <td>2,871,392</td>\n      <td>74,010</td>\n      <td>70,339</td>\n      <td>0.13</td>\n      <td>0.17</td>\n      <td>0.17</td>\n    </tr>\n    <tr>\n      <th>my</th>\n      <td>2,684,804</td>\n      <td>2,673,686</td>\n      <td>47,155</td>\n      <td>44,750</td>\n      <td>0.12</td>\n      <td>0.11</td>\n      <td>0.11</td>\n    </tr>\n    <tr>\n      <th>cat</th>\n      <td>2,616,179</td>\n      <td>2,603,022</td>\n      <td>25,079</td>\n      <td>23,585</td>\n      <td>0.12</td>\n      <td>0.06</td>\n      <td>0.06</td>\n    </tr>\n    <tr>\n      <th>hk</th>\n      <td>2,565,271</td>\n      <td>2,547,023</td>\n      <td>35,543</td>\n      <td>31,323</td>\n      <td>0.12</td>\n      <td>0.08</td>\n      <td>0.08</td>\n    </tr>\n    <tr>\n      <th>xyz</th>\n      <td>2,514,466</td>\n      <td>2,500,638</td>\n      <td>134,418</td>\n      <td>132,344</td>\n      <td>0.11</td>\n      <td>0.31</td>\n      <td>0.32</td>\n    </tr>\n    <tr>\n      <th>th</th>\n      <td>2,491,264</td>\n      <td>2,482,862</td>\n      <td>35,242</td>\n      <td>31,524</td>\n      <td>0.11</td>\n      <td>0.08</td>\n      <td>0.08</td>\n    </tr>\n    <tr>\n      <th>lv</th>\n      <td>2,262,924</td>\n      <td>2,246,863</td>\n      <td>29,827</td>\n      <td>27,263</td>\n      <td>0.10</td>\n      <td>0.07</td>\n      <td>0.07</td>\n    </tr>\n    <tr>\n      <th>ir</th>\n      <td>2,219,542</td>\n      <td>2,214,190</td>\n      <td>21,170</td>\n      <td>20,470</td>\n      <td>0.10</td>\n      <td>0.05</td>\n      <td>0.05</td>\n    </tr>\n    <tr>\n      <th>pro</th>\n      <td>2,020,737</td>\n      <td>2,011,062</td>\n      <td>47,439</td>\n      <td>46,138</td>\n      <td>0.09</td>\n      <td>0.11</td>\n      <td>0.11</td>\n    </tr>\n    <tr>\n      <th>top</th>\n      <td>2,016,773</td>\n      <td>2,006,691</td>\n      <td>88,932</td>\n      <td>87,453</td>\n      <td>0.09</td>\n      <td>0.21</td>\n      <td>0.21</td>\n    </tr>\n    <tr>\n      <th>su</th>\n      <td>1,906,416</td>\n      <td>1,899,093</td>\n      <td>20,528</td>\n      <td>19,460</td>\n      <td>0.09</td>\n      <td>0.05</td>\n      <td>0.05</td>\n    </tr>\n    <tr>\n      <th>pe</th>\n      <td>1,900,793</td>\n      <td>1,888,595</td>\n      <td>24,702</td>\n      <td>23,504</td>\n      <td>0.09</td>\n      <td>0.06</td>\n      <td>0.06</td>\n    </tr>\n    <tr>\n      <th>news</th>\n      <td>1,891,968</td>\n      <td>1,885,549</td>\n      <td>7,614</td>\n      <td>6,911</td>\n      <td>0.09</td>\n      <td>0.02</td>\n      <td>0.02</td>\n    </tr>\n    <tr>\n      <th>pk</th>\n      <td>1,727,158</td>\n      <td>1,721,951</td>\n      <td>23,818</td>\n      <td>22,678</td>\n      <td>0.08</td>\n      <td>0.06</td>\n      <td>0.06</td>\n    </tr>\n    <tr>\n      <th>ae</th>\n      <td>1,582,478</td>\n      <td>1,573,648</td>\n      <td>27,092</td>\n      <td>25,900</td>\n      <td>0.07</td>\n      <td>0.06</td>\n      <td>0.06</td>\n    </tr>\n    <tr>\n      <th>sg</th>\n      <td>1,564,083</td>\n      <td>1,551,080</td>\n      <td>29,816</td>\n      <td>28,377</td>\n      <td>0.07</td>\n      <td>0.07</td>\n      <td>0.07</td>\n    </tr>\n    <tr>\n      <th>club</th>\n      <td>1,390,628</td>\n      <td>1,384,288</td>\n      <td>31,655</td>\n      <td>30,834</td>\n      <td>0.06</td>\n      <td>0.07</td>\n      <td>0.08</td>\n    </tr>\n    <tr>\n      <th>store</th>\n      <td>1,378,895</td>\n      <td>1,371,317</td>\n      <td>33,081</td>\n      <td>32,475</td>\n      <td>0.06</td>\n      <td>0.08</td>\n      <td>0.08</td>\n    </tr>\n    <tr>\n      <th>ng</th>\n      <td>1,345,357</td>\n      <td>1,341,787</td>\n      <td>16,206</td>\n      <td>15,491</td>\n      <td>0.06</td>\n      <td>0.04</td>\n      <td>0.04</td>\n    </tr>\n    <tr>\n      <th>ph</th>\n      <td>1,276,912</td>\n      <td>1,251,140</td>\n      <td>16,404</td>\n      <td>15,476</td>\n      <td>0.06</td>\n      <td>0.04</td>\n      <td>0.04</td>\n    </tr>\n    <tr>\n      <th>ba</th>\n      <td>1,200,399</td>\n      <td>1,196,799</td>\n      <td>11,501</td>\n      <td>10,620</td>\n      <td>0.05</td>\n      <td>0.03</td>\n      <td>0.03</td>\n    </tr>\n    <tr>\n      <th>az</th>\n      <td>1,193,371</td>\n      <td>1,189,940</td>\n      <td>9,113</td>\n      <td>8,030</td>\n      <td>0.05</td>\n      <td>0.02</td>\n      <td>0.02</td>\n    </tr>\n    <tr>\n      <th>md</th>\n      <td>1,194,537</td>\n      <td>1,189,715</td>\n      <td>10,822</td>\n      <td>10,061</td>\n      <td>0.05</td>\n      <td>0.03</td>\n      <td>0.02</td>\n    </tr>\n    <tr>\n      <th>uy</th>\n      <td>1,161,819</td>\n      <td>1,156,512</td>\n      <td>13,550</td>\n      <td>12,493</td>\n      <td>0.05</td>\n      <td>0.03</td>\n      <td>0.03</td>\n    </tr>\n    <tr>\n      <th>is</th>\n      <td>1,116,164</td>\n      <td>1,107,682</td>\n      <td>15,528</td>\n      <td>14,723</td>\n      <td>0.05</td>\n      <td>0.04</td>\n      <td>0.04</td>\n    </tr>\n    <tr>\n      <th>dev</th>\n      <td>1,110,730</td>\n      <td>1,101,292</td>\n      <td>51,054</td>\n      <td>50,331</td>\n      <td>0.05</td>\n      <td>0.12</td>\n      <td>0.12</td>\n    </tr>\n    <tr>\n      <th>ma</th>\n      <td>1,096,675</td>\n      <td>1,092,413</td>\n      <td>14,151</td>\n      <td>13,332</td>\n      <td>0.05</td>\n      <td>0.03</td>\n      <td>0.03</td>\n    </tr>\n  </tbody>\n</table>"
  },
  {
    "path": "plots/tld/latestcrawl.md",
    "content": "---\nlayout: table\ntable_include:\n - latest-crawl-groups.html\n - latest-crawl-tlds.html\ntable_sortlist: \"{sortList: [[5,1]]}\"\ntable_searcher: \"Filter for top-level domains\"\n---\n\nTop-Level Domains of the Latest Monthly Crawl\n=============================================\n\nDetailed numbers and percentage of top-level domains (groups) in the latest monthly crawl ({{ site.latest_crawl }}). Note that [Internationalized country code TLDs (IDN ccTLDs)](https://en.wikipedia.org/wiki/List_of_Internet_top-level_domains#Internationalized_country_code_top-level_domains) are mapped to their ASCII equivalents before counting TLDs. E.g., the counts of `.ru` contain also the occurrences of [.рф](https://en.wikipedia.org/wiki/.%D1%80%D1%84).\n\n\n"
  },
  {
    "path": "plots/tld/percentage.md",
    "content": "---\nlayout: table\ntable_include: selected-crawls-percentage.html\ntable_sortlist: \"{sortList: [[7,1]]}\"\ntable_searcher: \"Filter for top-level domains\"\n---\n\nTop-Level Domains of Selected Crawls\n====================================\n\nJust the distribution (percentage / relative frequency) of URLs on top-level domains for few selected crawls, include the latest monthly crawl...  Only TLDs which reach at least 0.05% in one of the selected crawls are shown.\n"
  },
  {
    "path": "plots/tld/selected-crawl-comparison-spearman-all-tlds.html",
    "content": "<table border=\"1\" class=\"dataframe matrix\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th></th>\n      <th>pages</th>\n      <th>urls</th>\n      <th>hosts</th>\n      <th>domains</th>\n      <th>alexa</th>\n      <th>cisco</th>\n      <th>majestic</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>pages</th>\n      <td>1.000</td>\n      <td>0.999</td>\n      <td>0.975</td>\n      <td>0.974</td>\n      <td>0.924</td>\n      <td>0.824</td>\n      <td>0.886</td>\n    </tr>\n    <tr>\n      <th>urls</th>\n      <td>0.999</td>\n      <td>1.000</td>\n      <td>0.976</td>\n      <td>0.975</td>\n      <td>0.925</td>\n      <td>0.824</td>\n      <td>0.887</td>\n    </tr>\n    <tr>\n      <th>hosts</th>\n      <td>0.975</td>\n      <td>0.976</td>\n      <td>1.000</td>\n      <td>1.000</td>\n      <td>0.907</td>\n      <td>0.806</td>\n      <td>0.881</td>\n    </tr>\n    <tr>\n      <th>domains</th>\n      <td>0.974</td>\n      <td>0.975</td>\n      <td>1.000</td>\n      <td>1.000</td>\n      <td>0.905</td>\n      <td>0.805</td>\n      <td>0.878</td>\n    </tr>\n    <tr>\n      <th>alexa</th>\n      <td>0.924</td>\n      <td>0.925</td>\n      <td>0.907</td>\n      <td>0.905</td>\n      <td>1.000</td>\n      <td>0.873</td>\n      <td>0.894</td>\n    </tr>\n    <tr>\n      <th>cisco</th>\n      <td>0.824</td>\n      <td>0.824</td>\n      <td>0.806</td>\n      <td>0.805</td>\n      <td>0.873</td>\n      <td>1.000</td>\n      <td>0.839</td>\n    </tr>\n    <tr>\n      <th>majestic</th>\n      <td>0.886</td>\n      <td>0.887</td>\n      <td>0.881</td>\n      <td>0.878</td>\n      <td>0.894</td>\n      <td>0.839</td>\n      <td>1.000</td>\n    </tr>\n  </tbody>\n</table>"
  },
  {
    "path": "plots/tld/selected-crawl-comparison-spearman-frequent-tlds.html",
    "content": "<table border=\"1\" class=\"dataframe matrix\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th></th>\n      <th>pages</th>\n      <th>urls</th>\n      <th>hosts</th>\n      <th>domains</th>\n      <th>alexa</th>\n      <th>cisco</th>\n      <th>majestic</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>pages</th>\n      <td>1.000</td>\n      <td>1.000</td>\n      <td>0.869</td>\n      <td>0.862</td>\n      <td>0.812</td>\n      <td>0.734</td>\n      <td>0.812</td>\n    </tr>\n    <tr>\n      <th>urls</th>\n      <td>1.000</td>\n      <td>1.000</td>\n      <td>0.870</td>\n      <td>0.864</td>\n      <td>0.812</td>\n      <td>0.734</td>\n      <td>0.813</td>\n    </tr>\n    <tr>\n      <th>hosts</th>\n      <td>0.869</td>\n      <td>0.870</td>\n      <td>1.000</td>\n      <td>0.999</td>\n      <td>0.820</td>\n      <td>0.717</td>\n      <td>0.868</td>\n    </tr>\n    <tr>\n      <th>domains</th>\n      <td>0.862</td>\n      <td>0.864</td>\n      <td>0.999</td>\n      <td>1.000</td>\n      <td>0.819</td>\n      <td>0.721</td>\n      <td>0.873</td>\n    </tr>\n    <tr>\n      <th>alexa</th>\n      <td>0.812</td>\n      <td>0.812</td>\n      <td>0.820</td>\n      <td>0.819</td>\n      <td>1.000</td>\n      <td>0.765</td>\n      <td>0.831</td>\n    </tr>\n    <tr>\n      <th>cisco</th>\n      <td>0.734</td>\n      <td>0.734</td>\n      <td>0.717</td>\n      <td>0.721</td>\n      <td>0.765</td>\n      <td>1.000</td>\n      <td>0.825</td>\n    </tr>\n    <tr>\n      <th>majestic</th>\n      <td>0.812</td>\n      <td>0.813</td>\n      <td>0.868</td>\n      <td>0.873</td>\n      <td>0.831</td>\n      <td>0.825</td>\n      <td>1.000</td>\n    </tr>\n  </tbody>\n</table>"
  },
  {
    "path": "plots/tld/selected-crawl-comparison.html",
    "content": "<table border=\"1\" class=\"dataframe tablesorter tablepercentage\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th></th>\n      <th>pages</th>\n      <th>urls</th>\n      <th>hosts</th>\n      <th>domains</th>\n      <th>alexa</th>\n      <th>cisco</th>\n      <th>majestic</th>\n    </tr>\n    <tr>\n      <th>tld</th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>hu</th>\n      <td>0.437</td>\n      <td>0.437</td>\n      <td>0.397</td>\n      <td>0.388</td>\n      <td>0.368</td>\n      <td>0.090</td>\n      <td>0.226</td>\n    </tr>\n    <tr>\n      <th>bg</th>\n      <td>0.127</td>\n      <td>0.127</td>\n      <td>0.059</td>\n      <td>0.058</td>\n      <td>0.108</td>\n      <td>0.026</td>\n      <td>0.043</td>\n    </tr>\n    <tr>\n      <th>se</th>\n      <td>0.629</td>\n      <td>0.628</td>\n      <td>0.686</td>\n      <td>0.690</td>\n      <td>0.406</td>\n      <td>0.126</td>\n      <td>0.356</td>\n    </tr>\n    <tr>\n      <th>ca</th>\n      <td>0.818</td>\n      <td>0.819</td>\n      <td>0.818</td>\n      <td>0.820</td>\n      <td>0.682</td>\n      <td>0.361</td>\n      <td>0.641</td>\n    </tr>\n    <tr>\n      <th>uk</th>\n      <td>2.300</td>\n      <td>2.295</td>\n      <td>2.630</td>\n      <td>2.623</td>\n      <td>1.684</td>\n      <td>1.130</td>\n      <td>2.567</td>\n    </tr>\n    <tr>\n      <th>jp</th>\n      <td>1.821</td>\n      <td>1.826</td>\n      <td>1.546</td>\n      <td>1.534</td>\n      <td>1.074</td>\n      <td>0.360</td>\n      <td>1.525</td>\n    </tr>\n    <tr>\n      <th>it</th>\n      <td>1.621</td>\n      <td>1.622</td>\n      <td>1.584</td>\n      <td>1.582</td>\n      <td>1.130</td>\n      <td>0.428</td>\n      <td>0.985</td>\n    </tr>\n    <tr>\n      <th>at</th>\n      <td>0.400</td>\n      <td>0.400</td>\n      <td>0.587</td>\n      <td>0.582</td>\n      <td>0.310</td>\n      <td>0.087</td>\n      <td>0.275</td>\n    </tr>\n    <tr>\n      <th>be</th>\n      <td>0.483</td>\n      <td>0.483</td>\n      <td>0.601</td>\n      <td>0.585</td>\n      <td>0.331</td>\n      <td>0.147</td>\n      <td>0.283</td>\n    </tr>\n    <tr>\n      <th>cn</th>\n      <td>1.382</td>\n      <td>1.391</td>\n      <td>3.217</td>\n      <td>3.233</td>\n      <td>0.265</td>\n      <td>0.632</td>\n      <td>2.942</td>\n    </tr>\n    <tr>\n      <th>id</th>\n      <td>0.202</td>\n      <td>0.202</td>\n      <td>0.180</td>\n      <td>0.182</td>\n      <td>0.198</td>\n      <td>0.140</td>\n      <td>0.111</td>\n    </tr>\n    <tr>\n      <th>il</th>\n      <td>0.267</td>\n      <td>0.267</td>\n      <td>0.172</td>\n      <td>0.171</td>\n      <td>0.157</td>\n      <td>0.121</td>\n      <td>0.114</td>\n    </tr>\n    <tr>\n      <th>in</th>\n      <td>0.353</td>\n      <td>0.354</td>\n      <td>0.394</td>\n      <td>0.394</td>\n      <td>1.407</td>\n      <td>0.632</td>\n      <td>0.603</td>\n    </tr>\n    <tr>\n      <th>ir</th>\n      <td>0.240</td>\n      <td>0.240</td>\n      <td>0.235</td>\n      <td>0.231</td>\n      <td>1.293</td>\n      <td>0.078</td>\n      <td>0.323</td>\n    </tr>\n    <tr>\n      <th>kr</th>\n      <td>0.343</td>\n      <td>0.345</td>\n      <td>0.386</td>\n      <td>0.351</td>\n      <td>0.258</td>\n      <td>0.100</td>\n      <td>0.144</td>\n    </tr>\n    <tr>\n      <th>me</th>\n      <td>0.265</td>\n      <td>0.266</td>\n      <td>0.224</td>\n      <td>0.231</td>\n      <td>0.359</td>\n      <td>0.787</td>\n      <td>0.206</td>\n    </tr>\n    <tr>\n      <th>nz</th>\n      <td>0.218</td>\n      <td>0.218</td>\n      <td>0.266</td>\n      <td>0.266</td>\n      <td>0.137</td>\n      <td>0.075</td>\n      <td>0.148</td>\n    </tr>\n    <tr>\n      <th>rs</th>\n      <td>0.153</td>\n      <td>0.153</td>\n      <td>0.077</td>\n      <td>0.073</td>\n      <td>0.101</td>\n      <td>0.017</td>\n      <td>0.045</td>\n    </tr>\n    <tr>\n      <th>ru</th>\n      <td>4.513</td>\n      <td>4.518</td>\n      <td>2.987</td>\n      <td>2.991</td>\n      <td>4.498</td>\n      <td>1.440</td>\n      <td>4.311</td>\n    </tr>\n    <tr>\n      <th>th</th>\n      <td>0.093</td>\n      <td>0.093</td>\n      <td>0.079</td>\n      <td>0.074</td>\n      <td>0.141</td>\n      <td>0.053</td>\n      <td>0.053</td>\n    </tr>\n    <tr>\n      <th>vn</th>\n      <td>0.381</td>\n      <td>0.381</td>\n      <td>0.243</td>\n      <td>0.244</td>\n      <td>0.162</td>\n      <td>0.269</td>\n      <td>0.316</td>\n    </tr>\n    <tr>\n      <th>za</th>\n      <td>0.192</td>\n      <td>0.193</td>\n      <td>0.296</td>\n      <td>0.294</td>\n      <td>0.386</td>\n      <td>0.054</td>\n      <td>0.256</td>\n    </tr>\n    <tr>\n      <th>au</th>\n      <td>0.928</td>\n      <td>0.928</td>\n      <td>1.122</td>\n      <td>1.128</td>\n      <td>1.110</td>\n      <td>0.192</td>\n      <td>0.848</td>\n    </tr>\n    <tr>\n      <th>br</th>\n      <td>1.252</td>\n      <td>1.253</td>\n      <td>1.192</td>\n      <td>1.158</td>\n      <td>2.417</td>\n      <td>0.488</td>\n      <td>0.892</td>\n    </tr>\n    <tr>\n      <th>fr</th>\n      <td>1.681</td>\n      <td>1.681</td>\n      <td>1.640</td>\n      <td>1.643</td>\n      <td>0.968</td>\n      <td>0.479</td>\n      <td>0.956</td>\n    </tr>\n    <tr>\n      <th>pl</th>\n      <td>1.479</td>\n      <td>1.479</td>\n      <td>1.360</td>\n      <td>1.346</td>\n      <td>1.551</td>\n      <td>0.339</td>\n      <td>1.154</td>\n    </tr>\n    <tr>\n      <th>us</th>\n      <td>0.224</td>\n      <td>0.224</td>\n      <td>0.252</td>\n      <td>0.253</td>\n      <td>0.335</td>\n      <td>0.396</td>\n      <td>0.660</td>\n    </tr>\n    <tr>\n      <th>fi</th>\n      <td>0.338</td>\n      <td>0.338</td>\n      <td>0.317</td>\n      <td>0.316</td>\n      <td>0.208</td>\n      <td>0.054</td>\n      <td>0.150</td>\n    </tr>\n    <tr>\n      <th>no</th>\n      <td>0.363</td>\n      <td>0.362</td>\n      <td>0.299</td>\n      <td>0.298</td>\n      <td>0.364</td>\n      <td>0.106</td>\n      <td>0.163</td>\n    </tr>\n    <tr>\n      <th>ar</th>\n      <td>0.205</td>\n      <td>0.205</td>\n      <td>0.216</td>\n      <td>0.206</td>\n      <td>0.481</td>\n      <td>0.064</td>\n      <td>0.148</td>\n    </tr>\n    <tr>\n      <th>ro</th>\n      <td>0.458</td>\n      <td>0.458</td>\n      <td>0.310</td>\n      <td>0.306</td>\n      <td>0.589</td>\n      <td>0.065</td>\n      <td>0.282</td>\n    </tr>\n    <tr>\n      <th>tr</th>\n      <td>0.186</td>\n      <td>0.186</td>\n      <td>0.194</td>\n      <td>0.183</td>\n      <td>0.326</td>\n      <td>0.105</td>\n      <td>0.216</td>\n    </tr>\n    <tr>\n      <th>az</th>\n      <td>0.058</td>\n      <td>0.058</td>\n      <td>0.017</td>\n      <td>0.016</td>\n      <td>0.163</td>\n      <td>0.006</td>\n      <td>0.022</td>\n    </tr>\n    <tr>\n      <th>biz</th>\n      <td>0.180</td>\n      <td>0.181</td>\n      <td>0.282</td>\n      <td>0.286</td>\n      <td>0.219</td>\n      <td>0.996</td>\n      <td>0.306</td>\n    </tr>\n    <tr>\n      <th>by</th>\n      <td>0.195</td>\n      <td>0.196</td>\n      <td>0.116</td>\n      <td>0.116</td>\n      <td>0.141</td>\n      <td>0.042</td>\n      <td>0.116</td>\n    </tr>\n    <tr>\n      <th>cat</th>\n      <td>0.164</td>\n      <td>0.164</td>\n      <td>0.068</td>\n      <td>0.065</td>\n      <td>0.051</td>\n      <td>0.011</td>\n      <td>0.048</td>\n    </tr>\n    <tr>\n      <th>cc</th>\n      <td>0.112</td>\n      <td>0.110</td>\n      <td>0.137</td>\n      <td>0.137</td>\n      <td>0.138</td>\n      <td>0.544</td>\n      <td>0.156</td>\n    </tr>\n    <tr>\n      <th>ch</th>\n      <td>0.549</td>\n      <td>0.549</td>\n      <td>0.808</td>\n      <td>0.782</td>\n      <td>0.462</td>\n      <td>0.147</td>\n      <td>0.329</td>\n    </tr>\n    <tr>\n      <th>ua</th>\n      <td>0.758</td>\n      <td>0.760</td>\n      <td>0.429</td>\n      <td>0.435</td>\n      <td>0.592</td>\n      <td>0.259</td>\n      <td>0.402</td>\n    </tr>\n    <tr>\n      <th>cl</th>\n      <td>0.107</td>\n      <td>0.108</td>\n      <td>0.155</td>\n      <td>0.154</td>\n      <td>0.311</td>\n      <td>0.057</td>\n      <td>0.147</td>\n    </tr>\n    <tr>\n      <th>tw</th>\n      <td>0.523</td>\n      <td>0.526</td>\n      <td>0.593</td>\n      <td>0.596</td>\n      <td>0.323</td>\n      <td>0.090</td>\n      <td>0.716</td>\n    </tr>\n    <tr>\n      <th>co</th>\n      <td>0.417</td>\n      <td>0.418</td>\n      <td>0.379</td>\n      <td>0.387</td>\n      <td>0.698</td>\n      <td>0.539</td>\n      <td>0.554</td>\n    </tr>\n    <tr>\n      <th>com</th>\n      <td>46.309</td>\n      <td>46.286</td>\n      <td>47.160</td>\n      <td>47.446</td>\n      <td>47.796</td>\n      <td>58.393</td>\n      <td>49.626</td>\n    </tr>\n    <tr>\n      <th>ee</th>\n      <td>0.194</td>\n      <td>0.192</td>\n      <td>0.096</td>\n      <td>0.090</td>\n      <td>0.048</td>\n      <td>0.014</td>\n      <td>0.051</td>\n    </tr>\n    <tr>\n      <th>es</th>\n      <td>0.900</td>\n      <td>0.900</td>\n      <td>0.725</td>\n      <td>0.727</td>\n      <td>0.698</td>\n      <td>0.227</td>\n      <td>0.525</td>\n    </tr>\n    <tr>\n      <th>ge</th>\n      <td>0.053</td>\n      <td>0.054</td>\n      <td>0.023</td>\n      <td>0.022</td>\n      <td>0.036</td>\n      <td>0.005</td>\n      <td>0.025</td>\n    </tr>\n    <tr>\n      <th>gr</th>\n      <td>0.421</td>\n      <td>0.422</td>\n      <td>0.292</td>\n      <td>0.282</td>\n      <td>0.656</td>\n      <td>0.081</td>\n      <td>0.211</td>\n    </tr>\n    <tr>\n      <th>hk</th>\n      <td>0.088</td>\n      <td>0.089</td>\n      <td>0.076</td>\n      <td>0.073</td>\n      <td>0.097</td>\n      <td>0.062</td>\n      <td>0.088</td>\n    </tr>\n    <tr>\n      <th>hr</th>\n      <td>0.161</td>\n      <td>0.161</td>\n      <td>0.087</td>\n      <td>0.082</td>\n      <td>0.110</td>\n      <td>0.021</td>\n      <td>0.065</td>\n    </tr>\n    <tr>\n      <th>kz</th>\n      <td>0.118</td>\n      <td>0.119</td>\n      <td>0.079</td>\n      <td>0.079</td>\n      <td>0.129</td>\n      <td>0.023</td>\n      <td>0.102</td>\n    </tr>\n    <tr>\n      <th>lv</th>\n      <td>0.148</td>\n      <td>0.148</td>\n      <td>0.075</td>\n      <td>0.071</td>\n      <td>0.058</td>\n      <td>0.014</td>\n      <td>0.053</td>\n    </tr>\n    <tr>\n      <th>mx</th>\n      <td>0.187</td>\n      <td>0.187</td>\n      <td>0.196</td>\n      <td>0.190</td>\n      <td>0.633</td>\n      <td>0.152</td>\n      <td>0.164</td>\n    </tr>\n    <tr>\n      <th>my</th>\n      <td>0.095</td>\n      <td>0.095</td>\n      <td>0.092</td>\n      <td>0.090</td>\n      <td>0.105</td>\n      <td>0.064</td>\n      <td>0.109</td>\n    </tr>\n    <tr>\n      <th>pt</th>\n      <td>0.254</td>\n      <td>0.255</td>\n      <td>0.182</td>\n      <td>0.178</td>\n      <td>0.213</td>\n      <td>0.119</td>\n      <td>0.129</td>\n    </tr>\n    <tr>\n      <th>sg</th>\n      <td>0.065</td>\n      <td>0.065</td>\n      <td>0.070</td>\n      <td>0.070</td>\n      <td>0.098</td>\n      <td>0.049</td>\n      <td>0.083</td>\n    </tr>\n    <tr>\n      <th>pro</th>\n      <td>0.064</td>\n      <td>0.064</td>\n      <td>0.070</td>\n      <td>0.072</td>\n      <td>0.167</td>\n      <td>0.071</td>\n      <td>0.072</td>\n    </tr>\n    <tr>\n      <th>cz</th>\n      <td>0.970</td>\n      <td>0.969</td>\n      <td>0.851</td>\n      <td>0.836</td>\n      <td>0.780</td>\n      <td>0.114</td>\n      <td>0.370</td>\n    </tr>\n    <tr>\n      <th>de</th>\n      <td>3.847</td>\n      <td>3.845</td>\n      <td>5.121</td>\n      <td>4.999</td>\n      <td>3.107</td>\n      <td>0.925</td>\n      <td>2.398</td>\n    </tr>\n    <tr>\n      <th>dk</th>\n      <td>0.395</td>\n      <td>0.394</td>\n      <td>0.537</td>\n      <td>0.538</td>\n      <td>0.317</td>\n      <td>0.125</td>\n      <td>0.240</td>\n    </tr>\n    <tr>\n      <th>edu</th>\n      <td>1.056</td>\n      <td>1.059</td>\n      <td>0.257</td>\n      <td>0.263</td>\n      <td>0.306</td>\n      <td>1.040</td>\n      <td>0.398</td>\n    </tr>\n    <tr>\n      <th>eu</th>\n      <td>0.704</td>\n      <td>0.704</td>\n      <td>0.649</td>\n      <td>0.641</td>\n      <td>0.501</td>\n      <td>0.372</td>\n      <td>0.480</td>\n    </tr>\n    <tr>\n      <th>gov</th>\n      <td>0.358</td>\n      <td>0.357</td>\n      <td>0.055</td>\n      <td>0.053</td>\n      <td>0.107</td>\n      <td>0.511</td>\n      <td>0.172</td>\n    </tr>\n    <tr>\n      <th>ie</th>\n      <td>0.144</td>\n      <td>0.144</td>\n      <td>0.139</td>\n      <td>0.139</td>\n      <td>0.177</td>\n      <td>0.044</td>\n      <td>0.132</td>\n    </tr>\n    <tr>\n      <th>lt</th>\n      <td>0.247</td>\n      <td>0.247</td>\n      <td>0.135</td>\n      <td>0.130</td>\n      <td>0.115</td>\n      <td>0.025</td>\n      <td>0.084</td>\n    </tr>\n    <tr>\n      <th>info</th>\n      <td>1.115</td>\n      <td>1.119</td>\n      <td>0.741</td>\n      <td>0.743</td>\n      <td>0.863</td>\n      <td>0.754</td>\n      <td>1.062</td>\n    </tr>\n    <tr>\n      <th>io</th>\n      <td>0.140</td>\n      <td>0.140</td>\n      <td>0.345</td>\n      <td>0.361</td>\n      <td>0.626</td>\n      <td>0.939</td>\n      <td>0.207</td>\n    </tr>\n    <tr>\n      <th>is</th>\n      <td>0.060</td>\n      <td>0.060</td>\n      <td>0.037</td>\n      <td>0.037</td>\n      <td>0.041</td>\n      <td>0.034</td>\n      <td>0.036</td>\n    </tr>\n    <tr>\n      <th>net</th>\n      <td>3.656</td>\n      <td>3.652</td>\n      <td>3.491</td>\n      <td>3.492</td>\n      <td>4.064</td>\n      <td>15.653</td>\n      <td>4.480</td>\n    </tr>\n    <tr>\n      <th>nl</th>\n      <td>1.360</td>\n      <td>1.359</td>\n      <td>1.944</td>\n      <td>1.930</td>\n      <td>0.568</td>\n      <td>0.453</td>\n      <td>1.119</td>\n    </tr>\n    <tr>\n      <th>nu</th>\n      <td>0.056</td>\n      <td>0.056</td>\n      <td>0.078</td>\n      <td>0.078</td>\n      <td>0.031</td>\n      <td>0.012</td>\n      <td>0.243</td>\n    </tr>\n    <tr>\n      <th>org</th>\n      <td>5.809</td>\n      <td>5.811</td>\n      <td>4.129</td>\n      <td>4.064</td>\n      <td>4.875</td>\n      <td>4.228</td>\n      <td>7.252</td>\n    </tr>\n    <tr>\n      <th>si</th>\n      <td>0.152</td>\n      <td>0.152</td>\n      <td>0.102</td>\n      <td>0.098</td>\n      <td>0.096</td>\n      <td>0.013</td>\n      <td>0.049</td>\n    </tr>\n    <tr>\n      <th>sk</th>\n      <td>0.308</td>\n      <td>0.308</td>\n      <td>0.260</td>\n      <td>0.255</td>\n      <td>0.380</td>\n      <td>0.049</td>\n      <td>0.108</td>\n    </tr>\n    <tr>\n      <th>su</th>\n      <td>0.074</td>\n      <td>0.074</td>\n      <td>0.056</td>\n      <td>0.056</td>\n      <td>0.112</td>\n      <td>0.027</td>\n      <td>0.091</td>\n    </tr>\n    <tr>\n      <th>tk</th>\n      <td>0.064</td>\n      <td>0.064</td>\n      <td>0.073</td>\n      <td>0.076</td>\n      <td>0.054</td>\n      <td>0.013</td>\n      <td>0.101</td>\n    </tr>\n    <tr>\n      <th>tv</th>\n      <td>0.222</td>\n      <td>0.222</td>\n      <td>0.109</td>\n      <td>0.108</td>\n      <td>0.325</td>\n      <td>0.384</td>\n      <td>0.202</td>\n    </tr>\n    <tr>\n      <th>club</th>\n      <td>0.105</td>\n      <td>0.105</td>\n      <td>0.132</td>\n      <td>0.137</td>\n      <td>0.188</td>\n      <td>0.097</td>\n      <td>0.815</td>\n    </tr>\n    <tr>\n      <th>xyz</th>\n      <td>0.097</td>\n      <td>0.097</td>\n      <td>0.170</td>\n      <td>0.175</td>\n      <td>0.221</td>\n      <td>0.109</td>\n      <td>0.189</td>\n    </tr>\n    <tr>\n      <th>top</th>\n      <td>0.063</td>\n      <td>0.063</td>\n      <td>0.272</td>\n      <td>0.282</td>\n      <td>0.079</td>\n      <td>0.054</td>\n      <td>0.211</td>\n    </tr>\n    <tr>\n      <th>site</th>\n      <td>0.075</td>\n      <td>0.075</td>\n      <td>0.478</td>\n      <td>0.500</td>\n      <td>0.103</td>\n      <td>0.036</td>\n      <td>0.167</td>\n    </tr>\n    <tr>\n      <th>online</th>\n      <td>0.063</td>\n      <td>0.063</td>\n      <td>0.080</td>\n      <td>0.083</td>\n      <td>0.169</td>\n      <td>0.060</td>\n      <td>0.106</td>\n    </tr>\n    <tr>\n      <th>live</th>\n      <td>0.151</td>\n      <td>0.152</td>\n      <td>0.303</td>\n      <td>0.320</td>\n      <td>0.057</td>\n      <td>0.033</td>\n      <td>0.052</td>\n    </tr>\n    <tr>\n      <th>blog</th>\n      <td>0.097</td>\n      <td>0.097</td>\n      <td>0.093</td>\n      <td>0.098</td>\n      <td>0.031</td>\n      <td>0.004</td>\n      <td>0.007</td>\n    </tr>\n  </tbody>\n</table>"
  },
  {
    "path": "plots/tld/selected-crawls-percentage.html",
    "content": "<table border=\"1\" class=\"dataframe tablesorter tablepercentage tablesearcher\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th>crawl</th>\n      <th>CC-MAIN-2008-2009</th>\n      <th>CC-MAIN-2012</th>\n      <th>CC-MAIN-2014-10</th>\n      <th>CC-MAIN-2016-30</th>\n      <th>CC-MAIN-2019-09</th>\n      <th>CC-MAIN-2022-49</th>\n      <th>CC-MAIN-2026-17</th>\n    </tr>\n    <tr>\n      <th>tld</th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>ae</th>\n      <td>0.0010</td>\n      <td>0.0101</td>\n      <td>0.0123</td>\n      <td>0.0099</td>\n      <td>0.0266</td>\n      <td>0.0452</td>\n      <td>0.0743</td>\n    </tr>\n    <tr>\n      <th>ai</th>\n      <td>0.0000</td>\n      <td>0.0004</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.0049</td>\n      <td>0.0257</td>\n      <td>0.1447</td>\n    </tr>\n    <tr>\n      <th>app</th>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>0.0054</td>\n      <td>0.0991</td>\n      <td>0.1502</td>\n    </tr>\n    <tr>\n      <th>ar</th>\n      <td>0.0818</td>\n      <td>0.2379</td>\n      <td>0.0991</td>\n      <td>0.0782</td>\n      <td>0.2121</td>\n      <td>0.3143</td>\n      <td>0.3572</td>\n    </tr>\n    <tr>\n      <th>at</th>\n      <td>0.0025</td>\n      <td>0.3795</td>\n      <td>0.0632</td>\n      <td>0.1555</td>\n      <td>0.4176</td>\n      <td>0.4889</td>\n      <td>0.4929</td>\n    </tr>\n    <tr>\n      <th>au</th>\n      <td>0.6008</td>\n      <td>0.9929</td>\n      <td>0.4579</td>\n      <td>0.5643</td>\n      <td>0.9371</td>\n      <td>0.2561</td>\n      <td>0.9060</td>\n    </tr>\n    <tr>\n      <th>az</th>\n      <td>0.0002</td>\n      <td>0.0060</td>\n      <td>0.0012</td>\n      <td>0.0031</td>\n      <td>0.0393</td>\n      <td>0.0407</td>\n      <td>0.0562</td>\n    </tr>\n    <tr>\n      <th>ba</th>\n      <td>0.0014</td>\n      <td>0.0101</td>\n      <td>0.0020</td>\n      <td>0.0028</td>\n      <td>0.0244</td>\n      <td>0.0377</td>\n      <td>0.0565</td>\n    </tr>\n    <tr>\n      <th>be</th>\n      <td>0.0024</td>\n      <td>0.3970</td>\n      <td>0.0564</td>\n      <td>0.1547</td>\n      <td>0.4498</td>\n      <td>0.6205</td>\n      <td>0.5564</td>\n    </tr>\n    <tr>\n      <th>bg</th>\n      <td>0.0010</td>\n      <td>0.0379</td>\n      <td>0.0078</td>\n      <td>0.0161</td>\n      <td>0.1108</td>\n      <td>0.1413</td>\n      <td>0.1411</td>\n    </tr>\n    <tr>\n      <th>biz</th>\n      <td>0.5548</td>\n      <td>0.3744</td>\n      <td>0.0384</td>\n      <td>0.0532</td>\n      <td>0.2749</td>\n      <td>0.1651</td>\n      <td>0.1356</td>\n    </tr>\n    <tr>\n      <th>blog</th>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>0.0886</td>\n      <td>0.1750</td>\n      <td>0.0423</td>\n    </tr>\n    <tr>\n      <th>br</th>\n      <td>0.3366</td>\n      <td>0.7638</td>\n      <td>0.2175</td>\n      <td>0.2958</td>\n      <td>1.1821</td>\n      <td>0.3424</td>\n      <td>1.7511</td>\n    </tr>\n    <tr>\n      <th>by</th>\n      <td>0.0023</td>\n      <td>0.0352</td>\n      <td>0.0009</td>\n      <td>0.0138</td>\n      <td>0.2154</td>\n      <td>0.1632</td>\n      <td>0.2193</td>\n    </tr>\n    <tr>\n      <th>ca</th>\n      <td>0.0141</td>\n      <td>0.6896</td>\n      <td>0.4689</td>\n      <td>0.5205</td>\n      <td>0.7431</td>\n      <td>0.9764</td>\n      <td>0.8631</td>\n    </tr>\n    <tr>\n      <th>cat</th>\n      <td>0.0004</td>\n      <td>0.0495</td>\n      <td>0.0103</td>\n      <td>0.0150</td>\n      <td>0.0926</td>\n      <td>0.1412</td>\n      <td>0.1229</td>\n    </tr>\n    <tr>\n      <th>cc</th>\n      <td>0.0035</td>\n      <td>0.0956</td>\n      <td>0.0404</td>\n      <td>0.1105</td>\n      <td>0.1024</td>\n      <td>0.1143</td>\n      <td>0.1727</td>\n    </tr>\n    <tr>\n      <th>ch</th>\n      <td>0.0033</td>\n      <td>0.5263</td>\n      <td>0.1018</td>\n      <td>0.2150</td>\n      <td>0.5639</td>\n      <td>0.6393</td>\n      <td>0.6620</td>\n    </tr>\n    <tr>\n      <th>cl</th>\n      <td>0.0010</td>\n      <td>0.0834</td>\n      <td>0.0660</td>\n      <td>0.0633</td>\n      <td>0.1189</td>\n      <td>0.2032</td>\n      <td>0.2402</td>\n    </tr>\n    <tr>\n      <th>club</th>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>0.0000</td>\n      <td>0.0004</td>\n      <td>0.0990</td>\n      <td>0.0749</td>\n      <td>0.0653</td>\n    </tr>\n    <tr>\n      <th>cn</th>\n      <td>1.0882</td>\n      <td>0.4206</td>\n      <td>0.0157</td>\n      <td>0.3095</td>\n      <td>0.8912</td>\n      <td>0.7129</td>\n      <td>1.1141</td>\n    </tr>\n    <tr>\n      <th>co</th>\n      <td>0.0165</td>\n      <td>0.0453</td>\n      <td>0.0328</td>\n      <td>0.0638</td>\n      <td>0.4111</td>\n      <td>0.4344</td>\n      <td>0.4437</td>\n    </tr>\n    <tr>\n      <th>com</th>\n      <td>71.2776</td>\n      <td>55.7739</td>\n      <td>74.6893</td>\n      <td>69.1709</td>\n      <td>46.4954</td>\n      <td>48.5718</td>\n      <td>43.0835</td>\n    </tr>\n    <tr>\n      <th>cz</th>\n      <td>0.0065</td>\n      <td>0.7823</td>\n      <td>0.0480</td>\n      <td>0.2278</td>\n      <td>1.0365</td>\n      <td>1.1044</td>\n      <td>1.1445</td>\n    </tr>\n    <tr>\n      <th>de</th>\n      <td>0.0523</td>\n      <td>4.8419</td>\n      <td>0.7005</td>\n      <td>1.5104</td>\n      <td>4.0367</td>\n      <td>4.4966</td>\n      <td>4.4824</td>\n    </tr>\n    <tr>\n      <th>dev</th>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>0.0000</td>\n      <td>0.0189</td>\n      <td>0.0520</td>\n    </tr>\n    <tr>\n      <th>dk</th>\n      <td>0.0033</td>\n      <td>0.3703</td>\n      <td>0.0803</td>\n      <td>0.1524</td>\n      <td>0.3844</td>\n      <td>0.4507</td>\n      <td>0.5416</td>\n    </tr>\n    <tr>\n      <th>edu</th>\n      <td>1.2782</td>\n      <td>0.6178</td>\n      <td>3.0893</td>\n      <td>2.9472</td>\n      <td>0.6385</td>\n      <td>1.5058</td>\n      <td>0.8516</td>\n    </tr>\n    <tr>\n      <th>ee</th>\n      <td>0.0003</td>\n      <td>0.0481</td>\n      <td>0.0058</td>\n      <td>0.0134</td>\n      <td>0.1142</td>\n      <td>0.1539</td>\n      <td>0.1632</td>\n    </tr>\n    <tr>\n      <th>es</th>\n      <td>0.0339</td>\n      <td>0.6735</td>\n      <td>0.1764</td>\n      <td>0.2350</td>\n      <td>0.8842</td>\n      <td>1.0312</td>\n      <td>0.9327</td>\n    </tr>\n    <tr>\n      <th>eu</th>\n      <td>0.0045</td>\n      <td>0.4587</td>\n      <td>0.1181</td>\n      <td>0.1841</td>\n      <td>0.7728</td>\n      <td>0.7487</td>\n      <td>0.7473</td>\n    </tr>\n    <tr>\n      <th>fi</th>\n      <td>0.0009</td>\n      <td>0.1756</td>\n      <td>0.0262</td>\n      <td>0.0514</td>\n      <td>0.2874</td>\n      <td>0.3940</td>\n      <td>0.3680</td>\n    </tr>\n    <tr>\n      <th>fm</th>\n      <td>0.0001</td>\n      <td>0.0631</td>\n      <td>0.0582</td>\n      <td>0.0879</td>\n      <td>0.0401</td>\n      <td>0.0665</td>\n      <td>0.0452</td>\n    </tr>\n    <tr>\n      <th>fr</th>\n      <td>0.0197</td>\n      <td>1.3196</td>\n      <td>0.2698</td>\n      <td>0.4410</td>\n      <td>1.6453</td>\n      <td>1.9843</td>\n      <td>1.9828</td>\n    </tr>\n    <tr>\n      <th>gov</th>\n      <td>0.3797</td>\n      <td>0.2691</td>\n      <td>1.6173</td>\n      <td>1.5328</td>\n      <td>0.2410</td>\n      <td>0.4898</td>\n      <td>0.4072</td>\n    </tr>\n    <tr>\n      <th>gr</th>\n      <td>0.0014</td>\n      <td>0.1162</td>\n      <td>0.0574</td>\n      <td>0.0765</td>\n      <td>0.3998</td>\n      <td>0.5672</td>\n      <td>0.5375</td>\n    </tr>\n    <tr>\n      <th>hk</th>\n      <td>0.0355</td>\n      <td>0.0431</td>\n      <td>0.0170</td>\n      <td>0.0253</td>\n      <td>0.0783</td>\n      <td>0.1074</td>\n      <td>0.1202</td>\n    </tr>\n    <tr>\n      <th>hr</th>\n      <td>0.0034</td>\n      <td>0.0683</td>\n      <td>0.0136</td>\n      <td>0.0279</td>\n      <td>0.0949</td>\n      <td>0.1503</td>\n      <td>0.1646</td>\n    </tr>\n    <tr>\n      <th>hu</th>\n      <td>0.0025</td>\n      <td>0.3731</td>\n      <td>0.0466</td>\n      <td>0.0971</td>\n      <td>0.4631</td>\n      <td>0.5871</td>\n      <td>0.5229</td>\n    </tr>\n    <tr>\n      <th>id</th>\n      <td>0.0006</td>\n      <td>0.0648</td>\n      <td>0.0556</td>\n      <td>0.0675</td>\n      <td>0.1580</td>\n      <td>0.2769</td>\n      <td>0.4535</td>\n    </tr>\n    <tr>\n      <th>ie</th>\n      <td>0.0017</td>\n      <td>0.1182</td>\n      <td>0.0746</td>\n      <td>0.0920</td>\n      <td>0.1359</td>\n      <td>0.2019</td>\n      <td>0.1462</td>\n    </tr>\n    <tr>\n      <th>il</th>\n      <td>0.0136</td>\n      <td>0.0864</td>\n      <td>0.0216</td>\n      <td>0.0395</td>\n      <td>0.1694</td>\n      <td>0.0430</td>\n      <td>0.2268</td>\n    </tr>\n    <tr>\n      <th>in</th>\n      <td>0.0100</td>\n      <td>0.2149</td>\n      <td>0.1058</td>\n      <td>0.1037</td>\n      <td>0.4125</td>\n      <td>0.5466</td>\n      <td>0.6916</td>\n    </tr>\n    <tr>\n      <th>info</th>\n      <td>1.8063</td>\n      <td>1.3288</td>\n      <td>0.1828</td>\n      <td>0.2468</td>\n      <td>1.4361</td>\n      <td>0.7173</td>\n      <td>0.6015</td>\n    </tr>\n    <tr>\n      <th>int</th>\n      <td>0.0000</td>\n      <td>0.0135</td>\n      <td>0.0739</td>\n      <td>0.0816</td>\n      <td>0.0166</td>\n      <td>0.0328</td>\n      <td>0.0188</td>\n    </tr>\n    <tr>\n      <th>io</th>\n      <td>NaN</td>\n      <td>0.0049</td>\n      <td>0.0128</td>\n      <td>0.0189</td>\n      <td>0.1391</td>\n      <td>0.2229</td>\n      <td>0.3323</td>\n    </tr>\n    <tr>\n      <th>ir</th>\n      <td>0.0007</td>\n      <td>0.0553</td>\n      <td>0.0141</td>\n      <td>0.0144</td>\n      <td>0.3396</td>\n      <td>0.3407</td>\n      <td>0.1045</td>\n    </tr>\n    <tr>\n      <th>is</th>\n      <td>0.0001</td>\n      <td>0.0345</td>\n      <td>0.0379</td>\n      <td>0.0362</td>\n      <td>0.0396</td>\n      <td>0.0564</td>\n      <td>0.0523</td>\n    </tr>\n    <tr>\n      <th>it</th>\n      <td>0.0439</td>\n      <td>1.3305</td>\n      <td>0.2254</td>\n      <td>0.4405</td>\n      <td>1.6564</td>\n      <td>2.0824</td>\n      <td>1.7880</td>\n    </tr>\n    <tr>\n      <th>jp</th>\n      <td>0.0518</td>\n      <td>1.1743</td>\n      <td>0.1047</td>\n      <td>0.6075</td>\n      <td>2.1451</td>\n      <td>1.5354</td>\n      <td>2.3647</td>\n    </tr>\n    <tr>\n      <th>kr</th>\n      <td>0.0009</td>\n      <td>0.0780</td>\n      <td>0.0451</td>\n      <td>0.0846</td>\n      <td>0.3447</td>\n      <td>0.3294</td>\n      <td>0.4309</td>\n    </tr>\n    <tr>\n      <th>kz</th>\n      <td>0.0003</td>\n      <td>0.0215</td>\n      <td>0.0009</td>\n      <td>0.0096</td>\n      <td>0.1191</td>\n      <td>0.1160</td>\n      <td>0.1437</td>\n    </tr>\n    <tr>\n      <th>lt</th>\n      <td>0.0003</td>\n      <td>0.0999</td>\n      <td>0.0063</td>\n      <td>0.0218</td>\n      <td>0.1428</td>\n      <td>0.1666</td>\n      <td>0.1830</td>\n    </tr>\n    <tr>\n      <th>lv</th>\n      <td>0.0013</td>\n      <td>0.0609</td>\n      <td>0.0048</td>\n      <td>0.0140</td>\n      <td>0.0987</td>\n      <td>0.1007</td>\n      <td>0.1061</td>\n    </tr>\n    <tr>\n      <th>ma</th>\n      <td>0.0008</td>\n      <td>0.0081</td>\n      <td>0.0009</td>\n      <td>0.0028</td>\n      <td>0.0206</td>\n      <td>0.0330</td>\n      <td>0.0516</td>\n    </tr>\n    <tr>\n      <th>md</th>\n      <td>0.0005</td>\n      <td>0.0168</td>\n      <td>0.0016</td>\n      <td>0.0034</td>\n      <td>0.0358</td>\n      <td>0.0423</td>\n      <td>0.0562</td>\n    </tr>\n    <tr>\n      <th>me</th>\n      <td>0.0000</td>\n      <td>0.0586</td>\n      <td>0.0367</td>\n      <td>0.0557</td>\n      <td>0.3158</td>\n      <td>0.2102</td>\n      <td>0.1820</td>\n    </tr>\n    <tr>\n      <th>mx</th>\n      <td>0.0786</td>\n      <td>0.1460</td>\n      <td>0.0752</td>\n      <td>0.0898</td>\n      <td>0.1991</td>\n      <td>0.1443</td>\n      <td>0.2994</td>\n    </tr>\n    <tr>\n      <th>my</th>\n      <td>0.0302</td>\n      <td>0.0465</td>\n      <td>0.0285</td>\n      <td>0.0413</td>\n      <td>0.0788</td>\n      <td>0.1082</td>\n      <td>0.1262</td>\n    </tr>\n    <tr>\n      <th>net</th>\n      <td>9.1996</td>\n      <td>5.4501</td>\n      <td>3.2462</td>\n      <td>3.4269</td>\n      <td>4.3645</td>\n      <td>3.7162</td>\n      <td>3.0569</td>\n    </tr>\n    <tr>\n      <th>news</th>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>0.0017</td>\n      <td>0.0349</td>\n      <td>0.0820</td>\n      <td>0.0890</td>\n    </tr>\n    <tr>\n      <th>ng</th>\n      <td>0.0008</td>\n      <td>0.0013</td>\n      <td>0.0008</td>\n      <td>0.0010</td>\n      <td>0.0359</td>\n      <td>0.0578</td>\n      <td>0.0633</td>\n    </tr>\n    <tr>\n      <th>nl</th>\n      <td>0.0073</td>\n      <td>1.4578</td>\n      <td>0.1612</td>\n      <td>0.4426</td>\n      <td>1.4049</td>\n      <td>1.8683</td>\n      <td>1.5077</td>\n    </tr>\n    <tr>\n      <th>no</th>\n      <td>0.0063</td>\n      <td>0.2375</td>\n      <td>0.0612</td>\n      <td>0.0717</td>\n      <td>0.2697</td>\n      <td>0.3572</td>\n      <td>0.3401</td>\n    </tr>\n    <tr>\n      <th>nu</th>\n      <td>0.0001</td>\n      <td>0.0661</td>\n      <td>0.0271</td>\n      <td>0.0208</td>\n      <td>0.0746</td>\n      <td>0.0571</td>\n      <td>0.0505</td>\n    </tr>\n    <tr>\n      <th>nz</th>\n      <td>0.0322</td>\n      <td>0.2274</td>\n      <td>0.0710</td>\n      <td>0.0815</td>\n      <td>0.2161</td>\n      <td>0.0694</td>\n      <td>0.1989</td>\n    </tr>\n    <tr>\n      <th>online</th>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>0.0013</td>\n      <td>0.0662</td>\n      <td>0.1162</td>\n      <td>0.1450</td>\n    </tr>\n    <tr>\n      <th>org</th>\n      <td>8.1008</td>\n      <td>6.0302</td>\n      <td>9.8266</td>\n      <td>10.5466</td>\n      <td>5.4654</td>\n      <td>6.5231</td>\n      <td>5.6526</td>\n    </tr>\n    <tr>\n      <th>pe</th>\n      <td>0.0155</td>\n      <td>0.0288</td>\n      <td>0.0077</td>\n      <td>0.0153</td>\n      <td>0.0462</td>\n      <td>0.0722</td>\n      <td>0.0892</td>\n    </tr>\n    <tr>\n      <th>ph</th>\n      <td>0.0157</td>\n      <td>0.0316</td>\n      <td>0.0106</td>\n      <td>0.0096</td>\n      <td>0.0389</td>\n      <td>0.0558</td>\n      <td>0.0591</td>\n    </tr>\n    <tr>\n      <th>pk</th>\n      <td>0.0074</td>\n      <td>0.0141</td>\n      <td>0.0109</td>\n      <td>0.0137</td>\n      <td>0.0410</td>\n      <td>0.0694</td>\n      <td>0.0813</td>\n    </tr>\n    <tr>\n      <th>pl</th>\n      <td>0.1857</td>\n      <td>1.8377</td>\n      <td>0.0851</td>\n      <td>0.2665</td>\n      <td>1.5367</td>\n      <td>1.6926</td>\n      <td>1.9501</td>\n    </tr>\n    <tr>\n      <th>pro</th>\n      <td>0.0000</td>\n      <td>0.0082</td>\n      <td>0.0011</td>\n      <td>0.0019</td>\n      <td>0.0706</td>\n      <td>0.0862</td>\n      <td>0.0949</td>\n    </tr>\n    <tr>\n      <th>pt</th>\n      <td>0.0178</td>\n      <td>0.1074</td>\n      <td>0.0414</td>\n      <td>0.0590</td>\n      <td>0.2079</td>\n      <td>0.2815</td>\n      <td>0.3051</td>\n    </tr>\n    <tr>\n      <th>ro</th>\n      <td>0.0191</td>\n      <td>0.5855</td>\n      <td>0.0252</td>\n      <td>0.0918</td>\n      <td>0.4788</td>\n      <td>0.5701</td>\n      <td>0.6007</td>\n    </tr>\n    <tr>\n      <th>rs</th>\n      <td>0.0002</td>\n      <td>0.0389</td>\n      <td>0.0074</td>\n      <td>0.0186</td>\n      <td>0.0934</td>\n      <td>0.1484</td>\n      <td>0.1941</td>\n    </tr>\n    <tr>\n      <th>ru</th>\n      <td>0.0533</td>\n      <td>1.7328</td>\n      <td>0.0891</td>\n      <td>0.6050</td>\n      <td>6.1098</td>\n      <td>4.3328</td>\n      <td>5.0205</td>\n    </tr>\n    <tr>\n      <th>se</th>\n      <td>0.0019</td>\n      <td>0.5328</td>\n      <td>0.1349</td>\n      <td>0.1918</td>\n      <td>0.7078</td>\n      <td>0.6305</td>\n      <td>0.6869</td>\n    </tr>\n    <tr>\n      <th>sg</th>\n      <td>0.0229</td>\n      <td>0.0486</td>\n      <td>0.0190</td>\n      <td>0.0219</td>\n      <td>0.0636</td>\n      <td>0.0838</td>\n      <td>0.0732</td>\n    </tr>\n    <tr>\n      <th>shop</th>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>0.0000</td>\n      <td>0.0243</td>\n      <td>0.1146</td>\n      <td>0.2094</td>\n    </tr>\n    <tr>\n      <th>si</th>\n      <td>0.0027</td>\n      <td>0.0568</td>\n      <td>0.0071</td>\n      <td>0.0105</td>\n      <td>0.0895</td>\n      <td>0.1520</td>\n      <td>0.1450</td>\n    </tr>\n    <tr>\n      <th>sk</th>\n      <td>0.0010</td>\n      <td>0.1600</td>\n      <td>0.0107</td>\n      <td>0.0502</td>\n      <td>0.2658</td>\n      <td>0.3710</td>\n      <td>0.4073</td>\n    </tr>\n    <tr>\n      <th>store</th>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>0.0000</td>\n      <td>0.0090</td>\n      <td>0.0503</td>\n      <td>0.0647</td>\n    </tr>\n    <tr>\n      <th>su</th>\n      <td>0.0001</td>\n      <td>0.0304</td>\n      <td>0.0025</td>\n      <td>0.0052</td>\n      <td>0.1152</td>\n      <td>0.0838</td>\n      <td>0.0897</td>\n    </tr>\n    <tr>\n      <th>th</th>\n      <td>0.0003</td>\n      <td>0.0217</td>\n      <td>0.0206</td>\n      <td>0.0316</td>\n      <td>0.0680</td>\n      <td>0.0807</td>\n      <td>0.1172</td>\n    </tr>\n    <tr>\n      <th>tk</th>\n      <td>0.0000</td>\n      <td>0.0244</td>\n      <td>0.0015</td>\n      <td>0.0021</td>\n      <td>0.0980</td>\n      <td>0.0441</td>\n      <td>0.0024</td>\n    </tr>\n    <tr>\n      <th>top</th>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>0.0001</td>\n      <td>0.0404</td>\n      <td>0.0696</td>\n      <td>0.0947</td>\n    </tr>\n    <tr>\n      <th>tr</th>\n      <td>0.0623</td>\n      <td>0.1155</td>\n      <td>0.0503</td>\n      <td>0.0769</td>\n      <td>0.1942</td>\n      <td>0.0918</td>\n      <td>0.4316</td>\n    </tr>\n    <tr>\n      <th>tv</th>\n      <td>0.0013</td>\n      <td>0.2583</td>\n      <td>0.1455</td>\n      <td>0.1339</td>\n      <td>0.2392</td>\n      <td>0.2082</td>\n      <td>0.2101</td>\n    </tr>\n    <tr>\n      <th>tw</th>\n      <td>0.0923</td>\n      <td>0.1091</td>\n      <td>0.0505</td>\n      <td>0.0985</td>\n      <td>0.3121</td>\n      <td>0.1671</td>\n      <td>0.4419</td>\n    </tr>\n    <tr>\n      <th>ua</th>\n      <td>0.2189</td>\n      <td>0.4141</td>\n      <td>0.0099</td>\n      <td>0.0538</td>\n      <td>0.9978</td>\n      <td>0.3662</td>\n      <td>0.9063</td>\n    </tr>\n    <tr>\n      <th>uk</th>\n      <td>4.0402</td>\n      <td>3.5017</td>\n      <td>1.5931</td>\n      <td>1.6469</td>\n      <td>2.5171</td>\n      <td>0.4003</td>\n      <td>2.1624</td>\n    </tr>\n    <tr>\n      <th>us</th>\n      <td>0.0046</td>\n      <td>0.4174</td>\n      <td>0.3289</td>\n      <td>0.2699</td>\n      <td>0.3468</td>\n      <td>0.2397</td>\n      <td>0.1713</td>\n    </tr>\n    <tr>\n      <th>uy</th>\n      <td>0.0097</td>\n      <td>0.0156</td>\n      <td>0.0025</td>\n      <td>0.0125</td>\n      <td>0.0224</td>\n      <td>0.0330</td>\n      <td>0.0546</td>\n    </tr>\n    <tr>\n      <th>vn</th>\n      <td>0.0136</td>\n      <td>0.0797</td>\n      <td>0.0500</td>\n      <td>0.0666</td>\n      <td>0.3596</td>\n      <td>0.5066</td>\n      <td>0.6119</td>\n    </tr>\n    <tr>\n      <th>ws</th>\n      <td>0.0006</td>\n      <td>0.0840</td>\n      <td>0.0109</td>\n      <td>0.0081</td>\n      <td>0.0287</td>\n      <td>0.0174</td>\n      <td>0.0162</td>\n    </tr>\n    <tr>\n      <th>xyz</th>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>NaN</td>\n      <td>0.0008</td>\n      <td>0.1076</td>\n      <td>0.1504</td>\n      <td>0.1180</td>\n    </tr>\n    <tr>\n      <th>za</th>\n      <td>0.0126</td>\n      <td>0.1613</td>\n      <td>0.0737</td>\n      <td>0.1455</td>\n      <td>0.2097</td>\n      <td>0.0354</td>\n      <td>0.2119</td>\n    </tr>\n  </tbody>\n</table>"
  },
  {
    "path": "plots/tld/selected-tlds-by-year.csv",
    "content": "year,com,org,ru,net,de,uk,jp,edu,fr,it,pl,nl,br,cz,au,es\n(any),51.89498041088741,6.374690312897634,4.043836128047363,3.7540135387074742,3.3057420391065255,2.0636941568332174,1.6835267130601943,1.4252882516137377,1.378812124865615,1.3646056974912153,1.2560181267062749,1.121195143198995,0.9993935660133176,0.8268963567184797,0.8218748742850955,0.7555833791162748\n2009,71.19780889022911,8.098929313625348,0.05351614532270588,9.192244767771701,0.05229943066335908,4.035882904228814,0.05172600187665833,1.2758001274752773,0.019721612003983577,0.04384950419892673,0.18616156990118463,0.007326984931601306,0.3371385283395139,0.006517566005039137,0.601235299647618,0.03384002941450515\n2010,68.93182873699625,7.140400107811788,0.46442692696666116,6.0261543153559165,1.5071477519179124,3.1231446830343264,0.5019212492802659,1.3083111025801328,0.4374130392617395,0.5685715050740612,0.48197880870021537,0.4423738714382255,0.7884784029067625,0.1696544885787117,1.0174189743866877,0.2536865504094791\n2012,55.856399418493176,6.022725691210052,1.7092228719397122,5.430585937678828,4.752871358541379,3.454940323911269,1.1427540929401447,0.6065172816762283,1.2974944702218174,1.3003447285636904,1.794793492276718,1.4343236655889144,0.7561427194830521,0.7643201919764638,0.9834737749202592,0.6679580672316351\n2013,73.07832933177185,9.397807679592292,0.0576101583509711,3.269726670817926,1.122655213970551,1.9973525831718704,0.16378503435221878,2.906697821403832,0.3795106738238928,0.33725209585561516,0.02455189987001929,0.24826465816108723,0.2165408066061675,0.09510312100280675,0.633941239564323,0.22165410747988268\n2014,73.25154993537471,9.748709303575934,0.11357902937548757,3.2006759407993606,0.8102633151462019,1.7445533155041957,0.13037620976505668,3.36436596270053,0.3023998644590416,0.2627330934011718,0.1575522142061087,0.16476339518765715,0.2801926420741301,0.05591932198087427,0.508761576408202,0.180034989378696\n2015,73.30584506468368,10.25005088968117,0.10884730008636287,3.163612596472046,0.755234139038026,1.6705744755475465,0.1416879605482132,3.344217600154009,0.2810126137710399,0.24869594328930453,0.13983018448402285,0.1661677306088631,0.25895815983586756,0.047732897166349104,0.5070904400084749,0.17552997164679915\n2016,64.54523740307623,8.962913504852864,2.5554470749563514,3.6593123663986775,1.9722821636683794,1.7895415990305006,0.8124400136775266,2.4817418083983913,0.6309310471298197,0.6481674607899223,0.48744016390253647,0.5113775166677983,0.43462600911804555,0.520424381598946,0.6046418501995843,0.3567211033635578\n2017,56.54142420097272,5.643604702140739,5.298772605425257,4.217553207459812,2.8272361487220534,2.030203752445904,2.094932027320141,1.0213536337719042,1.1462942617265288,1.0752783830848343,0.9875203959783877,0.7282896047329713,0.8073278394888976,0.8525616264541258,0.70379930272525,0.7080291752576782\n2018,50.06329875319154,5.277805347037557,6.059784566481229,4.411463764554048,3.493396558772616,2.2178148687676367,2.164062012953355,0.7471671647649256,1.4179426241400284,1.278994949295683,1.3704808710201752,1.0185913442100039,0.9893937030239857,0.9309126422286781,0.781953100203275,0.802891385809908\n2019,46.20532576745491,5.676807344971467,5.085952469840225,3.9819656860964496,3.8838680030819392,2.3803074166762186,1.9926785479648448,0.888637799619372,1.6682126002159616,1.6259115040790517,1.5062165054968,1.381020765676773,1.187565937889545,0.9904209503277482,0.9193488692014473,0.9006401307095173\n2020,44.965464764988575,5.680418883349085,4.851169812730146,3.7145583596844514,4.030039960587272,2.295895268261546,1.8924009010047067,1.0761603584806487,1.7504655275200778,1.7043980826477478,1.5247171265991937,1.4581695573792826,1.3056568434903515,1.0175013685624041,0.9797505695472748,0.9101720911446329\n2021,44.32560044163435,5.712679745200201,4.785891026180248,3.5893809528625042,4.147310238160972,2.3843450021653423,1.885449413654711,1.281048084913162,1.790613167633786,1.7719417632847865,1.5852346915602094,1.517795518795522,1.398618093474787,1.0486188707374928,1.0501915728082938,0.9687100013794343\n2022,45.37548169622278,6.158432878698863,4.136582366324254,3.558225755498412,4.20563086555731,1.750006179943287,1.7826016159829337,1.488170085944872,1.8476059411985666,1.8766664931169015,1.656898832651494,1.6432687465511873,1.0531541785479854,1.0284847667932469,0.798074391363609,0.9768547566332577\n2023,46.52580333169464,6.059793038227193,4.274594205438922,3.4923339674259486,4.295582610988845,0.7721516959075141,1.6617919730015456,1.3069957401439511,1.9138263335101504,2.060756103048291,1.6413990191796046,1.7580674048160572,0.4870726818081391,1.0794611766053126,0.41106841526393656,1.018274387928326\n2024,43.64514945495107,5.509630912040156,4.400192617327216,3.3161531547511496,4.028478270272748,2.0924533910547045,2.0801574283126305,1.1379001775504274,1.7504729335015614,1.9166658226647484,1.74936524608057,1.5397250866024828,1.4133306498645226,1.0307223655323625,1.0498701103812977,0.9845486508528206\n2025,43.16689356863301,5.164674228080854,4.284308762325859,3.2709505785983404,4.1637023690852555,2.175032223492076,2.2662357981506456,1.0180548378551648,1.7219803080962657,1.738790226931858,1.6972942763569192,1.4786093202261839,1.5635812915029117,1.015281826976945,1.1162430662993146,0.9009949248586931\n2026,41.87555481631105,5.510759830749804,4.599670566972649,3.049980817631032,4.368193211724322,2.039847060234517,2.47274095181078,0.8569106252161244,1.8887017950570846,1.7983108059302308,1.8780644166455187,1.4491169071701397,1.714666149334643,1.105213042595473,0.8949063165011313,0.9262104112494509\n"
  },
  {
    "path": "plots/tld/selected-tlds-by-year.html",
    "content": "<table border=\"1\" class=\"dataframe tablepercentage tablesorter\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th></th>\n      <th>com</th>\n      <th>org</th>\n      <th>ru</th>\n      <th>net</th>\n      <th>de</th>\n      <th>uk</th>\n      <th>jp</th>\n      <th>edu</th>\n      <th>fr</th>\n      <th>it</th>\n      <th>pl</th>\n      <th>nl</th>\n      <th>br</th>\n      <th>cz</th>\n      <th>au</th>\n      <th>es</th>\n    </tr>\n    <tr>\n      <th>year</th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>(any)</th>\n      <td>51.89</td>\n      <td>6.37</td>\n      <td>4.04</td>\n      <td>3.75</td>\n      <td>3.31</td>\n      <td>2.06</td>\n      <td>1.68</td>\n      <td>1.43</td>\n      <td>1.38</td>\n      <td>1.36</td>\n      <td>1.26</td>\n      <td>1.12</td>\n      <td>1.00</td>\n      <td>0.83</td>\n      <td>0.82</td>\n      <td>0.76</td>\n    </tr>\n    <tr>\n      <th>2009</th>\n      <td>71.20</td>\n      <td>8.10</td>\n      <td>0.05</td>\n      <td>9.19</td>\n      <td>0.05</td>\n      <td>4.04</td>\n      <td>0.05</td>\n      <td>1.28</td>\n      <td>0.02</td>\n      <td>0.04</td>\n      <td>0.19</td>\n      <td>0.01</td>\n      <td>0.34</td>\n      <td>0.01</td>\n      <td>0.60</td>\n      <td>0.03</td>\n    </tr>\n    <tr>\n      <th>2010</th>\n      <td>68.93</td>\n      <td>7.14</td>\n      <td>0.46</td>\n      <td>6.03</td>\n      <td>1.51</td>\n      <td>3.12</td>\n      <td>0.50</td>\n      <td>1.31</td>\n      <td>0.44</td>\n      <td>0.57</td>\n      <td>0.48</td>\n      <td>0.44</td>\n      <td>0.79</td>\n      <td>0.17</td>\n      <td>1.02</td>\n      <td>0.25</td>\n    </tr>\n    <tr>\n      <th>2012</th>\n      <td>55.86</td>\n      <td>6.02</td>\n      <td>1.71</td>\n      <td>5.43</td>\n      <td>4.75</td>\n      <td>3.45</td>\n      <td>1.14</td>\n      <td>0.61</td>\n      <td>1.30</td>\n      <td>1.30</td>\n      <td>1.79</td>\n      <td>1.43</td>\n      <td>0.76</td>\n      <td>0.76</td>\n      <td>0.98</td>\n      <td>0.67</td>\n    </tr>\n    <tr>\n      <th>2013</th>\n      <td>73.08</td>\n      <td>9.40</td>\n      <td>0.06</td>\n      <td>3.27</td>\n      <td>1.12</td>\n      <td>2.00</td>\n      <td>0.16</td>\n      <td>2.91</td>\n      <td>0.38</td>\n      <td>0.34</td>\n      <td>0.02</td>\n      <td>0.25</td>\n      <td>0.22</td>\n      <td>0.10</td>\n      <td>0.63</td>\n      <td>0.22</td>\n    </tr>\n    <tr>\n      <th>2014</th>\n      <td>73.25</td>\n      <td>9.75</td>\n      <td>0.11</td>\n      <td>3.20</td>\n      <td>0.81</td>\n      <td>1.74</td>\n      <td>0.13</td>\n      <td>3.36</td>\n      <td>0.30</td>\n      <td>0.26</td>\n      <td>0.16</td>\n      <td>0.16</td>\n      <td>0.28</td>\n      <td>0.06</td>\n      <td>0.51</td>\n      <td>0.18</td>\n    </tr>\n    <tr>\n      <th>2015</th>\n      <td>73.31</td>\n      <td>10.25</td>\n      <td>0.11</td>\n      <td>3.16</td>\n      <td>0.76</td>\n      <td>1.67</td>\n      <td>0.14</td>\n      <td>3.34</td>\n      <td>0.28</td>\n      <td>0.25</td>\n      <td>0.14</td>\n      <td>0.17</td>\n      <td>0.26</td>\n      <td>0.05</td>\n      <td>0.51</td>\n      <td>0.18</td>\n    </tr>\n    <tr>\n      <th>2016</th>\n      <td>64.55</td>\n      <td>8.96</td>\n      <td>2.56</td>\n      <td>3.66</td>\n      <td>1.97</td>\n      <td>1.79</td>\n      <td>0.81</td>\n      <td>2.48</td>\n      <td>0.63</td>\n      <td>0.65</td>\n      <td>0.49</td>\n      <td>0.51</td>\n      <td>0.43</td>\n      <td>0.52</td>\n      <td>0.60</td>\n      <td>0.36</td>\n    </tr>\n    <tr>\n      <th>2017</th>\n      <td>56.54</td>\n      <td>5.64</td>\n      <td>5.30</td>\n      <td>4.22</td>\n      <td>2.83</td>\n      <td>2.03</td>\n      <td>2.09</td>\n      <td>1.02</td>\n      <td>1.15</td>\n      <td>1.08</td>\n      <td>0.99</td>\n      <td>0.73</td>\n      <td>0.81</td>\n      <td>0.85</td>\n      <td>0.70</td>\n      <td>0.71</td>\n    </tr>\n    <tr>\n      <th>2018</th>\n      <td>50.06</td>\n      <td>5.28</td>\n      <td>6.06</td>\n      <td>4.41</td>\n      <td>3.49</td>\n      <td>2.22</td>\n      <td>2.16</td>\n      <td>0.75</td>\n      <td>1.42</td>\n      <td>1.28</td>\n      <td>1.37</td>\n      <td>1.02</td>\n      <td>0.99</td>\n      <td>0.93</td>\n      <td>0.78</td>\n      <td>0.80</td>\n    </tr>\n    <tr>\n      <th>2019</th>\n      <td>46.21</td>\n      <td>5.68</td>\n      <td>5.09</td>\n      <td>3.98</td>\n      <td>3.88</td>\n      <td>2.38</td>\n      <td>1.99</td>\n      <td>0.89</td>\n      <td>1.67</td>\n      <td>1.63</td>\n      <td>1.51</td>\n      <td>1.38</td>\n      <td>1.19</td>\n      <td>0.99</td>\n      <td>0.92</td>\n      <td>0.90</td>\n    </tr>\n    <tr>\n      <th>2020</th>\n      <td>44.97</td>\n      <td>5.68</td>\n      <td>4.85</td>\n      <td>3.71</td>\n      <td>4.03</td>\n      <td>2.30</td>\n      <td>1.89</td>\n      <td>1.08</td>\n      <td>1.75</td>\n      <td>1.70</td>\n      <td>1.52</td>\n      <td>1.46</td>\n      <td>1.31</td>\n      <td>1.02</td>\n      <td>0.98</td>\n      <td>0.91</td>\n    </tr>\n    <tr>\n      <th>2021</th>\n      <td>44.33</td>\n      <td>5.71</td>\n      <td>4.79</td>\n      <td>3.59</td>\n      <td>4.15</td>\n      <td>2.38</td>\n      <td>1.89</td>\n      <td>1.28</td>\n      <td>1.79</td>\n      <td>1.77</td>\n      <td>1.59</td>\n      <td>1.52</td>\n      <td>1.40</td>\n      <td>1.05</td>\n      <td>1.05</td>\n      <td>0.97</td>\n    </tr>\n    <tr>\n      <th>2022</th>\n      <td>45.38</td>\n      <td>6.16</td>\n      <td>4.14</td>\n      <td>3.56</td>\n      <td>4.21</td>\n      <td>1.75</td>\n      <td>1.78</td>\n      <td>1.49</td>\n      <td>1.85</td>\n      <td>1.88</td>\n      <td>1.66</td>\n      <td>1.64</td>\n      <td>1.05</td>\n      <td>1.03</td>\n      <td>0.80</td>\n      <td>0.98</td>\n    </tr>\n    <tr>\n      <th>2023</th>\n      <td>46.53</td>\n      <td>6.06</td>\n      <td>4.27</td>\n      <td>3.49</td>\n      <td>4.30</td>\n      <td>0.77</td>\n      <td>1.66</td>\n      <td>1.31</td>\n      <td>1.91</td>\n      <td>2.06</td>\n      <td>1.64</td>\n      <td>1.76</td>\n      <td>0.49</td>\n      <td>1.08</td>\n      <td>0.41</td>\n      <td>1.02</td>\n    </tr>\n    <tr>\n      <th>2024</th>\n      <td>43.65</td>\n      <td>5.51</td>\n      <td>4.40</td>\n      <td>3.32</td>\n      <td>4.03</td>\n      <td>2.09</td>\n      <td>2.08</td>\n      <td>1.14</td>\n      <td>1.75</td>\n      <td>1.92</td>\n      <td>1.75</td>\n      <td>1.54</td>\n      <td>1.41</td>\n      <td>1.03</td>\n      <td>1.05</td>\n      <td>0.98</td>\n    </tr>\n    <tr>\n      <th>2025</th>\n      <td>43.17</td>\n      <td>5.16</td>\n      <td>4.28</td>\n      <td>3.27</td>\n      <td>4.16</td>\n      <td>2.18</td>\n      <td>2.27</td>\n      <td>1.02</td>\n      <td>1.72</td>\n      <td>1.74</td>\n      <td>1.70</td>\n      <td>1.48</td>\n      <td>1.56</td>\n      <td>1.02</td>\n      <td>1.12</td>\n      <td>0.90</td>\n    </tr>\n    <tr>\n      <th>2026</th>\n      <td>41.88</td>\n      <td>5.51</td>\n      <td>4.60</td>\n      <td>3.05</td>\n      <td>4.37</td>\n      <td>2.04</td>\n      <td>2.47</td>\n      <td>0.86</td>\n      <td>1.89</td>\n      <td>1.80</td>\n      <td>1.88</td>\n      <td>1.45</td>\n      <td>1.71</td>\n      <td>1.11</td>\n      <td>0.89</td>\n      <td>0.93</td>\n    </tr>\n  </tbody>\n</table>"
  },
  {
    "path": "plots/tld/tlds-by-year-and-continent.csv",
    "content": "year,(other),\"com,net\",org,edu,\"gov,mil\",North America,South America,Oceania,Africa,Asia,Europe\n2009,2.372710231294118,80.38104003392658,8.098021232327786,1.2756570801426825,0.3793266584367303,0.11401450241006646,0.4869093014580774,0.6385207762024301,0.025662649035679254,1.4786198795909986,4.749517655174848\n2010,1.4855696236647693,74.95629887048294,7.140239674834392,1.3082817069941184,0.5120370711261071,0.7706887698166217,0.9790683746172806,1.4112024309658973,0.1281535582272385,1.7830943051527208,9.525365614117918\n2012,1.805603499529646,61.286829663077846,6.022710391113422,0.6065157408833226,0.2674993425437423,1.313681628396945,1.1912177609532053,1.7423530678298849,0.22608598259612694,2.774087757007317,22.763415166068544\n2013,0.40492028804343894,76.34802196410801,9.397803489739635,2.906696525502064,1.4128169971802005,1.0172778318175024,0.422744478041168,1.0805405428554966,0.18532918473122176,0.8537253370084816,5.970123360972776\n2014,0.41733410009547656,76.45221478702612,9.748707889557197,3.364365474710134,1.6853772456589369,0.9603473219225983,0.5335950655704679,0.8683960090486706,0.18209174352684082,0.8291928743976551,4.958377488485904\n2015,0.3746039648183713,76.46945214130866,10.250050149794749,3.3442173587560675,1.6839290167887637,0.8405363480989,0.51476511310795,0.8530288444537862,0.17400684980450837,0.8053354007332064,4.690074812335029\n2016,0.7364446130600686,68.20454902568343,8.962913407109552,2.481741781334238,1.2664009984490998,0.9542985272580663,0.8108407328828081,1.0907254528906893,0.23798517351067525,2.482341437572674,12.771758850248698\n2017,1.3803362668953434,60.758977390531555,5.643604700478004,1.0213536334709903,0.42362111261162405,1.1501900986422446,1.3815340022573843,1.3300550265072695,0.2969733599295535,5.127185253115497,21.486169155560535\n2018,2.4722427093505788,54.47476249849602,5.277805345172555,0.7471671645009016,0.2809316181870313,1.403865320751203,1.7183262532181955,1.5125740042582414,0.40486852829194125,5.872907599592247,25.834548958181088\n2019,2.799127291037323,50.187220637958696,5.6767993348464945,0.8886365457279859,0.3075981672638809,1.3562237983356609,2.04299088912311,1.6477873839691597,0.4757171673848548,6.62478803338319,27.993110750969645\n2020,2.7569743182402955,48.67997702017013,5.680413503464852,1.0761593392568443,0.3511239201356604,1.3601336273656373,2.180024157926504,1.6606431478052264,0.4766815781708249,7.164844271609742,28.61302511585429\n2021,2.807726498809468,47.914979148097146,5.712679477372442,1.281048024853741,0.4114774978120561,1.4514077514517278,2.343827844096823,1.7198842195845663,0.500569399436175,6.682231757594182,29.174168380891672\n2022,2.8780538409820116,48.93370393081929,6.1584324355843085,1.488169978867335,0.47988094726490643,1.5060979491331428,2.0843334295330225,1.4029550288832249,0.4837686122978544,6.370098503155943,28.214505343478958\n2023,2.9878111904742277,50.01810770292156,6.059789452591052,1.306994966782364,0.47024376514043276,1.567826346305796,1.6625261765574342,0.9366992918690097,0.4255690144713344,6.35774534328999,28.206686749596795\n2024,3.0454213699438024,46.961250802687076,5.509624833896743,1.137898922235765,0.43758927914542306,1.5944360037056953,2.627106931726031,1.6589448982493866,0.5954904899067033,7.677015083900745,28.75522138460263\n2025,3.1710095569417116,46.437826174591486,5.164672229219115,1.0180544438417627,0.43464626049835847,1.638992711199414,2.816431662118706,1.743696094446849,0.6276925586809861,8.45079220305241,28.496186105409205\n2026,3.042738116164256,44.92553232030033,5.510759424284224,0.8569105620116508,0.43252031132823504,1.593273577276783,2.966933213245479,1.4690889036041748,0.6041385687836416,8.779568331734819,29.818536671266408\n"
  },
  {
    "path": "plots/tld/tlds-by-year-and-continent.html",
    "content": "<table border=\"1\" class=\"dataframe tablepercentage tablesorter\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th></th>\n      <th>(other)</th>\n      <th>com,net</th>\n      <th>org</th>\n      <th>edu</th>\n      <th>gov,mil</th>\n      <th>North America</th>\n      <th>South America</th>\n      <th>Oceania</th>\n      <th>Africa</th>\n      <th>Asia</th>\n      <th>Europe</th>\n    </tr>\n    <tr>\n      <th>year</th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>2009</th>\n      <td>2.37</td>\n      <td>80.38</td>\n      <td>8.10</td>\n      <td>1.28</td>\n      <td>0.38</td>\n      <td>0.11</td>\n      <td>0.49</td>\n      <td>0.64</td>\n      <td>0.03</td>\n      <td>1.48</td>\n      <td>4.75</td>\n    </tr>\n    <tr>\n      <th>2010</th>\n      <td>1.49</td>\n      <td>74.96</td>\n      <td>7.14</td>\n      <td>1.31</td>\n      <td>0.51</td>\n      <td>0.77</td>\n      <td>0.98</td>\n      <td>1.41</td>\n      <td>0.13</td>\n      <td>1.78</td>\n      <td>9.53</td>\n    </tr>\n    <tr>\n      <th>2012</th>\n      <td>1.81</td>\n      <td>61.29</td>\n      <td>6.02</td>\n      <td>0.61</td>\n      <td>0.27</td>\n      <td>1.31</td>\n      <td>1.19</td>\n      <td>1.74</td>\n      <td>0.23</td>\n      <td>2.77</td>\n      <td>22.76</td>\n    </tr>\n    <tr>\n      <th>2013</th>\n      <td>0.40</td>\n      <td>76.35</td>\n      <td>9.40</td>\n      <td>2.91</td>\n      <td>1.41</td>\n      <td>1.02</td>\n      <td>0.42</td>\n      <td>1.08</td>\n      <td>0.19</td>\n      <td>0.85</td>\n      <td>5.97</td>\n    </tr>\n    <tr>\n      <th>2014</th>\n      <td>0.42</td>\n      <td>76.45</td>\n      <td>9.75</td>\n      <td>3.36</td>\n      <td>1.69</td>\n      <td>0.96</td>\n      <td>0.53</td>\n      <td>0.87</td>\n      <td>0.18</td>\n      <td>0.83</td>\n      <td>4.96</td>\n    </tr>\n    <tr>\n      <th>2015</th>\n      <td>0.37</td>\n      <td>76.47</td>\n      <td>10.25</td>\n      <td>3.34</td>\n      <td>1.68</td>\n      <td>0.84</td>\n      <td>0.51</td>\n      <td>0.85</td>\n      <td>0.17</td>\n      <td>0.81</td>\n      <td>4.69</td>\n    </tr>\n    <tr>\n      <th>2016</th>\n      <td>0.74</td>\n      <td>68.20</td>\n      <td>8.96</td>\n      <td>2.48</td>\n      <td>1.27</td>\n      <td>0.95</td>\n      <td>0.81</td>\n      <td>1.09</td>\n      <td>0.24</td>\n      <td>2.48</td>\n      <td>12.77</td>\n    </tr>\n    <tr>\n      <th>2017</th>\n      <td>1.38</td>\n      <td>60.76</td>\n      <td>5.64</td>\n      <td>1.02</td>\n      <td>0.42</td>\n      <td>1.15</td>\n      <td>1.38</td>\n      <td>1.33</td>\n      <td>0.30</td>\n      <td>5.13</td>\n      <td>21.49</td>\n    </tr>\n    <tr>\n      <th>2018</th>\n      <td>2.47</td>\n      <td>54.47</td>\n      <td>5.28</td>\n      <td>0.75</td>\n      <td>0.28</td>\n      <td>1.40</td>\n      <td>1.72</td>\n      <td>1.51</td>\n      <td>0.40</td>\n      <td>5.87</td>\n      <td>25.83</td>\n    </tr>\n    <tr>\n      <th>2019</th>\n      <td>2.80</td>\n      <td>50.19</td>\n      <td>5.68</td>\n      <td>0.89</td>\n      <td>0.31</td>\n      <td>1.36</td>\n      <td>2.04</td>\n      <td>1.65</td>\n      <td>0.48</td>\n      <td>6.62</td>\n      <td>27.99</td>\n    </tr>\n    <tr>\n      <th>2020</th>\n      <td>2.76</td>\n      <td>48.68</td>\n      <td>5.68</td>\n      <td>1.08</td>\n      <td>0.35</td>\n      <td>1.36</td>\n      <td>2.18</td>\n      <td>1.66</td>\n      <td>0.48</td>\n      <td>7.16</td>\n      <td>28.61</td>\n    </tr>\n    <tr>\n      <th>2021</th>\n      <td>2.81</td>\n      <td>47.91</td>\n      <td>5.71</td>\n      <td>1.28</td>\n      <td>0.41</td>\n      <td>1.45</td>\n      <td>2.34</td>\n      <td>1.72</td>\n      <td>0.50</td>\n      <td>6.68</td>\n      <td>29.17</td>\n    </tr>\n    <tr>\n      <th>2022</th>\n      <td>2.88</td>\n      <td>48.93</td>\n      <td>6.16</td>\n      <td>1.49</td>\n      <td>0.48</td>\n      <td>1.51</td>\n      <td>2.08</td>\n      <td>1.40</td>\n      <td>0.48</td>\n      <td>6.37</td>\n      <td>28.21</td>\n    </tr>\n    <tr>\n      <th>2023</th>\n      <td>2.99</td>\n      <td>50.02</td>\n      <td>6.06</td>\n      <td>1.31</td>\n      <td>0.47</td>\n      <td>1.57</td>\n      <td>1.66</td>\n      <td>0.94</td>\n      <td>0.43</td>\n      <td>6.36</td>\n      <td>28.21</td>\n    </tr>\n    <tr>\n      <th>2024</th>\n      <td>3.05</td>\n      <td>46.96</td>\n      <td>5.51</td>\n      <td>1.14</td>\n      <td>0.44</td>\n      <td>1.59</td>\n      <td>2.63</td>\n      <td>1.66</td>\n      <td>0.60</td>\n      <td>7.68</td>\n      <td>28.76</td>\n    </tr>\n    <tr>\n      <th>2025</th>\n      <td>3.17</td>\n      <td>46.44</td>\n      <td>5.16</td>\n      <td>1.02</td>\n      <td>0.43</td>\n      <td>1.64</td>\n      <td>2.82</td>\n      <td>1.74</td>\n      <td>0.63</td>\n      <td>8.45</td>\n      <td>28.50</td>\n    </tr>\n    <tr>\n      <th>2026</th>\n      <td>3.04</td>\n      <td>44.93</td>\n      <td>5.51</td>\n      <td>0.86</td>\n      <td>0.43</td>\n      <td>1.59</td>\n      <td>2.97</td>\n      <td>1.47</td>\n      <td>0.60</td>\n      <td>8.78</td>\n      <td>29.82</td>\n    </tr>\n  </tbody>\n</table>"
  },
  {
    "path": "plots/tlds.md",
    "content": "Top-Level Domains\n=================\n\n[Top-level domains](https://en.wikipedia.org/wiki/Top-level_domain) (abbrev. \"TLD\"/\"TLDs\") are a significant indicator for the representativeness of the data, whether the data set or particular crawl is biased towards certain countries, regions or languages.\n\nMetrics about top-level domains are show on the following pages:\n\n* [Groups of TLDs](./tld/groups.md): generic vs. country-code TLDs (e.g., `.com` vs. `.jp`)\n* [TLDs of latest monthly crawl](./tld/latestcrawl.md)\n* [Estimation of representativeness](./tld/comparison.md): a comparison of a recent crawl with an external data source\n* [TLDs of selected crawls](./tld/percentage.md): lists percentage of TLDs for selected crawls from 2008--2025\n* [TLDs by year and continent](./tld/by-year-and-continent.md): TLDs which are bound to geographical regions are mapped to the corresponding continents.\n\nNote, that top-level domain is defined here as the left-most element of a host name (`com` in `www.example.com`). [Country-code second-level domains](https://en.wikipedia.org/wiki/Second-level_domain#Country-code_second-level_domains) (\"ccSLD\") and [public suffixes](https://en.wikipedia.org/wiki/Public_Suffix_List) are not covered by this metrics.\n\n"
  },
  {
    "path": "requirements.txt",
    "content": "hyperloglog==0.0.14\nisoweek==1.3.3\nmrjob==0.7.4\ntldextract==5.1.2\nujson==5.12.0\n\n# tests\npytest\njsonpickle\nsetuptools\n"
  },
  {
    "path": "requirements_plot.txt",
    "content": "ggplot==0.11.5\nidna==3.7\n#pandas==2.1.4+dfsg\npandas==2.1.4\npygraphviz==1.13\nrpy2==3.5.15\n\nmatplotlib==3.10.7\nfsspec[s3]"
  },
  {
    "path": "run_stats_hadoop.sh",
    "content": "#!/bin/bash\n\nCRAWL=\"$1\"\n\nif [ -z \"$CRAWL\" ]; then\n    echo \"Usage: $0 <CRAWL-YEAR-WEEK>\"\n    echo \"  Argument indicating year and week of crawl (e.g., 2016-40) to be processed required\"\n    exit 1\nfi\n\n\nOUTPUT_COUNT=ccstats/$CRAWL/count/\nOUTPUT_STATS=ccstats/$CRAWL/stats/\n\nhadoop fs -mkdir -p ccstats/$CRAWL/\n\n# check that output paths do not exist (jobs will fail otherwise)\nif hadoop fs -ls $OUTPUT_COUNT; then\n    echo \"Output path $OUTPUT_COUNT already exists: delete path before running the count job\"\n    exit 1\nfi\n\nif hadoop fs -ls $OUTPUT_STATS; then\n    echo \"Output path $OUTPUT_STATS already exists: delete path before running the stats job\"\n    exit 1\nfi\n\n\nset -e\nset -x\nset -o pipefail\n\n\nINPUT=\"s3a://commoncrawl/cc-index/collections/CC-MAIN-$CRAWL/indexes/cdx-*.gz\"\n\nHADOOP_USER=${HADOOP_USER:-$USER}\n\n\npython3 crawlstats.py --job=count \\\n        --no-exact-counts \\\n        -r hadoop \\\n        --jobconf \"mapreduce.map.memory.mb=720\" \\\n        --jobconf \"mapreduce.map.java.opts=-Xmx512m\" \\\n        --jobconf \"mapreduce.reduce.memory.mb=640\" \\\n        --jobconf \"mapreduce.reduce.java.opts=-Xmx512m\" \\\n        --jobconf \"mapreduce.output.fileoutputformat.compress=true\" \\\n        --output-dir hdfs:///user/$HADOOP_USER/$OUTPUT_COUNT \\\n        --no-output \\\n        --cleanup NONE \\\n        \"$INPUT\" \\\n    2>&1 | tee cc-stats.$CRAWL.count.log\n\n#for i in `seq 0 9`; do\n#    hadoop distcp ccstats/$CRAWL/count/part-0000$i.bz2 s3a://commoncrawl/crawl-analysis/CC-MAIN-$CRAWL/count/part-0000$i.bz2\n#done\nhadoop fs -rm ccstats/$CRAWL/count/_SUCCESS\nhadoop distcp -direct ccstats/$CRAWL/count s3a://commoncrawl/crawl-analysis/CC-MAIN-$CRAWL/count\n\n\npython3 crawlstats.py --job=stats \\\n        --max-top-hosts-domains=500 \\\n        --min-urls-top-host-domain=100 \\\n        --min-lang-comb-freq=50 \\\n        -r hadoop \\\n        --jobconf \"mapreduce.map.memory.mb=1200\" \\\n        --jobconf \"mapreduce.map.java.opts=-Xmx1024m\" \\\n        --jobconf \"mapreduce.reduce.memory.mb=1200\" \\\n        --jobconf \"mapreduce.reduce.java.opts=-Xmx1024m\" \\\n        --jobconf \"mapreduce.output.fileoutputformat.compress=true\" \\\n        --no-output \\\n        --cleanup NONE \\\n        --output-dir hdfs:///user/$HADOOP_USER/$OUTPUT_STATS \\\n        hdfs:///user/$HADOOP_USER/$OUTPUT_COUNT \\\n    2>&1 | tee cc-stats.$CRAWL.stats.log\n\nhadoop fs -mkdir -p s3a://commoncrawl/crawl-analysis/CC-MAIN-$CRAWL/stats/\nhadoop fs -cp -d -f ccstats/$CRAWL/stats/part-00000.gz s3a://commoncrawl/crawl-analysis/CC-MAIN-$CRAWL/stats/part-00000.gz\n"
  },
  {
    "path": "setup.py",
    "content": "from setuptools import setup\n\n\nsetup(\n    setup_requires=['pytest-runner'],\n    tests_require=['pytest'],\n)"
  },
  {
    "path": "site.Dockerfile",
    "content": "# See\n#    https://docs.github.com/en/pages/setting-up-a-github-pages-site-with-jekyll\n#    https://github.com/BillRaymond/my-jekyll-docker-website\n\n# As of 2024-12-15, Github pages require Ruby 3.3.4 and Jekyll 3.10.0\n# see https://pages.github.com/versions/\nFROM ruby:3.3-alpine\n\n# Add Jekyll build dependencies to Alpine\nRUN apk update\nRUN apk add --no-cache build-base gcc cmake git\n\n# Update the Ruby bundler and install Jekyll,\n# pin dependency versions to avoid conflicts\nRUN gem install bundler -v 2.5.23\nRUN gem install ffi     -v 1.17.0\nRUN gem install jekyll  -v 3.10.0\n\n\nRUN mkdir /cc-crawl-statistics\nWORKDIR /cc-crawl-statistics\n\nRUN echo -e \"source 'https://rubygems.org'\\ngem 'github-pages', group: :jekyll_plugins\" >Gemfile\nRUN bundle install\nRUN bundle exec jekyll clean\n\nCOPY index.md _config.yml ./\nCOPY _layouts/ ./_layouts/\nCOPY assets/ ./assets/\nCOPY plots/ ./plots/\n\nCMD bundle exec jekyll serve\n#CMD bundle exec jekyll serve --host 0.0.0.0\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2016-18.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2016-18\"]\t7706034375\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2016-18\"]\t4884080239\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2016-18\"]\t1225\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2016-18\"]\t4823256591\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2016-18\"]\t1338807996\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2016-18\"]\t327260\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2016-18\"]\t338160914\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2016-18\"]\t1090448325\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2016-18\"]\t426625500\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2016-18\"]\t1426295\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2016-18\"]\t19915502\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2016-18\"]\t82830014\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2016-18\"]\t521424978\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2016-18\"]\t7854886\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2016-18\"]\t0\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2016-18\"]\t305983410\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2016-18\"]\t284383017\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2016-18\"]\t405068494\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2016-18\"]\t102758408401405\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2016-22.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2016-22\"]\t8087074988\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2016-22\"]\t5261630738\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2016-22\"]\t1227\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2016-22\"]\t5227623812\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2016-22\"]\t1468074295\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2016-22\"]\t256139\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2016-22\"]\t334686475\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2016-22\"]\t1117011316\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2016-22\"]\t453120454\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2016-22\"]\t1219720\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2016-22\"]\t23171460\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2016-22\"]\t159901466\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2016-22\"]\t671241422\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2016-22\"]\t7796696\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2016-22\"]\t492\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2016-22\"]\t299420928\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2016-22\"]\t255346003\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2016-22\"]\t436376946\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2016-22\"]\t109013317353257\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2016-26.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2016-26\"]\t7180806080\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2016-26\"]\t3578181474\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2016-26\"]\t1299552667\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2016-26\"]\t7849358\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2016-26\"]\t4542\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2016-26\"]\t1026907236\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2016-26\"]\t295675118\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2016-26\"]\t948192553\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2016-26\"]\t820\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2016-26\"]\t3555622846\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2016-26\"]\t1239037032\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2016-26\"]\t283288\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2016-26\"]\t281679547\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2016-26\"]\t995729397\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2016-26\"]\t48853116\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2016-26\"]\t171324\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2016-26\"]\t2442289\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2016-26\"]\t219056540\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2016-26\"]\t116429750\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2016-26\"]\t271438\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2016-26\"]\t226\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2016-26\"]\t360488201\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2016-26\"]\t167326318\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2016-26\"]\t123854380\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2016-26\"]\t88623547035512\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2016-26\"]\t2959816783\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2016-26\"]\t1458288238\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2016-26\"]\t1208261302\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2016-26\"]\t341362333\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2016-26\"]\t1212535320\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2016-26\"]\t542104\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2016-30.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2016-30\"]\t7180518032\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2016-30\"]\t2973093696\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2016-30\"]\t1245810\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2016-30\"]\t1329353152\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2016-30\"]\t8699898\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2016-30\"]\t4372\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2016-30\"]\t682024659\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2016-30\"]\t174730909\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2016-30\"]\t777034896\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2016-30\"]\t703\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2016-30\"]\t4197629689\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2016-30\"]\t1810244403\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2016-30\"]\t59201\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2016-30\"]\t290453958\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2016-30\"]\t981585540\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2016-30\"]\t206900007\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2016-30\"]\t324964\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2016-30\"]\t9945025\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2016-30\"]\t228070081\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2016-30\"]\t141536480\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2016-30\"]\t425474\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2016-30\"]\t0\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2016-30\"]\t203614009\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2016-30\"]\t205019936\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2016-30\"]\t119450611\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2016-30\"]\t152939938979003\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2016-30\"]\t2700852810\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2016-30\"]\t1511329903\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2016-30\"]\t1301660933\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2016-30\"]\t363167187\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2016-30\"]\t1302685912\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2016-30\"]\t821287\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2016-36.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2016-36\"]\t7218846495\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2016-36\"]\t2837438550\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2016-36\"]\t4016986\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2016-36\"]\t1310692190\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2016-36\"]\t11216926\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2016-36\"]\t4322\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2016-36\"]\t723192092\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2016-36\"]\t157229196\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2016-36\"]\t631086838\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2016-36\"]\t659\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2016-36\"]\t3299721802\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2016-36\"]\t1669540210\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2016-36\"]\t297150\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2016-36\"]\t141377763\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2016-36\"]\t358938772\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2016-36\"]\t199755423\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2016-36\"]\t403716\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2016-36\"]\t10264655\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2016-36\"]\t156733905\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2016-36\"]\t118198417\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2016-36\"]\t354645\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2016-36\"]\t434913\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2016-36\"]\t376252865\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2016-36\"]\t138243661\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2016-36\"]\t128925707\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2016-36\"]\t137795391799291\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2016-36\"]\t2417090235\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2016-36\"]\t1513758138\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2016-36\"]\t1515748969\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2016-36\"]\t196286452\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2016-36\"]\t946721948\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2016-36\"]\t814877\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2016-36\"]\t628425876\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2016-40.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2016-40\"]\t6936860504\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2016-40\"]\t2438332392\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2016-40\"]\t477\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2016-40\"]\t2706529909\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2016-40\"]\t1751866875\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2016-40\"]\t258041\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2016-40\"]\t78975219\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2016-40\"]\t199660245\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2016-40\"]\t68408887\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2016-40\"]\t653219\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2016-40\"]\t3887018\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2016-40\"]\t111251283\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2016-40\"]\t66420383\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2016-40\"]\t434523\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2016-40\"]\t112653\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2016-40\"]\t280732748\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2016-40\"]\t37285807\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2016-40\"]\t106583008\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2016-40\"]\t144057750380583\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2016-40\"]\t2330387939\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2016-40\"]\t1802786208\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2016-40\"]\t1819563339\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2016-40\"]\t162118346\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2016-40\"]\t633970371\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2016-40\"]\t1085872\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2016-40\"]\t624090304\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2016-44.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2016-44\"]\t9290101260\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2016-44\"]\t4298206731\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2016-44\"]\t8817659\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2016-44\"]\t1585953961\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2016-44\"]\t14498019\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2016-44\"]\t4659\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2016-44\"]\t320494642\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2016-44\"]\t93221876\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2016-44\"]\t2275215915\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2016-44\"]\t890\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2016-44\"]\t4825821690\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2016-44\"]\t3269916830\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2016-44\"]\t293668\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2016-44\"]\t161241810\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2016-44\"]\t436898978\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2016-44\"]\t108465290\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2016-44\"]\t401588\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2016-44\"]\t9078828\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2016-44\"]\t125317919\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2016-44\"]\t98063081\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2016-44\"]\t2000043\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2016-44\"]\t164830\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2016-44\"]\t336853084\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2016-44\"]\t142373476\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2016-44\"]\t134752265\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2016-44\"]\t271050060224575\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2016-44\"]\t3954548384\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2016-44\"]\t1889568295\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2016-44\"]\t1912674627\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2016-44\"]\t185402241\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2016-44\"]\t723510573\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2016-44\"]\t1338332\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2016-44\"]\t623058808\n \n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2016-50.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2016-50\"]\t9779597110\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2016-50\"]\t3689984208\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2016-50\"]\t10385068\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2016-50\"]\t2574745733\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2016-50\"]\t10149030\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2016-50\"]\t307222\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2016-50\"]\t186545660\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2016-50\"]\t75781174\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2016-50\"]\t832070321\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2016-50\"]\t907\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2016-50\"]\t3937603611\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2016-50\"]\t2842785646\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2016-50\"]\t304473\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2016-50\"]\t106006250\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2016-50\"]\t241654463\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2016-50\"]\t62077997\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2016-50\"]\t201765\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2016-50\"]\t5429486\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2016-50\"]\t84941222\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2016-50\"]\t65484993\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2016-50\"]\t796379\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2016-50\"]\t62476\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2016-50\"]\t272605215\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2016-50\"]\t137950385\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2016-50\"]\t117302861\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2016-50\"]\t249899847816413\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2016-50\"]\t2366539642\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2016-50\"]\t3283113827\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2016-50\"]\t2080657701\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2016-50\"]\t154942192\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2016-50\"]\t677746136\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2016-50\"]\t1623027\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2016-50\"]\t1005647259\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2017-04.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2017-04\"]\t10058030146\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2017-04\"]\t3877984074\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2017-04\"]\t11057924\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2017-04\"]\t2739072245\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2017-04\"]\t14992487\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2017-04\"]\t314424222\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2017-04\"]\t10962061\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2017-04\"]\t21944583\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2017-04\"]\t765530552\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2017-04\"]\t732\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2017-04\"]\t4224908113\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2017-04\"]\t3180033761\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2017-04\"]\t275513\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2017-04\"]\t89229638\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2017-04\"]\t265593164\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2017-04\"]\t58423504\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2017-04\"]\t235469\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2017-04\"]\t4461790\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2017-04\"]\t107204273\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2017-04\"]\t67843485\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2017-04\"]\t482563\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2017-04\"]\t0\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2017-04\"]\t159756311\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2017-04\"]\t172009272\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2017-04\"]\t119359370\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2017-04\"]\t275327597533768\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2017-04\"]\t2404728243\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2017-04\"]\t3276551279\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2017-04\"]\t2174897267\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2017-04\"]\t153059872\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2017-04\"]\t670133262\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2017-04\"]\t317048153\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2017-04\"]\t1061612070\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2017-09.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2017-09\"]\t10309950142\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2017-09\"]\t4435442265\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2017-09\"]\t622490924\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2017-09\"]\t2661307231\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2017-09\"]\t75450227\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2017-09\"]\t59634488\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2017-09\"]\t306597503\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2017-09\"]\t90289707\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2017-09\"]\t619672185\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2017-09\"]\t1022\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2017-09\"]\t5721772192\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2017-09\"]\t3332987429\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2017-09\"]\t171060\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2017-09\"]\t347710866\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2017-09\"]\t969656086\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2017-09\"]\t169237694\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2017-09\"]\t397047\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2017-09\"]\t9401372\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2017-09\"]\t135915640\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2017-09\"]\t156316496\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2017-09\"]\t810610\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2017-09\"]\t0\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2017-09\"]\t48503266\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2017-09\"]\t413684114\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2017-09\"]\t136980512\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2017-09\"]\t314687710946070\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2017-09\"]\t2207201972\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2017-09\"]\t3397576095\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2017-09\"]\t2297647695\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2017-09\"]\t162830116\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2017-09\"]\t713702943\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2017-09\"]\t418214793\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2017-09\"]\t1112776528\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2017-13.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2017-13\"]\t11054073116\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2017-13\"]\t3953684648\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2017-13\"]\t97647536\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2017-13\"]\t2552968616\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2017-13\"]\t10614549\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2017-13\"]\t19599792\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2017-13\"]\t193125557\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2017-13\"]\t43398044\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2017-13\"]\t1036330554\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2017-13\"]\t839\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2017-13\"]\t4460862193\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2017-13\"]\t3126884662\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2017-13\"]\t295435\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2017-13\"]\t124493367\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2017-13\"]\t395186542\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2017-13\"]\t66203591\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2017-13\"]\t420559\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2017-13\"]\t6884720\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2017-13\"]\t110366439\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2017-13\"]\t122993082\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2017-13\"]\t333587\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2017-13\"]\t9673\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2017-13\"]\t235731484\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2017-13\"]\t153497707\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2017-13\"]\t117561345\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2017-13\"]\t294485026915066\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2017-13\"]\t2637260380\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2017-13\"]\t3365767571\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2017-13\"]\t2431502897\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2017-13\"]\t172921755\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2017-13\"]\t741292462\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2017-13\"]\t642655358\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2017-13\"]\t1062672693\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2017-17.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2017-17\"]\t11614646341\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2017-17\"]\t3741728936\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2017-17\"]\t71131470\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2017-17\"]\t2282526378\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2017-17\"]\t6267616\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2017-17\"]\t341740437\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2017-17\"]\t122162500\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2017-17\"]\t66510064\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2017-17\"]\t851390471\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2017-17\"]\t748\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2017-17\"]\t4275917748\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2017-17\"]\t2994688505\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2017-17\"]\t172749\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2017-17\"]\t148604307\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2017-17\"]\t397231695\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2017-17\"]\t66746787\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2017-17\"]\t487733\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2017-17\"]\t3824609\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2017-17\"]\t118088550\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2017-17\"]\t88277706\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2017-17\"]\t366758\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2017-17\"]\t0\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2017-17\"]\t231613590\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2017-17\"]\t109166415\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2017-17\"]\t116648344\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2017-17\"]\t278922874037715\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2017-17\"]\t2448991569\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2017-17\"]\t3691674939\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2017-17\"]\t2580641900\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2017-17\"]\t183591714\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2017-17\"]\t760631183\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2017-17\"]\t827246845\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2017-17\"]\t1121868191\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2017-22.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2017-22\"]\t12106403981\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2017-22\"]\t3949651087\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2017-22\"]\t63450080\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2017-22\"]\t2325510222\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2017-22\"]\t102192828\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2017-22\"]\t315468944\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2017-22\"]\t321793504\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2017-22\"]\t64797249\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2017-22\"]\t756438260\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2017-22\"]\t730\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2017-22\"]\t4797344270\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2017-22\"]\t3033250432\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2017-22\"]\t257506\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2017-22\"]\t177345120\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2017-22\"]\t692714884\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2017-22\"]\t125269358\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2017-22\"]\t610079\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2017-22\"]\t7269501\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2017-22\"]\t157887225\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2017-22\"]\t140026583\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2017-22\"]\t610881\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2017-22\"]\t214866437\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2017-22\"]\t122418910\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2017-22\"]\t124817354\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2017-22\"]\t283596679518758\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2017-22\"]\t2355753062\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2017-22\"]\t3961650978\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2017-22\"]\t2702825542\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2017-22\"]\t188024529\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2017-22\"]\t780899750\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2017-22\"]\t956399067\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2017-22\"]\t1160851053\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2017-26.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2017-26\"]\t12986411417\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2017-26\"]\t4019722453\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2017-26\"]\t37878431\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2017-26\"]\t2371514646\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2017-26\"]\t16134852\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2017-26\"]\t200859775\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2017-26\"]\t188985115\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2017-26\"]\t50439278\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2017-26\"]\t1153910356\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2017-26\"]\t690\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2017-26\"]\t4574808620\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2017-26\"]\t3212658689\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2017-26\"]\t158123\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2017-26\"]\t134251168\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2017-26\"]\t434116921\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2017-26\"]\t71301129\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2017-26\"]\t399669\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2017-26\"]\t4168345\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2017-26\"]\t157694366\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2017-26\"]\t92837621\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2017-26\"]\t579226\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2017-26\"]\t252501231\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2017-26\"]\t93997300\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2017-26\"]\t120144832\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2017-26\"]\t296569324705292\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2017-26\"]\t12986411417\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2017-26\"]\t2750434416\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2017-26\"]\t4155811402\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2017-26\"]\t2817606881\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2017-26\"]\t196139800\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2017-26\"]\t798120913\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2017-26\"]\t1067159481\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2017-26\"]\t1201138524\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2017-30.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2017-30\"]\t13566579384\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2017-30\"]\t4674326265\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2017-30\"]\t244590557\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2017-30\"]\t1954483273\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2017-30\"]\t926644143\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2017-30\"]\t484776279\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2017-30\"]\t145891163\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2017-30\"]\t59751176\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2017-30\"]\t858189674\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2017-30\"]\t888\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2017-30\"]\t5534511521\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2017-30\"]\t2979385367\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2017-30\"]\t166146\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2017-30\"]\t201494711\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2017-30\"]\t681835209\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2017-30\"]\t361022708\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2017-30\"]\t1214525\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2017-30\"]\t13615340\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2017-30\"]\t251786042\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2017-30\"]\t501079119\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2017-30\"]\t78028\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2017-30\"]\t182423929\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2017-30\"]\t205915625\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2017-30\"]\t154494772\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2017-30\"]\t270140671637973\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2017-30\"]\t13566579384\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2017-30\"]\t2458901551\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2017-30\"]\t4666914757\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2017-30\"]\t2945986722\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2017-30\"]\t208037879\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2017-30\"]\t817921816\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2017-30\"]\t1204720136\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2017-30\"]\t1264096523\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2017-34.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2017-34\"]\t14698581608\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2017-34\"]\t4228576525\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2017-34\"]\t22188071\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2017-34\"]\t2596845574\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2017-34\"]\t1524419\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2017-34\"]\t61446965\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2017-34\"]\t1133\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2017-34\"]\t92487034\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2017-34\"]\t64280317\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2017-34\"]\t1389803012\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2017-34\"]\t748\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2017-34\"]\t4596143944\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2017-34\"]\t3311349890\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2017-34\"]\t6511421\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2017-34\"]\t131876745\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2017-34\"]\t266235187\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2017-34\"]\t66633426\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2017-34\"]\t335874\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2017-34\"]\t3289602\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2017-34\"]\t252551428\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2017-34\"]\t77174541\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2017-34\"]\t47788\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2017-34\"]\t259391103\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2017-34\"]\t96158581\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2017-34\"]\t124588358\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2017-34\"]\t310433133466170\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2017-34\"]\t14698581608\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2017-34\"]\t3076043806\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2017-34\"]\t5006935549\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2017-34\"]\t2236270221\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2017-34\"]\t260757633\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2017-34\"]\t1150539535\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2017-34\"]\t990776773\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2017-34\"]\t1339996022\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2017-34\"]\t637262069\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2017-39.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2017-39\"]\t14981165656\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2017-39\"]\t3951178480\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2017-39\"]\t23259501\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2017-39\"]\t2207968561\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2017-39\"]\t7220704\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2017-39\"]\t224769215\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2017-39\"]\t65\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2017-39\"]\t175188791\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2017-39\"]\t64413243\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2017-39\"]\t1248358400\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2017-39\"]\t713\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2017-39\"]\t4587378749\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2017-39\"]\t3070502683\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2017-39\"]\t48612783\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2017-39\"]\t172102105\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2017-39\"]\t481857001\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2017-39\"]\t85752794\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2017-39\"]\t553774\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2017-39\"]\t5185927\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2017-39\"]\t185502116\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2017-39\"]\t88762359\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2017-39\"]\t202418\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2017-39\"]\t271810221\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2017-39\"]\t62735738\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2017-39\"]\t113798830\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2017-39\"]\t279341049655480\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2017-39\"]\t14981165656\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2017-39\"]\t3036783816\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2017-39\"]\t5498973901\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2017-39\"]\t2379462200\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2017-39\"]\t289206929\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2017-39\"]\t1270055417\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2017-39\"]\t1077659650\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2017-39\"]\t1428053290\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2017-39\"]\t970453\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2017-43.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2017-43\"]\t15959590811\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2017-43\"]\t4775053544\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2017-43\"]\t39152551\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2017-43\"]\t2867690086\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2017-43\"]\t1734433\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2017-43\"]\t255938231\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2017-43\"]\t34\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2017-43\"]\t221851277\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2017-43\"]\t105351637\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2017-43\"]\t1283335295\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2017-43\"]\t724\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2017-43\"]\t5591606430\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2017-43\"]\t3712542097\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2017-43\"]\t66501392\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2017-43\"]\t216668862\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2017-43\"]\t620532043\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2017-43\"]\t107578277\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2017-43\"]\t536119\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2017-43\"]\t6014667\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2017-43\"]\t238497356\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2017-43\"]\t91764179\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2017-43\"]\t341552\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2017-43\"]\t400141993\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2017-43\"]\t10036643\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2017-43\"]\t120451250\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2017-43\"]\t348748095977586\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2017-43\"]\t15959590811\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2017-43\"]\t3122841352\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2017-43\"]\t5971792808\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2017-43\"]\t2492882625\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2017-43\"]\t328298718\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2017-43\"]\t1443098416\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2017-43\"]\t1035904596\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2017-43\"]\t1557355682\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2017-43\"]\t7416614\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2017-47.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2017-47\"]\t16756526195\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2017-47\"]\t4343750079\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2017-47\"]\t32173470\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2017-47\"]\t2585622128\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2017-47\"]\t3257941\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2017-47\"]\t256707599\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2017-47\"]\t43\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2017-47\"]\t173986929\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2017-47\"]\t90683456\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2017-47\"]\t1201318513\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2017-47\"]\t864\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2017-47\"]\t5010042149\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2017-47\"]\t3252728548\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2017-47\"]\t62082353\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2017-47\"]\t177391378\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2017-47\"]\t508693458\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2017-47\"]\t87868459\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2017-47\"]\t702645\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2017-47\"]\t5193453\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2017-47\"]\t287350638\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2017-47\"]\t85282128\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2017-47\"]\t8637220\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2017-47\"]\t402820882\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2017-47\"]\t10562723\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2017-47\"]\t120728264\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2017-47\"]\t287343034723371\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2017-47\"]\t16756526195\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2017-47\"]\t3023484693\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2017-47\"]\t6367094529\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2017-47\"]\t2642912081\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2017-47\"]\t364184547\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2017-47\"]\t1677626597\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2017-47\"]\t979294749\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2017-47\"]\t1698798693\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2017-47\"]\t3130306\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2017-51.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2017-51\"]\t17390543871\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2017-51\"]\t3809408512\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2017-51\"]\t5949427\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2017-51\"]\t2729333867\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2017-51\"]\t103773\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2017-51\"]\t34725019\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2017-51\"]\t182\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2017-51\"]\t71007198\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2017-51\"]\t29927486\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2017-51\"]\t938361560\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2017-51\"]\t796\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2017-51\"]\t4168517598\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2017-51\"]\t2944314545\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2017-51\"]\t79404292\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2017-51\"]\t94957871\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2017-51\"]\t276852486\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2017-51\"]\t54447385\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2017-51\"]\t383881\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2017-51\"]\t3462996\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2017-51\"]\t174768584\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2017-51\"]\t56023764\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2017-51\"]\t5829268\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2017-51\"]\t337477499\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2017-51\"]\t26504855\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2017-51\"]\t114090172\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2017-51\"]\t269133016575671\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2017-51\"]\t17390543871\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2017-51\"]\t2823422683\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2017-51\"]\t6620604422\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2017-51\"]\t474509164\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2017-51\"]\t394068005\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2017-51\"]\t1892585141\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2017-51\"]\t972078034\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2017-51\"]\t500992703\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2017-51\"]\t3712283719\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2018-05.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2018-05\"]\t14985445343\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2018-05\"]\t4732788935\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2018-05\"]\t4929024\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2018-05\"]\t2370015735\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2018-05\"]\t72263\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2018-05\"]\t255381651\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2018-05\"]\t202\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2018-05\"]\t398344669\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2018-05\"]\t85514344\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2018-05\"]\t1618531047\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2018-05\"]\t786\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2018-05\"]\t5555368862\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2018-05\"]\t3539656618\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2018-05\"]\t57260633\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2018-05\"]\t194114941\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2018-05\"]\t647907171\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2018-05\"]\t137014171\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2018-05\"]\t1028950\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2018-05\"]\t7112642\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2018-05\"]\t297621012\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2018-05\"]\t106953112\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2018-05\"]\t4724008\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2018-05\"]\t306367202\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2018-05\"]\t136113281\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2018-05\"]\t119495121\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2018-05\"]\t298385074636475\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2018-05\"]\t14985445343\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2018-05\"]\t3530830470\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2018-05\"]\t6680509983\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2018-05\"]\t383010192\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2018-05\"]\t423180270\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2018-05\"]\t2027169812\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2018-05\"]\t1141286075\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2018-05\"]\t464213456\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2018-05\"]\t335245085\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2018-09.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2018-09\"]\t15702763091\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2018-09\"]\t4629848076\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2018-09\"]\t29407204\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2018-09\"]\t2714848619\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2018-09\"]\t7571398\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2018-09\"]\t218794961\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2018-09\"]\t865133\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2018-09\"]\t12656244\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2018-09\"]\t26145936\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2018-09\"]\t1619558581\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2018-09\"]\t712\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2018-09\"]\t5049116155\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2018-09\"]\t3537023788\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2018-09\"]\t81979040\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2018-09\"]\t149299992\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2018-09\"]\t288513288\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2018-09\"]\t91033027\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2018-09\"]\t636989\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2018-09\"]\t5999359\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2018-09\"]\t353538286\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2018-09\"]\t66302608\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2018-09\"]\t1402868\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2018-09\"]\t373773900\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2018-09\"]\t35127662\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2018-09\"]\t64485348\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2018-09\"]\t300536226999345\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2018-09\"]\t15702763091\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2018-09\"]\t3375900564\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2018-09\"]\t7383766566\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2018-09\"]\t312579144\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2018-09\"]\t122260941\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2018-09\"]\t268322325\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2018-09\"]\t1162096276\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2018-09\"]\t412199050\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2018-09\"]\t2665638225\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2018-13.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2018-13\"]\t13830972570\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2018-13\"]\t4297718457\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2018-13\"]\t68959878\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2018-13\"]\t2666733933\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2018-13\"]\t14180528\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2018-13\"]\t307760844\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2018-13\"]\t41358\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2018-13\"]\t74011305\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2018-13\"]\t32047111\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2018-13\"]\t1133983500\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2018-13\"]\t723\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2018-13\"]\t4782794000\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2018-13\"]\t3285419961\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2018-13\"]\t111508186\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2018-13\"]\t139828371\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2018-13\"]\t357078563\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2018-13\"]\t87237419\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2018-13\"]\t980289\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2018-13\"]\t9812406\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2018-13\"]\t277946089\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2018-13\"]\t63489021\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2018-13\"]\t2516967\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2018-13\"]\t368015977\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2018-13\"]\t8230413\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2018-13\"]\t70730338\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2018-13\"]\t284337695637620\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2018-13\"]\t13830972570\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2018-13\"]\t3001227883\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2018-13\"]\t7895148123\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2018-13\"]\t365571188\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2018-13\"]\t154234976\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2018-13\"]\t348846564\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2018-13\"]\t1199871167\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2018-13\"]\t481114057\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2018-13\"]\t384958612\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2018-17.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2018-17\"]\t14071100780\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2018-17\"]\t4173609779\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2018-17\"]\t37175943\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2018-17\"]\t2829798545\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2018-17\"]\t17359610\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2018-17\"]\t206850116\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2018-17\"]\t37206\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2018-17\"]\t27323828\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2018-17\"]\t17589204\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2018-17\"]\t1037475327\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2018-17\"]\t699\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2018-17\"]\t4547550846\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2018-17\"]\t3144252077\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2018-17\"]\t100902383\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2018-17\"]\t105141991\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2018-17\"]\t277830711\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2018-17\"]\t72302567\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2018-17\"]\t1058355\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2018-17\"]\t4052303\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2018-17\"]\t344641596\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2018-17\"]\t57180569\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2018-17\"]\t2020822\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2018-17\"]\t294609224\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2018-17\"]\t76724326\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2018-17\"]\t66833922\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2018-17\"]\t253987501232646\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2018-17\"]\t14071100780\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2018-17\"]\t2970644985\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2018-17\"]\t8114915537\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2018-17\"]\t362439633\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2018-17\"]\t135744114\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2018-17\"]\t301467764\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2018-17\"]\t1206453159\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2018-17\"]\t481125718\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2018-17\"]\t498309870\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2018-22.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2018-22\"]\t14293230909\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2018-22\"]\t3917155993\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2018-22\"]\t32465315\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2018-22\"]\t2530328991\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2018-22\"]\t6523309\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2018-22\"]\t159576729\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2018-22\"]\t27838\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2018-22\"]\t11977848\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2018-22\"]\t33985121\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2018-22\"]\t1142270842\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2018-22\"]\t743\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2018-22\"]\t4298275561\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2018-22\"]\t2840416631\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2018-22\"]\t108799877\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2018-22\"]\t135203413\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2018-22\"]\t257427577\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2018-22\"]\t81534904\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2018-22\"]\t976814\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2018-22\"]\t3808524\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2018-22\"]\t385275581\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2018-22\"]\t59583279\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2018-22\"]\t9479707\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2018-22\"]\t352030428\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2018-22\"]\t8512144\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2018-22\"]\t55226682\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2018-22\"]\t239126191264461\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2018-22\"]\t14293230909\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2018-22\"]\t3177942882\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2018-22\"]\t8103351816\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2018-22\"]\t299583913\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2018-22\"]\t141267298\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2018-22\"]\t326809247\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2018-22\"]\t1334180288\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2018-22\"]\t432254606\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2018-22\"]\t477840859\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2018-26.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2018-26\"]\t14114634413\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2018-26\"]\t4008025120\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2018-26\"]\t32391310\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2018-26\"]\t2682351796\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2018-26\"]\t11193645\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2018-26\"]\t247817992\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2018-26\"]\t243937\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2018-26\"]\t18750526\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2018-26\"]\t28346965\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2018-26\"]\t986928949\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2018-26\"]\t546\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2018-26\"]\t4414244040\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2018-26\"]\t3113935691\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2018-26\"]\t103681263\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2018-26\"]\t144538017\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2018-26\"]\t272764837\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2018-26\"]\t87784880\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2018-26\"]\t735848\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2018-26\"]\t3485928\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2018-26\"]\t362210741\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2018-26\"]\t59362986\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2018-26\"]\t224376999\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2018-26\"]\t11492148\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2018-26\"]\t29874702\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2018-26\"]\t258520269206734\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2018-26\"]\t14114634413\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2018-26\"]\t1733783856\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2018-26\"]\t7339361811\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2018-26\"]\t293483951\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2018-26\"]\t153405416\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2018-26\"]\t374247837\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2018-26\"]\t1349447758\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2018-26\"]\t423459632\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2018-26\"]\t2447444152\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2018-30.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2018-30\"]\t12336785966\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2018-30\"]\t4272792338\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2018-30\"]\t31525933\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2018-30\"]\t2764181054\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2018-30\"]\t9295209\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2018-30\"]\t249537428\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2018-30\"]\t278443\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2018-30\"]\t78763744\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2018-30\"]\t40791189\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2018-30\"]\t1098419338\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2018-30\"]\t399\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2018-30\"]\t4804044753\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2018-30\"]\t3318163845\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2018-30\"]\t99627702\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2018-30\"]\t182144927\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2018-30\"]\t364496458\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2018-30\"]\t113435536\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2018-30\"]\t917048\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2018-30\"]\t4246537\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2018-30\"]\t409227586\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2018-30\"]\t67774292\n[\"crawl_status\", \"fetcher:filter_denied\", \"CC-MAIN-2018-30\"]\t56584\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2018-30\"]\t210341792\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2018-30\"]\t488723\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2018-30\"]\t33123723\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2018-30\"]\t283827031229424\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2018-30\"]\t12336785966\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2018-30\"]\t1819924719\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2018-30\"]\t6349393753\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2018-30\"]\t278526026\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2018-30\"]\t172383828\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2018-30\"]\t424540268\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2018-30\"]\t1266019885\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2018-30\"]\t378211682\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2018-30\"]\t1647785805\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2018-34.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2018-34\"]\t11304753488\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2018-34\"]\t3530776601\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2018-34\"]\t27082719\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2018-34\"]\t2157338202\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2018-34\"]\t16260140\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2018-34\"]\t236467881\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2018-34\"]\t65887\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2018-34\"]\t64065853\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2018-34\"]\t30648499\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2018-34\"]\t998847420\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2018-34\"]\t335\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2018-34\"]\t3956782964\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2018-34\"]\t2735259369\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2018-34\"]\t100121564\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2018-34\"]\t127120411\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2018-34\"]\t310300121\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2018-34\"]\t95621653\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2018-34\"]\t693310\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2018-34\"]\t6368586\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2018-34\"]\t328746273\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2018-34\"]\t50613072\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2018-34\"]\t17662938\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2018-34\"]\t154267033\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2018-34\"]\t674974\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2018-34\"]\t29333660\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2018-34\"]\t246357881816816\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2018-34\"]\t11304753488\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2018-34\"]\t1635807505\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2018-34\"]\t5580993899\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2018-34\"]\t373290661\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2018-34\"]\t168159102\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2018-34\"]\t410307697\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2018-34\"]\t1230145234\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2018-34\"]\t450826491\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2018-34\"]\t1455222899\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2018-39.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2018-39\"]\t10322390017\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2018-39\"]\t3720881871\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2018-39\"]\t4136119072\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2018-39\"]\t2884119432\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2018-39\"]\t84584691\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2018-39\"]\t134994515\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2018-39\"]\t294096388\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2018-39\"]\t95324822\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2018-39\"]\t737780\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2018-39\"]\t6270334\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2018-39\"]\t389911847\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2018-39\"]\t52406321\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2018-39\"]\t29927162\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2018-39\"]\t136463425\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2018-39\"]\t11782536\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2018-39\"]\t15499819\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2018-39\"]\t242048461520004\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2018-39\"]\t10322390017\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2018-39\"]\t1398567439\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2018-39\"]\t5488581498\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2018-39\"]\t374186964\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2018-39\"]\t143284282\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2018-39\"]\t318986116\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2018-39\"]\t1242592600\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2018-39\"]\t437746486\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2018-39\"]\t918444632\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2018-43.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2018-43\"]\t10068215197\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2018-43\"]\t3813543568\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2018-43\"]\t42021732\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2018-43\"]\t2445779704\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2018-43\"]\t16271131\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2018-43\"]\t201227801\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2018-43\"]\t8285\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2018-43\"]\t44762976\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2018-43\"]\t44917161\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2018-43\"]\t1018554778\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2018-43\"]\t290\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2018-43\"]\t4218632230\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2018-43\"]\t3090406673\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2018-43\"]\t27315531\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2018-43\"]\t139881101\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2018-43\"]\t279486840\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2018-43\"]\t94183562\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2018-43\"]\t588332\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2018-43\"]\t5121173\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2018-43\"]\t339131122\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2018-43\"]\t58003185\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2018-43\"]\t32022037\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2018-43\"]\t131616628\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2018-43\"]\t7056180\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2018-43\"]\t13819866\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2018-43\"]\t265205184729109\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2018-43\"]\t10068215197\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2018-43\"]\t1461120982\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2018-43\"]\t5266342920\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2018-43\"]\t467535814\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2018-43\"]\t163303086\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2018-43\"]\t398840989\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2018-43\"]\t1197919494\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2018-43\"]\t524387947\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2018-43\"]\t588763965\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2018-47.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2018-47\"]\t10372257458\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2018-47\"]\t3301990275\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2018-47\"]\t66657642\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2018-47\"]\t1834016045\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2018-47\"]\t19516316\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2018-47\"]\t216806570\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2018-47\"]\t34832\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2018-47\"]\t70318660\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2018-47\"]\t43035511\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2018-47\"]\t1051604699\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2018-47\"]\t230\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2018-47\"]\t3656933396\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2018-47\"]\t2691695481\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2018-47\"]\t23960257\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2018-47\"]\t134383167\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2018-47\"]\t278564192\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2018-47\"]\t90330725\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2018-47\"]\t593860\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2018-47\"]\t4088303\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2018-47\"]\t198376701\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2018-47\"]\t62439892\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2018-47\"]\t39004719\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2018-47\"]\t115949113\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2018-47\"]\t7502892\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2018-47\"]\t10044094\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2018-47\"]\t242525017908146\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2018-47\"]\t10372257458\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2018-47\"]\t1184456635\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2018-47\"]\t5461150713\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2018-47\"]\t602495879\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2018-47\"]\t187593772\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2018-47\"]\t475087379\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2018-47\"]\t1230242846\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2018-47\"]\t627432633\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2018-47\"]\t603797601\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2018-51.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2018-51\"]\t10696257053\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2018-51\"]\t3851138781\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2018-51\"]\t46438271\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2018-51\"]\t2410368563\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2018-51\"]\t21195653\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2018-51\"]\t202847224\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2018-51\"]\t6207\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2018-51\"]\t50264345\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2018-51\"]\t29653778\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2018-51\"]\t1090364740\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2018-51\"]\t268\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2018-51\"]\t4236751469\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2018-51\"]\t3219306621\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2018-51\"]\t32755355\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2018-51\"]\t129749930\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2018-51\"]\t275584140\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2018-51\"]\t90717237\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2018-51\"]\t691530\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2018-51\"]\t3586075\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2018-51\"]\t242299052\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2018-51\"]\t63168563\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2018-51\"]\t48961370\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2018-51\"]\t97158339\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2018-51\"]\t25821635\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2018-51\"]\t6951622\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2018-51\"]\t280265065707216\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2018-51\"]\t10696257053\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2018-51\"]\t1213509726\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2018-51\"]\t5910211156\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2018-51\"]\t681845228\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2018-51\"]\t192894989\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2018-51\"]\t468061025\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2018-51\"]\t1240802263\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2018-51\"]\t706307667\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2018-51\"]\t282624999\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2019-04.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2019-04\"]\t11425571649\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2019-04\"]\t3579014656\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2019-04\"]\t17047012\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2019-04\"]\t2281909542\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2019-04\"]\t5835359\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2019-04\"]\t54071655\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2019-04\"]\t19546\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2019-04\"]\t28071252\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2019-04\"]\t29201860\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2019-04\"]\t1162858430\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2019-04\"]\t394\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2019-04\"]\t3923187910\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2019-04\"]\t2941135435\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2019-04\"]\t41894460\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2019-04\"]\t136417987\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2019-04\"]\t228992959\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2019-04\"]\t87490833\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2019-04\"]\t707713\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2019-04\"]\t3216221\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2019-04\"]\t256048221\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2019-04\"]\t77369505\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2019-04\"]\t42272465\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2019-04\"]\t100220044\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2019-04\"]\t997384\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2019-04\"]\t6424683\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2019-04\"]\t265131774568884\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2019-04\"]\t11425571649\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2019-04\"]\t1304655900\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2019-04\"]\t5989875297\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2019-04\"]\t649536320\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2019-04\"]\t189263437\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2019-04\"]\t422378341\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2019-04\"]\t1197987241\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2019-04\"]\t698289453\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2019-04\"]\t973585660\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2019-09.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2019-09\"]\t11395325655\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2019-09\"]\t3512447577\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2019-09\"]\t35586667\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2019-09\"]\t2144960700\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2019-09\"]\t9121400\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2019-09\"]\t222975922\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2019-09\"]\t5285\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2019-09\"]\t40363114\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2019-09\"]\t39297831\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2019-09\"]\t1020136658\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2019-09\"]\t1583\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2019-09\"]\t3881841808\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2019-09\"]\t2965203537\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2019-09\"]\t42989143\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2019-09\"]\t141306529\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2019-09\"]\t246628046\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2019-09\"]\t96873013\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2019-09\"]\t908140\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2019-09\"]\t3237812\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2019-09\"]\t247452785\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2019-09\"]\t70812357\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2019-09\"]\t9541247\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2019-09\"]\t31954332\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2019-09\"]\t474887\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2019-09\"]\t24459980\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2019-09\"]\t249402241174208\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2019-09\"]\t11395325655\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2019-09\"]\t1233189167\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2019-09\"]\t6068548300\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2019-09\"]\t665868662\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2019-09\"]\t195252295\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2019-09\"]\t406884827\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2019-09\"]\t1190927396\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2019-09\"]\t698261708\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2019-09\"]\t936393300\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2019-13.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2019-13\"]\t11250692948\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2019-13\"]\t3085950972\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2019-13\"]\t36269668\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2019-13\"]\t1847768013\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2019-13\"]\t15336277\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2019-13\"]\t206903707\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2019-13\"]\t9996\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2019-13\"]\t45785126\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2019-13\"]\t43156143\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2019-13\"]\t890722042\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2019-13\"]\t2696\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2019-13\"]\t3431317282\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2019-13\"]\t2614037004\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2019-13\"]\t28321635\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2019-13\"]\t131441796\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2019-13\"]\t229805021\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2019-13\"]\t96171191\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2019-13\"]\t1018465\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2019-13\"]\t3202891\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2019-13\"]\t210258976\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2019-13\"]\t63447886\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2019-13\"]\t6853981\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2019-13\"]\t26712766\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2019-13\"]\t712952\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2019-13\"]\t19332718\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2019-13\"]\t230720561471378\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2019-13\"]\t11250692948\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2019-13\"]\t1139021514\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2019-13\"]\t6176794401\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2019-13\"]\t696242905\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2019-13\"]\t208862069\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2019-13\"]\t417564787\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2019-13\"]\t1102153249\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2019-13\"]\t729892836\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2019-13\"]\t780161187\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2019-18.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2019-18\"]\t11385935631\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2019-18\"]\t2993990226\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2019-18\"]\t28597679\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2019-18\"]\t1773452337\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2019-18\"]\t7649933\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2019-18\"]\t132611754\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2019-18\"]\t7336\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2019-18\"]\t45801433\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2019-18\"]\t26143247\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2019-18\"]\t979726507\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2019-18\"]\t2933\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2019-18\"]\t3331014082\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2019-18\"]\t2541879921\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2019-18\"]\t30291091\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2019-18\"]\t119820842\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2019-18\"]\t231211738\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2019-18\"]\t100535942\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2019-18\"]\t830764\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2019-18\"]\t6074680\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2019-18\"]\t179817366\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2019-18\"]\t77121082\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2019-18\"]\t7364967\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2019-18\"]\t26028465\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2019-18\"]\t47115\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2019-18\"]\t9990109\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2019-18\"]\t218295951215275\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2019-18\"]\t11385935631\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2019-18\"]\t1280576094\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2019-18\"]\t6263847783\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2019-18\"]\t822023933\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2019-18\"]\t232145284\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2019-18\"]\t481305946\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2019-18\"]\t977869468\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2019-18\"]\t839762605\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2019-18\"]\t488404518\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2019-22.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2019-22\"]\t12201452792\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2019-22\"]\t3241321519\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2019-22\"]\t24951298\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2019-22\"]\t1725869710\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2019-22\"]\t10766653\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2019-22\"]\t99038388\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2019-22\"]\t14944\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2019-22\"]\t33537083\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2019-22\"]\t39601883\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2019-22\"]\t1307541560\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2019-22\"]\t3901\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2019-22\"]\t3605990511\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2019-22\"]\t2729146942\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2019-22\"]\t28583594\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2019-22\"]\t151726298\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2019-22\"]\t233617131\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2019-22\"]\t110834281\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2019-22\"]\t855450\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2019-22\"]\t6245949\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2019-22\"]\t185493768\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2019-22\"]\t104616391\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2019-22\"]\t7165215\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2019-22\"]\t36245271\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2019-22\"]\t2583797\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2019-22\"]\t8876424\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2019-22\"]\t245628751198608\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2019-22\"]\t12201452792\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2019-22\"]\t1688179467\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2019-22\"]\t6436633894\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2019-22\"]\t908236787\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2019-22\"]\t248194659\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2019-22\"]\t508349132\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2019-22\"]\t1009185939\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2019-22\"]\t890709906\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2019-22\"]\t511963008\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2019-26.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2019-26\"]\t13037540318\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2019-26\"]\t3091701437\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2019-26\"]\t6567863\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2019-26\"]\t1736973207\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2019-26\"]\t633945\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2019-26\"]\t20627322\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2019-26\"]\t7661\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2019-26\"]\t7207839\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2019-26\"]\t12700326\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2019-26\"]\t1306983274\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2019-26\"]\t4322\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2019-26\"]\t3379152815\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2019-26\"]\t2632942767\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2019-26\"]\t20177097\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2019-26\"]\t121677784\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2019-26\"]\t182495647\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2019-26\"]\t82731932\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2019-26\"]\t758288\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2019-26\"]\t3886636\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2019-26\"]\t170038529\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2019-26\"]\t103149264\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2019-26\"]\t5683984\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2019-26\"]\t43337460\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2019-26\"]\t1803943\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2019-26\"]\t10469484\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2019-26\"]\t243165093483780\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2019-26\"]\t13037540318\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2019-26\"]\t1884854667\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2019-26\"]\t6853556704\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2019-26\"]\t985558590\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2019-26\"]\t264147107\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2019-26\"]\t528524214\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2019-26\"]\t1061494785\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2019-26\"]\t931485445\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2019-26\"]\t527918806\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2019-30.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2019-30\"]\t13857387307\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2019-30\"]\t3125680181\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2019-30\"]\t5988949\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2019-30\"]\t1781449657\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2019-30\"]\t495447\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2019-30\"]\t6766806\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2019-30\"]\t3546\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2019-30\"]\t8518648\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2019-30\"]\t25462276\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2019-30\"]\t1296994852\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2019-30\"]\t4780\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2019-30\"]\t3415769631\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2019-30\"]\t2633907026\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2019-30\"]\t28082880\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2019-30\"]\t133716550\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2019-30\"]\t178972763\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2019-30\"]\t87193926\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2019-30\"]\t785516\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2019-30\"]\t3947481\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2019-30\"]\t181392437\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2019-30\"]\t106506063\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2019-30\"]\t5391839\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2019-30\"]\t40420991\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2019-30\"]\t3442793\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2019-30\"]\t12009366\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2019-30\"]\t247295924114121\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2019-30\"]\t13857387307\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2019-30\"]\t2021409884\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2019-30\"]\t7246547798\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2019-30\"]\t1030766061\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2019-30\"]\t288914603\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2019-30\"]\t542398939\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2019-30\"]\t1145032006\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2019-30\"]\t964983816\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2019-30\"]\t617334200\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2019-35.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2019-35\"]\t15024860128\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2019-35\"]\t3554022988\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2019-35\"]\t4975006\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2019-35\"]\t1874973085\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2019-35\"]\t242386\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2019-35\"]\t10614977\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2019-35\"]\t49882\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2019-35\"]\t11479499\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2019-35\"]\t13910501\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2019-35\"]\t1637777652\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2019-35\"]\t5500\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2019-35\"]\t3864414952\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2019-35\"]\t2996282936\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2019-35\"]\t21963694\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2019-35\"]\t137199511\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2019-35\"]\t201760689\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2019-35\"]\t98767413\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2019-35\"]\t860899\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2019-35\"]\t4194429\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2019-35\"]\t214305232\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2019-35\"]\t110945603\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2019-35\"]\t4658649\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2019-35\"]\t48845732\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2019-35\"]\t10452149\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2019-35\"]\t14178016\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2019-35\"]\t286057758023033\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2019-35\"]\t15024860128\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2019-35\"]\t2526865067\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2019-35\"]\t7491382315\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2019-35\"]\t1105748670\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2019-35\"]\t312424161\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2019-35\"]\t557313735\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2019-35\"]\t1205640260\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2019-35\"]\t1010596007\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2019-35\"]\t814889913\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2019-39.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2019-39\"]\t15879390106\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2019-39\"]\t3143929897\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2019-39\"]\t1570256\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2019-39\"]\t1500575708\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2019-39\"]\t161654\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2019-39\"]\t5389395\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2019-39\"]\t9368\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2019-39\"]\t24844895\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2019-39\"]\t28539110\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2019-39\"]\t1582839511\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2019-39\"]\t5742\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2019-39\"]\t3449909826\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2019-39\"]\t2599795453\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2019-39\"]\t17663707\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2019-39\"]\t144450494\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2019-39\"]\t191874608\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2019-39\"]\t84600666\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2019-39\"]\t764326\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2019-39\"]\t3487279\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2019-39\"]\t211490464\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2019-39\"]\t115875148\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2019-39\"]\t3349785\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2019-39\"]\t54558158\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2019-39\"]\t3947320\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2019-39\"]\t18052418\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2019-39\"]\t267847750399253\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2019-39\"]\t15879390106\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2019-39\"]\t2773144885\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2019-39\"]\t7997105323\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2019-39\"]\t1152617938\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2019-39\"]\t337499877\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2019-39\"]\t563615673\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2019-39\"]\t1272930097\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2019-39\"]\t1039576970\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2019-39\"]\t742899343\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2019-43.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2019-43\"]\t17009132379\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2019-43\"]\t3706625099\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2019-43\"]\t1347205\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2019-43\"]\t1824793579\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2019-43\"]\t144553\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2019-43\"]\t9299877\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2019-43\"]\t863\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2019-43\"]\t17341820\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2019-43\"]\t13835439\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2019-43\"]\t1839861763\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2019-43\"]\t8073\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2019-43\"]\t4000682231\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2019-43\"]\t3059287294\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2019-43\"]\t24576481\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2019-43\"]\t136685707\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2019-43\"]\t203869367\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2019-43\"]\t90568122\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2019-43\"]\t916546\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2019-43\"]\t8149099\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2019-43\"]\t205171451\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2019-43\"]\t120953714\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2019-43\"]\t65020994\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2019-43\"]\t43801063\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2019-43\"]\t21486545\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2019-43\"]\t20195848\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2019-43\"]\t316994443555513\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2019-43\"]\t17009132379\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2019-43\"]\t3171767084\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2019-43\"]\t8653065594\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2019-43\"]\t1268407594\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2019-43\"]\t369862514\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2019-43\"]\t601122155\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2019-43\"]\t1319238638\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2019-43\"]\t1131007554\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2019-43\"]\t494661246\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2019-47.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2019-47\"]\t18304035037\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2019-47\"]\t3156069719\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2019-47\"]\t1266248\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2019-47\"]\t1507713919\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2019-47\"]\t116271\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2019-47\"]\t6123268\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2019-47\"]\t1294\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2019-47\"]\t15222151\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2019-47\"]\t16413664\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2019-47\"]\t1609212904\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2019-47\"]\t17440\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2019-47\"]\t3415729517\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2019-47\"]\t2628115182\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2019-47\"]\t14500798\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2019-47\"]\t122121345\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2019-47\"]\t169216969\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2019-47\"]\t80515910\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2019-47\"]\t727802\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2019-47\"]\t4509788\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2019-47\"]\t211120826\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2019-47\"]\t104178155\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2019-47\"]\t30940773\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2019-47\"]\t31543430\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2019-47\"]\t12519074\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2019-47\"]\t5719465\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2019-47\"]\t282744454100763\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2019-47\"]\t18304035037\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2019-47\"]\t3255362969\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2019-47\"]\t9323271514\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2019-47\"]\t1396469513\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2019-47\"]\t412574427\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2019-47\"]\t650839553\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2019-47\"]\t1346940424\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2019-47\"]\t1238571606\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2019-47\"]\t680005031\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2019-51.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2019-51\"]\t19131514303\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2019-51\"]\t3024216942\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2019-51\"]\t1306071\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2019-51\"]\t1505098735\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2019-51\"]\t80542\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2019-51\"]\t12956441\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2019-51\"]\t1100\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2019-51\"]\t11084812\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2019-51\"]\t19564888\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2019-51\"]\t1474124353\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2019-51\"]\t17732\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2019-51\"]\t3272788239\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2019-51\"]\t2505464002\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2019-51\"]\t16926316\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2019-51\"]\t122867650\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2019-51\"]\t157264491\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2019-51\"]\t80137192\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2019-51\"]\t2368217\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2019-51\"]\t4115352\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2019-51\"]\t199374299\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2019-51\"]\t102657412\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2019-51\"]\t192046\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2019-51\"]\t31419594\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2019-51\"]\t27855121\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2019-51\"]\t16637257\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2019-51\"]\t5509290\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2019-51\"]\t262969974423043\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2019-51\"]\t19131514303\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2019-51\"]\t3196755577\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2019-51\"]\t10167859677\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2019-51\"]\t1460497975\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2019-51\"]\t434111522\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2019-51\"]\t667307093\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2019-51\"]\t1409166277\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2019-51\"]\t1288089277\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2019-51\"]\t507726905\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2020-05.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2020-05\"]\t20085156050\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2020-05\"]\t3668585586\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2020-05\"]\t1121666\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2020-05\"]\t2211238775\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2020-05\"]\t92012\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2020-05\"]\t46330186\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2020-05\"]\t3205\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2020-05\"]\t9777744\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2020-05\"]\t16061648\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2020-05\"]\t1383960350\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2020-05\"]\t19775\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2020-05\"]\t3936673141\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2020-05\"]\t3143769355\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2020-05\"]\t25246448\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2020-05\"]\t121955018\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2020-05\"]\t167466979\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2020-05\"]\t91814694\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2020-05\"]\t709153\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2020-05\"]\t7906827\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2020-05\"]\t183544591\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2020-05\"]\t101669489\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2020-05\"]\t121394\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2020-05\"]\t32008498\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2020-05\"]\t14712314\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2020-05\"]\t39535788\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2020-05\"]\t6212593\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2020-05\"]\t335640773090910\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2020-05\"]\t20085156050\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2020-05\"]\t2831108006\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2020-05\"]\t10411154186\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2020-05\"]\t1346879324\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2020-05\"]\t415489877\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2020-05\"]\t612057268\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2020-05\"]\t1376661791\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2020-05\"]\t1176918093\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2020-05\"]\t1914887505\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2020-10.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2020-10\"]\t19918325266\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2020-10\"]\t3330571565\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2020-10\"]\t969236\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2020-10\"]\t1603252678\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2020-10\"]\t103194\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2020-10\"]\t59866165\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2020-10\"]\t2321\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2020-10\"]\t21213723\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2020-10\"]\t24673635\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2020-10\"]\t1620490613\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2020-10\"]\t11987\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2020-10\"]\t3619056565\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2020-10\"]\t2673682290\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2020-10\"]\t20074055\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2020-10\"]\t144764802\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2020-10\"]\t205649940\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2020-10\"]\t113969803\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2020-10\"]\t829636\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2020-10\"]\t7067208\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2020-10\"]\t184323686\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2020-10\"]\t109151178\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2020-10\"]\t102693\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2020-10\"]\t19989051\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2020-10\"]\t17186176\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2020-10\"]\t75283581\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2020-10\"]\t46982466\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2020-10\"]\t264675728587166\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2020-10\"]\t19918325266\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2020-10\"]\t2946774172\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2020-10\"]\t10719606051\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2020-10\"]\t1374401689\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2020-10\"]\t420495999\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2020-10\"]\t622044013\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2020-10\"]\t1357438756\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2020-10\"]\t1178295354\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2020-10\"]\t1299269232\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2020-16.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2020-16\"]\t20380741760\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2020-16\"]\t3488201254\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2020-16\"]\t718305\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2020-16\"]\t1821903237\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2020-16\"]\t69490\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2020-16\"]\t21596310\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2020-16\"]\t2207\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2020-16\"]\t16831401\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2020-16\"]\t19938299\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2020-16\"]\t1607142005\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2020-16\"]\t10114\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2020-16\"]\t3698733301\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2020-16\"]\t2896755264\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2020-16\"]\t18674174\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2020-16\"]\t119654320\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2020-16\"]\t157735997\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2020-16\"]\t80192634\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2020-16\"]\t702088\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2020-16\"]\t3018086\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2020-16\"]\t138247700\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2020-16\"]\t95420328\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2020-16\"]\t104480\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2020-16\"]\t10852307\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2020-16\"]\t1602691\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2020-16\"]\t32232266\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2020-16\"]\t13029233\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2020-16\"]\t83717088\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2020-16\"]\t46794645\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2020-16\"]\t312280547326383\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2020-16\"]\t20380741760\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2020-16\"]\t2916211638\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2020-16\"]\t11231558010\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2020-16\"]\t1569635611\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2020-16\"]\t430415403\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2020-16\"]\t630128775\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2020-16\"]\t1338108574\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2020-16\"]\t1327513455\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2020-16\"]\t937170294\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2020-24.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2020-24\"]\t21097779271\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2020-24\"]\t3637934268\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2020-24\"]\t1285706\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2020-24\"]\t2181427232\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2020-24\"]\t164421\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2020-24\"]\t4838325\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2020-24\"]\t57247\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2020-24\"]\t4595670\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2020-24\"]\t12692668\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2020-24\"]\t1432872999\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2020-24\"]\t13976\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2020-24\"]\t3955587295\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2020-24\"]\t2770235619\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2020-24\"]\t22629264\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2020-24\"]\t134157178\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2020-24\"]\t242238484\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2020-24\"]\t158510590\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2020-24\"]\t969685\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2020-24\"]\t5487484\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2020-24\"]\t250465653\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2020-24\"]\t101836538\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2020-24\"]\t130646\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2020-24\"]\t34715027\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2020-24\"]\t1978890\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2020-24\"]\t52471522\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2020-24\"]\t2039603\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2020-24\"]\t124783214\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2020-24\"]\t52937898\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2020-24\"]\t284936918032978\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2020-24\"]\t21097779271\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2020-24\"]\t2611718412\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2020-24\"]\t11490176195\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2020-24\"]\t1382791180\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2020-24\"]\t379969069\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2020-24\"]\t536206995\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2020-24\"]\t1284102995\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2020-24\"]\t1192874017\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2020-24\"]\t2219940408\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2020-29.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2020-29\"]\t20528820728\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2020-29\"]\t4073198154\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2020-29\"]\t1065277\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2020-29\"]\t2621276554\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2020-29\"]\t87960\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2020-29\"]\t4603310\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2020-29\"]\t19313\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2020-29\"]\t13957105\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2020-29\"]\t15099451\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2020-29\"]\t1417089184\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2020-29\"]\t16112\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2020-29\"]\t4168069863\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2020-29\"]\t3079189122\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2020-29\"]\t21484094\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2020-29\"]\t130028601\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2020-29\"]\t241756269\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2020-29\"]\t134199822\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2020-29\"]\t983796\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2020-29\"]\t5399946\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2020-29\"]\t217772669\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2020-29\"]\t96494114\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2020-29\"]\t134922\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2020-29\"]\t36165088\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2020-29\"]\t2027922\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2020-29\"]\t48430230\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2020-29\"]\t3586576\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2020-29\"]\t105665665\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2020-29\"]\t44751027\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2020-29\"]\t332782304577866\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2020-29\"]\t20528820728\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2020-29\"]\t2667329075\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2020-29\"]\t11551270706\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2020-29\"]\t1391470539\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2020-29\"]\t377736669\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2020-29\"]\t541842801\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2020-29\"]\t1291142246\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2020-29\"]\t1179403381\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2020-29\"]\t1528625311\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2020-34.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2020-34\"]\t20403113647\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2020-34\"]\t3108580994\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2020-34\"]\t1036828\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2020-34\"]\t1781618067\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2020-34\"]\t78051\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2020-34\"]\t4614840\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2020-34\"]\t24133\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2020-34\"]\t15910596\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2020-34\"]\t18605686\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2020-34\"]\t1286692793\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2020-34\"]\t12295\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2020-34\"]\t3380185917\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2020-34\"]\t2452118051\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2020-34\"]\t17324426\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2020-34\"]\t130128973\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2020-34\"]\t212575569\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2020-34\"]\t103667934\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2020-34\"]\t975564\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2020-34\"]\t4293686\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2020-34\"]\t167008581\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2020-34\"]\t103151371\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2020-34\"]\t105843\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2020-34\"]\t40335680\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2020-34\"]\t2102071\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2020-34\"]\t43649577\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2020-34\"]\t28963182\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2020-34\"]\t15805765\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2020-34\"]\t57979644\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2020-34\"]\t261708608732153\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2020-34\"]\t20403113647\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2020-34\"]\t2433303004\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2020-34\"]\t11562709592\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2020-34\"]\t1369232998\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2020-34\"]\t328085012\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2020-34\"]\t475362874\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2020-34\"]\t1296917973\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2020-34\"]\t1156895281\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2020-34\"]\t1780606913\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2020-40.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2020-40\"]\t21173047327\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2020-40\"]\t4371144186\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2020-40\"]\t1050318\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2020-40\"]\t2203752401\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2020-40\"]\t76076\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2020-40\"]\t5324666\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2020-40\"]\t20326\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2020-40\"]\t14636142\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2020-40\"]\t21189179\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2020-40\"]\t2125095078\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2020-40\"]\t12421\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2020-40\"]\t4646202620\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2020-40\"]\t3479666684\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2020-40\"]\t21422070\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2020-40\"]\t146170973\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2020-40\"]\t249922920\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2020-40\"]\t132228734\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2020-40\"]\t920866\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2020-40\"]\t4717126\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2020-40\"]\t207540975\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2020-40\"]\t108490858\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2020-40\"]\t188433\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2020-40\"]\t37555035\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2020-40\"]\t2030383\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2020-40\"]\t47860646\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2020-40\"]\t2758467\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2020-40\"]\t147388413\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2020-40\"]\t57340037\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2020-40\"]\t379687151165375\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2020-40\"]\t21173047327\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2020-40\"]\t3823419718\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2020-40\"]\t11109911962\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2020-40\"]\t1138156112\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2020-40\"]\t324775626\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2020-40\"]\t468113459\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2020-40\"]\t1210112001\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2020-40\"]\t1015337830\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2020-40\"]\t2083220619\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2020-45.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2020-45\"]\t21531016513\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2020-45\"]\t3253602367\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2020-45\"]\t984923\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2020-45\"]\t1237974864\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2020-45\"]\t57289\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2020-45\"]\t4977772\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2020-45\"]\t18434\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2020-45\"]\t12051004\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2020-45\"]\t9818576\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2020-45\"]\t1987719505\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2020-45\"]\t8593\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2020-45\"]\t3540127936\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2020-45\"]\t2735297287\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2020-45\"]\t11505024\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2020-45\"]\t135053928\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2020-45\"]\t196274120\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2020-45\"]\t84115672\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2020-45\"]\t873990\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2020-45\"]\t3515645\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2020-45\"]\t106753932\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2020-45\"]\t112182282\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2020-45\"]\t120869\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2020-45\"]\t27778099\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2020-45\"]\t1994960\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2020-45\"]\t40136769\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2020-45\"]\t32645583\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2020-45\"]\t4986022\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2020-45\"]\t46893754\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2020-45\"]\t308010284999097\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2020-45\"]\t21531016513\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2020-45\"]\t4013679532\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2020-45\"]\t11644427153\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2020-45\"]\t1143950643\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2020-45\"]\t327728343\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2020-45\"]\t496821771\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2020-45\"]\t1214801317\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2020-45\"]\t1039815597\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2020-45\"]\t1649792157\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2020-50.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2020-50\"]\t22014556091\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2020-50\"]\t3179455369\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2020-50\"]\t1022491\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2020-50\"]\t1403907454\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2020-50\"]\t70866\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2020-50\"]\t5141827\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2020-50\"]\t6078\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2020-50\"]\t15164883\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2020-50\"]\t12674137\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2020-50\"]\t1741467633\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2020-50\"]\t7712\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2020-50\"]\t3415109586\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2020-50\"]\t2642459905\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2020-50\"]\t14561039\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2020-50\"]\t124330607\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2020-50\"]\t179128143\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2020-50\"]\t81746295\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2020-50\"]\t926089\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2020-50\"]\t3422291\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2020-50\"]\t122434328\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2020-50\"]\t109265380\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2020-50\"]\t185522\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2020-50\"]\t8928876\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2020-50\"]\t2062818\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2020-50\"]\t37764630\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2020-50\"]\t21076209\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2020-50\"]\t10866258\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2020-50\"]\t55951196\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2020-50\"]\t296858065294325\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2020-50\"]\t22014556091\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2020-50\"]\t3968496666\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2020-50\"]\t12297968183\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2020-50\"]\t1111198736\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2020-50\"]\t393524347\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2020-50\"]\t585973504\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2020-50\"]\t1175926356\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2020-50\"]\t1045427105\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2020-50\"]\t1436041194\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2021-04.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2021-04\"]\t22704928999\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2021-04\"]\t3980206624\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2021-04\"]\t1059166\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2021-04\"]\t2145623932\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2021-04\"]\t76460\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2021-04\"]\t5544952\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2021-04\"]\t13591\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2021-04\"]\t17792209\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2021-04\"]\t17326509\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2021-04\"]\t1792769805\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2021-04\"]\t9320\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2021-04\"]\t4304731128\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2021-04\"]\t3409444621\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2021-04\"]\t23666907\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2021-04\"]\t133952596\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2021-04\"]\t212581925\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2021-04\"]\t105535443\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2021-04\"]\t980927\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2021-04\"]\t4031652\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2021-04\"]\t148320153\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2021-04\"]\t109606192\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2021-04\"]\t143857\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2021-04\"]\t4129763\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2021-04\"]\t2606640\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2021-04\"]\t45292256\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2021-04\"]\t11426935\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2021-04\"]\t42826071\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2021-04\"]\t50185190\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2021-04\"]\t387617418169542\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2021-04\"]\t22704928999\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2021-04\"]\t4286112571\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2021-04\"]\t12206803964\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2021-04\"]\t1113131343\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2021-04\"]\t401279933\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2021-04\"]\t595411182\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2021-04\"]\t1098610883\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2021-04\"]\t1042496692\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2021-04\"]\t1961082431\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2021-10.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2021-10\"]\t22937361361\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2021-10\"]\t3209033070\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2021-10\"]\t1008309\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2021-10\"]\t1409923637\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2021-10\"]\t68073\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2021-10\"]\t7522380\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2021-10\"]\t13009\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2021-10\"]\t10309568\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2021-10\"]\t15619815\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2021-10\"]\t1764568279\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2021-10\"]\t5156\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2021-10\"]\t3425118952\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2021-10\"]\t2734510630\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2021-10\"]\t12320903\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2021-10\"]\t122603830\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2021-10\"]\t166129219\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2021-10\"]\t76212254\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2021-10\"]\t778303\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2021-10\"]\t3135279\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2021-10\"]\t102400191\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2021-10\"]\t100100750\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2021-10\"]\t107464\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2021-10\"]\t2875435\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2021-10\"]\t1905649\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2021-10\"]\t35671817\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2021-10\"]\t13110664\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2021-10\"]\t13527407\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2021-10\"]\t39729157\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2021-10\"]\t312710741699590\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2021-10\"]\t22937361361\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2021-10\"]\t3774278312\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2021-10\"]\t12676125866\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2021-10\"]\t1143565384\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2021-10\"]\t407980478\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2021-10\"]\t620102017\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2021-10\"]\t1106333792\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2021-10\"]\t1056177611\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2021-10\"]\t2152797901\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2021-17.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2021-17\"]\t21968054310\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2021-17\"]\t3709617713\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2021-17\"]\t976344\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2021-17\"]\t1795745671\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2021-17\"]\t69779\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2021-17\"]\t15740866\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2021-17\"]\t23092\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2021-17\"]\t12013497\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2021-17\"]\t21204523\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2021-17\"]\t1863843941\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2021-17\"]\t5554\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2021-17\"]\t3920902135\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2021-17\"]\t3127001582\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2021-17\"]\t14621976\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2021-17\"]\t132987823\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2021-17\"]\t153518702\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2021-17\"]\t94327292\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2021-17\"]\t877526\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2021-17\"]\t3423393\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2021-17\"]\t88346680\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2021-17\"]\t117396947\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2021-17\"]\t78604\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2021-17\"]\t2821863\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2021-17\"]\t1332452\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2021-17\"]\t40410343\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2021-17\"]\t15847466\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2021-17\"]\t10391333\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2021-17\"]\t117518153\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2021-17\"]\t352138053661199\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2021-17\"]\t23144531730\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2021-17\"]\t3907505417\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2021-17\"]\t13134056830\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2021-17\"]\t1164575344\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2021-17\"]\t379122900\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2021-17\"]\t582479322\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2021-17\"]\t1086399934\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2021-17\"]\t1071678206\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2021-17\"]\t1818713777\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2021-21.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2021-21\"]\t23713955373\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2021-21\"]\t3464062412\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2021-21\"]\t3353616\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2021-21\"]\t1346822315\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2021-21\"]\t53017\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2021-21\"]\t151250902\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2021-21\"]\t2646\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2021-21\"]\t11689253\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2021-21\"]\t18219275\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2021-21\"]\t1932671388\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2021-21\"]\t6074\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2021-21\"]\t3667368943\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2021-21\"]\t2631391117\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2021-21\"]\t12291299\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2021-21\"]\t137287136\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2021-21\"]\t176674355\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2021-21\"]\t133469271\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2021-21\"]\t1375419\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2021-21\"]\t4141543\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2021-21\"]\t152372383\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2021-21\"]\t113067314\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2021-21\"]\t79995\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2021-21\"]\t6101279\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2021-21\"]\t1327786\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2021-21\"]\t41047506\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2021-21\"]\t14660411\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2021-21\"]\t11075164\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2021-21\"]\t231006965\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2021-21\"]\t311264250882666\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2021-21\"]\t23713955373\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2021-21\"]\t4615640332\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2021-21\"]\t13455648147\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2021-21\"]\t1219602381\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2021-21\"]\t431976698\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2021-21\"]\t611179955\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2021-21\"]\t1075723453\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2021-21\"]\t1147514566\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2021-21\"]\t1156669841\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2021-25.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2021-25\"]\t3080558881\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2021-25\"]\t3080558881\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2021-25\"]\t3285121939\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2021-25\"]\t2455171959\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2021-25\"]\t11183164\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2021-25\"]\t105205569\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2021-25\"]\t155786618\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2021-25\"]\t105405147\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2021-25\"]\t995371\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2021-25\"]\t3673969\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2021-25\"]\t125777337\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2021-25\"]\t95756141\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2021-25\"]\t25258\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2021-25\"]\t7258722\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2021-25\"]\t1222341\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2021-25\"]\t37763920\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2021-25\"]\t14712488\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2021-25\"]\t9709994\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2021-25\"]\t155473941\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2021-25\"]\t290946448700164\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2021-25\"]\t24800457807\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2021-25\"]\t4686648268\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2021-25\"]\t14551473174\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2021-25\"]\t1440720582\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2021-25\"]\t441151277\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2021-25\"]\t603351871\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2021-25\"]\t1011741947\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2021-25\"]\t1323907039\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2021-25\"]\t741463649\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2021-31.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2021-31\"]\t26047830277\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2021-31\"]\t3840646040\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2021-31\"]\t1989358\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2021-31\"]\t2210722599\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2021-31\"]\t82308\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2021-31\"]\t24092338\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2021-31\"]\t20825\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2021-31\"]\t18607811\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2021-31\"]\t13532841\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2021-31\"]\t1571597960\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2021-31\"]\t9014\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2021-31\"]\t4042568803\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2021-31\"]\t3163682448\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2021-31\"]\t19975742\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2021-31\"]\t105105103\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2021-31\"]\t158530723\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2021-31\"]\t112886143\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2021-31\"]\t885491\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2021-31\"]\t3893078\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2021-31\"]\t136343523\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2021-31\"]\t96819617\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2021-31\"]\t28384\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2021-31\"]\t10036129\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2021-31\"]\t1176969\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2021-31\"]\t37862997\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2021-31\"]\t1994850\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2021-31\"]\t38900573\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2021-31\"]\t154447033\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2021-31\"]\t397552775848124\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2021-31\"]\t26047830277\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2021-31\"]\t4576610281\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2021-31\"]\t14820522928\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2021-31\"]\t1316943908\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2021-31\"]\t373301656\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2021-31\"]\t518558657\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2021-31\"]\t965929408\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2021-31\"]\t1214292931\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2021-31\"]\t2261670508\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2021-39.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2021-39\"]\t26294713963\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2021-39\"]\t3590999547\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2021-39\"]\t2040894\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2021-39\"]\t1563906707\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2021-39\"]\t81712\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2021-39\"]\t35259229\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2021-39\"]\t15222\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2021-39\"]\t14488274\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2021-39\"]\t15976320\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2021-39\"]\t1959231189\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2021-39\"]\t8137\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2021-39\"]\t3883613334\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2021-39\"]\t2966078302\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2021-39\"]\t16785975\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2021-39\"]\t145459252\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2021-39\"]\t186926808\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2021-39\"]\t109920161\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2021-39\"]\t1042137\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2021-39\"]\t4965056\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2021-39\"]\t117553743\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2021-39\"]\t131475018\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2021-39\"]\t113050\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2021-39\"]\t14400833\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2021-39\"]\t2101068\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2021-39\"]\t43967454\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2021-39\"]\t17599652\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2021-39\"]\t6192180\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2021-39\"]\t119032645\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2021-39\"]\t345966372054467\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2021-39\"]\t26294713963\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2021-39\"]\t4287031164\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2021-39\"]\t14156853204\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2021-39\"]\t1335336524\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2021-39\"]\t358225761\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2021-39\"]\t487966283\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2021-39\"]\t952000426\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2021-39\"]\t1191749370\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2021-39\"]\t3525551231\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2021-43.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2021-43\"]\t25464021170\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2021-43\"]\t3937733264\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2021-43\"]\t1983861\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2021-43\"]\t1854461177\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2021-43\"]\t63338\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2021-43\"]\t25799254\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2021-43\"]\t3162\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2021-43\"]\t10211369\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2021-43\"]\t22818130\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2021-43\"]\t2022392973\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2021-43\"]\t12446\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2021-43\"]\t4186134473\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2021-43\"]\t3324131032\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2021-43\"]\t14630482\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2021-43\"]\t145556185\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2021-43\"]\t178731966\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2021-43\"]\t100938453\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2021-43\"]\t950898\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2021-43\"]\t4096594\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2021-43\"]\t98462156\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2021-43\"]\t130594727\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2021-43\"]\t104943\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2021-43\"]\t11977365\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2021-43\"]\t1989656\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2021-43\"]\t41461498\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2021-43\"]\t9550211\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2021-43\"]\t20279220\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2021-43\"]\t102679087\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2021-43\"]\t401669845241384\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2021-43\"]\t25464021170\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2021-43\"]\t4538253558\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2021-43\"]\t14498712038\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2021-43\"]\t1364684317\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2021-43\"]\t425461053\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2021-43\"]\t573281092\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2021-43\"]\t949691889\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2021-43\"]\t1188033683\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2021-43\"]\t1925903540\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2021-49.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2021-49\"]\t26305572235\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2021-49\"]\t3148703091\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2021-49\"]\t4829937\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2021-49\"]\t945024916\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2021-49\"]\t85286\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2021-49\"]\t32528064\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2021-49\"]\t11706\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2021-49\"]\t14476721\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2021-49\"]\t18545016\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2021-49\"]\t2133201445\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2021-49\"]\t9465\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2021-49\"]\t3453904596\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2021-49\"]\t2531182805\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2021-49\"]\t9243543\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2021-49\"]\t158675939\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2021-49\"]\t195910097\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2021-49\"]\t112657682\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2021-49\"]\t1102096\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2021-49\"]\t4813770\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2021-49\"]\t111119341\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2021-49\"]\t138736362\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2021-49\"]\t81298\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2021-49\"]\t6269460\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2021-49\"]\t2207606\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2021-49\"]\t44297127\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2021-49\"]\t16083689\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2021-49\"]\t6477072\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2021-49\"]\t115046709\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2021-49\"]\t313104969748282\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2021-49\"]\t26305572235\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2021-49\"]\t4743912642\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2021-49\"]\t14778217357\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2021-49\"]\t1414015596\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2021-49\"]\t432723796\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2021-49\"]\t576227529\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2021-49\"]\t958438742\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2021-49\"]\t1195987543\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2021-49\"]\t2206049030\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2022-05.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2022-05\"]\t26716610822\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2022-05\"]\t3546030954\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2022-05\"]\t9175675\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2022-05\"]\t1545201888\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2022-05\"]\t80870\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2022-05\"]\t22587592\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2022-05\"]\t22871\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2022-05\"]\t9112349\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2022-05\"]\t12243260\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2022-05\"]\t1947606449\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2022-05\"]\t17090\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2022-05\"]\t3742707359\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2022-05\"]\t2974668205\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2022-05\"]\t13244379\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2022-05\"]\t126987435\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2022-05\"]\t161226101\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2022-05\"]\t94350449\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2022-05\"]\t961378\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2022-05\"]\t3905415\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2022-05\"]\t63409947\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2022-05\"]\t134888834\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2022-05\"]\t55057\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2022-05\"]\t11232257\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2022-05\"]\t577306\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2022-05\"]\t39994831\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2022-05\"]\t31765834\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2022-05\"]\t5405484\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2022-05\"]\t79974984\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2022-05\"]\t356280025224500\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2022-05\"]\t26716610822\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2022-05\"]\t4661816549\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2022-05\"]\t15134324328\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2022-05\"]\t1454982882\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2022-05\"]\t393498035\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2022-05\"]\t528357067\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2022-05\"]\t928711331\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2022-05\"]\t1218752689\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2022-05\"]\t2396167941\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2022-21.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2022-21\"]\t27142123347\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2022-21\"]\t4077272510\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2022-21\"]\t11488862\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2022-21\"]\t1864530724\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2022-21\"]\t84716\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2022-21\"]\t22550907\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2022-21\"]\t24205\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2022-21\"]\t26179355\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2022-21\"]\t19866721\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2022-21\"]\t2132547020\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2022-21\"]\t17676\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2022-21\"]\t4383835156\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2022-21\"]\t3456340061\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2022-21\"]\t14268392\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2022-21\"]\t145737291\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2022-21\"]\t218323216\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2022-21\"]\t119739099\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2022-21\"]\t1170588\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2022-21\"]\t5067169\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2022-21\"]\t40038857\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2022-21\"]\t132096504\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2022-21\"]\t43923\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2022-21\"]\t3666993\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2022-21\"]\t645933\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2022-21\"]\t47395938\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2022-21\"]\t50129016\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2022-21\"]\t3690212\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2022-21\"]\t145420915\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2022-21\"]\t464350498317425\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2022-21\"]\t27142123347\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2022-21\"]\t4005585825\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2022-21\"]\t13233075166\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2022-21\"]\t1134070636\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2022-21\"]\t364446474\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2022-21\"]\t484685748\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2022-21\"]\t811061055\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2022-21\"]\t1004179005\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2022-21\"]\t6105019438\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2022-27.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2022-27\"]\t23976620914\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2022-27\"]\t3657633022\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2022-27\"]\t8063666\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2022-27\"]\t1538082910\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2022-27\"]\t71823\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2022-27\"]\t15686867\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2022-27\"]\t16893\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2022-27\"]\t27315592\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2022-27\"]\t20515601\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2022-27\"]\t2047879670\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2022-27\"]\t26423\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2022-27\"]\t3957265447\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2022-27\"]\t3117835780\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2022-27\"]\t13339554\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2022-27\"]\t142024709\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2022-27\"]\t188077576\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2022-27\"]\t97598112\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2022-27\"]\t1062203\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2022-27\"]\t4234690\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2022-27\"]\t32994498\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2022-27\"]\t123726208\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2022-27\"]\t41638\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2022-27\"]\t63340\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2022-27\"]\t2900169\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2022-27\"]\t650300\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2022-27\"]\t41402592\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2022-27\"]\t46964832\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2022-27\"]\t3724079\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2022-27\"]\t140625167\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2022-27\"]\t409311866035754\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2022-27\"]\t23976620914\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2022-27\"]\t4013453062\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2022-27\"]\t13593877262\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2022-27\"]\t1152962168\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2022-27\"]\t300884220\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2022-27\"]\t436310915\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2022-27\"]\t798503139\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2022-27\"]\t990418841\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2022-27\"]\t2690211307\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2022-33.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2022-33\"]\t24023318047\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2022-33\"]\t3319887725\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2022-33\"]\t13057123\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2022-33\"]\t1242180253\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2022-33\"]\t88373\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2022-33\"]\t35404318\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2022-33\"]\t12124\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2022-33\"]\t24895403\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2022-33\"]\t30408135\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2022-33\"]\t1973841996\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2022-33\"]\t29789\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2022-33\"]\t3690895430\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2022-33\"]\t2599832705\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2022-33\"]\t14037766\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2022-33\"]\t158428944\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2022-33\"]\t244963642\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2022-33\"]\t157689380\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2022-33\"]\t1085605\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2022-33\"]\t5583675\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2022-33\"]\t45162065\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2022-33\"]\t131125981\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2022-33\"]\t40142\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2022-33\"]\t71393\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2022-33\"]\t6178102\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2022-33\"]\t685872\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2022-33\"]\t53827063\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2022-33\"]\t54371741\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2022-33\"]\t911406\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2022-33\"]\t216899948\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2022-33\"]\t325938798447071\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2022-33\"]\t24023318047\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2022-33\"]\t4850665649\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2022-33\"]\t13978690608\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2022-33\"]\t1152374564\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2022-33\"]\t285420720\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2022-33\"]\t408368522\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2022-33\"]\t799365619\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2022-33\"]\t1003428846\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2022-33\"]\t1545003519\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2022-40.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2022-40\"]\t25121487097\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2022-40\"]\t3921032705\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2022-40\"]\t5729155\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2022-40\"]\t1954468917\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2022-40\"]\t78677\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2022-40\"]\t21409408\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2022-40\"]\t12181\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2022-40\"]\t15983182\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2022-40\"]\t12602560\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2022-40\"]\t1910748625\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2022-40\"]\t27276\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2022-40\"]\t4177803855\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2022-40\"]\t3185182948\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2022-40\"]\t17270873\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2022-40\"]\t108947580\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2022-40\"]\t173696671\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2022-40\"]\t105196765\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2022-40\"]\t1001170\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2022-40\"]\t4186870\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2022-40\"]\t43738895\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2022-40\"]\t115533365\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2022-40\"]\t36986\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2022-40\"]\t70113\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2022-40\"]\t55946779\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2022-40\"]\t560655\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2022-40\"]\t40274209\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2022-40\"]\t46566423\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2022-40\"]\t18106580\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2022-40\"]\t261486973\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2022-40\"]\t420316789740924\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2022-40\"]\t25121487097\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2022-40\"]\t4917226945\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2022-40\"]\t14307835903\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2022-40\"]\t1171418776\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2022-40\"]\t273326382\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2022-40\"]\t389451993\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2022-40\"]\t781979237\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2022-40\"]\t1003573994\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2022-40\"]\t2276673867\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2022-49.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2022-49\"]\t25536843285\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2022-49\"]\t4255410360\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2022-49\"]\t5956883\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2022-49\"]\t2193406271\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2022-49\"]\t80685\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2022-49\"]\t28661240\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2022-49\"]\t3016\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2022-49\"]\t14102193\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2022-49\"]\t14710564\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2022-49\"]\t1998489508\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2022-49\"]\t31019\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2022-49\"]\t4532479335\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2022-49\"]\t3389743574\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2022-49\"]\t20618364\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2022-49\"]\t120947003\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2022-49\"]\t192499939\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2022-49\"]\t128794342\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2022-49\"]\t1136398\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2022-49\"]\t5046250\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2022-49\"]\t48117534\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2022-49\"]\t131864675\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2022-49\"]\t35389\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2022-49\"]\t71093\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2022-49\"]\t98970499\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2022-49\"]\t612502\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2022-49\"]\t45772589\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2022-49\"]\t12274922\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2022-49\"]\t73176285\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2022-49\"]\t262797977\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2022-49\"]\t469959139089780\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2022-49\"]\t25536843285\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2022-49\"]\t4969342509\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2022-49\"]\t13222758843\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2022-49\"]\t1091128929\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2022-49\"]\t313589732\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2022-49\"]\t453225498\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2022-49\"]\t732975391\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2022-49\"]\t971080766\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2022-49\"]\t3782741617\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2023-06.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2023-06\"]\t24063833984\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2023-06\"]\t3796595064\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2023-06\"]\t5116269\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2023-06\"]\t2005944628\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2023-06\"]\t102995\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2023-06\"]\t24966483\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2023-06\"]\t7903\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2023-06\"]\t10054864\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2023-06\"]\t20281034\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2023-06\"]\t1730120888\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2023-06\"]\t24256\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2023-06\"]\t4019880276\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2023-06\"]\t3192983431\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2023-06\"]\t16239596\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2023-06\"]\t102126347\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2023-06\"]\t153321346\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2023-06\"]\t104754889\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2023-06\"]\t922548\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2023-06\"]\t4080867\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2023-06\"]\t31022916\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2023-06\"]\t94296468\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2023-06\"]\t19018\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2023-06\"]\t76930\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2023-06\"]\t49907750\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2023-06\"]\t533293\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2023-06\"]\t37582534\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2023-06\"]\t48249189\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2023-06\"]\t12371626\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2023-06\"]\t171391528\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2023-06\"]\t446948428961642\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2023-06\"]\t24063833984\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2023-06\"]\t3622484808\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2023-06\"]\t13070859324\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2023-06\"]\t1325571164\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2023-06\"]\t302359397\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2023-06\"]\t446248225\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2023-06\"]\t734683485\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2023-06\"]\t1132063986\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2023-06\"]\t3429563595\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2023-14.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2023-14\"]\t23193639650\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2023-14\"]\t3788776021\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2023-14\"]\t6257378\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2023-14\"]\t1844740888\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2023-14\"]\t1635491\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2023-14\"]\t36398443\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2023-14\"]\t11803\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2023-14\"]\t14080068\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2023-14\"]\t16850051\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2023-14\"]\t1868801899\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2023-14\"]\t30006\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2023-14\"]\t4034063018\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2023-14\"]\t3124887981\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2023-14\"]\t15540229\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2023-14\"]\t102646420\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2023-14\"]\t164675144\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2023-14\"]\t107786599\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2023-14\"]\t940998\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2023-14\"]\t4249486\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2023-14\"]\t36075488\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2023-14\"]\t108911483\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2023-14\"]\t26878\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2023-14\"]\t68967\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2023-14\"]\t84097649\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2023-14\"]\t678881\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2023-14\"]\t37738168\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2023-14\"]\t52504178\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2023-14\"]\t7165432\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2023-14\"]\t186069037\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2023-14\"]\t443152580006808\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2023-14\"]\t23193639650\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2023-14\"]\t4598631745\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2023-14\"]\t12702799327\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2023-14\"]\t1243492777\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2023-14\"]\t273681679\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2023-14\"]\t439165609\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2023-14\"]\t697347843\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2023-14\"]\t1097446640\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2023-14\"]\t2141074030\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2023-23.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2023-23\"]\t23471797837\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2023-23\"]\t3967407732\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2023-23\"]\t7325696\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2023-23\"]\t2174608895\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2023-23\"]\t4468462\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2023-23\"]\t47769410\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2023-23\"]\t20478\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2023-23\"]\t24124686\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2023-23\"]\t10619993\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2023-23\"]\t1698470112\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2023-23\"]\t61042\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2023-23\"]\t4230515300\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2023-23\"]\t3147083566\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2023-23\"]\t17515925\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2023-23\"]\t99348083\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2023-23\"]\t190333842\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2023-23\"]\t125615263\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2023-23\"]\t1076884\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2023-23\"]\t5382671\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2023-23\"]\t47084544\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2023-23\"]\t108407428\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2023-23\"]\t29915\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2023-23\"]\t60900\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2023-23\"]\t113919547\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2023-23\"]\t604713\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2023-23\"]\t41587219\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2023-23\"]\t33639145\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2023-23\"]\t31572460\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2023-23\"]\t267253195\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2023-23\"]\t437813059556665\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2023-23\"]\t23471797837\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2023-23\"]\t4378716292\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2023-23\"]\t13905851362\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2023-23\"]\t1025231960\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2023-23\"]\t189625402\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2023-23\"]\t348943229\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2023-23\"]\t740766193\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2023-23\"]\t922946681\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2023-23\"]\t1959716718\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2023-40.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2023-40\"]\t24130374695\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2023-40\"]\t4260222260\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2023-40\"]\t9746225\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2023-40\"]\t2331086389\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2023-40\"]\t7057217\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2023-40\"]\t40989544\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2023-40\"]\t14501\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2023-40\"]\t20126165\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2023-40\"]\t11965490\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2023-40\"]\t1839236729\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2023-40\"]\t75895\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2023-40\"]\t4600561579\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2023-40\"]\t3460550562\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2023-40\"]\t20378958\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2023-40\"]\t118420004\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2023-40\"]\t229681445\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2023-40\"]\t166377343\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2023-40\"]\t1107477\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2023-40\"]\t5881194\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2023-40\"]\t46464439\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2023-40\"]\t218645610\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2023-40\"]\t54943\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2023-40\"]\t64733\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2023-40\"]\t6036130\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2023-40\"]\t730490\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2023-40\"]\t54161502\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2023-40\"]\t9850098\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2023-40\"]\t62916955\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2023-40\"]\t199239696\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2023-40\"]\t501577265652400\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2023-40\"]\t24130374695\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2023-40\"]\t3884665696\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2023-40\"]\t11114553064\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2023-40\"]\t775024933\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2023-40\"]\t165681918\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2023-40\"]\t326114894\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2023-40\"]\t606467644\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2023-40\"]\t756036014\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2023-40\"]\t6501830532\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2023-50.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2023-50\"]\t20650993966\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2023-50\"]\t4201814495\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2023-50\"]\t9318432\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2023-50\"]\t1999533261\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2023-50\"]\t6335982\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2023-50\"]\t33822098\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2023-50\"]\t18686\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2023-50\"]\t18620453\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2023-50\"]\t12487229\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2023-50\"]\t2121678354\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2023-50\"]\t79851\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2023-50\"]\t4545962671\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2023-50\"]\t3370910459\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2023-50\"]\t17677519\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2023-50\"]\t124878530\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2023-50\"]\t242337459\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2023-50\"]\t175486919\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2023-50\"]\t1192486\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2023-50\"]\t5915502\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2023-50\"]\t50821465\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2023-50\"]\t196769532\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2023-50\"]\t49488\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2023-50\"]\t101213\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2023-50\"]\t284260\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2023-50\"]\t785557\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2023-50\"]\t57029567\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2023-50\"]\t46515075\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2023-50\"]\t28829893\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2023-50\"]\t226377747\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2023-50\"]\t500270929196590\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2023-50\"]\t20650993966\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2023-50\"]\t4244004287\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2023-50\"]\t10979486761\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2023-50\"]\t869072677\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2023-50\"]\t131102870\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2023-50\"]\t265349548\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2023-50\"]\t595764652\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2023-50\"]\t742898916\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2023-50\"]\t2823314255\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2024-10.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2024-10\"]\t20599819450\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2024-10\"]\t3984507663\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2024-10\"]\t9759116\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2024-10\"]\t1945861517\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2024-10\"]\t5847564\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2024-10\"]\t29218976\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2024-10\"]\t11564\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2024-10\"]\t15407344\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2024-10\"]\t10039167\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2024-10\"]\t1968362415\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2024-10\"]\t69280\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2024-10\"]\t4326140264\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2024-10\"]\t3128032551\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2024-10\"]\t16903617\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2024-10\"]\t120203589\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2024-10\"]\t233699835\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2024-10\"]\t171551229\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2024-10\"]\t1533000\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2024-10\"]\t5153976\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2024-10\"]\t52059083\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2024-10\"]\t165875440\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2024-10\"]\t66802\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2024-10\"]\t108466\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2024-10\"]\t20853041\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2024-10\"]\t721168\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2024-10\"]\t55921796\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2024-10\"]\t10468954\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2024-10\"]\t109331721\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2024-10\"]\t233655996\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2024-10\"]\t467015596332470\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2024-10\"]\t20599819450\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2024-10\"]\t4107295999\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2024-10\"]\t11001427792\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2024-10\"]\t940768266\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2024-10\"]\t126856377\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2024-10\"]\t265841871\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2024-10\"]\t575294289\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2024-10\"]\t774783620\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2024-10\"]\t2807551236\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2024-18.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2024-18\"]\t20216718958\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2024-18\"]\t3565682499\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2024-18\"]\t8643721\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2024-18\"]\t1785578970\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2024-18\"]\t4778023\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2024-18\"]\t24142941\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2024-18\"]\t2800\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2024-18\"]\t15101186\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2024-18\"]\t8160640\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2024-18\"]\t1719274218\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2024-18\"]\t58569\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2024-18\"]\t3848217167\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2024-18\"]\t2803116264\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2024-18\"]\t15520472\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2024-18\"]\t100520754\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2024-18\"]\t200644602\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2024-18\"]\t142535087\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2024-18\"]\t1391977\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2024-18\"]\t4573419\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2024-18\"]\t48663897\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2024-18\"]\t150646294\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2024-18\"]\t94782\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2024-18\"]\t109552\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2024-18\"]\t9036123\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2024-18\"]\t663875\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2024-18\"]\t46982558\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2024-18\"]\t76767431\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2024-18\"]\t27088554\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2024-18\"]\t219861526\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2024-18\"]\t424724693645771\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2024-18\"]\t20216718958\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2024-18\"]\t3753696678\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2024-18\"]\t10999688998\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2024-18\"]\t950860825\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2024-18\"]\t165836046\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2024-18\"]\t338372824\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2024-18\"]\t551656353\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2024-18\"]\t790305356\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2024-18\"]\t2666301878\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2024-22.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2024-22\"]\t19759133480\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2024-22\"]\t3468459881\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2024-22\"]\t8887773\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2024-22\"]\t1807529312\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2024-22\"]\t4376319\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2024-22\"]\t24954745\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2024-22\"]\t1355\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2024-22\"]\t16667673\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2024-22\"]\t10751613\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2024-22\"]\t1595291091\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2024-22\"]\t55812\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2024-22\"]\t3746403860\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2024-22\"]\t2724733199\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2024-22\"]\t17254235\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2024-22\"]\t98096133\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2024-22\"]\t190055008\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2024-22\"]\t136016945\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2024-22\"]\t1732968\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2024-22\"]\t4165255\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2024-22\"]\t49281074\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2024-22\"]\t145180193\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2024-22\"]\t45328\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2024-22\"]\t99916\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2024-22\"]\t7559738\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2024-22\"]\t757830\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2024-22\"]\t43824652\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2024-22\"]\t101035770\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2024-22\"]\t7260546\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2024-22\"]\t219305070\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2024-22\"]\t414783369380256\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2024-22\"]\t19759133480\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2024-22\"]\t4405838379\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2024-22\"]\t10956834122\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2024-22\"]\t1165878995\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2024-22\"]\t201942741\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2024-22\"]\t404174362\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2024-22\"]\t532280803\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2024-22\"]\t940322959\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2024-22\"]\t1151861119\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2024-26.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2024-26\"]\t20635672053\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2024-26\"]\t3697574228\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2024-26\"]\t10250906\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2024-26\"]\t2077172808\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2024-26\"]\t4782313\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2024-26\"]\t29540613\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2024-26\"]\t7899\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2024-26\"]\t15071329\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2024-26\"]\t11605301\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2024-26\"]\t1549143059\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2024-26\"]\t69096\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2024-26\"]\t3986216346\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2024-26\"]\t2813450427\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2024-26\"]\t22419628\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2024-26\"]\t100753785\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2024-26\"]\t195851429\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2024-26\"]\t163171446\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2024-26\"]\t2597885\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2024-26\"]\t4701171\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2024-26\"]\t56765062\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2024-26\"]\t157638112\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2024-26\"]\t42739\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2024-26\"]\t127984\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2024-26\"]\t1085293\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2024-26\"]\t714455\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2024-26\"]\t48339027\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2024-26\"]\t90681275\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2024-26\"]\t48354595\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2024-26\"]\t279521399\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2024-26\"]\t634\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2024-26\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2024-26\"]\t420066803999131\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2024-26\"]\t20635672053\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2024-26\"]\t4987535364\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2024-26\"]\t11824566917\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2024-26\"]\t1387536079\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2024-26\"]\t199692137\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2024-26\"]\t375883539\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2024-26\"]\t570548292\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2024-26\"]\t1084411923\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2024-26\"]\t205497802\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2024-30.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2024-30\"]\t22484038777\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2024-30\"]\t3353545118\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2024-30\"]\t8691353\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2024-30\"]\t1704905039\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2024-30\"]\t3928722\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2024-30\"]\t26741213\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2024-30\"]\t1952\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2024-30\"]\t13452427\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2024-30\"]\t9977134\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2024-30\"]\t1585847278\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2024-30\"]\t59181\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2024-30\"]\t3579486425\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2024-30\"]\t2560559486\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2024-30\"]\t18632553\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2024-30\"]\t90339818\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2024-30\"]\t167561389\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2024-30\"]\t127011828\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2024-30\"]\t1529787\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2024-30\"]\t6553235\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2024-30\"]\t62658807\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2024-30\"]\t152654706\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2024-30\"]\t36358\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2024-30\"]\t115372\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2024-30\"]\t794196\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2024-30\"]\t41078337\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2024-30\"]\t92887154\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2024-30\"]\t24096916\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2024-30\"]\t232975313\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2024-30\"]\t1169\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2024-30\"]\t1\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2024-30\"]\t395080246061810\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2024-30\"]\t22484038777\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2024-30\"]\t4815380051\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2024-30\"]\t11619101762\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2024-30\"]\t1270554557\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2024-30\"]\t230323490\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2024-30\"]\t428264449\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2024-30\"]\t569650215\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2024-30\"]\t1061451208\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2024-30\"]\t2489313045\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2024-33.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2024-33\"]\t21902542885\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2024-33\"]\t3057831348\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2024-33\"]\t7682540\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2024-33\"]\t1520560022\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2024-33\"]\t3456377\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2024-33\"]\t24429362\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2024-33\"]\t6357\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2024-33\"]\t12736865\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2024-33\"]\t8716010\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2024-33\"]\t1480243815\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2024-33\"]\t54148\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2024-33\"]\t3290059251\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2024-33\"]\t2328003168\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2024-33\"]\t17106553\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2024-33\"]\t83486145\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2024-33\"]\t154976267\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2024-33\"]\t113724057\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2024-33\"]\t1613472\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2024-33\"]\t5370806\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2024-33\"]\t49390776\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2024-33\"]\t146820848\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2024-33\"]\t33374\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2024-33\"]\t151898\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2024-33\"]\t772999\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2024-33\"]\t38516158\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2024-33\"]\t96730017\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2024-33\"]\t182046\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2024-33\"]\t253180000\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2024-33\"]\t666\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2024-33\"]\t1\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2024-33\"]\t360013918508070\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2024-33\"]\t21902542885\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2024-33\"]\t5315880834\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2024-33\"]\t12446913533\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2024-33\"]\t1505010789\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2024-33\"]\t227573613\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2024-33\"]\t405721294\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2024-33\"]\t617892977\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2024-33\"]\t1193245940\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2024-33\"]\t190303905\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2024-38.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2024-38\"]\t23533999592\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2024-38\"]\t3670177067\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2024-38\"]\t7416622\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2024-38\"]\t2196208122\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2024-38\"]\t3232726\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2024-38\"]\t25013686\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2024-38\"]\t1400\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2024-38\"]\t12023407\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2024-38\"]\t8994921\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2024-38\"]\t1417286183\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2024-38\"]\t62181\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2024-38\"]\t3906633226\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2024-38\"]\t2814337832\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2024-38\"]\t22219235\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2024-38\"]\t83061425\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2024-38\"]\t159498201\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2024-38\"]\t128607565\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2024-38\"]\t3612417\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2024-38\"]\t5794636\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2024-38\"]\t55494476\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2024-38\"]\t158606948\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2024-38\"]\t45045\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2024-38\"]\t136521\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2024-38\"]\t658021\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2024-38\"]\t38837024\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2024-38\"]\t77871108\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2024-38\"]\t47815821\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2024-38\"]\t310036519\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2024-38\"]\t429\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2024-38\"]\t3\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2024-38\"]\t451968999449777\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2024-38\"]\t23533999592\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2024-38\"]\t5106119664\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2024-38\"]\t13241003714\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2024-38\"]\t1419137622\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2024-38\"]\t253805791\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2024-38\"]\t449464374\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2024-38\"]\t664116892\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2024-38\"]\t1157710667\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2024-38\"]\t1242640868\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2024-42.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2024-42\"]\t24237973275\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2024-42\"]\t3292436854\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2024-42\"]\t6742974\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2024-42\"]\t1774892279\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2024-42\"]\t2888958\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2024-42\"]\t22627937\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2024-42\"]\t327\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2024-42\"]\t11225341\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2024-42\"]\t8902518\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2024-42\"]\t1465156520\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2024-42\"]\t58261\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2024-42\"]\t3523794847\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2024-42\"]\t2507916084\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2024-42\"]\t18756995\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2024-42\"]\t86224578\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2024-42\"]\t152856477\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2024-42\"]\t118545289\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2024-42\"]\t2443649\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2024-42\"]\t6056729\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2024-42\"]\t52260074\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2024-42\"]\t155472674\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2024-42\"]\t47392\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2024-42\"]\t128440\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2024-42\"]\t654706\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2024-42\"]\t39256831\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2024-42\"]\t96186457\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2024-42\"]\t478914\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2024-42\"]\t286509247\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2024-42\"]\t311\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2024-42\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2024-42\"]\t401984660089088\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2024-42\"]\t24237973275\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2024-42\"]\t5152497140\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2024-42\"]\t13898419172\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2024-42\"]\t1642409652\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2024-42\"]\t281783251\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2024-42\"]\t502068203\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2024-42\"]\t729163712\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2024-42\"]\t1285823315\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2024-42\"]\t745808830\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2024-46.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2024-46\"]\t25404964414\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2024-46\"]\t3512067777\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2024-46\"]\t6849308\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2024-46\"]\t2005670110\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2024-46\"]\t2897199\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2024-46\"]\t21221965\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2024-46\"]\t3389\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2024-46\"]\t11175645\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2024-46\"]\t9615362\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2024-46\"]\t1454634799\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2024-46\"]\t60748\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2024-46\"]\t3738908543\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2024-46\"]\t2700111429\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2024-46\"]\t20927775\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2024-46\"]\t85756414\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2024-46\"]\t147889477\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2024-46\"]\t122772755\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2024-46\"]\t2338501\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2024-46\"]\t5893741\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2024-46\"]\t53535084\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2024-46\"]\t151620445\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2024-46\"]\t45845\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2024-46\"]\t137503\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2024-46\"]\t1114798\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2024-46\"]\t592057\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2024-46\"]\t39741414\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2024-46\"]\t75758429\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2024-46\"]\t16196074\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2024-46\"]\t311643790\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2024-46\"]\t610\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2024-46\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2024-46\"]\t445559626171254\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2024-46\"]\t25404964414\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2024-46\"]\t5121780466\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2024-46\"]\t13956219266\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2024-46\"]\t1866571677\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2024-46\"]\t275776016\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2024-46\"]\t476792662\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2024-46\"]\t728257961\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2024-46\"]\t1417321521\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2024-46\"]\t1562244845\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2024-51.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2024-51\"]\t25915332801\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2024-51\"]\t3500310083\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2024-51\"]\t6557151\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2024-51\"]\t1897558478\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2024-51\"]\t2692958\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2024-51\"]\t19405097\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2024-51\"]\t634\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2024-51\"]\t13011806\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2024-51\"]\t11038630\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2024-51\"]\t1550045329\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2024-51\"]\t67914\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2024-51\"]\t3740993208\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2024-51\"]\t2647896043\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2024-51\"]\t18846576\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2024-51\"]\t91624691\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2024-51\"]\t156560742\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2024-51\"]\t129557641\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2024-51\"]\t2021905\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2024-51\"]\t6036585\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2024-51\"]\t53948375\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2024-51\"]\t170882396\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2024-51\"]\t31812\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2024-51\"]\t131038\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2024-51\"]\t587568\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2024-51\"]\t42455390\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2024-51\"]\t86349929\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2024-51\"]\t8756973\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2024-51\"]\t325304199\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2024-51\"]\t1345\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2024-51\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2024-51\"]\t433261745132066\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2024-51\"]\t25915332801\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2024-51\"]\t5281987216\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2024-51\"]\t14665098080\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2024-51\"]\t1803846525\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2024-51\"]\t303994365\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2024-51\"]\t527028820\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2024-51\"]\t798249687\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2024-51\"]\t1382571195\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2024-51\"]\t1152556913\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2025-05.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2025-05\"]\t26857631748\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2025-05\"]\t3969936359\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2025-05\"]\t7048847\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2025-05\"]\t2391192098\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2025-05\"]\t2770975\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2025-05\"]\t18612116\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2025-05\"]\t4333\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2025-05\"]\t15011580\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2025-05\"]\t12477127\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2025-05\"]\t1522819283\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2025-05\"]\t74183\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2025-05\"]\t4226325712\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2025-05\"]\t3044851336\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2025-05\"]\t21395704\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2025-05\"]\t94101595\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2025-05\"]\t169875096\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2025-05\"]\t148517681\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2025-05\"]\t2000487\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2025-05\"]\t5595061\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2025-05\"]\t56594924\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2025-05\"]\t176545258\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2025-05\"]\t36098\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2025-05\"]\t233685\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2025-05\"]\t627283\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2025-05\"]\t46468592\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2025-05\"]\t19710199\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2025-05\"]\t89660690\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2025-05\"]\t350110057\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2025-05\"]\t1966\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2025-05\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2025-05\"]\t511103974602780\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2025-05\"]\t26857631748\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2025-05\"]\t4739528195\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2025-05\"]\t14798867981\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2025-05\"]\t1802893497\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2025-05\"]\t301391293\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2025-05\"]\t517664635\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2025-05\"]\t811352596\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2025-05\"]\t1378616558\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2025-05\"]\t2507316993\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2025-08.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2025-08\"]\t26387970898\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2025-08\"]\t3634095214\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2025-08\"]\t7202838\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2025-08\"]\t2107453831\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2025-08\"]\t2670474\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2025-08\"]\t16939086\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2025-08\"]\t2493\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2025-08\"]\t16791704\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2025-08\"]\t12257849\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2025-08\"]\t1470776939\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2025-08\"]\t71139\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2025-08\"]\t3887374247\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2025-08\"]\t2692264061\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2025-08\"]\t19791265\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2025-08\"]\t90262665\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2025-08\"]\t168565767\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2025-08\"]\t146493055\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2025-08\"]\t1910573\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2025-08\"]\t5864293\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2025-08\"]\t55700117\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2025-08\"]\t186368376\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2025-08\"]\t50324\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2025-08\"]\t160671\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2025-08\"]\t62155\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2025-08\"]\t583302\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2025-08\"]\t44927424\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2025-08\"]\t55602374\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2025-08\"]\t43608395\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2025-08\"]\t375157438\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2025-08\"]\t1992\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2025-08\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2025-08\"]\t442803995079285\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2025-08\"]\t26387970898\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2025-08\"]\t4772126983\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2025-08\"]\t15491343288\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2025-08\"]\t2078247255\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2025-08\"]\t300226772\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2025-08\"]\t528602232\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2025-08\"]\t873604787\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2025-08\"]\t1520464156\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2025-08\"]\t823355425\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2025-13.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2025-13\"]\t27837493836\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2025-13\"]\t3762533233\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2025-13\"]\t7352740\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2025-13\"]\t2175066839\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2025-13\"]\t2671042\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2025-13\"]\t17067603\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2025-13\"]\t3047\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2025-13\"]\t15918436\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2025-13\"]\t11127234\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2025-13\"]\t1533326292\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2025-13\"]\t78940\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2025-13\"]\t4020443907\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2025-13\"]\t2753538967\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2025-13\"]\t21090585\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2025-13\"]\t89599285\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2025-13\"]\t174585378\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2025-13\"]\t150360083\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2025-13\"]\t2472593\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2025-13\"]\t7134471\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2025-13\"]\t59555454\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2025-13\"]\t169830613\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2025-13\"]\t50243\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2025-13\"]\t192917\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2025-13\"]\t174511\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2025-13\"]\t642349\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2025-13\"]\t46851207\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2025-13\"]\t75320089\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2025-13\"]\t40630564\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2025-13\"]\t428413094\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2025-13\"]\t1504\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2025-13\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2025-13\"]\t500840275974825\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2025-13\"]\t27837493836\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2025-13\"]\t5086663863\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2025-13\"]\t15560968244\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2025-13\"]\t1909299987\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2025-13\"]\t270210478\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2025-13\"]\t477359785\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2025-13\"]\t886726630\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2025-13\"]\t1427157028\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2025-13\"]\t2219107821\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2025-18.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2025-18\"]\t27638605242\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2025-18\"]\t3785072639\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2025-18\"]\t7413929\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2025-18\"]\t2311831201\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2025-18\"]\t2619585\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2025-18\"]\t17053825\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2025-18\"]\t3547\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2025-18\"]\t17856708\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2025-18\"]\t12238400\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2025-18\"]\t1416055444\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2025-18\"]\t73807\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2025-18\"]\t4047863325\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2025-18\"]\t2760301059\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2025-18\"]\t20491145\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2025-18\"]\t90978628\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2025-18\"]\t177875606\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2025-18\"]\t150599016\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2025-18\"]\t2372653\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2025-18\"]\t7883330\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2025-18\"]\t60052965\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2025-18\"]\t184069115\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2025-18\"]\t42250\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2025-18\"]\t198920\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2025-18\"]\t20682\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2025-18\"]\t620823\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2025-18\"]\t48674329\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2025-18\"]\t71691306\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2025-18\"]\t26073754\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2025-18\"]\t445915512\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2025-18\"]\t2232\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2025-18\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2025-18\"]\t514885469890832\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2025-18\"]\t27638605242\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2025-18\"]\t5032944919\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2025-18\"]\t16247616732\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2025-18\"]\t1937849738\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2025-18\"]\t270385602\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2025-18\"]\t483857741\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2025-18\"]\t942179486\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2025-18\"]\t1435727210\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2025-18\"]\t1288043814\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2025-21.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2025-21\"]\t27797066363\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2025-21\"]\t3443657988\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2025-21\"]\t7270073\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2025-21\"]\t2289217178\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2025-21\"]\t2499189\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2025-21\"]\t16268706\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2025-21\"]\t2651\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2025-21\"]\t16428749\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2025-21\"]\t11867807\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2025-21\"]\t1100103635\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2025-21\"]\t65077\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2025-21\"]\t3674018218\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2025-21\"]\t2487165634\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2025-21\"]\t19996738\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2025-21\"]\t76026213\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2025-21\"]\t160218457\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2025-21\"]\t138392329\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2025-21\"]\t2060851\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2025-21\"]\t6732300\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2025-21\"]\t58177852\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2025-21\"]\t152743792\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2025-21\"]\t51776\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2025-21\"]\t186639\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2025-21\"]\t25755\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2025-21\"]\t512290\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2025-21\"]\t40562849\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2025-21\"]\t77150916\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2025-21\"]\t15236394\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2025-21\"]\t438775407\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2025-21\"]\t2026\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2025-21\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2025-21\"]\t471735560659753\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2025-21\"]\t27797066363\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2025-21\"]\t5238778343\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2025-21\"]\t16313799119\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2025-21\"]\t1972269204\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2025-21\"]\t271890234\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2025-21\"]\t486492423\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2025-21\"]\t963406334\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2025-21\"]\t1449396642\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2025-21\"]\t1101034064\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2025-26.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2025-26\"]\t28167640016\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2025-26\"]\t3363003425\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2025-26\"]\t7253269\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2025-26\"]\t2216574130\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2025-26\"]\t2472835\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2025-26\"]\t16599892\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2025-26\"]\t5259\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2025-26\"]\t16377700\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2025-26\"]\t11523007\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2025-26\"]\t1092197333\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2025-26\"]\t68213\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2025-26\"]\t3592271667\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2025-26\"]\t2395311332\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2025-26\"]\t18578688\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2025-26\"]\t74194732\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2025-26\"]\t160910513\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2025-26\"]\t139589318\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2025-26\"]\t2165900\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2025-26\"]\t5635575\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2025-26\"]\t56169310\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2025-26\"]\t159227497\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2025-26\"]\t45833\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2025-26\"]\t78257\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2025-26\"]\t463149\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2025-26\"]\t42597042\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2025-26\"]\t86703895\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2025-26\"]\t5021508\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2025-26\"]\t445577331\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2025-26\"]\t1787\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2025-26\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2025-26\"]\t428137350317750\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2025-26\"]\t28167640016\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2025-26\"]\t4277079078\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2025-26\"]\t16669245033\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2025-26\"]\t1970949239\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2025-26\"]\t265149106\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2025-26\"]\t483470947\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2025-26\"]\t1025874569\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2025-26\"]\t1446273819\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2025-26\"]\t2029598225\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2025-30.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2025-30\"]\t27783766888\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2025-30\"]\t3394507444\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2025-30\"]\t7003564\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2025-30\"]\t2135526545\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2025-30\"]\t2343832\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2025-30\"]\t15854999\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2025-30\"]\t5094\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2025-30\"]\t14649702\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2025-30\"]\t10635735\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2025-30\"]\t1208487973\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2025-30\"]\t69149\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2025-30\"]\t3619679510\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2025-30\"]\t2432783351\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2025-30\"]\t17466320\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2025-30\"]\t75424696\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2025-30\"]\t154513597\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2025-30\"]\t133132620\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2025-30\"]\t2161015\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2025-30\"]\t5791456\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2025-30\"]\t56044041\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2025-30\"]\t181114878\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2025-30\"]\t26605\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2025-30\"]\t84324\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2025-30\"]\t482772\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2025-30\"]\t42326207\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2025-30\"]\t86255499\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2025-30\"]\t2162989\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2025-30\"]\t429906202\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2025-30\"]\t2938\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2025-30\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2025-30\"]\t461077262212150\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2025-30\"]\t27783766888\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2025-30\"]\t4972693531\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2025-30\"]\t16561529486\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2025-30\"]\t1954656400\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2025-30\"]\t258395300\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2025-30\"]\t480357829\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2025-30\"]\t1050573338\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2025-30\"]\t1430279210\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2025-30\"]\t1075281794\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2025-33.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2025-33\"]\t28259545744\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2025-33\"]\t3363397721\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2025-33\"]\t6928253\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2025-33\"]\t2175111394\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2025-33\"]\t2320407\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2025-33\"]\t16122547\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2025-33\"]\t5227\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2025-33\"]\t14572988\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2025-33\"]\t10471845\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2025-33\"]\t1137865060\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2025-33\"]\t69898\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2025-33\"]\t3579195444\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2025-33\"]\t2452395752\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2025-33\"]\t17327821\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2025-33\"]\t72004210\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2025-33\"]\t148502329\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2025-33\"]\t129847107\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2025-33\"]\t1438379\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2025-33\"]\t5567004\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2025-33\"]\t53899641\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2025-33\"]\t175894025\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2025-33\"]\t38588\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2025-33\"]\t117440\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2025-33\"]\t90454\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2025-33\"]\t431317\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2025-33\"]\t40259210\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2025-33\"]\t70162662\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2025-33\"]\t2296111\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2025-33\"]\t408920539\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2025-33\"]\t2855\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2025-33\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2025-33\"]\t466546501448057\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2025-33\"]\t28259545744\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2025-33\"]\t4665438474\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2025-33\"]\t16531170261\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2025-33\"]\t1951622924\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2025-33\"]\t248743983\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2025-33\"]\t464602177\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2025-33\"]\t1071233903\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2025-33\"]\t1413019452\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2025-33\"]\t1913714570\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2025-38.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2025-38\"]\t27837059074\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2025-38\"]\t3268835843\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2025-38\"]\t6984498\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2025-38\"]\t2103527775\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2025-38\"]\t2258297\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2025-38\"]\t17076978\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2025-38\"]\t2089\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2025-38\"]\t15538066\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2025-38\"]\t11414994\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2025-38\"]\t1112033146\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2025-38\"]\t67022\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2025-38\"]\t3481594608\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2025-38\"]\t2395594531\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2025-38\"]\t15961233\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2025-38\"]\t85244275\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2025-38\"]\t146744789\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2025-38\"]\t133986063\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2025-38\"]\t1674193\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2025-38\"]\t5158753\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2025-38\"]\t51850624\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2025-38\"]\t187537000\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2025-38\"]\t35669\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2025-38\"]\t100007\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2025-38\"]\t69735\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2025-38\"]\t378269\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2025-38\"]\t39008806\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2025-38\"]\t62843100\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2025-38\"]\t1112314\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2025-38\"]\t354293107\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2025-38\"]\t2140\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2025-38\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2025-38\"]\t463347395390320\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2025-38\"]\t27837059074\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2025-38\"]\t4434486804\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2025-38\"]\t15847038068\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2025-38\"]\t1891499398\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2025-38\"]\t269137349\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2025-38\"]\t506898260\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2025-38\"]\t1036694168\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2025-38\"]\t1369780536\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2025-38\"]\t2481524491\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2025-43.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2025-43\"]\t26899650260\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2025-43\"]\t3501327345\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2025-43\"]\t6932927\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2025-43\"]\t2276506498\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2025-43\"]\t2262833\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2025-43\"]\t19304947\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2025-43\"]\t3736\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2025-43\"]\t17620085\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2025-43\"]\t12439636\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2025-43\"]\t1166256683\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2025-43\"]\t66950\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2025-43\"]\t3720822711\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2025-43\"]\t2627342431\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2025-43\"]\t16646387\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2025-43\"]\t73093813\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2025-43\"]\t151238189\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2025-43\"]\t132229979\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2025-43\"]\t1668899\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2025-43\"]\t7351980\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2025-43\"]\t51472017\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2025-43\"]\t191204170\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2025-43\"]\t47834\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2025-43\"]\t101306\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2025-43\"]\t28697\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2025-43\"]\t407966\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2025-43\"]\t41111433\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2025-43\"]\t63259462\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2025-43\"]\t1587596\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2025-43\"]\t362028640\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2025-43\"]\t1912\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2025-43\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2025-43\"]\t515301270615394\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2025-43\"]\t26899650260\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2025-43\"]\t4473079912\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2025-43\"]\t15711750468\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2025-43\"]\t2140147387\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2025-43\"]\t272380440\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2025-43\"]\t497072187\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2025-43\"]\t1043804905\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2025-43\"]\t1468230036\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2025-43\"]\t1293184925\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2025-47.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2025-47\"]\t27080086217\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2025-47\"]\t3376418359\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2025-47\"]\t6733895\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2025-47\"]\t2191608275\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2025-47\"]\t2184826\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2025-47\"]\t21534450\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2025-47\"]\t4833\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2025-47\"]\t16854578\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2025-47\"]\t11912263\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2025-47\"]\t1125585239\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2025-47\"]\t66547\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2025-47\"]\t3585452894\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2025-47\"]\t2304233783\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2025-47\"]\t16179210\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2025-47\"]\t70494729\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2025-47\"]\t143359435\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2025-47\"]\t118543350\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2025-47\"]\t1997699\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2025-47\"]\t5410385\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2025-47\"]\t56522498\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2025-47\"]\t219573638\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2025-47\"]\t38456\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2025-47\"]\t110747\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2025-47\"]\t355119\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2025-47\"]\t37162883\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2025-47\"]\t193832962\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2025-47\"]\t1767403\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2025-47\"]\t415869274\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2025-47\"]\t1323\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2025-47\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2025-47\"]\t416203443769796\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2025-47\"]\t27080086217\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2025-47\"]\t4363489279\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2025-47\"]\t15601802741\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2025-47\"]\t1829714737\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2025-47\"]\t259491364\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2025-47\"]\t479403112\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2025-47\"]\t1044238440\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2025-47\"]\t1283427146\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2025-47\"]\t2218519398\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2025-51.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2025-51\"]\t26268339705\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2025-51\"]\t3206111434\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2025-51\"]\t6604193\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2025-51\"]\t2080194507\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2025-51\"]\t2194087\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2025-51\"]\t23381454\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2025-51\"]\t3620\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2025-51\"]\t17751763\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2025-51\"]\t11543382\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2025-51\"]\t1064438428\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2025-51\"]\t61025\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2025-51\"]\t3409457525\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2025-51\"]\t2178742256\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2025-51\"]\t14592026\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2025-51\"]\t68371610\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2025-51\"]\t139802134\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2025-51\"]\t113042790\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2025-51\"]\t1432142\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2025-51\"]\t3761121\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2025-51\"]\t56884058\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2025-51\"]\t196266083\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2025-51\"]\t38834\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2025-51\"]\t93484\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2025-51\"]\t333114\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2025-51\"]\t35865702\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2025-51\"]\t197944064\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2025-51\"]\t97589\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2025-51\"]\t402190105\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2025-51\"]\t413\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2025-51\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2025-51\"]\t400430094915628\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2025-51\"]\t26268339705\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2025-51\"]\t3641980000\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2025-51\"]\t15391675183\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2025-51\"]\t2089753583\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2025-51\"]\t246877754\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2025-51\"]\t463748511\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2025-51\"]\t1036957527\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2025-51\"]\t1382355116\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2025-51\"]\t2014992031\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2026-04.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2026-04\"]\t25612258765\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2026-04\"]\t3410010503\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2026-04\"]\t6765440\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2026-04\"]\t2321441825\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2026-04\"]\t2255706\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2026-04\"]\t26984393\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2026-04\"]\t5327\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2026-04\"]\t17383455\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2026-04\"]\t10944978\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2026-04\"]\t1024229379\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2026-04\"]\t59717\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2026-04\"]\t3616559010\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2026-04\"]\t2339673995\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2026-04\"]\t16203549\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2026-04\"]\t67701410\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2026-04\"]\t143288112\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2026-04\"]\t122908001\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2026-04\"]\t1624372\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2026-04\"]\t4065355\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2026-04\"]\t56991730\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2026-04\"]\t192151953\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2026-04\"]\t52884\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2026-04\"]\t148601\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2026-04\"]\t45034\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2026-04\"]\t355429\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2026-04\"]\t36951268\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2026-04\"]\t231443181\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2026-04\"]\t4548522\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2026-04\"]\t398404649\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2026-04\"]\t965\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2026-04\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2026-04\"]\t437932873289353\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2026-04\"]\t25612258765\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2026-04\"]\t3506980105\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2026-04\"]\t15124965425\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2026-04\"]\t2022383472\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2026-04\"]\t214328249\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2026-04\"]\t406017921\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2026-04\"]\t1011144017\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2026-04\"]\t1329279168\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2026-04\"]\t1997160408\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2026-08.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2026-08\"]\t24938307108\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2026-08\"]\t3275516979\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2026-08\"]\t6775762\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2026-08\"]\t2192445208\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2026-08\"]\t2129895\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2026-08\"]\t27770540\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2026-08\"]\t1243\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2026-08\"]\t17969328\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2026-08\"]\t11413466\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2026-08\"]\t1017011537\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2026-08\"]\t58804\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2026-08\"]\t3483275559\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2026-08\"]\t2176942448\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2026-08\"]\t14669187\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2026-08\"]\t67516643\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2026-08\"]\t144873930\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2026-08\"]\t118974866\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2026-08\"]\t1854416\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2026-08\"]\t3472737\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2026-08\"]\t58775412\n[\"crawl_status\", \"fetcher:robots_denied\", \"CC-MAIN-2026-08\"]\t197522208\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay\", \"CC-MAIN-2026-08\"]\t50363\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped\", \"CC-MAIN-2026-08\"]\t121130\n[\"crawl_status\", \"fetcher:filtered\", \"CC-MAIN-2026-08\"]\t658\n[\"crawl_status\", \"fetcher:redirect_count_exceeded\", \"CC-MAIN-2026-08\"]\t338160\n[\"crawl_status\", \"fetcher:redirect_deduplicated\", \"CC-MAIN-2026-08\"]\t35740340\n[\"crawl_status\", \"fetcher:hitByThrougputThreshold\", \"CC-MAIN-2026-08\"]\t256534874\n[\"crawl_status\", \"fetcher:hitByTimeLimit\", \"CC-MAIN-2026-08\"]\t2198180\n[\"crawl_status\", \"fetcher:AboveExceptionThresholdInQueue\", \"CC-MAIN-2026-08\"]\t403688416\n[\"crawl_status\", \"fetcher:hungThreads\", \"CC-MAIN-2026-08\"]\t1533\n[\"crawl_status\", \"fetcher:hitByTimeout\", \"CC-MAIN-2026-08\"]\t58\n[\"crawl_status\", \"fetcher:bytes_downloaded\", \"CC-MAIN-2026-08\"]\t399711354104042\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2026-08\"]\t24938307108\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2026-08\"]\t3366817867\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2026-08\"]\t15440733660\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2026-08\"]\t1982959537\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2026-08\"]\t231718496\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2026-08\"]\t448373364\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2026-08\"]\t1044327468\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2026-08\"]\t1288190581\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2026-08\"]\t1135186135\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2026-12.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2026-12\"]\t25055505905\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2026-12\"]\t3086297054\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2026-12\"]\t6932438\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2026-12\"]\t2036957679\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2026-12\"]\t2177735\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2026-12\"]\t28180900\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2026-12\"]\t3935\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2026-12\"]\t16451781\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2026-12\"]\t11685260\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2026-12\"]\t983907326\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2026-12\"]\t56007\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2026-12\"]\t3282647598\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2026-12\"]\t1984198830\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2026-12\"]\t14000166\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2026-12\"]\t64923556\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2026-12\"]\t136175302\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2026-12\"]\t114367812\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2026-12\"]\t1174162\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2026-12\"]\t3614611\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2026-12\"]\t61854875\n[\"crawl_status\", \"fetcher:robots_denied_total\", \"CC-MAIN-2026-12\"]\t188473300\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay_total\", \"CC-MAIN-2026-12\"]\t40973\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped_total\", \"CC-MAIN-2026-12\"]\t112107\n[\"crawl_status\", \"fetcher:filtered_total\", \"CC-MAIN-2026-12\"]\t0\n[\"crawl_status\", \"fetcher:redirect_count_exceeded_total\", \"CC-MAIN-2026-12\"]\t338652\n[\"crawl_status\", \"fetcher:redirect_deduplicated_total\", \"CC-MAIN-2026-12\"]\t33718403\n[\"crawl_status\", \"fetcher:redirect_not_created_total\", \"CC-MAIN-2026-12\"]\t0\n[\"crawl_status\", \"fetcher:errors_url_total\", \"CC-MAIN-2026-12\"]\t1079\n[\"crawl_status\", \"fetcher:errors_other_total\", \"CC-MAIN-2026-12\"]\t61711647\n[\"crawl_status\", \"fetcher:hit_by_throughput_threshold_total\", \"CC-MAIN-2026-12\"]\t240603395\n[\"crawl_status\", \"fetcher:hit_by_timelimit_total\", \"CC-MAIN-2026-12\"]\t3684705\n[\"crawl_status\", \"fetcher:above_exception_threshold_total\", \"CC-MAIN-2026-12\"]\t435364712\n[\"crawl_status\", \"fetcher:hung_threads_total\", \"CC-MAIN-2026-12\"]\t2037\n[\"crawl_status\", \"fetcher:hit_by_timeout_total\", \"CC-MAIN-2026-12\"]\t0\n[\"crawl_status\", \"fetcher:bytes_downloaded_total\", \"CC-MAIN-2026-12\"]\t378940564215016\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2026-12\"]\t25055505905\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2026-12\"]\t3748190173\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2026-12\"]\t14528798325\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2026-12\"]\t2014792439\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2026-12\"]\t230099887\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2026-12\"]\t446868594\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2026-12\"]\t958555154\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2026-12\"]\t1294847633\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2026-12\"]\t1833353700\n"
  },
  {
    "path": "stats/crawler/CC-MAIN-2026-17.json",
    "content": "[\"crawl_status\", \"generator:crawldb_size\", \"CC-MAIN-2026-17\"]\t24642277769\n[\"crawl_status\", \"generator:fetch_list\", \"CC-MAIN-2026-17\"]\t3371549557\n[\"crawl_status\", \"generator:selected:db_duplicate\", \"CC-MAIN-2026-17\"]\t7023432\n[\"crawl_status\", \"generator:selected:db_fetched\", \"CC-MAIN-2026-17\"]\t2219152147\n[\"crawl_status\", \"generator:selected:db_gone\", \"CC-MAIN-2026-17\"]\t2174152\n[\"crawl_status\", \"generator:selected:db_notmodified\", \"CC-MAIN-2026-17\"]\t30621825\n[\"crawl_status\", \"generator:selected:db_orphan\", \"CC-MAIN-2026-17\"]\t5464\n[\"crawl_status\", \"generator:selected:db_redir_perm\", \"CC-MAIN-2026-17\"]\t17904788\n[\"crawl_status\", \"generator:selected:db_redir_temp\", \"CC-MAIN-2026-17\"]\t12726515\n[\"crawl_status\", \"generator:selected:db_unfetched\", \"CC-MAIN-2026-17\"]\t1081941234\n[\"crawl_status\", \"generator:skipped_domains_overflow\", \"CC-MAIN-2026-17\"]\t62761\n[\"crawl_status\", \"fetcher:total\", \"CC-MAIN-2026-17\"]\t3585327457\n[\"crawl_status\", \"fetcher:success\", \"CC-MAIN-2026-17\"]\t2202695211\n[\"crawl_status\", \"fetcher:notmodified\", \"CC-MAIN-2026-17\"]\t14985960\n[\"crawl_status\", \"fetcher:temp_moved\", \"CC-MAIN-2026-17\"]\t70451334\n[\"crawl_status\", \"fetcher:moved\", \"CC-MAIN-2026-17\"]\t149352840\n[\"crawl_status\", \"fetcher:notfound\", \"CC-MAIN-2026-17\"]\t126147600\n[\"crawl_status\", \"fetcher:access_denied\", \"CC-MAIN-2026-17\"]\t1323550\n[\"crawl_status\", \"fetcher:gone\", \"CC-MAIN-2026-17\"]\t4479150\n[\"crawl_status\", \"fetcher:exception\", \"CC-MAIN-2026-17\"]\t61007202\n[\"crawl_status\", \"fetcher:robots_denied_total\", \"CC-MAIN-2026-17\"]\t217210179\n[\"crawl_status\", \"fetcher:robots_denied_maxcrawldelay_total\", \"CC-MAIN-2026-17\"]\t39081\n[\"crawl_status\", \"fetcher:robots_defer_visits_dropped_total\", \"CC-MAIN-2026-17\"]\t95851\n[\"crawl_status\", \"fetcher:filtered_total\", \"CC-MAIN-2026-17\"]\t125727\n[\"crawl_status\", \"fetcher:redirect_count_exceeded_total\", \"CC-MAIN-2026-17\"]\t360395\n[\"crawl_status\", \"fetcher:redirect_deduplicated_total\", \"CC-MAIN-2026-17\"]\t37255193\n[\"crawl_status\", \"fetcher:redirect_not_created_total\", \"CC-MAIN-2026-17\"]\t0\n[\"crawl_status\", \"fetcher:errors_url_total\", \"CC-MAIN-2026-17\"]\t1396\n[\"crawl_status\", \"fetcher:errors_other_total\", \"CC-MAIN-2026-17\"]\t60868565\n[\"crawl_status\", \"fetcher:hit_by_throughput_threshold_total\", \"CC-MAIN-2026-17\"]\t257381694\n[\"crawl_status\", \"fetcher:hit_by_timelimit_total\", \"CC-MAIN-2026-17\"]\t19625672\n[\"crawl_status\", \"fetcher:above_exception_threshold_total\", \"CC-MAIN-2026-17\"]\t422787345\n[\"crawl_status\", \"fetcher:hung_threads_total\", \"CC-MAIN-2026-17\"]\t2895\n[\"crawl_status\", \"fetcher:hit_by_timeout_total\", \"CC-MAIN-2026-17\"]\t578\n[\"crawl_status\", \"fetcher:bytes_downloaded_total\", \"CC-MAIN-2026-17\"]\t416956151754369\n[\"crawl_status\", \"crawldb:size\", \"CC-MAIN-2026-17\"]\t24642277769\n[\"crawl_status\", \"crawldb:status:db_unfetched\", \"CC-MAIN-2026-17\"]\t3297370708\n[\"crawl_status\", \"crawldb:status:db_fetched\", \"CC-MAIN-2026-17\"]\t14792539087\n[\"crawl_status\", \"crawldb:status:db_gone\", \"CC-MAIN-2026-17\"]\t1796708613\n[\"crawl_status\", \"crawldb:status:db_redir_temp\", \"CC-MAIN-2026-17\"]\t205870956\n[\"crawl_status\", \"crawldb:status:db_redir_perm\", \"CC-MAIN-2026-17\"]\t402958862\n[\"crawl_status\", \"crawldb:status:db_notmodified\", \"CC-MAIN-2026-17\"]\t978689541\n[\"crawl_status\", \"crawldb:status:db_duplicate\", \"CC-MAIN-2026-17\"]\t1173128233\n[\"crawl_status\", \"crawldb:status:db_orphan\", \"CC-MAIN-2026-17\"]\t1995011769\n"
  },
  {
    "path": "stats/crawler/README.md",
    "content": "Crawler-Related Metrics\n=======================\n\nJSON files in this folder contain metrics\n- written by the crawler ([Apache Nutch](http://nutch.apache.org/) in a [modified version](https://github.com/commoncrawl/nutch/) adapted for Common Crawl) as Hadoop job counters,\n- extracted from crawler log files, and\n- saved in the JSON-based, tab-separated key-value output format used by [mrjob](https://pythonhosted.org/mrjob/)"
  },
  {
    "path": "stats/tld_alexa_top_1m.py",
    "content": "# derived from\n#   http://s3.amazonaws.com/alexa-static/top-1m.csv.zip\n# fetched 2019-02-06, see also\n#   https://support.alexa.com/hc/en-us/sections/200063274-Top-Sites\n\nalexa_top_1m_tlds_about = {\n  'date': '2019-02-06',\n  'source': 'http://s3.amazonaws.com/alexa-static/top-1m.csv.zip'\n}\n\nalexa_top_1m_tlds = {\n  # zcat top-1m.csv.zip \\\n  #  | perl -ne 'chomp; s/.+\\.//; $h{$_}++;\n  #              END {\n  #                for (sort { $h{$b} <=> $h{$a} } keys %h) {\n  #                  print \"\\047\", $_, \"\\047:\", $h{$_}, \", \";\n  #                }\n  #              }' \\\n  #  | fold --width=70 -s | perl -lpe 's/^/  /; s/:/: /g; s/\\s+$//'\n  'com': 477407, 'org': 48692, 'ru': 44928, 'net': 40595, 'de': 31039,\n  'br': 24140, 'uk': 16820, 'pl': 15490, 'in': 14051, 'ir': 12913,\n  'it': 11283, 'au': 11085, 'jp': 10723, 'fr': 9673, 'info': 8625,\n  'cz': 7787, 'es': 6967, 'co': 6967, 'ca': 6813, 'gr': 6548, 'mx': 6325,\n  'io': 6249, 'ua': 5918, 'ro': 5885, 'nl': 5677, 'eu': 5001, 'ar': 4800,\n  'ch': 4616, 'se': 4053, 'za': 3855, 'sk': 3791, 'hu': 3671, 'no': 3640,\n  'me': 3587, 'us': 3343, 'be': 3303, 'tr': 3254, 'tv': 3242, 'tw': 3228,\n  'dk': 3165, 'cl': 3111, 'at': 3097, 'edu': 3055, 'cn': 2644, 'kr': 2573,\n  'xyz': 2209, 'biz': 2191, 'pt': 2127, 'fi': 2074, 'id': 1982, 'club': 1876,\n  'ie': 1770, 'online': 1686, 'pro': 1666, 'az': 1630, 'vn': 1615,\n  'il': 1570, 'by': 1406, 'th': 1404, 'cc': 1382, 'nz': 1372, 'kz': 1287,\n  'pe': 1240, 'lt': 1153, 'su': 1116, 'hr': 1102, 'bg': 1081,\n  'xn--p1ai': 1076, 'pk': 1075, 'gov': 1065, 'my': 1053, 'site': 1033,\n  'ng': 1010, 'rs': 1008, 'sg': 978, 'hk': 967, 'si': 955, 'sa': 821,\n  'ae': 812, 'top': 793, 'pw': 747, 'uz': 730, 'ph': 668, 'lv': 576,\n  'live': 569, 'to': 566, 'tk': 537, 'cat': 512, 'mobi': 491, 've': 488,\n  'lk': 483, 'ee': 475, 'ws': 461, 'bd': 454, 'ma': 438, 'do': 421, 'is': 406,\n  'fm': 377, 'ge': 364, 'news': 364, 'ba': 362, 'space': 356, 'ec': 353,\n  'life': 353, 'tn': 352, 'uy': 347, 'xxx': 335, 'ml': 322, 'eg': 321,\n  'ai': 315, 'nu': 313, 'am': 311, 'blog': 310, 'ga': 310, 'guru': 308,\n  'ke': 306, 'fun': 296, 'cr': 292, 'shop': 290, 'mk': 285, 'cf': 284,\n  'website': 280, 'app': 276, 'asia': 272, 'lu': 272, 'tech': 271,\n  'cloud': 258, 'md': 257, 'today': 253, 'ly': 246, 'gg': 243, 'icu': 232,\n  'media': 230, 'store': 230, 'dz': 229, 'one': 226, 'qa': 212, 'host': 210,\n  'link': 204, 'py': 202, 'la': 198, 'al': 198, 'win': 193, 'tz': 189,\n  'world': 186, 'work': 186, 'name': 184, 'travel': 172, 'af': 172,\n  'vip': 172, 'rocks': 163, 'cu': 161, 'bo': 159, 'kg': 156, 'bz': 153,\n  'im': 152, 'ug': 150, 'gt': 150, 'aero': 148, 'pa': 148, 'kw': 146,\n  'cy': 142, 'video': 141, 'network': 140, 'coop': 135, 'mm': 134, 'ao': 131,\n  'tj': 131, 'sv': 130, 'global': 130, 'om': 129, 'eus': 128,\n  'download': 127, 'digital': 126, 'tokyo': 126, 'design': 117, 'jobs': 116,\n  'gq': 112, 'vc': 109, 'mn': 108, 'np': 107, 'stream': 106, 'ag': 105,\n  'wiki': 105, 'jo': 105, 'sy': 102, 'click': 100, 'int': 99, 'center': 99,\n  'zone': 98, 'cm': 92, 'academy': 91, 'plus': 90, 'agency': 89, 'sh': 87,\n  'ni': 87, 'mz': 86, 'li': 83, 'moe': 83, 'gh': 82, 'lb': 81, 'nyc': 79,\n  'company': 79, 'ninja': 78, 'ci': 76, 'tools': 76, 'ac': 75, 'games': 74,\n  'city': 74, 'bid': 73, 'sd': 73, 'education': 71, 'studio': 71, 'ovh': 71,\n  'zw': 70, 'st': 69, 'porn': 69, 'ps': 69, 'tm': 69, 'rw': 68, 'mg': 68,\n  'et': 68, 'hn': 66, 'press': 66, 'group': 64, 're': 63, 'iq': 62,\n  'expert': 62, 'red': 62, 'ooo': 62, 'london': 61, 'bh': 61,\n  'solutions': 61, 'school': 61, 'bank': 60, 'services': 60, 'sn': 60,\n  'mu': 60, 'bet': 59, 'guide': 59, 'tips': 58, 'market': 57, 'cool': 57,\n  'trade': 56, 'cd': 56, 'cx': 55, 'kh': 55, 'ink': 54, 'mil': 54,\n  'community': 53, 'ms': 53, 'pub': 53, 'help': 52, 'art': 51, 'bw': 51,\n  'cash': 51, 'mt': 50, 'pics': 50, 'gratis': 50, 'chat': 49, 'email': 49,\n  'sc': 49, 'sexy': 48, 'social': 48, 'land': 47, 'tt': 47, 'zm': 47,\n  'team': 46, 'pg': 46, 'berlin': 46, 'systems': 45, 'events': 45, 'ltd': 45,\n  'watch': 44, 'works': 42, 'review': 42, 'so': 42, 'support': 41,\n  'church': 41, 'bn': 40, 'men': 39, 'ad': 39, 'na': 38, 'gs': 37, 'run': 36,\n  'pr': 36, 'gal': 35, 'bt': 35, 'swiss': 35, 'paris': 35, 'gdn': 35,\n  'kim': 34, 'love': 34, 'exchange': 34, 'marketing': 34, 'bike': 34,\n  'tf': 33, 'mw': 33, 'bio': 33, 'software': 33, 'tube': 32, 'training': 32,\n  'istanbul': 31, 'wtf': 31, 'money': 31, 'fo': 31, 'sex': 30, 'moscow': 30,\n  'bf': 30, 'mo': 30, 'pf': 30, 'farm': 29, 'lol': 29, 'fit': 29, 'pm': 29,\n  'energy': 29, 'coffee': 28, 'party': 28, 'codes': 28, 'ht': 28,\n  'audio': 28, 'capital': 28, 'as': 28, 'report': 28, 'deals': 28,\n  'technology': 27, 'jm': 27, 'scot': 27, 'nc': 27, 'blue': 26, 'gl': 26,\n  'sx': 26, 'africa': 26, 'care': 25, 'careers': 25, 'xn--80asehdb': 24,\n  'uno': 24, 'tl': 24, 'tc': 24, 'photography': 23, 'movie': 23, 'wales': 23,\n  'cafe': 23, 'bar': 23, 'direct': 22, 'nrw': 22, 'house': 22, 'science': 22,\n  'film': 21, 'date': 21, 'institute': 21, 'buzz': 20, 'xn--j1amh': 20,\n  'express': 20, 'bi': 20, 'bm': 20, 'xn--p1acf': 20, 'brussels': 19,\n  'gold': 19, 'vision': 19, 'fyi': 19, 'dev': 19, 'taipei': 19, 'sale': 19,\n  'show': 19, 'dating': 18, 'gallery': 18, 'business': 18, 'style': 18,\n  'university': 18, 'yt': 18, 'gy': 18, 'fj': 18, 'game': 18, 'je': 18,\n  'pink': 18, 'webcam': 18, 'mv': 17, 'tel': 17, 'fund': 17, 'vg': 17,\n  'build': 17, 'bj': 17, 'directory': 17, 'photos': 17, 'lat': 17,\n  'clinic': 16, 'museum': 16, 'wang': 16, 'vet': 16, 'gi': 16, 'menu': 16,\n  'sm': 16, 'pet': 16, 'rip': 16, 'dj': 16, 'legal': 16, 'cg': 15,\n  'partners': 15, 'lc': 15, 'earth': 15, 'desi': 14, 'gd': 14, 'cam': 14,\n  'engineering': 14, 'bzh': 14, 'cv': 14, 'graphics': 14, 'hosting': 14,\n  'canon': 14, 'ye': 14, 'ky': 14, 'photo': 13, 'place': 13, 'pizza': 13,\n  'ist': 13, 'va': 13, 'international': 13, 'best': 13, 'reviews': 13,\n  'onl': 13, 'mr': 13, 'law': 13, 'health': 12, 'rest': 12, 'how': 12,\n  'xn--90ais': 12, 'tours': 12, 'beer': 12, 'bb': 12, 'kp': 12, 'ngo': 12,\n  'restaurant': 11, 'finance': 11, 'sz': 11, 'delivery': 11,\n  'xn--d1acj3b': 11, 'dog': 11, 'bs': 11, 'foundation': 11,\n  'management': 11, 'black': 11, 'kiwi': 11, 'leclerc': 11, 'sb': 11,\n  'eco': 10, 'sl': 10, 'tg': 10, 'ventures': 10, 'dance': 10, 'parts': 10,\n  'abbott': 10, 'fitness': 10, 'radio': 10, 'wien': 10, 'boutique': 10,\n  'vu': 10, 'loan': 10, 'google': 10, 'town': 10, 'college': 10, 'bayern': 9,\n  'toys': 9, 'shoes': 9, 'tax': 9, 'ls': 9, 'band': 9, 'immo': 9, 'coach': 9,\n  'ne': 9, 'gm': 9, 'box': 9, 'hamburg': 9, 'mba': 9, 'promo': 9, 'koeln': 9,\n  'football': 9, 'green': 9, 'pictures': 9, 'cards': 9, 'vin': 9, 'mc': 9,\n  'cw': 8, 'dental': 8, 'yoga': 8, 'schule': 8, 'amsterdam': 8,\n  'bnpparibas': 8, 'wedding': 8, 'camp': 8, 'sap': 8, 'ax': 8, 'casa': 8,\n  'ski': 8, 'xn--80adxhks': 8, 'domains': 8, 'camera': 8, 'supply': 8,\n  'garden': 8, 'krd': 7, 'vegas': 7, 'bot': 7, 'sr': 7, 'page': 7, 'army': 7,\n  'jetzt': 7, 'barcelona': 7, 'cab': 7, 'quebec': 7, 'horse': 7, 'aws': 7,\n  'clothing': 7, 'casino': 7, 'bradesco': 7, 'taxi': 6, 'cymru': 6,\n  'exposed': 6, 'weber': 6, 'post': 6, 'tirol': 6, 'soy': 6, 'wine': 6,\n  'basketball': 6, 'builders': 6, 'fish': 6, 'recipes': 6, 'audi': 6,\n  'td': 6, 'diet': 6, 'realtor': 6, 'haus': 6, 'ads': 6, 'rentals': 6,\n  'pharmacy': 6, 'mp': 6, 'xn--80aswg': 5, 'cricket': 5, 'miami': 5,\n  'vote': 5, 'prod': 5, 'productions': 5, 'kitchen': 5, 'racing': 5, 'dm': 5,\n  'lighting': 5, 'xn--c1avg': 5, 'computer': 5, 'wf': 5, 'solar': 5,\n  'credit': 5, 'bible': 5, 'consulting': 5, 'gent': 5, 'equipment': 5,\n  'family': 5, 'jewelry': 5, 'auction': 5, 'forsale': 5, 'poker': 5,\n  'rio': 5, 'barclays': 5, 'shiksha': 4, 'gift': 4, 'office': 4, 'nagoya': 4,\n  'shopping': 4, 'discount': 4, 'lawyer': 4, 'flights': 4, 'aw': 4,\n  'sydney': 4, 'srl': 4, 'golf': 4, 'rent': 4, 'surf': 4, 'gn': 4, 'hm': 4,\n  'observer': 4, 'corsica': 4, 'singles': 4, 'estate': 4, 'fashion': 4,\n  'sport': 4, 'vi': 4, 'fail': 4, 'trading': 4, 'nico': 4, 'limited': 4,\n  'ruhr': 4, 'adult': 4, 'nf': 4, 'tattoo': 4, 'sbi': 4, 'apartments': 4,\n  'insure': 4, 'cern': 3, 'neustar': 3, 'salon': 3, 'gp': 3, 'tatar': 3,\n  'lr': 3, 'med': 3, 'frl': 3, 'repair': 3, 'moda': 3, 'theater': 3,\n  'here': 3, 'xn--90ae': 3, 'fans': 3, 'yokohama': 3, 'forex': 3, 'pn': 3,\n  'sener': 3, 'gifts': 3, 'ipiranga': 3, 'gf': 3, 'holdings': 3, 'auto': 3,\n  'xn--3e0b707e': 3, 'cooking': 3, 'contractors': 3, 'futbol': 3,\n  'edeka': 3, 'cheap': 3, 'flowers': 3, 'study': 3, 'gmbh': 3, 'fishing': 3,\n  'healthcare': 3, 'hockey': 3, 'stockholm': 3, 'kn': 3, 'hot': 3, 'cars': 3,\n  'car': 3, 'archi': 3, 'telefonica': 3, 'vlaanderen': 3, 'industries': 3,\n  'claims': 2, 'vodka': 2, 'mom': 2, 'abudhabi': 2, 'faith': 2, 'career': 2,\n  'xin': 2, 'attorney': 2, 'bv': 2, 'ong': 2, 'sncf': 2, 'ricoh': 2,\n  'teva': 2, 'pioneer': 2, 'yandex': 2, 'lease': 2, 'investments': 2,\n  'security': 2, 'gop': 2, 'immobilien': 2, 'okinawa': 2, 'pictet': 2,\n  'goog': 2, 'tienda': 2, 'fan': 2, 'abc': 2, 'coupons': 2, 'sandvik': 2,\n  'monash': 2, 'ki': 2, 'inc': 2, 'country': 2, 'alsace': 2,\n  'barclaycard': 2, 'sony': 2, 'melbourne': 2, 'dhl': 2, 'brother': 2,\n  'glass': 2, 'ceb': 2, 'dentist': 2, 'aq': 2, 'mortgage': 2, 'sharp': 2,\n  'associates': 2, 'kpmg': 2, 'gw': 2, 'luxury': 2, 'afl': 2, 'mq': 2,\n  'sky': 2, 'total': 2, 'kaufen': 1, 'rwe': 1, 'woodside': 1, 'crs': 1,\n  'voyage': 1, 'tickets': 1, 'kpn': 1, 'xn--wgbl6a': 1, 'epson': 1,\n  'financial': 1, 'honda': 1, 'llc': 1, 'markets': 1, 'xn--90a3ac': 1,\n  'reisen': 1, 'reit': 1, 'courses': 1, 'ren': 1, 'drive': 1, 'nr': 1,\n  'xn--h2brj9c': 1, 'xn--tckwe': 1, 'gives': 1, 'sarl': 1, 'seat': 1,\n  'kred': 1, 'java': 1, 'fox': 1, 'komatsu': 1, 'abb': 1, 'gripe': 1,\n  'osaka': 1, 'property': 1, 'insurance': 1, 'chrome': 1, 'hiphop': 1,\n  'crown': 1, 'actor': 1, 'zip': 1, 'rmit': 1, 'ceo': 1, 'limo': 1, 'luxe': 1,\n  'properties': 1, 'mango': 1, 'rodeo': 1, 'versicherung': 1, 'orange': 1,\n  'jcb': 1, 'xn--fiqs8s': 1, 'goo': 1, 'ryukyu': 1, 'xn--pgbs0dh': 1,\n  'off': 1, 'ck': 1, 'scb': 1, 'enterprises': 1, 'star': 1, 'capetown': 1,\n  'dvag': 1, 'ismaili': 1, 'spot': 1, 'uol': 1, 'vanguard': 1, 'axa': 1,\n  'accountant': 1, 'soccer': 1, 'cologne': 1, 'bargains': 1, 'juegos': 1,\n  'lamborghini': 1, 'cruises': 1, 'vacations': 1, 'stada': 1, 'skype': 1,\n  'hospital': 1, 'xn--54b7fta0cc': 1, 'xn--q9jyb4c': 1, 'weir': 1,\n  'guitars': 1, 'tires': 1, 'vivo': 1, 'madrid': 1, 'globo': 1, 'trv': 1,\n  'loans': 1, 'holiday': 1, 'rugby': 1, 'storage': 1, 'joburg': 1, 'ses': 1,\n  'creditcard': 1, 'degree': 1, 'surgery': 1, 'saxo': 1, 'softbank': 1,\n  'accountants': 1, 'cbn': 1, 'lundbeck': 1, 'physio': 1, 'organic': 1,\n  'you': 1, 'doctor': 1, 'kyoto': 1, 'realty': 1, 'cba': 1, 'praxi': 1,\n  'broker': 1, 'tennis': 1, 'qvc': 1, 'gmail': 1, 'viajes': 1,\n}\n"
  },
  {
    "path": "stats/tld_cisco_umbrella_top_1m.py",
    "content": "# derived from\n#   http://s3-us-west-1.amazonaws.com/umbrella-static/top-1m.csv.zip\n# fetched 2019-02-06, see also\n#   http://s3-us-west-1.amazonaws.com/umbrella-static/index.html\n#\n# \"The popularity list contains our most queried domains based on\n# passive DNS usage across our Umbrella global network of more than\n# 100 Billion requests per day with 65 million unique active users, in\n# more than 165 countries. Unlike Alexa, the metric is not based on\n# only browser based 'http' requests from users but rather takes into\n# account the number of unique client IPs invoking this domain\n# relative to the sum of all requests to all domains. In other words,\n# our popularity ranking reflects the domain’s relative internet\n# activity agnostic to the invocation protocols and applications where\n# as ’site ranking’ models (such as Alexa) focus on the web activity\n# over port 80 mainly from browsers.\n#\n# As for Alexa, the site’s rank is based on combined measure of unique\n# visitors (Alexa users who visit the site per day) and page views\n# (total URL requests from Alexa users for a site). Umbrella\n# popularity lists are generated on a daily basis reflecting the\n# actual world-wide usage of domains by Umbrella global network users\n# and includes root domains, subdomains in addition to TLDs (Alexa\n# list has only this). In addition, Umbrella popularity algorithm also\n# applies data normalization methodologies to smoothen potential\n# biases that may occur in the data due to sampling of the DNS usage\n# data.\"\n#\n#\n# NOTE: The list contains also domain names from intranets - 'localhost',\n#       'belkin', 'dlinkrouter', 'dmz', etc.  These are filtered out by\n#       allowing only IANA-registered domain name suffixes.\n#\n\ncisco_umbrella_top_1m_tlds_about = {\n  'date': '2019-02-06',\n  'source': 'http://s3-us-west-1.amazonaws.com/umbrella-static/top-1m.csv.zip'\n}\n\ncisco_umbrella_top_1m_tlds = {\n  # zcat top-1m.csv.zip \\\n  #  | perl -ne 'chomp; s/^\\d+,//; s/.+\\.//; $h{$_}++;\n  #              END {\n  #                for (sort { $h{$b} <=> $h{$a} } keys %h) {\n  #                  print \"\\047\", $_, \"\\047:\", $h{$_}, \", \";\n  #                }\n  #              }' \\\n  #  | fold --width=70 -s | perl -lpe 's/^/  /; s/:/: /g; s/\\s+$//'\n  'com': 579421, 'net': 155319, 'org': 41951, 'ru': 14293, 'uk': 11216,\n  'edu': 10324, 'biz': 9884, 'io': 9316, 'de': 9179, 'me': 7807,\n  'info': 7483, 'cn': 6274, 'in': 6267, 'cc': 5401, 'co': 5352, 'gov': 5068,\n  'br': 4846, 'fr': 4752, 'nl': 4499, 'it': 4251, 'us': 3929, 'tv': 3813,\n  'eu': 3689, 'ca': 3585, 'jp': 3570, 'pl': 3361, 'vn': 2666, 'ua': 2572,\n  'es': 2249, 'au': 1901, 'mx': 1504, 'ch': 1462, 'be': 1455, 'id': 1386,\n  'se': 1253, 'dk': 1236, 'il': 1198, 'pt': 1180, 'link': 1153, 'cz': 1133,\n  'xyz': 1078, 'email': 1065, 'no': 1054, 'tr': 1044, 'kr': 996, 'club': 962,\n  'hu': 898, 'tw': 890, 'at': 866, 'mobi': 861, 'gr': 801, 'ir': 778,\n  'nz': 740, 'to': 735, 'pro': 707, 'cloud': 656, 'ro': 645, 'ar': 633,\n  'my': 631, 'hk': 612, 'online': 600, 'cl': 561, 'top': 540, 'za': 536,\n  'fi': 534, 'th': 526, 'mil': 489, 'sg': 488, 'sk': 486, 'pw': 463,\n  'name': 447, 'ie': 438, 'ng': 431, 'by': 419, 'ms': 402, 'st': 376,\n  'ec': 369, 'fm': 364, 'site': 362, 'ai': 361, 'ws': 357, 'is': 333,\n  'ph': 330, 'live': 326, 'pk': 325, 'im': 318, 'pe': 317, 'icu': 282,\n  've': 269, 'ae': 269, 'su': 264, 'media': 256, 'bg': 254, 'ly': 250,\n  'lt': 248, 'kz': 228, 'xxx': 227, 'gg': 223, 'do': 218, 'space': 216,\n  'hr': 211, 'services': 207, 'app': 202, 'cr': 198, 'tech': 196,\n  'systems': 182, 'gl': 175, 'ga': 172, 'rs': 166, 'host': 163, 'news': 162,\n  'video': 154, 'box': 154, 'network': 148, 'bz': 142, 'md': 142, 'sh': 140,\n  'ee': 138, 'lv': 138, 'tc': 137, 'eg': 131, 'tk': 131, 'la': 128,\n  'asia': 128, 'solutions': 127, 'life': 127, 'si': 126, 'lk': 125,\n  'nu': 124, 'one': 123, 'fun': 122, 'int': 122, 'stream': 122, 'world': 121,\n  'zone': 118, 'bid': 118, 'uy': 113, 'gt': 113, 'rocks': 113, 'bd': 112,\n  'lu': 111, 'am': 110, 'ag': 109, 'cat': 108, 'today': 108, 'sa': 105,\n  'store': 102, 'click': 102, 'ninja': 101, 'digital': 100, 'website': 94,\n  'aero': 94, 'win': 92, 'li': 85, 're': 85, 'ba': 84, 'ke': 82, 'work': 78,\n  'pa': 77, 'ovh': 76, 'games': 74, 'support': 73, 'hn': 70, 'dz': 69,\n  'vip': 68, 'sc': 67, 'al': 66, 'arpa': 65, 'sex': 63, 'tools': 63,\n  'guru': 60, 'ml': 60, 'az': 59, 'global': 59, 'py': 58, 'management': 58,\n  'download': 57, 'travel': 57, 'ma': 56, 'coop': 56, 'cm': 55, 'cu': 54,\n  'aws': 54, 'works': 54, 'vc': 53, 'sv': 53, 'cy': 53, 'cool': 51,\n  'jobs': 51, 'chat': 51, 'so': 50, 'kh': 50, 'plus': 50, 'np': 50, 'cf': 49,\n  'kg': 47, 'technology': 47, 'uz': 47, 'gs': 47, 'qa': 46, 'date': 46,\n  'bo': 46, 'lb': 46, 'pub': 45, 'ge': 45, 'ac': 43, 'ni': 42, 'blog': 41,\n  'bet': 41, 'tf': 41, 'ad': 40, 'sx': 39, 'af': 39, 'cx': 37, 'money': 37,\n  'ps': 36, 'gh': 33, 'tn': 33, 'goog': 32, 'xn--p1ai': 32, 'agency': 32,\n  'zw': 32, 'as': 31, 'tt': 31, 'mn': 30, 'mk': 30, 'pm': 30, 'press': 29,\n  'shop': 29, 'events': 29, 'run': 29, 'mt': 29, 'wiki': 28, 'trade': 28,\n  'porn': 28, 'pr': 27, 'tl': 27, 'tube': 26, 'om': 26, 'studio': 26,\n  'sn': 24, 'ci': 24, 'mm': 23, 'gdn': 23, 'ug': 23, 'team': 23, 'moe': 23,\n  'sexy': 23, 'software': 22, 'pics': 21, 'tips': 21, 'vg': 21, 'review': 20,\n  'iq': 20, 'tz': 20, 'sap': 20, 'mg': 20, 'science': 20, 'land': 20,\n  'na': 20, 'party': 19, 'gq': 19, 'google': 19, 'help': 19, 'lol': 19,\n  'wtf': 19, 'center': 19, 'mu': 18, 'company': 18, 'cd': 17, 'gy': 17,\n  'ink': 17, 'jm': 17, 'sncf': 17, 'fyi': 17, 'engineering': 17, 'group': 17,\n  'va': 17, 'market': 17, 'eus': 17, 'tm': 16, 'cash': 16, 'cricket': 16,\n  'care': 16, 'guide': 15, 'film': 15, 'mv': 15, 'bm': 15, 'buzz': 15,\n  'pg': 15, 'ne': 15, 'ooo': 15, 'direct': 15, 'bn': 14, 'expert': 14,\n  'lat': 14, 'game': 14, 'watch': 14, 'scot': 14, 'photos': 13, 'ao': 13,\n  'love': 13, 'bh': 13, 'uno': 13, 'design': 13, 'ky': 13, 'report': 13,\n  'menu': 13, 'ltd': 12, 'bank': 12, 'moscow': 12, 'movie': 12, 'bs': 12,\n  'bw': 12, 'mz': 12, 'nyc': 12, 'ht': 11, 'tj': 11, 'sm': 11, 'leclerc': 11,\n  'jo': 11, 'yandex': 11, 'dj': 11, 'show': 11, 'gd': 11, 'london': 11,\n  'nc': 10, 'rw': 10, 'training': 10, 'et': 10, 'social': 10, 'express': 10,\n  'gift': 10, 'church': 10, 'ye': 10, 'health': 10, 'dm': 10, 'bike': 10,\n  'fj': 10, 'school': 10, 'city': 10, 'hosting': 10, 'photo': 9, 'llc': 9,\n  'rip': 9, 'community': 9, 'recipes': 9, 'men': 9, 'domains': 9,\n  'supply': 9, 'education': 9, 'dev': 8, 'sky': 8, 'pn': 8, 'delivery': 8,\n  'law': 8, 'audio': 8, 'gratis': 8, 'kw': 8, 'cab': 8, 'gm': 8, 'pet': 8,\n  'rest': 8, 'build': 8, 'tel': 8, 'loan': 7, 'energy': 7, 'farm': 7, 'lc': 7,\n  'museum': 7, 'cv': 7, 'red': 7, 'vision': 7, 'ist': 7, 'ki': 7, 'fit': 7,\n  'je': 7, 'onl': 7, 'art': 7, 'pictures': 7, 'wf': 7, 'webcam': 7, 'pink': 7,\n  'vu': 7, 'zm': 7, 'supplies': 6, 'codes': 6, 'faith': 6, 'marketing': 6,\n  'pharmacy': 6, 'academy': 6, 'wang': 6, 'gold': 6, 'blue': 6, 'fail': 6,\n  'football': 6, 'business': 6, 'gi': 6, 'sl': 6, 'bio': 6, 'exchange': 6,\n  'post': 6, 'fo': 6, 'style': 6, 'army': 6, 'gp': 6, 'cafe': 6, 'paris': 6,\n  'hm': 6, 'gal': 6, 'cisco': 5, 'uol': 5, 'here': 5, 'nf': 5, 'house': 5,\n  'dog': 5, 'taxi': 5, 'bi': 5, 'sb': 5, 'schwarz': 5, 'sr': 5, 'careers': 5,\n  'kim': 5, 'bt': 5, 'canon': 5, 'pf': 5, 'sy': 5, 'yt': 5, 'ads': 4,\n  'tokyo': 4, 'international': 4, 'realtor': 4, 'earth': 4, 'legal': 4,\n  'nr': 4, 'dhl': 4, 'garden': 4, 'meet': 4, 'consulting': 4, 'abbott': 4,\n  'weir': 4, 'toys': 4, 'ski': 4, 'bb': 4, 'deals': 4, 'bradesco': 4,\n  'fitness': 4, 'bot': 4, 'golf': 4, 'cw': 4, 'fish': 4, 'kpmg': 4, 'bj': 4,\n  'best': 4, 'cam': 4, 'boutique': 4, 'diet': 3, 'sd': 3, 'cheap': 3, 'td': 3,\n  'mo': 3, 'ck': 3, 'tours': 3, 'bnpparibas': 3, 'tax': 3, 'bzh': 3,\n  'directory': 3, 'adult': 3, 'fashion': 3, 'new': 3, 'istanbul': 3,\n  'neustar': 3, 'band': 3, 'bar': 3, 'vacations': 3, 'bf': 3, 'tg': 3,\n  'inc': 3, 'limited': 3, 'koeln': 3, 'barclays': 3, 'wales': 3, 'ren': 3,\n  'camera': 3, 'kiwi': 3, 'vet': 3, 'solar': 3, 'discount': 3, 'partners': 3,\n  'haus': 3, 'lease': 3, 'glass': 3, 'forsale': 3, 'radio': 3, 'builders': 3,\n  'hsbc': 3, 'racing': 3, 'shopping': 3, 'ax': 3, 'vi': 3, 'coffee': 2,\n  'nrw': 2, 'bingo': 2, 'cars': 2, 'saxo': 2, 'crs': 2, 'beer': 2,\n  'brother': 2, 'pizza': 2, 'chrome': 2, 'dance': 2, 'fans': 2, 'town': 2,\n  'flights': 2, 'car': 2, 'storage': 2, 'nra': 2, 'sony': 2, 'mc': 2,\n  'nico': 2, 'coach': 2, 'mp': 2, 'degree': 2, 'camp': 2, 'trust': 2,\n  'graphics': 2, 'miami': 2, 'sale': 2, 'reviews': 2, 'mw': 2, 'rugby': 2,\n  'ls': 2, 'finance': 2, 'cards': 2, 'how': 2, 'moda': 2, 'madrid': 2,\n  'quebec': 2, 'office': 2, 'xn--9dbq2a': 2, 'dating': 2, 'gallery': 2,\n  'kn': 2, 'basketball': 2, 'tattoo': 2, 'cg': 2, 'lgbt': 2, 'foundation': 2,\n  'africa': 2, 'barclaycard': 2, 'baby': 1, 'bing': 1, 'hitachi': 1,\n  'vin': 1, 'goo': 1, 'hockey': 1, 'insure': 1, 'actor': 1, 'saarland': 1,\n  'java': 1, 'gmail': 1, 'youtube': 1, 'ltda': 1, 'brussels': 1, 'navy': 1,\n  'xn--54b7fta0cc': 1, 'institute': 1, 'green': 1, 'prod': 1, 'diamonds': 1,\n  'ice': 1, 'cern': 1, 'itau': 1, 'seven': 1, 'associates': 1,\n  'williamhill': 1, 'auction': 1, 'abc': 1, 'xn--j1amh': 1, 'holiday': 1,\n  'xn--c1avg': 1, 'study': 1, 'tatar': 1, 'ss': 1, 'xn--d1acj3b': 1,\n  'vote': 1, 'docs': 1, 'amex': 1, 'page': 1, 'itv': 1, 'healthcare': 1,\n  'honda': 1, 'cymru': 1, 'place': 1, 'play': 1, 'dental': 1, 'yahoo': 1,\n  'audible': 1, 'fage': 1, 'college': 1, 'eco': 1, 'aw': 1, 'gifts': 1,\n  'mr': 1, 'jaguar': 1, 'berlin': 1, 'photography': 1, 'secure': 1,\n  'xn--80asehdb': 1, 'crown': 1, 'gn': 1, 'landrover': 1, 'horse': 1,\n  'ventures': 1, 'kp': 1, 'vanguard': 1, 'casa': 1, 'luxury': 1,\n}\n"
  },
  {
    "path": "stats/tld_majestic_top_1m.py",
    "content": "# derived from\n#   http://downloads.majestic.com/majestic_million.csv\n# fetched 2019-02-06\n#\n# see also\n#\n#   https://majestic.com/reports/majestic-million\n#\n# The Majestic Million is a list of the top 1 million website in the\n# world, ordered by the number of referring subnets. A subnet is a bit\n# complex – but to a layman it is basically anything within an IP\n# range, ignoring the last three digits of the IP number.\n#\n#   https://majestic.com/support/faq#Where\n#\n# Where is the data coming from?\n#   Our data comes from the World Wide Web itself. The Majestic-12:\n#   Distributed Search Engine (http://www.majestic12.co.uk/) does not\n#   meta-search or otherwise query other search engines: we are the\n#   search engine! Over a long period of time we have developed\n#   software capable of crawling and indexing large amounts of web\n#   data. This index is a big stepping stone towards relevant\n#   full-text search. The purpose of the index is to allow relevancy\n#   research as well as to help fund continued activites in\n#   development of a competitive community-driven general-purpose\n#   web-scale search engine.\n#\n\nmajestic_top_1m_tlds_about = {\n  'date': '2019-02-06',\n  'source': 'http://downloads.majestic.com/majestic_million.csv'\n}\n\nmajestic_top_1m_tlds = {\n  # cut -d, -f4 majestic_million.csv | tail -n+2 \\\n  #  | perl -ne 'chomp; $h{$_}++;\n  #              END {\n  #                for (sort { $h{$b} <=> $h{$a} } keys %h) {\n  #                  print \"\\047\", $_, \"\\047:\", $h{$_}, \", \";\n  #                }\n  #              }' \\\n  #  | fold --width=70 -s | perl -lpe 's/^/  /; s/:/: /g; s/\\s+$//'\n  'com': 495190, 'org': 72365, 'net': 44704, 'ru': 43014, 'cn': 29361,\n  'uk': 25616, 'de': 23928, 'jp': 15220, 'pl': 11514, 'nl': 11167,\n  'info': 10601, 'it': 9829, 'fr': 9542, 'br': 8905, 'au': 8457,\n  'club': 8136, 'tw': 7140, 'us': 6584, 'ca': 6393, 'in': 6014, 'co': 5533,\n  'es': 5240, 'eu': 4791, 'ua': 4010, 'edu': 3975, 'cz': 3689, 'se': 3549,\n  'ch': 3285, 'ir': 3220, 'vn': 3156, 'biz': 3050, 'be': 2827, 'ro': 2817,\n  'at': 2743, 'za': 2550, 'nu': 2428, 'dk': 2396, 'hu': 2252, 'tr': 2154,\n  'gr': 2110, 'top': 2105, 'io': 2064, 'me': 2057, 'tv': 2017, 'xyz': 1881,\n  'gov': 1721, 'xn--p1ai': 1715, 'site': 1668, 'mx': 1636, 'no': 1631,\n  'cc': 1559, 'fi': 1497, 'nz': 1481, 'ar': 1478, 'cl': 1463, 'kr': 1435,\n  'mobi': 1406, 'ie': 1322, 'pt': 1285, 'cf': 1258, 'by': 1157, 'il': 1133,\n  'id': 1109, 'my': 1085, 'sk': 1073, 'online': 1057, 'kz': 1014, 'tk': 1012,\n  'su': 904, 'hk': 877, 'store': 849, 'lt': 836, 'sg': 827, 'pro': 720,\n  'hr': 650, 'pw': 646, 'space': 602, 'pk': 568, 'ng': 566, 'th': 530,\n  'shop': 528, 'lv': 525, 'live': 514, 'gq': 505, 'ee': 504, 'doctor': 502,\n  'icu': 487, 'si': 487, 'cat': 480, 'world': 478, 'ph': 461, 'rs': 445,\n  'ae': 444, 'name': 443, 'bg': 432, 'to': 429, 'pe': 420, 'life': 403,\n  'ga': 401, 'ws': 367, 'is': 362, 'xn--fiqs8s': 355, 'ml': 353, 'fm': 326,\n  'ke': 317, 'fun': 296, 'sa': 279, 'win': 270, 'ma': 261, 'website': 260,\n  'video': 255, 'ge': 252, 'md': 251, 'bid': 247, 'stream': 232, 'uz': 232,\n  'ovh': 231, 'asia': 228, 'lk': 220, 'az': 220, 'am': 218, 'bd': 216,\n  'reisen': 207, 'ec': 206, 'tech': 206, 'news': 205, 've': 198, 'mk': 193,\n  'ba': 186, 'ooo': 185, 'np': 175, 'uy': 174, 'lu': 172, 'today': 169,\n  'vip': 167, 'science': 166, 'travel': 162, 'work': 160, 'ly': 150,\n  'men': 147, 'ai': 147, 'network': 144, 'im': 139, 'la': 138, 'review': 136,\n  'tn': 136, 'aero': 131, 'ltd': 129, 'bz': 127, 'ink': 127, 'do': 126,\n  'int': 123, 'coop': 123, 'st': 119, 'trade': 118, 'al': 117, 'guru': 116,\n  'press': 114, 'services': 114, 'eg': 113, 'mn': 112, 'host': 108,\n  'kg': 105, 'media': 104, 'cy': 98, 'li': 95, 'py': 93, 'webcam': 92,\n  'party': 92, 'zw': 90, 'link': 89, 'wiki': 89, 'one': 86, 'cx': 86,\n  'mil': 85, 'company': 81, 'eus': 80, 'mo': 80, 'global': 77, 'tz': 75,\n  'cu': 75, 'gt': 74, 'tel': 73, 'blog': 72, 'gdn': 72, 'cr': 71, 'ms': 71,\n  'mt': 70, 'sh': 69, 'gs': 68, 'rocks': 67, 'gg': 67, 'vc': 66, 'jo': 66,\n  'lb': 65, 'zone': 65, 'bo': 65, 'ag': 63, 'cricket': 62, 'tips': 62,\n  'so': 62, 'ps': 60, 'team': 60, 'ug': 59, 'center': 57, 'qa': 57,\n  'accountant': 55, 'ninja': 55, 'pub': 55, 'agency': 55, 'dz': 54, 'tc': 53,\n  'vu': 53, 're': 52, 'tj': 51, 'city': 51, 'xxx': 50, 'blue': 47,\n  'moscow': 47, 'ac': 46, 'kh': 45, 'xn--p1acf': 45, 'london': 45,\n  'design': 45, 'gh': 45, 'tt': 44, 'group': 44, 'mu': 44, 'sc': 44,\n  'app': 43, 'cm': 42, 'studio': 41, 'click': 40, 'af': 40, 'nyc': 40,\n  'tokyo': 39, 'pet': 39, 'movie': 38, 'tools': 38, 'directory': 38,\n  'art': 38, 'promo': 37, 'as': 37, 'date': 36, 'social': 36, 'digital': 35,\n  'pink': 35, 'sn': 35, 'wang': 35, 'cloud': 35, 'wales': 35, 'vg': 35,\n  'pa': 34, 'scot': 33, 'college': 33, 'bio': 33, 'sv': 33, 'na': 33,\n  'download': 32, 'bt': 32, 'rent': 32, 'ni': 32, 'band': 31, 'mz': 31,\n  'kw': 31, 'toys': 31, 'museum': 30, 'cd': 30, 'jobs': 30, 'rw': 30,\n  'bw': 30, 'va': 29, 'education': 29, 'hn': 29, 'solutions': 29, 'gd': 29,\n  'actor': 29, 'mv': 29, 'systems': 28, 'om': 28, 'auction': 28,\n  'schule': 27, 'expert': 27, 'community': 27, 'guide': 27, 'gal': 27,\n  'love': 26, 'mg': 26, 'games': 26, 'ci': 26, 'tl': 26, 'mba': 26, 'gl': 26,\n  'plus': 26, 'nf': 25, 'works': 25, 'et': 25, 'bet': 25, 'mc': 25,\n  'paris': 25, 'loan': 24, 'zm': 24, 'yu': 24, 'berlin': 24, 'market': 24,\n  'fund': 24, 'sy': 24, 'ht': 23, 'help': 23, 'nrw': 23, 'bh': 22,\n  'events': 22, 'xn--80adxhks': 22, 'red': 22, 'gy': 21, 'support': 21,\n  'cash': 21, 'iq': 21, 'dj': 20, 'gm': 20, 'technology': 20, 'fj': 20,\n  'ao': 20, 'academy': 20, 'fail': 19, 'school': 19, 'ad': 19, 'faith': 19,\n  'swiss': 19, 'foundation': 19, 'run': 19, 'moe': 18, 'fo': 18, 'nc': 18,\n  'pn': 18, 'bzh': 18, 'pm': 18, 'racing': 17, 'xn--90ais': 17,\n  'reviews': 17, 'exchange': 17, 'cv': 17, 'land': 17, 'gi': 16, 'ren': 16,\n  'jm': 16, 'google': 16, 'cars': 16, 'sm': 16, 'email': 16, 'tf': 16,\n  'ky': 16, 'mw': 15, 'sx': 15, 'coffee': 15, 'software': 15, 'cafe': 15,\n  'sd': 15, 'bb': 15, 'xn--j1amh': 15, 'pg': 15, 'pr': 15, 'gallery': 14,\n  'care': 14, 'poker': 14, 'bf': 14, 'xin': 14, 'amsterdam': 14, 'codes': 13,\n  'earth': 13, 'uno': 13, 'sr': 13, 'gp': 13, 'church': 13, 'pics': 13,\n  'brussels': 13, 'mm': 12, 'bm': 12, 'capital': 12, 'cool': 12,\n  'institute': 12, 'ls': 12, 'photo': 12, 'international': 12, 'tm': 12,\n  'je': 11, 'chat': 11, 'bike': 11, 'africa': 11, 'istanbul': 11,\n  'photos': 11, 'show': 11, 'money': 11, 'onl': 11, 'pf': 11, 'casino': 11,\n  'consulting': 11, 'camp': 11, 'report': 11, 'mr': 11, 'lc': 10,\n  'finance': 10, 'photography': 10, 'clinic': 10, 'tours': 10,\n  'graphics': 10, 'yt': 10, 'bi': 10, 'town': 10, 'legal': 10, 'bank': 9,\n  'marketing': 9, 'ngo': 9, 'farm': 9, 'bn': 9, 'kim': 9, 'dm': 9, 'ax': 9,\n  'abbott': 9, 'xn--80asehdb': 9, 'bayern': 9, 'tg': 9, 'energy': 9,\n  'porn': 8, 'sale': 8, 'lol': 8, 'bs': 8, 'nr': 8, 'pictures': 8, 'cymru': 8,\n  'fyi': 8, 'business': 8, 'ye': 8, 'deals': 8, 'audio': 8, 'rest': 7,\n  'ki': 7, 'game': 7, 'buzz': 7, 'sexy': 7, 'hm': 7, 'fit': 7, 'sex': 7,\n  'film': 7, 'domains': 7, 'ski': 7, 'coach': 7, 'best': 7, 'barcelona': 7,\n  'taipei': 7, 'style': 7, 'dev': 7, 'sz': 7, 'sl': 7, 'fitness': 7,\n  'house': 7, 'law': 7, 'place': 7, 'fish': 6, 'eco': 6, 'express': 6,\n  'basketball': 6, 'canon': 6, 'parts': 6, 'ne': 6, 'realtor': 6, 'green': 6,\n  'vi': 6, 'direct': 6, 'cg': 6, 'ist': 6, 'hosting': 6, 'recipes': 6,\n  'engineering': 6, 'wtf': 6, 'partners': 6, 'training': 6, 'engineer': 6,\n  'vision': 6, 'bj': 6, 'gratis': 6, 'mp': 6, 'kiwi': 6, 'gop': 5,\n  'properties': 5, 'delivery': 5, 'tirol': 5, 'watch': 5, 'cern': 5,\n  'careers': 5, 'sb': 5, 'estate': 5, 'joburg': 5, 'football': 5, 'koeln': 5,\n  'desi': 5, 'bar': 5, 'wien': 5, 'vote': 5, 'hamburg': 5, 'wf': 5,\n  'camera': 5, 'neustar': 5, 'fashion': 5, 'weber': 5, 'mom': 5, 'taxi': 4,\n  'corsica': 4, 'university': 4, 'surf': 4, 'kp': 4, 'shoes': 4, 'wine': 4,\n  'dating': 4, 'kn': 4, 'lgbt': 4, 'health': 4, 'bnpparibas': 4, 'vegas': 4,\n  'beer': 4, 'rip': 4, 'repair': 4, 'productions': 4, 'vet': 4, 'gold': 4,\n  'family': 4, 'gift': 4, 'aq': 4, 'saarland': 4, 'srl': 4, 'dance': 4,\n  'dental': 4, 'supply': 4, 'how': 4, 'solar': 3, 'casa': 3, 'build': 3,\n  'tp': 3, 'pizza': 3, 'construction': 3, 'cab': 3, 'flowers': 3,\n  'credit': 3, 'jetzt': 3, 'xn--6qq986b3xl': 3, 'futbol': 3, 'garden': 3,\n  'boutique': 3, 'cheap': 3, 'pharmacy': 3, 'frl': 3, 'gifts': 3, 'yoga': 3,\n  'quebec': 3, 'auto': 3, 'builders': 3, 'xn--d1acj3b': 3, 'cards': 3,\n  'lat': 3, 'lighting': 3, 'sandvik': 3, 'villas': 3, 'krd': 3, 'ck': 3,\n  'tube': 3, 'sport': 3, 'xn--3ds443g': 3, 'sydney': 3, 'clothing': 3,\n  'lawyer': 3, 'archi': 3, 'brother': 2, 'army': 2, 'barclays': 2,\n  'discount': 2, 'aws': 2, 'hockey': 2, 'alsace': 2, 'an': 2, 'mortgage': 2,\n  'rio': 2, 'kpmg': 2, 'km': 2, 'restaurant': 2, 'dog': 2, 'menu': 2,\n  'cam': 2, 'catering': 2, 'moda': 2, 'active': 2, 'yokohama': 2,\n  'vlaanderen': 2, 'haus': 2, 'apple': 2, 'komatsu': 2, 'xn--6frz82g': 2,\n  'shiksha': 2, 'black': 2, 'kred': 2, 'bot': 2, 'tattoo': 2, 'gf': 2,\n  'golf': 2, 'miami': 2, 'hiv': 2, 'vin': 2, 'guitars': 2, 'physio': 2,\n  'post': 2, 'healthcare': 2, 'xn--80aswg': 2, 'tax': 2, 'kitchen': 2,\n  'tatar': 2, 'broker': 2, 'equipment': 2, 'nico': 2, 'xn--e1a4c': 2,\n  'nagoya': 2, 'forsale': 2, 'contractors': 2, 'kyoto': 2, 'diamonds': 2,\n  'immobilien': 2, 'page': 2, '\" \"': 2, 'industries': 2, 'radio': 2,\n  'horse': 2, 'okinawa': 2, 'holiday': 2, 'luxury': 2, 'loans': 2,\n  'citic': 1, 'enterprises': 1, 'vanguard': 1, 'kaufen': 1, 'sbi': 1,\n  'surgery': 1, 'yandex': 1, 'fast': 1, 'sony': 1, 'tickets': 1,\n  'dentist': 1, 'associates': 1, 'schmidt': 1, 'kpn': 1, 'bingo': 1,\n  'new': 1, 'glass': 1, 'security': 1, 'property': 1, 'financial': 1,\n  'gu': 1, 'holdings': 1, 'diet': 1, 'gmail': 1, 'gw': 1, 'forum': 1,\n  'bible': 1, 'investments': 1, 'fans': 1, 'gent': 1, 'abc': 1,\n  'barclaycard': 1, 'fage': 1, 'here': 1, 'theater': 1, 'realestate': 1,\n  'attorney': 1, 'xn--3e0b707e': 1, 'markets': 1, 'mq': 1, 'goo': 1,\n  'reise': 1, 'box': 1, 'ismaili': 1, 'fan': 1, 'rentals': 1, 'irish': 1,\n  'gn': 1, 'florist': 1, 'td': 1, 'hitachi': 1, 'goog': 1, 'exposed': 1,\n  'flickr': 1, 'rehab': 1, 'monash': 1, 'voyage': 1, 'computer': 1, 'you': 1,\n  'uol': 1, 'cs': 1, 'pioneer': 1, 'limo': 1, 'bradesco': 1, 'madrid': 1,\n  'flights': 1, 'bbc': 1, 'dhl': 1, 'juegos': 1, 'free': 1, 'leclerc': 1,\n  'jll': 1, 'lidl': 1, 'cuisinella': 1, 'edeka': 1, 'cologne': 1, 'cw': 1,\n  'hot': 1, 'honda': 1, 'immo': 1, 'ipiranga': 1, 'youtube': 1, 'jewelry': 1,\n  'saxo': 1, 'sncf': 1, 'baidu': 1, 'charity': 1, 'softbank': 1, 'jcb': 1,\n  'audi': 1, 'bv': 1, 'rmit': 1, 'shopping': 1, 'java': 1, 'rwe': 1, 'ses': 1,\n  'fk': 1, 'ruhr': 1, 'xn--kpry57d': 1, 'gmbh': 1, 'weir': 1, 'pictet': 1,\n  'furniture': 1, 'melbourne': 1, 'rugby': 1, 'wedding': 1, 'ltda': 1,\n  'supplies': 1, 'trust': 1, 'vodka': 1, 'yahoo': 1, 'management': 1,\n  'microsoft': 1, 'big': 1, 'sener': 1, 'theatre': 1, 'mobile': 1,\n  'office': 1, 'soccer': 1, 'car': 1, 'qpon': 1, 'buy': 1, 'map': 1,\n  'lixil': 1, 'chrome': 1, 'hiphop': 1, 'study': 1, 'sky': 1, 'lr': 1,\n}\n"
  },
  {
    "path": "stats.Dockerfile",
    "content": "# Replicating pjox/cc-crawl-statistics\nFROM python:3.12\n\n# Install system dependencies\nRUN apt-get update && apt-get install -y \\\n    git \\\n    python3-rpy2 \\\n    r-cran-ggplot2 \\\n    graphviz-dev \\\n    r-base jq \\\n    awscli\n\n# Install Liberation Sans (Helvetica alternative) and other fonts\nRUN apt-get update && apt-get install -y \\\n    fontconfig \\\n    fonts-liberation \\\n    fonts-dejavu \\\n    && fc-cache -fv \\\n    && rm -rf /var/lib/apt/lists/*\n\n# Set working directory\nWORKDIR /app\n\n# Copy dependency config files (first for cache)\nCOPY requirements.txt .\nCOPY requirements_plot.txt .\n\n# Install Python dependencies\nRUN pip3 install -r requirements.txt\nRUN pip3 install -r requirements_plot.txt\n\n# Copy the remaining repository files\nCOPY stats/crawler ./stats/crawler\nCOPY plots/ ./plots/\nCOPY plot/ ./plot/\nCOPY tests/ ./tests/\n\nCOPY *.sh ./\nCOPY *.py ./\nCOPY _config.yml ./\n\n# Set environment variables\nENV PYTHONPATH=/app\n\n# Supported plotlibs: matplotlib, rpy2.ggplot2, ggplot (partially deprecated)\nENV PLOTLIB=matplotlib\n\n# ggplot2 is already installed via r-cran-ggplot2 system package above\n\n# Default command\nCMD [\"./get_stats_and_plot.sh\"]"
  },
  {
    "path": "tests/test_crawlstat.py",
    "content": "import json\nimport sys\n\nimport ujson\nimport jsonpickle\n\nfrom crawlstats import MonthlyCrawl, MonthlyCrawlSet\nfrom crawlstats import CrawlStatsJSONDecoder, CrawlStatsJSONEncoder\nfrom crawlstats import CST\nfrom crawlstats import MultiCount\nfrom hyperloglog import HyperLogLog\n\ncrawl1 = MonthlyCrawl.get_by_name('CC-MAIN-2014-52')\ncrawl2 = MonthlyCrawl.get_by_name('CC-MAIN-2015-06')\ncrawl3 = MonthlyCrawl.get_by_name('CC-MAIN-2016-26')\n\n\ndef test_monthly_crawl():\n    assert(crawl1 != crawl2)\n    assert(crawl1 < crawl2)\n    assert('{}'.format(crawl1) == json.dumps(crawl1))\n    assert('CC-MAIN-2014-52' == MonthlyCrawl.to_name(crawl1))\n\n\ndef test_monthly_crawl_set():\n    crawls = MonthlyCrawlSet()\n    assert('0' == json.dumps(crawls, cls=CrawlStatsJSONEncoder))\n\n    # add crawl 1 - CC-MAIN-2014-52\n    crawls.add(crawl1)\n    assert(crawl1 in crawls)\n    assert('1' == json.dumps(crawls, cls=CrawlStatsJSONEncoder))\n    assert(crawls.is_newest(crawl1))\n\n    # add crawl 2 - CC-MAIN-2015-06\n    crawls.add(crawl2)\n    assert(crawl2 in crawls)\n    assert(crawls.is_newest(crawl2))\n    assert(not crawls.is_newest(crawl1))\n\n    # create second crawl set and add crawl 3 - CC-MAIN-2016-26\n    crawls2 = MonthlyCrawlSet()\n    crawls2.add(crawl3)\n    assert(crawl3 in crawls2)\n\n    # merge the two crawl sets\n    crawls.update(crawls2)\n    assert(crawl3 in crawls)\n    assert(3 == len(crawls))\n\n    # check iterator over crawl set\n    for crawl in crawls.get_crawls():\n        assert(crawl in crawls)\n        assert((crawl == crawl1) or (crawl == crawl2) or (crawl == crawl3))\n        crawl = MonthlyCrawl.to_name(crawl)\n        assert((crawl == 'CC-MAIN-2014-52') or\n               (crawl == 'CC-MAIN-2015-06') or\n               (crawl == 'CC-MAIN-2016-26'))\n\n    # check is_newest in merged crawl set\n    assert(not crawls.is_newest(crawl2))\n    assert(crawls.is_newest(crawl3))\n\n    # check deletions from crawl set\n    crawls.discard(crawl2)\n    assert(crawl2 not in crawls)\n    assert(crawl1 in crawls)\n\n    # check is_new\n    assert(not crawls.is_new(crawl2))\n    assert(not crawls.is_new(crawl3))\n    crawls.discard(crawl1)\n    assert(crawls.is_new(crawl3))\n    # although crawl2 is not in crawls there is no older crawl\n    assert(crawls.is_new(crawl2))\n\n\ndef test_crawlstatstype():\n    cst = CST.url\n    assert(cst.value == CST.url.value)\n\n\ndef test_json_hyperloglog():\n    hll1 = HyperLogLog(.01)\n    for i in range(0, 50):\n        hll1.add(i)\n    jsons = json.dumps(hll1, cls=CrawlStatsJSONEncoder)\n    hll2 = json.loads(jsons, cls=CrawlStatsJSONDecoder)\n    assert(hll1.card() == hll2.card())\n    # test jsonpickle serialization\n    jsonp = jsonpickle.encode(hll2)\n    hll3 = jsonpickle.decode(jsonp)\n    assert(hll1.card() == hll3.card())\n\n\ndef test_multicount():\n    cnt = MultiCount(2)\n    cnt.incr('a', 1, 1)\n    assert([1, 1] == cnt.get('a'))\n    assert(1 == cnt.get_compressed('a'))\n    cnt.incr('a', 2, 1)\n    assert([3, 2] == cnt.get_compressed('a'))\n    assert([3, 2] == MultiCount.sum_values([[2, 1], 1]))\n    assert([6, 4, 3] == MultiCount.sum_values([[3, 2, 1], [2, 1], 1]))\n    cnt.incr('b', *[2, 1])\n"
  },
  {
    "path": "top_level_domain.py",
    "content": "import fileinput\nimport idna\nimport re\n\n\nclass TopLevelDomain:\n    \"\"\"Classify top-level domains (TLDs) to provide the following information:\n- type: generic, country-code, ...\n- \"\"\"\n\n    tld_ccs = {}\n    tld_types = {}\n    short_types = {'generic': 'gTLD',\n                   'generic-restricted': 'grTLD',\n                   'infrastructure': 'ARPA',\n                   'country-code': 'ccTLD',\n                   'sponsored': 'sTLD',\n                   'test': 'tTLD',\n                   'internationalized generic': 'IDN gTLD',\n                   'internationalized country-code TLD': 'IDN ccTLD',\n                   'internationalized test TLD': 'IDN tTLD'\n                   }\n\n    def __init__(self, tld):\n        self.tld = tld = tld.lower()\n        self.first_level = self.tld\n        self.tld_type = None\n        self.sub_type = None\n        if tld in TopLevelDomain.tld_ccs:\n            self.first_level = TopLevelDomain.tld_ccs[tld]\n        elif tld.find('.'):\n            self.first_level = re.sub(r'^.+\\.', '', tld)\n        if tld in TopLevelDomain.tld_types:\n            self.tld_type = TopLevelDomain.tld_types[tld]\n        elif tld in TopLevelDomain.tld_ccs:\n            self.tld_type = 'country-code'\n            self.sub_type = 'internationalized'\n            self.first_level = TopLevelDomain.tld_ccs[tld]\n        elif self.first_level in TopLevelDomain.tld_types:\n            self.tld_type = TopLevelDomain.tld_types[self.first_level]\n            self.sub_type = 'second-level'\n\n    def __str__(self):\n        _str = self.tld + '('\n        if self.tld_type:\n            _str += self.tld_type\n        if self.sub_type:\n            _str += ', ' + self.sub_type\n        if self.first_level and self.first_level != self.tld:\n            _str += ' of ' + self.first_level\n        idn = idna.encode(self.tld).decode('utf-8')\n        if idn != self.tld:\n            _str += ', idn: ' + idn\n        _str += ')'\n        return _str\n\n    @staticmethod\n    def _read_data():\n        state = ''\n        state_pattern = re.compile('^__([A-Z_]+)__$')\n        for line in TopLevelDomain.__DATA__.splitlines():\n            # print(line)\n            if len(line) == 0 or '#' == line[0]:\n                continue\n            m = state_pattern.match(line)\n            if m:\n                state = m.group(1)\n                continue\n            if state == 'IANA':\n                (tld, tld_type, _sponsoring_organization) = line.split('\\t')\n                tld = tld.strip('\\u200e\\u200f')\n                tld = tld.lstrip('.')\n                idn = idna.encode(tld).decode('utf-8')\n                if idn != tld:\n                    if tld_type == 'country-code':\n                        tld_type = 'internationalized country-code TLD'\n                    else:\n                        tld_type = 'internationalized ' + tld_type\n                    TopLevelDomain.tld_types[idn] = tld_type\n                TopLevelDomain.tld_types[tld] = tld_type\n            elif state == 'ICCTLD':\n                (dns, idn, _country, _lang, _script,\n                 _translit, _comment, cctld, _dnssec) = line.split('\\t')\n                dns = dns.lstrip('.')\n                cctld = cctld.lstrip('.')\n                idn = idn.lstrip('.')\n                if '[' in idn:\n                    # strip Wikipedia footnotes and links\n                    idn = re.sub(r'\\s*\\[.+?\\]\\s*$', '', idn)\n                for tld in (dns, idn):\n                    TopLevelDomain.tld_types[tld] \\\n                        = 'internationalized country-code TLD'\n                    TopLevelDomain.tld_ccs[tld] = cctld\n            elif state == 'INTERNATIONAL_BRAND_TLD':\n                (dns, idn, _entity, _script, _translit,\n                 _comments, _dnssec) = line.split('\\t')\n                dns = dns.lstrip('.')\n                idn = idn.lstrip('.')\n                TopLevelDomain.tld_types[dns] = 'internationalized generic TLD'\n                TopLevelDomain.tld_types[idn] = 'internationalized generic TLD'\n            elif state == 'INTERNATIONAL_GEOGRAPHIC_TLD':\n                # geographic TLDs (not internationalized) are classified in IANA list as generic\n                (dns, idn, _entity, _script, _translit,\n                 _comments, _other_tld, _dnssec) = line.split('\\t')\n                dns = dns.lstrip('.')\n                idn = idn.lstrip('.')\n                TopLevelDomain.tld_types[dns] = 'internationalized generic TLD'\n                TopLevelDomain.tld_types[idn] = 'internationalized generic TLD'\n            elif state == 'INTERNATIONAL_TEST_TLD':\n                (dns, idn, _translit, _lang, _script, _test) = line.split('\\t')\n                dns = dns.lstrip('.')\n                idn = idn.lstrip('.')\n                TopLevelDomain.tld_types[dns] = 'internationalized test TLD'\n                TopLevelDomain.tld_types[idn] = 'internationalized test TLD'\n\n    @staticmethod\n    def short_type(name):\n        if name in TopLevelDomain.short_types:\n            return TopLevelDomain.short_types[name]\n        return name\n\n    __DATA__ = '''\\\n__IANA__\n# https://www.iana.org/domains/root/db\n# (update 2025-09-26)\n# Domain\tType\tTLD Manager\n.aaa\tgeneric\tAmerican Automobile Association, Inc.\n.aarp\tgeneric\tAARP\n.abarth\tgeneric\tNot assigned\n.abb\tgeneric\tABB Ltd\n.abbott\tgeneric\tAbbott Laboratories, Inc.\n.abbvie\tgeneric\tAbbVie Inc.\n.abc\tgeneric\tDisney Enterprises, Inc.\n.able\tgeneric\tAble Inc.\n.abogado\tgeneric\tRegistry Services, LLC\n.abudhabi\tgeneric\tAbu Dhabi Systems and Information Centre\n.ac\tcountry-code\tInternet Computer Bureau Limited\n.academy\tgeneric\tBinky Moon, LLC\n.accenture\tgeneric\tAccenture plc\n.accountant\tgeneric\tdot Accountant Limited\n.accountants\tgeneric\tBinky Moon, LLC\n.aco\tgeneric\tACO Severin Ahlmann GmbH & Co. KG\n.active\tgeneric\tNot assigned\n.actor\tgeneric\tDog Beach, LLC\n.ad\tcountry-code\tAndorra Telecom\n.adac\tgeneric\tNot assigned\n.ads\tgeneric\tCharleston Road Registry Inc.\n.adult\tgeneric\tICM Registry AD LLC\n.ae\tcountry-code\tTelecommunications and Digital Government Regulatory Authority (TDRA)\n.aeg\tgeneric\tAktiebolaget Electrolux\n.aero\tsponsored\tSociete Internationale de Telecommunications Aeronautique (SITA INC USA)\n.aetna\tgeneric\tAetna Life Insurance Company\n.af\tcountry-code\tMinistry of Communications and IT\n.afamilycompany\tgeneric\tNot assigned\n.afl\tgeneric\tAustralian Football League\n.africa\tgeneric\tZA Central Registry NPC trading as Registry.Africa\n.ag\tcountry-code\tUHSA School of Medicine\n.agakhan\tgeneric\tFondation Aga Khan (Aga Khan Foundation)\n.agency\tgeneric\tBinky Moon, LLC\n.ai\tcountry-code\tGovernment of Anguilla\n.aig\tgeneric\tAmerican International Group, Inc.\n.aigo\tgeneric\tNot assigned\n.airbus\tgeneric\tAirbus S.A.S.\n.airforce\tgeneric\tDog Beach, LLC\n.airtel\tgeneric\tBharti Airtel Limited\n.akdn\tgeneric\tFondation Aga Khan (Aga Khan Foundation)\n.al\tcountry-code\tElectronic and Postal Communications Authority - AKEP\n.alfaromeo\tgeneric\tNot assigned\n.alibaba\tgeneric\tAlibaba Group Holding Limited\n.alipay\tgeneric\tAlibaba Group Holding Limited\n.allfinanz\tgeneric\tAllfinanz Deutsche Vermögensberatung Aktiengesellschaft\n.allstate\tgeneric\tAllstate Fire and Casualty Insurance Company\n.ally\tgeneric\tAlly Financial Inc.\n.alsace\tgeneric\tREGION GRAND EST\n.alstom\tgeneric\tALSTOM\n.am\tcountry-code\t\"Internet Society\" Non-governmental Organization\n.amazon\tgeneric\tAmazon Registry Services, Inc.\n.americanexpress\tgeneric\tAmerican Express Travel Related Services Company, Inc.\n.americanfamily\tgeneric\tAmFam, Inc.\n.amex\tgeneric\tAmerican Express Travel Related Services Company, Inc.\n.amfam\tgeneric\tAmFam, Inc.\n.amica\tgeneric\tAmica Mutual Insurance Company\n.amsterdam\tgeneric\tGemeente Amsterdam\n.an\tcountry-code\tNot assigned\n.analytics\tgeneric\tCampus IP LLC\n.android\tgeneric\tCharleston Road Registry Inc.\n.anquan\tgeneric\tQIHOO 360 TECHNOLOGY CO. LTD.\n.anz\tgeneric\tAustralia and New Zealand Banking Group Limited\n.ao\tcountry-code\tMinistry of Telecommunications and Information Technologies (MTTI)\n.aol\tgeneric\tYahoo Inc.\n.apartments\tgeneric\tBinky Moon, LLC\n.app\tgeneric\tCharleston Road Registry Inc.\n.apple\tgeneric\tApple Inc.\n.aq\tcountry-code\tAntarctica Network Information Centre Limited\n.aquarelle\tgeneric\tAquarelle.com\n.ar\tcountry-code\tPresidencia de la Nación , Secretaría Legal y Técnica\n.arab\tgeneric\tLeague of Arab States\n.aramco\tgeneric\tAramco Services Company\n.archi\tgeneric\tIdentity Digital Limited\n.army\tgeneric\tDog Beach, LLC\n.arpa\tinfrastructure\tInternet Architecture Board (IAB)\n.art\tgeneric\tUK Creative Ideas Limited\n.arte\tgeneric\tAssociation Relative à la Télévision Européenne G.E.I.E.\n.as\tcountry-code\tAS Domain Registry\n.asda\tgeneric\tAsda Stores Limited\n.asia\tsponsored\tDotAsia Organisation Ltd.\n.associates\tgeneric\tBinky Moon, LLC\n.at\tcountry-code\tnic.at GmbH\n.athleta\tgeneric\tThe Gap, Inc.\n.attorney\tgeneric\tDog Beach, LLC\n.au\tcountry-code\t.au Domain Administration (auDA)\n.auction\tgeneric\tDog Beach, LLC\n.audi\tgeneric\tAUDI Aktiengesellschaft\n.audible\tgeneric\tAmazon Registry Services, Inc.\n.audio\tgeneric\tXYZ.COM LLC\n.auspost\tgeneric\tAustralian Postal Corporation\n.author\tgeneric\tAmazon Registry Services, Inc.\n.auto\tgeneric\tXYZ.COM LLC\n.autos\tgeneric\tXYZ.COM LLC\n.avianca\tgeneric\tNot assigned\n.aw\tcountry-code\tSETAR\n.aws\tgeneric\tAWS Registry LLC\n.ax\tcountry-code\tÅlands landskapsregering\n.axa\tgeneric\tAXA Group Operations SAS\n.az\tcountry-code\tIntraNS\n.azure\tgeneric\tMicrosoft Corporation\n.ba\tcountry-code\tUniverstiy Telinformatic Centre (UTIC)\n.baby\tgeneric\tXYZ.COM LLC\n.baidu\tgeneric\tBaidu, Inc.\n.banamex\tgeneric\tCitigroup Inc.\n.bananarepublic\tgeneric\tNot assigned\n.band\tgeneric\tDog Beach, LLC\n.bank\tgeneric\tfTLD Registry Services, LLC\n.bar\tgeneric\tPunto 2012 Sociedad Anonima Promotora de Inversion de Capital Variable\n.barcelona\tgeneric\tMunicipi de Barcelona\n.barclaycard\tgeneric\tBarclays Bank PLC\n.barclays\tgeneric\tBarclays Bank PLC\n.barefoot\tgeneric\tGallo Vineyards, Inc.\n.bargains\tgeneric\tBinky Moon, LLC\n.baseball\tgeneric\tMLB Advanced Media DH, LLC\n.basketball\tgeneric\tFédération Internationale de Basketball (FIBA)\n.bauhaus\tgeneric\tWerkhaus GmbH\n.bayern\tgeneric\tBayern Connect GmbH\n.bb\tcountry-code\tMinistry of Innovation, Science and Smart Technology\n.bbc\tgeneric\tBritish Broadcasting Corporation\n.bbt\tgeneric\tBB&T Corporation\n.bbva\tgeneric\tBANCO BILBAO VIZCAYA ARGENTARIA, S.A.\n.bcg\tgeneric\tThe Boston Consulting Group, Inc.\n.bcn\tgeneric\tMunicipi de Barcelona\n.bd\tcountry-code\tPosts and Telecommunications Division\n.be\tcountry-code\tDNS Belgium vzw/asbl\n.beats\tgeneric\tBeats Electronics, LLC\n.beauty\tgeneric\tXYZ.COM LLC\n.beer\tgeneric\tRegistry Services, LLC\n.bentley\tgeneric\tNot assigned\n.berlin\tgeneric\tdotBERLIN GmbH & Co. KG\n.best\tgeneric\tBestTLD Pty Ltd\n.bestbuy\tgeneric\tBBY Solutions, Inc.\n.bet\tgeneric\tIdentity Digital Limited\n.bf\tcountry-code\tAutorité de Régulation des Communications Electroniques et des Postes (ARCEP)\n.bg\tcountry-code\tRegister.BG\n.bh\tcountry-code\tTelecommunications Regulatory Authority (TRA)\n.bharti\tgeneric\tBharti Enterprises (Holding) Private Limited\n.bi\tcountry-code\tCentre National de l'Informatique\n.bible\tgeneric\tAmerican Bible Society\n.bid\tgeneric\tdot Bid Limited\n.bike\tgeneric\tBinky Moon, LLC\n.bing\tgeneric\tMicrosoft Corporation\n.bingo\tgeneric\tBinky Moon, LLC\n.bio\tgeneric\tIdentity Digital Limited\n.biz\tgeneric-restricted\tRegistry Services, LLC\n.bj\tcountry-code\tAutorité de Régulation des Communications Electroniques et de la Poste du Bénin (ARCEP BENIN)\n.bl\tcountry-code\tNot assigned\n.black\tgeneric\tIdentity Digital Limited\n.blackfriday\tgeneric\tRegistry Services, LLC\n.blanco\tgeneric\tNot assigned\n.blockbuster\tgeneric\tDish DBS Corporation\n.blog\tgeneric\tKnock Knock WHOIS There, LLC\n.bloomberg\tgeneric\tBloomberg IP Holdings LLC\n.blue\tgeneric\tIdentity Digital Limited\n.bm\tcountry-code\tRegistry General Department, Ministry of Home Affairs\n.bms\tgeneric\tBristol-Myers Squibb Company\n.bmw\tgeneric\tBayerische Motoren Werke Aktiengesellschaft\n.bn\tcountry-code\tAuthority for Info-communications Technology Industry of Brunei Darussalam (AITI)\n.bnl\tgeneric\tNot assigned\n.bnpparibas\tgeneric\tBNP Paribas\n.bo\tcountry-code\tAgencia para el Desarrollo de la Información de la Sociedad en Bolivia\n.boats\tgeneric\tXYZ.COM LLC\n.boehringer\tgeneric\tBoehringer Ingelheim International GmbH\n.bofa\tgeneric\tBank of America Corporation\n.bom\tgeneric\tNúcleo de Informação e Coordenação do Ponto BR - NIC.br\n.bond\tgeneric\tShortdot SA\n.boo\tgeneric\tCharleston Road Registry Inc.\n.book\tgeneric\tAmazon Registry Services, Inc.\n.booking\tgeneric\tBooking.com B.V.\n.boots\tgeneric\tNot assigned\n.bosch\tgeneric\tRobert Bosch GMBH\n.bostik\tgeneric\tBostik SA\n.boston\tgeneric\tRegistry Services, LLC\n.bot\tgeneric\tAmazon Registry Services, Inc.\n.boutique\tgeneric\tBinky Moon, LLC\n.box\tgeneric\tIntercap Registry Inc.\n.bq\tcountry-code\tNot assigned\n.br\tcountry-code\tComite Gestor da Internet no Brasil\n.bradesco\tgeneric\tBanco Bradesco S.A.\n.bridgestone\tgeneric\tBridgestone Corporation\n.broadway\tgeneric\tCelebrate Broadway, Inc.\n.broker\tgeneric\tDog Beach, LLC\n.brother\tgeneric\tBrother Industries, Ltd.\n.brussels\tgeneric\tDNS.be vzw\n.bs\tcountry-code\tUniversity of The Bahamas\n.bt\tcountry-code\tMinistry of Information and Communications\n.budapest\tgeneric\tNot assigned\n.bugatti\tgeneric\tNot assigned\n.build\tgeneric\tPlan Bee LLC\n.builders\tgeneric\tBinky Moon, LLC\n.business\tgeneric\tBinky Moon, LLC\n.buy\tgeneric\tAmazon Registry Services, INC\n.buzz\tgeneric\tDOTSTRATEGY CO.\n.bv\tcountry-code\tNorid A/S\n.bw\tcountry-code\tBotswana Communications Regulatory Authority (BOCRA)\n.by\tcountry-code\tBelarusian Cloud Technologies LLC\n.bz\tcountry-code\tUniversity of Belize\n.bzh\tgeneric\tAssociation www.bzh\n.ca\tcountry-code\tCanadian Internet Registration Authority (CIRA) Autorité Canadienne pour les enregistrements Internet (ACEI)\n.cab\tgeneric\tBinky Moon, LLC\n.cafe\tgeneric\tBinky Moon, LLC\n.cal\tgeneric\tCharleston Road Registry Inc.\n.call\tgeneric\tAmazon Registry Services, Inc.\n.calvinklein\tgeneric\tPVH gTLD Holdings LLC\n.cam\tgeneric\tCAM Connecting SARL\n.camera\tgeneric\tBinky Moon, LLC\n.camp\tgeneric\tBinky Moon, LLC\n.cancerresearch\tgeneric\tNot assigned\n.canon\tgeneric\tCanon Inc.\n.capetown\tgeneric\tZA Central Registry NPC trading as ZA Central Registry\n.capital\tgeneric\tBinky Moon, LLC\n.capitalone\tgeneric\tCapital One Financial Corporation\n.car\tgeneric\tXYZ.COM LLC\n.caravan\tgeneric\tCaravan International, Inc.\n.cards\tgeneric\tBinky Moon, LLC\n.care\tgeneric\tBinky Moon, LLC\n.career\tgeneric\tdotCareer LLC\n.careers\tgeneric\tBinky Moon, LLC\n.cars\tgeneric\tXYZ.COM LLC\n.cartier\tgeneric\tNot assigned\n.casa\tgeneric\tRegistry Services, LLC\n.case\tgeneric\tDigity, LLC\n.caseih\tgeneric\tNot assigned\n.cash\tgeneric\tBinky Moon, LLC\n.casino\tgeneric\tBinky Moon, LLC\n.cat\tsponsored\tFundacio puntCAT\n.catering\tgeneric\tBinky Moon, LLC\n.catholic\tgeneric\tPontificium Consilium de Comunicationibus Socialibus (PCCS) (Pontifical Council for Social Communication)\n.cba\tgeneric\tCOMMONWEALTH BANK OF AUSTRALIA\n.cbn\tgeneric\tThe Christian Broadcasting Network, Inc.\n.cbre\tgeneric\tCBRE, Inc.\n.cbs\tgeneric\tNot assigned\n.cc\tcountry-code\teNIC Cocos (Keeling) Islands Pty. Ltd. d/b/a Island Internet Services\n.cd\tcountry-code\tOffice Congolais des Postes et Télécommunications - OCPT\n.ceb\tgeneric\tNot assigned\n.center\tgeneric\tBinky Moon, LLC\n.ceo\tgeneric\tXYZ.COM LLC\n.cern\tgeneric\tEuropean Organization for Nuclear Research (\"CERN\")\n.cf\tcountry-code\tSociete Centrafricaine de Telecommunications (SOCATEL)\n.cfa\tgeneric\tCFA Institute\n.cfd\tgeneric\tShortdot SA\n.cg\tcountry-code\tInterpoint Switzerland\n.ch\tcountry-code\tSWITCH The Swiss Education & Research Network\n.chanel\tgeneric\tChanel International B.V.\n.channel\tgeneric\tCharleston Road Registry Inc.\n.charity\tgeneric\tPublic Interest Registry (PIR)\n.chase\tgeneric\tJPMorgan Chase Bank, National Association\n.chat\tgeneric\tBinky Moon, LLC\n.cheap\tgeneric\tBinky Moon, LLC\n.chintai\tgeneric\tCHINTAI Corporation\n.chloe\tgeneric\tNot assigned\n.christmas\tgeneric\tXYZ.COM LLC\n.chrome\tgeneric\tCharleston Road Registry Inc.\n.chrysler\tgeneric\tNot assigned\n.church\tgeneric\tBinky Moon, LLC\n.ci\tcountry-code\tAutorité de Régulation des Télécommunications/TIC de Côte d’lvoire (ARTCI)\n.cipriani\tgeneric\tHotel Cipriani Srl\n.circle\tgeneric\tAmazon Registry Services, Inc.\n.cisco\tgeneric\tCisco Technology, Inc.\n.citadel\tgeneric\tCitadel Domain LLC\n.citi\tgeneric\tCitigroup Inc.\n.citic\tgeneric\tCITIC Group Corporation\n.city\tgeneric\tBinky Moon, LLC\n.cityeats\tgeneric\tNot assigned\n.ck\tcountry-code\tTelecom Cook Islands Ltd.\n.cl\tcountry-code\tNIC Chile (University of Chile)\n.claims\tgeneric\tBinky Moon, LLC\n.cleaning\tgeneric\tBinky Moon, LLC\n.click\tgeneric\tInternet Naming Co.\n.clinic\tgeneric\tBinky Moon, LLC\n.clinique\tgeneric\tThe Estée Lauder Companies Inc.\n.clothing\tgeneric\tBinky Moon, LLC\n.cloud\tgeneric\tARUBA PEC S.p.A.\n.club\tgeneric\tRegistry Services, LLC\n.clubmed\tgeneric\tClub Méditerranée S.A.\n.cm\tcountry-code\tAgence Nationale des Technologies de l'Information et de la Communication (ANTIC)\n.cn\tcountry-code\tChina Internet Network Information Center (CNNIC)\n.co\tcountry-code\tMinistry of Information and Communications Technologies (MinTIC)\n.coach\tgeneric\tBinky Moon, LLC\n.codes\tgeneric\tBinky Moon, LLC\n.coffee\tgeneric\tBinky Moon, LLC\n.college\tgeneric\tXYZ.COM LLC\n.cologne\tgeneric\tdotKoeln GmbH\n.com\tgeneric\tVeriSign Global Registry Services\n.comcast\tgeneric\tNot assigned\n.commbank\tgeneric\tCOMMONWEALTH BANK OF AUSTRALIA\n.community\tgeneric\tBinky Moon, LLC\n.company\tgeneric\tBinky Moon, LLC\n.compare\tgeneric\tRegistry Services, LLC\n.computer\tgeneric\tBinky Moon, LLC\n.comsec\tgeneric\tVeriSign, Inc.\n.condos\tgeneric\tBinky Moon, LLC\n.construction\tgeneric\tBinky Moon, LLC\n.consulting\tgeneric\tDog Beach, LLC\n.contact\tgeneric\tDog Beach, LLC\n.contractors\tgeneric\tBinky Moon, LLC\n.cooking\tgeneric\tRegistry Services, LLC\n.cookingchannel\tgeneric\tNot assigned\n.cool\tgeneric\tBinky Moon, LLC\n.coop\tsponsored\tDotCooperation LLC\n.corsica\tgeneric\tCollectivité de Corse\n.country\tgeneric\tInternet Naming Co.\n.coupon\tgeneric\tAmazon Registry Services, Inc.\n.coupons\tgeneric\tBinky Moon, LLC\n.courses\tgeneric\tRegistry Services, LLC\n.cpa\tgeneric\tAmerican Institute of Certified Public Accountants\n.cr\tcountry-code\tNational Academy of Sciences (Academia Nacional de Ciencias)\n.credit\tgeneric\tBinky Moon, LLC\n.creditcard\tgeneric\tBinky Moon, LLC\n.creditunion\tgeneric\tDotCooperation, LLC\n.cricket\tgeneric\tdot Cricket Limited\n.crown\tgeneric\tCrown Equipment Corporation\n.crs\tgeneric\tFederated Co-operatives Limited\n.cruise\tgeneric\tViking River Cruises (Bermuda) Ltd.\n.cruises\tgeneric\tBinky Moon, LLC\n.csc\tgeneric\tNot assigned\n.cu\tcountry-code\tCENIAInternet\n.cuisinella\tgeneric\tSCHMIDT GROUPE S.A.S.\n.cv\tcountry-code\tAgência Reguladora Multissectorial da Economia (ARME)\n.cw\tcountry-code\tUniversity of Curacao\n.cx\tcountry-code\tChristmas Island Domain Administration Limited\n.cy\tcountry-code\tUniversity of Cyprus\n.cymru\tgeneric\tNominet UK\n.cyou\tgeneric\tShortdot SA\n.cz\tcountry-code\tCZ.NIC, z.s.p.o\n.dabur\tgeneric\tNot assigned\n.dad\tgeneric\tCharleston Road Registry Inc.\n.dance\tgeneric\tDog Beach, LLC\n.data\tgeneric\tDish DBS Corporation\n.date\tgeneric\tdot Date Limited\n.dating\tgeneric\tBinky Moon, LLC\n.datsun\tgeneric\tNISSAN MOTOR CO., LTD.\n.day\tgeneric\tCharleston Road Registry Inc.\n.dclk\tgeneric\tCharleston Road Registry Inc.\n.dds\tgeneric\tRegistry Services, LLC\n.de\tcountry-code\tDENIC eG\n.deal\tgeneric\tAmazon Registry Services, Inc.\n.dealer\tgeneric\tIntercap Registry Inc.\n.deals\tgeneric\tBinky Moon, LLC\n.degree\tgeneric\tDog Beach, LLC\n.delivery\tgeneric\tBinky Moon, LLC\n.dell\tgeneric\tDell Inc.\n.deloitte\tgeneric\tDeloitte Touche Tohmatsu\n.delta\tgeneric\tDelta Air Lines, Inc.\n.democrat\tgeneric\tDog Beach, LLC\n.dental\tgeneric\tBinky Moon, LLC\n.dentist\tgeneric\tDog Beach, LLC\n.desi\tgeneric\tEmergency Back-End Registry Operator Program - ICANN\n.design\tgeneric\tRegistry Services, LLC\n.dev\tgeneric\tCharleston Road Registry Inc.\n.dhl\tgeneric\tDeutsche Post AG\n.diamonds\tgeneric\tBinky Moon, LLC\n.diet\tgeneric\tXYZ.COM LLC\n.digital\tgeneric\tBinky Moon, LLC\n.direct\tgeneric\tBinky Moon, LLC\n.directory\tgeneric\tBinky Moon, LLC\n.discount\tgeneric\tBinky Moon, LLC\n.discover\tgeneric\tDiscover Financial Services\n.dish\tgeneric\tDish DBS Corporation\n.diy\tgeneric\tInternet Naming Co.\n.dj\tcountry-code\tDjibouti Telecom S.A\n.dk\tcountry-code\tDansk Internet Forum\n.dm\tcountry-code\tDotDM Corporation\n.dnp\tgeneric\tDai Nippon Printing Co., Ltd.\n.do\tcountry-code\tPontificia Universidad Catolica Madre y Maestra, Recinto Santo Tomas de Aquino\n.docs\tgeneric\tCharleston Road Registry Inc.\n.doctor\tgeneric\tBinky Moon, LLC\n.dodge\tgeneric\tNot assigned\n.dog\tgeneric\tBinky Moon, LLC\n.doha\tgeneric\tNot assigned\n.domains\tgeneric\tBinky Moon, LLC\n.doosan\tgeneric\tNot assigned\n.dot\tgeneric\tDish DBS Corporation\n.download\tgeneric\tdot Support Limited\n.drive\tgeneric\tCharleston Road Registry Inc.\n.dtv\tgeneric\tDish DBS Corporation\n.dubai\tgeneric\tDubai Smart Government Department\n.duck\tgeneric\tNot assigned\n.dunlop\tgeneric\tThe Goodyear Tire & Rubber Company\n.duns\tgeneric\tNot assigned\n.dupont\tgeneric\tDuPont Specialty Products USA, LLC\n.durban\tgeneric\tZA Central Registry NPC trading as ZA Central Registry\n.dvag\tgeneric\tDeutsche Vermögensberatung Aktiengesellschaft DVAG\n.dvr\tgeneric\tDISH Technologies L.L.C.\n.dz\tcountry-code\tCERIST\n.earth\tgeneric\tInterlink Systems Innovation Institute K.K.\n.eat\tgeneric\tCharleston Road Registry Inc.\n.ec\tcountry-code\tECUADORDOMAIN S.A.\n.eco\tgeneric\tBig Room Inc.\n.edeka\tgeneric\tEDEKA Verband kaufmännischer Genossenschaften e.V.\n.edu\tsponsored\tEDUCAUSE\n.education\tgeneric\tBinky Moon, LLC\n.ee\tcountry-code\tEesti Interneti Sihtasutus (EIS)\n.eg\tcountry-code\tEgyptian Universities Network (EUN), Supreme Council of Universities\n.eh\tcountry-code\tNot assigned\n.email\tgeneric\tBinky Moon, LLC\n.emerck\tgeneric\tMerck KGaA\n.emerson\tgeneric\tNot assigned\n.energy\tgeneric\tBinky Moon, LLC\n.engineer\tgeneric\tDog Beach, LLC\n.engineering\tgeneric\tBinky Moon, LLC\n.enterprises\tgeneric\tBinky Moon, LLC\n.epost\tgeneric\tNot assigned\n.epson\tgeneric\tSeiko Epson Corporation\n.equipment\tgeneric\tBinky Moon, LLC\n.er\tcountry-code\tEritrea Telecommunication Services Corporation (EriTel)\n.ericsson\tgeneric\tTelefonaktiebolaget L M Ericsson\n.erni\tgeneric\tERNI Group Holding AG\n.es\tcountry-code\tRed.es\n.esq\tgeneric\tCharleston Road Registry Inc.\n.estate\tgeneric\tBinky Moon, LLC\n.esurance\tgeneric\tNot assigned\n.et\tcountry-code\tEthio telecom\n.etisalat\tgeneric\tNot assigned\n.eu\tcountry-code\tEURid vzw/asbl\n.eurovision\tgeneric\tEuropean Broadcasting Union (EBU)\n.eus\tgeneric\tPuntueus Fundazioa\n.events\tgeneric\tBinky Moon, LLC\n.everbank\tgeneric\tNot assigned\n.exchange\tgeneric\tBinky Moon, LLC\n.expert\tgeneric\tBinky Moon, LLC\n.exposed\tgeneric\tBinky Moon, LLC\n.express\tgeneric\tBinky Moon, LLC\n.extraspace\tgeneric\tExtra Space Storage LLC\n.fage\tgeneric\tFage International S.A.\n.fail\tgeneric\tBinky Moon, LLC\n.fairwinds\tgeneric\tFairWinds Partners, LLC\n.faith\tgeneric\tdot Faith Limited\n.family\tgeneric\tDog Beach, LLC\n.fan\tgeneric\tDog Beach, LLC\n.fans\tgeneric\tZDNS International Limited\n.farm\tgeneric\tBinky Moon, LLC\n.farmers\tgeneric\tFarmers Insurance Exchange\n.fashion\tgeneric\tRegistry Services, LLC\n.fast\tgeneric\tAmazon Registry Services, Inc.\n.fedex\tgeneric\tFederal Express Corporation\n.feedback\tgeneric\tTop Level Spectrum, Inc.\n.ferrari\tgeneric\tFiat Chrysler Automobiles N.V.\n.ferrero\tgeneric\tFerrero Trading Lux S.A.\n.fi\tcountry-code\tFinnish Transport and Communications Agency Traficom\n.fiat\tgeneric\tNot assigned\n.fidelity\tgeneric\tFidelity Brokerage Services LLC\n.fido\tgeneric\tRogers Communications Canada Inc.\n.film\tgeneric\tMotion Picture Domain Registry Pty Ltd\n.final\tgeneric\tNúcleo de Informação e Coordenação do Ponto BR - NIC.br\n.finance\tgeneric\tBinky Moon, LLC\n.financial\tgeneric\tBinky Moon, LLC\n.fire\tgeneric\tAmazon Registry Services, Inc.\n.firestone\tgeneric\tBridgestone Licensing Services, Inc.\n.firmdale\tgeneric\tFirmdale Holdings Limited\n.fish\tgeneric\tBinky Moon, LLC\n.fishing\tgeneric\tRegistry Services, LLC\n.fit\tgeneric\tRegistry Services, LLC\n.fitness\tgeneric\tBinky Moon, LLC\n.fj\tcountry-code\tThe University of the South Pacific IT Services\n.fk\tcountry-code\tFalkland Islands Government\n.flickr\tgeneric\tFlickr, Inc.\n.flights\tgeneric\tBinky Moon, LLC\n.flir\tgeneric\tFLIR Systems, Inc.\n.florist\tgeneric\tBinky Moon, LLC\n.flowers\tgeneric\tXYZ.COM LLC\n.flsmidth\tgeneric\tNot assigned\n.fly\tgeneric\tCharleston Road Registry Inc.\n.fm\tcountry-code\tFSM Telecommunications Corporation\n.fo\tcountry-code\tFO Council\n.foo\tgeneric\tCharleston Road Registry Inc.\n.food\tgeneric\tInternet Naming Co.\n.foodnetwork\tgeneric\tNot assigned\n.football\tgeneric\tBinky Moon, LLC\n.ford\tgeneric\tFord Motor Company\n.forex\tgeneric\tDog Beach, LLC\n.forsale\tgeneric\tDog Beach, LLC\n.forum\tgeneric\tFegistry, LLC\n.foundation\tgeneric\tPublic Interest Registry (PIR)\n.fox\tgeneric\tFOX Registry, LLC\n.fr\tcountry-code\tAssociation Française pour le Nommage Internet en Coopération (A.F.N.I.C.)\n.free\tgeneric\tAmazon Registry Services, Inc.\n.fresenius\tgeneric\tFresenius Immobilien-Verwaltungs-GmbH\n.frl\tgeneric\tFRLregistry B.V.\n.frogans\tgeneric\tOP3FT\n.frontdoor\tgeneric\tNot assigned\n.frontier\tgeneric\tFrontier Communications Corporation\n.ftr\tgeneric\tFrontier Communications Corporation\n.fujitsu\tgeneric\tFujitsu Limited\n.fujixerox\tgeneric\tNot assigned\n.fun\tgeneric\tRadix Technologies Inc.\n.fund\tgeneric\tBinky Moon, LLC\n.furniture\tgeneric\tBinky Moon, LLC\n.futbol\tgeneric\tDog Beach, LLC\n.fyi\tgeneric\tBinky Moon, LLC\n.ga\tcountry-code\tAgence Nationale des Infrastructures Numériques et des Fréquences (ANINF)\n.gal\tgeneric\tAsociación puntoGAL\n.gallery\tgeneric\tBinky Moon, LLC\n.gallo\tgeneric\tGallo Vineyards, Inc.\n.gallup\tgeneric\tGallup, Inc.\n.game\tgeneric\tXYZ.COM LLC\n.games\tgeneric\tDog Beach, LLC\n.gap\tgeneric\tThe Gap, Inc.\n.garden\tgeneric\tRegistry Services, LLC\n.gay\tgeneric\tRegistry Services, LLC\n.gb\tcountry-code\tReserved Domain - IANA\n.gbiz\tgeneric\tCharleston Road Registry Inc.\n.gd\tcountry-code\tThe National Telecommunications Regulatory Commission (NTRC)\n.gdn\tgeneric\tJoint Stock Company \"Navigation-information systems\"\n.ge\tcountry-code\tCaucasus Online LLC\n.gea\tgeneric\tGEA Group Aktiengesellschaft\n.gent\tgeneric\tCombell nv\n.genting\tgeneric\tResorts World Inc. Pte. Ltd.\n.george\tgeneric\tWal-Mart Stores, Inc.\n.gf\tcountry-code\tCANAL+ TELECOM\n.gg\tcountry-code\tIsland Networks Ltd.\n.ggee\tgeneric\tGMO Internet, Inc.\n.gh\tcountry-code\tNetwork Computer Systems Limited\n.gi\tcountry-code\tSapphire Networks\n.gift\tgeneric\tUniregistry, Corp.\n.gifts\tgeneric\tBinky Moon, LLC\n.gives\tgeneric\tPublic Interest Registry (PIR)\n.giving\tgeneric\tPublic Interest Registry (PIR)\n.gl\tcountry-code\tTELE Greenland A/S\n.glade\tgeneric\tNot assigned\n.glass\tgeneric\tBinky Moon, LLC\n.gle\tgeneric\tCharleston Road Registry Inc.\n.global\tgeneric\tIdentity Digital Limited\n.globo\tgeneric\tGlobo Comunicação e Participações S.A\n.gm\tcountry-code\tGM-NIC\n.gmail\tgeneric\tCharleston Road Registry Inc.\n.gmbh\tgeneric\tBinky Moon, LLC\n.gmo\tgeneric\tGMO Internet, Inc.\n.gmx\tgeneric\t1&1 Mail & Media GmbH\n.gn\tcountry-code\tCentre National des Sciences Halieutiques de Boussoura\n.godaddy\tgeneric\tGo Daddy East, LLC\n.gold\tgeneric\tBinky Moon, LLC\n.goldpoint\tgeneric\tYODOBASHI CAMERA CO.,LTD.\n.golf\tgeneric\tBinky Moon, LLC\n.goo\tgeneric\tNTT Resonant Inc.\n.goodhands\tgeneric\tNot assigned\n.goodyear\tgeneric\tThe Goodyear Tire & Rubber Company\n.goog\tgeneric\tCharleston Road Registry Inc.\n.google\tgeneric\tCharleston Road Registry Inc.\n.gop\tgeneric\tRepublican State Leadership Committee, Inc.\n.got\tgeneric\tAmazon Registry Services, Inc.\n.gov\tsponsored\tCybersecurity and Infrastructure Security Agency\n.gp\tcountry-code\tNetworking Technologies Group\n.gq\tcountry-code\tGETESA\n.gr\tcountry-code\tICS-FORTH GR\n.grainger\tgeneric\tGrainger Registry Services, LLC\n.graphics\tgeneric\tBinky Moon, LLC\n.gratis\tgeneric\tBinky Moon, LLC\n.green\tgeneric\tIdentity Digital Limited\n.gripe\tgeneric\tBinky Moon, LLC\n.grocery\tgeneric\tWal-Mart Stores, Inc.\n.group\tgeneric\tBinky Moon, LLC\n.gs\tcountry-code\tGovernment of South Georgia and South Sandwich Islands (GSGSSI)\n.gt\tcountry-code\tUniversidad del Valle de Guatemala\n.gu\tcountry-code\tUniversity of Guam\n.guardian\tgeneric\tNot assigned\n.gucci\tgeneric\tGuccio Gucci S.p.a.\n.guge\tgeneric\tCharleston Road Registry Inc.\n.guide\tgeneric\tBinky Moon, LLC\n.guitars\tgeneric\tXYZ.COM LLC\n.guru\tgeneric\tBinky Moon, LLC\n.gw\tcountry-code\tAutoridade Reguladora Nacional - Tecnologias de Informação e Comunicação da Guiné-Bissau\n.gy\tcountry-code\tUniversity of Guyana\n.hair\tgeneric\tXYZ.COM LLC\n.hamburg\tgeneric\tHamburg Top-Level-Domain GmbH\n.hangout\tgeneric\tCharleston Road Registry Inc.\n.haus\tgeneric\tDog Beach, LLC\n.hbo\tgeneric\tHBO Registry Services, Inc.\n.hdfc\tgeneric\tHOUSING DEVELOPMENT FINANCE CORPORATION LIMITED\n.hdfcbank\tgeneric\tHDFC Bank Limited\n.health\tgeneric\tRegistry Services, LLC\n.healthcare\tgeneric\tBinky Moon, LLC\n.help\tgeneric\tInnovation Service Ltd\n.helsinki\tgeneric\tCity of Helsinki\n.here\tgeneric\tCharleston Road Registry Inc.\n.hermes\tgeneric\tHermes International\n.hgtv\tgeneric\tNot assigned\n.hiphop\tgeneric\tDot Hip Hop, LLC\n.hisamitsu\tgeneric\tHisamitsu Pharmaceutical Co.,Inc.\n.hitachi\tgeneric\tHitachi, Ltd.\n.hiv\tgeneric\tInternet Naming Co.\n.hk\tcountry-code\tHong Kong Internet Registration Corporation Ltd.\n.hkt\tgeneric\tPCCW-HKT DataCom Services Limited\n.hm\tcountry-code\tHM Domain Registry\n.hn\tcountry-code\tRed de Desarrollo Sostenible Honduras\n.hockey\tgeneric\tBinky Moon, LLC\n.holdings\tgeneric\tBinky Moon, LLC\n.holiday\tgeneric\tBinky Moon, LLC\n.homedepot\tgeneric\tHome Depot Product Authority, LLC\n.homegoods\tgeneric\tThe TJX Companies, Inc.\n.homes\tgeneric\tXYZ.COM LLC\n.homesense\tgeneric\tThe TJX Companies, Inc.\n.honda\tgeneric\tHonda Motor Co., Ltd.\n.honeywell\tgeneric\tNot assigned\n.horse\tgeneric\tRegistry Services, LLC\n.hospital\tgeneric\tBinky Moon, LLC\n.host\tgeneric\tRadix Technologies Inc.\n.hosting\tgeneric\tXYZ.COM LLC\n.hot\tgeneric\tAmazon Registry Services, Inc.\n.hoteles\tgeneric\tNot assigned\n.hotels\tgeneric\tBooking.com B.V.\n.hotmail\tgeneric\tMicrosoft Corporation\n.house\tgeneric\tBinky Moon, LLC\n.how\tgeneric\tCharleston Road Registry Inc.\n.hr\tcountry-code\tCARNet - Croatian Academic and Research Network\n.hsbc\tgeneric\tHSBC Global Services (UK) Limited\n.ht\tcountry-code\tConsortium FDS/RDDH\n.htc\tgeneric\tNot assigned\n.hu\tcountry-code\tCouncil of Hungarian Internet Providers (CHIP)\n.hughes\tgeneric\tHughes Satellite Systems Corporation\n.hyatt\tgeneric\tHyatt GTLD, L.L.C.\n.hyundai\tgeneric\tHyundai Motor Company\n.ibm\tgeneric\tInternational Business Machines Corporation\n.icbc\tgeneric\tIndustrial and Commercial Bank of China Limited\n.ice\tgeneric\tIntercontinentalExchange, Inc.\n.icu\tgeneric\tShortdot SA\n.id\tcountry-code\tPerkumpulan Pengelola Nama Domain Internet Indonesia (PANDI)\n.ie\tcountry-code\tUniversity College Dublin, Computing Services, Computer Centre\n.ieee\tgeneric\tIEEE Global LLC\n.ifm\tgeneric\tifm electronic gmbh\n.iinet\tgeneric\tNot assigned\n.ikano\tgeneric\tIkano S.A.\n.il\tcountry-code\tThe Israel Internet Association (RA)\n.im\tcountry-code\tIsle of Man Government\n.imamat\tgeneric\tFondation Aga Khan (Aga Khan Foundation)\n.imdb\tgeneric\tAmazon Registry Services, Inc.\n.immo\tgeneric\tBinky Moon, LLC\n.immobilien\tgeneric\tDog Beach, LLC\n.in\tcountry-code\tNational Internet Exchange of India\n.inc\tgeneric\tIntercap Registry Inc.\n.industries\tgeneric\tBinky Moon, LLC\n.infiniti\tgeneric\tNISSAN MOTOR CO., LTD.\n.info\tgeneric\tIdentity Digital Limited\n.ing\tgeneric\tCharleston Road Registry Inc.\n.ink\tgeneric\tRegistry Services, LLC\n.institute\tgeneric\tBinky Moon, LLC\n.insurance\tgeneric\tfTLD Registry Services LLC\n.insure\tgeneric\tBinky Moon, LLC\n.int\tsponsored\tInternet Assigned Numbers Authority\n.intel\tgeneric\tNot assigned\n.international\tgeneric\tBinky Moon, LLC\n.intuit\tgeneric\tIntuit Administrative Services, Inc.\n.investments\tgeneric\tBinky Moon, LLC\n.io\tcountry-code\tInternet Computer Bureau Limited\n.ipiranga\tgeneric\tIpiranga Produtos de Petroleo S.A.\n.iq\tcountry-code\tCommunications and Media Commission (CMC)\n.ir\tcountry-code\tInstitute for Research in Fundamental Sciences\n.irish\tgeneric\tBinky Moon, LLC\n.is\tcountry-code\tISNIC - Internet á Íslandi hf.\n.iselect\tgeneric\tNot assigned\n.ismaili\tgeneric\tFondation Aga Khan (Aga Khan Foundation)\n.ist\tgeneric\tIstanbul Metropolitan Municipality\n.istanbul\tgeneric\tIstanbul Metropolitan Municipality\n.it\tcountry-code\tIIT - CNR\n.itau\tgeneric\tItau Unibanco Holding S.A.\n.itv\tgeneric\tITV Services Limited\n.iveco\tgeneric\tNot assigned\n.iwc\tgeneric\tNot assigned\n.jaguar\tgeneric\tJaguar Land Rover Ltd\n.java\tgeneric\tOracle Corporation\n.jcb\tgeneric\tJCB Co., Ltd.\n.jcp\tgeneric\tNot assigned\n.je\tcountry-code\tIsland Networks (Jersey) Ltd.\n.jeep\tgeneric\tFCA US LLC.\n.jetzt\tgeneric\tBinky Moon, LLC\n.jewelry\tgeneric\tBinky Moon, LLC\n.jio\tgeneric\tReliance Industries Limited\n.jlc\tgeneric\tNot assigned\n.jll\tgeneric\tJones Lang LaSalle Incorporated\n.jm\tcountry-code\tUniversity of West Indies\n.jmp\tgeneric\tMatrix IP LLC\n.jnj\tgeneric\tJohnson & Johnson Services, Inc.\n.jo\tcountry-code\tMinistry of Digital Economy and Entrepreneurship (MoDEE)\n.jobs\tsponsored\tEmploy Media LLC\n.joburg\tgeneric\tZA Central Registry NPC trading as ZA Central Registry\n.jot\tgeneric\tAmazon Registry Services, Inc.\n.joy\tgeneric\tAmazon Registry Services, Inc.\n.jp\tcountry-code\tJapan Registry Services Co., Ltd.\n.jpmorgan\tgeneric\tJPMorgan Chase Bank, National Association\n.jprs\tgeneric\tJapan Registry Services Co., Ltd.\n.juegos\tgeneric\tDog Beach, LLC\n.juniper\tgeneric\tJUNIPER NETWORKS, INC.\n.kaufen\tgeneric\tDog Beach, LLC\n.kddi\tgeneric\tKDDI CORPORATION\n.ke\tcountry-code\tKenya Network Information Center (KeNIC)\n.kerryhotels\tgeneric\tKerry Trading Co. Limited\n.kerrylogistics\tgeneric\tNot assigned\n.kerryproperties\tgeneric\tKerry Trading Co. Limited\n.kfh\tgeneric\tKuwait Finance House\n.kg\tcountry-code\tAsiaInfo Telecommunication Enterprise\n.kh\tcountry-code\tTelecommunication Regulator of Cambodia (TRC)\n.ki\tcountry-code\tMinistry of Information, Communications and Transport (MICT)\n.kia\tgeneric\tKIA MOTORS CORPORATION\n.kids\tgeneric\tDotKids Foundation Limited\n.kim\tgeneric\tIdentity Digital Limited\n.kinder\tgeneric\tNot assigned\n.kindle\tgeneric\tAmazon Registry Services, Inc.\n.kitchen\tgeneric\tBinky Moon, LLC\n.kiwi\tgeneric\tDOT KIWI LIMITED\n.km\tcountry-code\tComores Telecom\n.kn\tcountry-code\tMinistry of Finance, Sustainable Development Information & Technology\n.koeln\tgeneric\tdotKoeln GmbH\n.komatsu\tgeneric\tKomatsu Ltd.\n.kosher\tgeneric\tKosher Marketing Assets LLC\n.kp\tcountry-code\tStar Joint Venture Company\n.kpmg\tgeneric\tKPMG International Cooperative (KPMG International Genossenschaft)\n.kpn\tgeneric\tKoninklijke KPN N.V.\n.kr\tcountry-code\tKorea Internet & Security Agency (KISA)\n.krd\tgeneric\tKRG Department of Information Technology\n.kred\tgeneric\tKredTLD Pty Ltd\n.kuokgroup\tgeneric\tKerry Trading Co. Limited\n.kw\tcountry-code\tCommunications and Information Technology Regulatory Authority\n.ky\tcountry-code\tUtility Regulation and Competition Office (OfReg)\n.kyoto\tgeneric\tAcademic Institution: Kyoto Jyoho Gakuen\n.kz\tcountry-code\tAssociation of IT Companies of Kazakhstan\n.la\tcountry-code\tLao National Internet Center (LANIC), Ministry of Technology and Communications\n.lacaixa\tgeneric\tFundación Bancaria Caixa d'Estalvis i Pensions de Barcelona, \"la Caixa\"\n.ladbrokes\tgeneric\tNot assigned\n.lamborghini\tgeneric\tAutomobili Lamborghini S.p.A.\n.lamer\tgeneric\tThe Estée Lauder Companies Inc.\n.lancaster\tgeneric\tNot assigned\n.lancia\tgeneric\tNot assigned\n.lancome\tgeneric\tNot assigned\n.land\tgeneric\tBinky Moon, LLC\n.landrover\tgeneric\tJaguar Land Rover Ltd\n.lanxess\tgeneric\tLANXESS Corporation\n.lasalle\tgeneric\tJones Lang LaSalle Incorporated\n.lat\tgeneric\tXYZ.COM LLC\n.latino\tgeneric\tDish DBS Corporation\n.latrobe\tgeneric\tLa Trobe University\n.law\tgeneric\tRegistry Services, LLC\n.lawyer\tgeneric\tDog Beach, LLC\n.lb\tcountry-code\tInternet Society Lebanon\n.lc\tcountry-code\tUniversity of Puerto Rico\n.lds\tgeneric\tIRI Domain Management, LLC\n.lease\tgeneric\tBinky Moon, LLC\n.leclerc\tgeneric\tA.C.D. LEC Association des Centres Distributeurs Edouard Leclerc\n.lefrak\tgeneric\tLeFrak Organization, Inc.\n.legal\tgeneric\tBinky Moon, LLC\n.lego\tgeneric\tLEGO Juris A/S\n.lexus\tgeneric\tTOYOTA MOTOR CORPORATION\n.lgbt\tgeneric\tIdentity Digital Limited\n.li\tcountry-code\tSWITCH The Swiss Education & Research Network\n.liaison\tgeneric\tNot assigned\n.lidl\tgeneric\tSchwarz Domains und Services GmbH & Co. KG\n.life\tgeneric\tBinky Moon, LLC\n.lifeinsurance\tgeneric\tAmerican Council of Life Insurers\n.lifestyle\tgeneric\tInternet Naming Co.\n.lighting\tgeneric\tBinky Moon, LLC\n.like\tgeneric\tAmazon Registry Services, Inc.\n.lilly\tgeneric\tEli Lilly and Company\n.limited\tgeneric\tBinky Moon, LLC\n.limo\tgeneric\tBinky Moon, LLC\n.lincoln\tgeneric\tFord Motor Company\n.linde\tgeneric\tNot assigned\n.link\tgeneric\tNova Registry Ltd.\n.lipsy\tgeneric\tNot assigned\n.live\tgeneric\tDog Beach, LLC\n.living\tgeneric\tInternet Naming Co.\n.lixil\tgeneric\tNot assigned\n.lk\tcountry-code\tCouncil for Information Technology LK Domain Registrar\n.llc\tgeneric\tIdentity Digital Limited\n.llp\tgeneric\tIntercap Registry Inc.\n.loan\tgeneric\tdot Loan Limited\n.loans\tgeneric\tBinky Moon, LLC\n.locker\tgeneric\tOrange Domains LLC\n.locus\tgeneric\tLocus Analytics LLC\n.loft\tgeneric\tNot assigned\n.lol\tgeneric\tXYZ.COM LLC\n.london\tgeneric\tDot London Domains Limited\n.lotte\tgeneric\tLotte Holdings Co., Ltd.\n.lotto\tgeneric\tIdentity Digital Limited\n.love\tgeneric\tWaterford Limited\n.lpl\tgeneric\tLPL Holdings, Inc.\n.lplfinancial\tgeneric\tLPL Holdings, Inc.\n.lr\tcountry-code\tData Technology Solutions, Inc.\n.ls\tcountry-code\tLesotho Network Information Centre Proprietary (LSNIC)\n.lt\tcountry-code\tKaunas University of Technology\n.ltd\tgeneric\tBinky Moon, LLC\n.ltda\tgeneric\tInterNetX Corp.\n.lu\tcountry-code\tRESTENA\n.lundbeck\tgeneric\tH. Lundbeck A/S\n.lupin\tgeneric\tNot assigned\n.luxe\tgeneric\tRegistry Services, LLC\n.luxury\tgeneric\tLuxury Partners LLC\n.lv\tcountry-code\tUniversity of Latvia, Institute of Mathematics and Computer Science, Department of Network Solutions (DNS)\n.ly\tcountry-code\tGeneral Post and Telecommunication Company\n.ma\tcountry-code\tAgence Nationale de Réglementation des Télécommunications (ANRT)\n.macys\tgeneric\tNot assigned\n.madrid\tgeneric\tComunidad de Madrid\n.maif\tgeneric\tMutuelle Assurance Instituteur France (MAIF)\n.maison\tgeneric\tBinky Moon, LLC\n.makeup\tgeneric\tXYZ.COM LLC\n.man\tgeneric\tMAN Truck & Bus SE\n.management\tgeneric\tBinky Moon, LLC\n.mango\tgeneric\tPUNTO FA S.L.\n.map\tgeneric\tCharleston Road Registry Inc.\n.market\tgeneric\tDog Beach, LLC\n.marketing\tgeneric\tBinky Moon, LLC\n.markets\tgeneric\tDog Beach, LLC\n.marriott\tgeneric\tMarriott Worldwide Corporation\n.marshalls\tgeneric\tThe TJX Companies, Inc.\n.maserati\tgeneric\tNot assigned\n.mattel\tgeneric\tMattel IT Services, Inc.\n.mba\tgeneric\tBinky Moon, LLC\n.mc\tcountry-code\tDirection des Plateformes et des Ressources Numériques\n.mcd\tgeneric\tNot assigned\n.mcdonalds\tgeneric\tNot assigned\n.mckinsey\tgeneric\tMcKinsey Holdings, Inc.\n.md\tcountry-code\tIP Serviciul Tehnologia Informatiei si Securitate Cibernetica\n.me\tcountry-code\tGovernment of Montenegro\n.med\tgeneric\tMedistry LLC\n.media\tgeneric\tBinky Moon, LLC\n.meet\tgeneric\tCharleston Road Registry Inc.\n.melbourne\tgeneric\tThe Crown in right of the State of Victoria, represented by its Department of State Development, Business and Innovation\n.meme\tgeneric\tCharleston Road Registry Inc.\n.memorial\tgeneric\tDog Beach, LLC\n.men\tgeneric\tExclusive Registry Limited\n.menu\tgeneric\tDot Menu Registry LLC\n.meo\tgeneric\tNot assigned\n.merckmsd\tgeneric\tMSD Registry Holdings, Inc.\n.metlife\tgeneric\tNot assigned\n.mf\tcountry-code\tNot assigned\n.mg\tcountry-code\tNIC-MG (Network Information Center Madagascar)\n.mh\tcountry-code\tOffice of the Cabinet\n.miami\tgeneric\tRegistry Services, LLC\n.microsoft\tgeneric\tMicrosoft Corporation\n.mil\tsponsored\tDoD Network Information Center\n.mini\tgeneric\tBayerische Motoren Werke Aktiengesellschaft\n.mint\tgeneric\tIntuit Administrative Services, Inc.\n.mit\tgeneric\tMassachusetts Institute of Technology\n.mitsubishi\tgeneric\tMitsubishi Corporation\n.mk\tcountry-code\tMacedonian Academic Research Network Skopje\n.ml\tcountry-code\tAgence des Technologies de l’Information et de la Communication\n.mlb\tgeneric\tMLB Advanced Media DH, LLC\n.mls\tgeneric\tThe Canadian Real Estate Association\n.mm\tcountry-code\tMinistry of Transport and Communications\n.mma\tgeneric\tMMA IARD\n.mn\tcountry-code\tDatacom Co., Ltd.\n.mo\tcountry-code\tMacao Post and Telecommunications Bureau (CTT)\n.mobi\tgeneric\tIdentity Digital Limited\n.mobile\tgeneric\tDish DBS Corporation\n.mobily\tgeneric\tNot assigned\n.moda\tgeneric\tDog Beach, LLC\n.moe\tgeneric\tInterlink Systems Innovation Institute K.K.\n.moi\tgeneric\tAmazon Registry Services, Inc.\n.mom\tgeneric\tXYZ.COM LLC\n.monash\tgeneric\tMonash University\n.money\tgeneric\tBinky Moon, LLC\n.monster\tgeneric\tXYZ.COM LLC\n.montblanc\tgeneric\tNot assigned\n.mopar\tgeneric\tNot assigned\n.mormon\tgeneric\tIRI Domain Management, LLC (\"Applicant\")\n.mortgage\tgeneric\tDog Beach, LLC\n.moscow\tgeneric\tFoundation for Assistance for Internet Technologies and Infrastructure Development (FAITID)\n.moto\tgeneric\tMotorola Trademark Holdings, LLC\n.motorcycles\tgeneric\tXYZ.COM LLC\n.mov\tgeneric\tCharleston Road Registry Inc.\n.movie\tgeneric\tBinky Moon, LLC\n.movistar\tgeneric\tNot assigned\n.mp\tcountry-code\tSaipan Datacom, Inc.\n.mq\tcountry-code\tCANAL+ TELECOM\n.mr\tcountry-code\tUniversité de Nouakchott Al Aasriya\n.ms\tcountry-code\tMNI Networks Ltd.\n.msd\tgeneric\tMSD Registry Holdings, Inc.\n.mt\tcountry-code\tNIC (Malta)\n.mtn\tgeneric\tMTN Dubai Limited\n.mtpc\tgeneric\tNot assigned\n.mtr\tgeneric\tMTR Corporation Limited\n.mu\tcountry-code\tInternet Direct Ltd\n.museum\tsponsored\tMuseum Domain Management Association\n.music\tgeneric\tDotMusic Limited\n.mutual\tgeneric\tNot assigned\n.mutuelle\tgeneric\tNot assigned\n.mv\tcountry-code\tDhivehi Raajjeyge Gulhun PLC\n.mw\tcountry-code\tMalawi Sustainable Development Network Programme (Malawi SDNP)\n.mx\tcountry-code\tNIC-Mexico ITESM - Campus Monterrey\n.my\tcountry-code\tMYNIC Berhad\n.mz\tcountry-code\tCentro de Informatica de Universidade Eduardo Mondlane\n.na\tcountry-code\tNamibian Network Information Center\n.nab\tgeneric\tNational Australia Bank Limited\n.nadex\tgeneric\tNot assigned\n.nagoya\tgeneric\tGMO Registry, Inc.\n.name\tgeneric-restricted\tVeriSign Information Services, Inc.\n.nationwide\tgeneric\tNot assigned\n.natura\tgeneric\tNot assigned\n.navy\tgeneric\tDog Beach, LLC\n.nba\tgeneric\tNBA REGISTRY, LLC\n.nc\tcountry-code\tOffice des Postes et Telecommunications\n.ne\tcountry-code\tSONITEL\n.nec\tgeneric\tNEC Corporation\n.net\tgeneric\tVeriSign Global Registry Services\n.netbank\tgeneric\tCOMMONWEALTH BANK OF AUSTRALIA\n.netflix\tgeneric\tNetflix, Inc.\n.network\tgeneric\tBinky Moon, LLC\n.neustar\tgeneric\tNeuStar, Inc.\n.new\tgeneric\tCharleston Road Registry Inc.\n.newholland\tgeneric\tNot assigned\n.news\tgeneric\tDog Beach, LLC\n.next\tgeneric\tNext plc\n.nextdirect\tgeneric\tNext plc\n.nexus\tgeneric\tCharleston Road Registry Inc.\n.nf\tcountry-code\tNorfolk Island Data Services\n.nfl\tgeneric\tNFL Reg Ops LLC\n.ng\tcountry-code\tNigeria Internet Registration Association\n.ngo\tgeneric\tPublic Interest Registry\n.nhk\tgeneric\tJapan Broadcasting Corporation (NHK)\n.ni\tcountry-code\tUniversidad Nacional del Ingernieria. Division de Tecnologias de la Informacion.\n.nico\tgeneric\tDWANGO Co., Ltd.\n.nike\tgeneric\tNIKE, Inc.\n.nikon\tgeneric\tNIKON CORPORATION\n.ninja\tgeneric\tDog Beach, LLC\n.nissan\tgeneric\tNISSAN MOTOR CO., LTD.\n.nissay\tgeneric\tNippon Life Insurance Company\n.nl\tcountry-code\tSIDN (Stichting Internet Domeinregistratie Nederland)\n.no\tcountry-code\tNorid A/S\n.nokia\tgeneric\tNokia Corporation\n.northwesternmutual\tgeneric\tNot assigned\n.norton\tgeneric\tGen Digital Inc.\n.now\tgeneric\tAmazon Registry Services, Inc.\n.nowruz\tgeneric\tEmergency Back-End Registry Operator Program - ICANN\n.nowtv\tgeneric\tStarbucks (HK) Limited\n.np\tcountry-code\tMercantile Communications Pvt. Ltd.\n.nr\tcountry-code\tCENPAC NET\n.nra\tgeneric\tNational Rifle Association of America\n.nrw\tgeneric\tMinds + Machines GmbH\n.ntt\tgeneric\tNIPPON TELEGRAPH AND TELEPHONE CORPORATION\n.nu\tcountry-code\tThe IUSN Foundation\n.nyc\tgeneric\tThe City of New York by and through the New York City Department of Information Technology & Telecommunications\n.nz\tcountry-code\tInternetNZ\n.obi\tgeneric\tOBI Group Holding SE & Co. KGaA\n.observer\tgeneric\tFegistry, LLC\n.off\tgeneric\tNot assigned\n.office\tgeneric\tMicrosoft Corporation\n.okinawa\tgeneric\tBRregistry, Inc.\n.olayan\tgeneric\tCompetrol (Luxembourg) Sarl\n.olayangroup\tgeneric\tCompetrol (Luxembourg) Sarl\n.oldnavy\tgeneric\tNot assigned\n.ollo\tgeneric\tDish DBS Corporation\n.om\tcountry-code\tTelecommunications Regulatory Authority (TRA)\n.omega\tgeneric\tThe Swatch Group Ltd\n.one\tgeneric\tOne.com A/S\n.ong\tgeneric\tPublic Interest Registry\n.onl\tgeneric\tiRegistry GmbH\n.online\tgeneric\tRadix Technologies Inc. SEZC\n.onyourside\tgeneric\tNot assigned\n.ooo\tgeneric\tINFIBEAM AVENUES LIMITED\n.open\tgeneric\tAmerican Express Travel Related Services Company, Inc.\n.oracle\tgeneric\tOracle Corporation\n.orange\tgeneric\tOrange Brand Services Limited\n.org\tgeneric\tPublic Interest Registry (PIR)\n.organic\tgeneric\tIdentity Digital Limited\n.orientexpress\tgeneric\tNot assigned\n.origins\tgeneric\tThe Estée Lauder Companies Inc.\n.osaka\tgeneric\tOsaka Registry Co., Ltd.\n.otsuka\tgeneric\tOtsuka Holdings Co., Ltd.\n.ott\tgeneric\tDish DBS Corporation\n.ovh\tgeneric\tOVH SAS\n.pa\tcountry-code\tUniversidad Tecnologica de Panama\n.page\tgeneric\tCharleston Road Registry Inc.\n.pamperedchef\tgeneric\tNot assigned\n.panasonic\tgeneric\tPanasonic Corporation\n.panerai\tgeneric\tNot assigned\n.paris\tgeneric\tCity of Paris\n.pars\tgeneric\tEmergency Back-End Registry Operator Program - ICANN\n.partners\tgeneric\tBinky Moon, LLC\n.parts\tgeneric\tBinky Moon, LLC\n.party\tgeneric\tBlue Sky Registry Limited\n.passagens\tgeneric\tNot assigned\n.pay\tgeneric\tAmazon Registry Services, Inc.\n.pccw\tgeneric\tPCCW Enterprises Limited\n.pe\tcountry-code\tRed Cientifica Peruana\n.pet\tgeneric\tIdentity Digital Limited\n.pf\tcountry-code\tGouvernement de la Polynésie française\n.pfizer\tgeneric\tPfizer Inc.\n.pg\tcountry-code\tPNG DNS Administration, Vice Chancellors Office, The Papua New Guinea University of Technology\n.ph\tcountry-code\tPH Domain Foundation\n.pharmacy\tgeneric\tNational Association of Boards of Pharmacy\n.phd\tgeneric\tCharleston Road Registry Inc.\n.philips\tgeneric\tKoninklijke Philips N.V.\n.phone\tgeneric\tDish DBS Corporation\n.photo\tgeneric\tRegistry Services, LLC\n.photography\tgeneric\tBinky Moon, LLC\n.photos\tgeneric\tBinky Moon, LLC\n.physio\tgeneric\tPhysBiz Pty Ltd\n.piaget\tgeneric\tNot assigned\n.pics\tgeneric\tXYZ.COM LLC\n.pictet\tgeneric\tBanque Pictet & Cie SA\n.pictures\tgeneric\tBinky Moon, LLC\n.pid\tgeneric\tTop Level Spectrum, Inc.\n.pin\tgeneric\tAmazon Registry Services, Inc.\n.ping\tgeneric\tPing Registry Provider, Inc.\n.pink\tgeneric\tIdentity Digital Limited\n.pioneer\tgeneric\tPioneer Corporation\n.pizza\tgeneric\tBinky Moon, LLC\n.pk\tcountry-code\tPKNIC\n.pl\tcountry-code\tResearch and Academic Computer Network\n.place\tgeneric\tBinky Moon, LLC\n.play\tgeneric\tCharleston Road Registry Inc.\n.playstation\tgeneric\tSony Computer Entertainment Inc.\n.plumbing\tgeneric\tBinky Moon, LLC\n.plus\tgeneric\tBinky Moon, LLC\n.pm\tcountry-code\tAssociation Française pour le Nommage Internet en Coopération (A.F.N.I.C.)\n.pn\tcountry-code\tPitcairn Island Administration\n.pnc\tgeneric\tPNC Domain Co., LLC\n.pohl\tgeneric\tDeutsche Vermögensberatung Aktiengesellschaft DVAG\n.poker\tgeneric\tIdentity Digital Limited\n.politie\tgeneric\tPolitie Nederland\n.porn\tgeneric\tICM Registry PN LLC\n.post\tsponsored\tUniversal Postal Union\n.pr\tcountry-code\tGauss Research Laboratory Inc.\n.pramerica\tgeneric\tNot assigned\n.praxi\tgeneric\tPraxi S.p.A.\n.press\tgeneric\tRadix Technologies Inc.\n.prime\tgeneric\tAmazon Registry Services, Inc.\n.pro\tgeneric-restricted\tIdentity Digital Limited\n.prod\tgeneric\tCharleston Road Registry Inc.\n.productions\tgeneric\tBinky Moon, LLC\n.prof\tgeneric\tCharleston Road Registry Inc.\n.progressive\tgeneric\tProgressive Casualty Insurance Company\n.promo\tgeneric\tIdentity Digital Limited\n.properties\tgeneric\tBinky Moon, LLC\n.property\tgeneric\tDigital Property Infrastructure Limited\n.protection\tgeneric\tXYZ.COM LLC\n.pru\tgeneric\tPrudential Financial, Inc.\n.prudential\tgeneric\tPrudential Financial, Inc.\n.ps\tcountry-code\tMinistry of Telecommunications & Information Technology, Government Computer Center\n.pt\tcountry-code\tAssociação DNS.PT\n.pub\tgeneric\tDog Beach, LLC\n.pw\tcountry-code\tMicronesia Investment and Development Corporation\n.pwc\tgeneric\tPricewaterhouseCoopers LLP\n.py\tcountry-code\tNIC-PY\n.qa\tcountry-code\tCommunications Regulatory Authority\n.qpon\tgeneric\tDOTQPON LLC.\n.quebec\tgeneric\tPointQuébec Inc\n.quest\tgeneric\tXYZ.COM LLC\n.qvc\tgeneric\tNot assigned\n.racing\tgeneric\tPremier Registry Limited\n.radio\tgeneric\tEuropean Broadcasting Union (EBU)\n.raid\tgeneric\tNot assigned\n.re\tcountry-code\tAssociation Française pour le Nommage Internet en Coopération (A.F.N.I.C.)\n.read\tgeneric\tAmazon Registry Services, Inc.\n.realestate\tgeneric\tdotRealEstate LLC\n.realtor\tgeneric\tReal Estate Domains LLC\n.realty\tgeneric\tInternet Naming Co.\n.recipes\tgeneric\tBinky Moon, LLC\n.red\tgeneric\tIdentity Digital Limited\n.redstone\tgeneric\tNot assigned\n.redumbrella\tgeneric\tTravelers TLD, LLC\n.rehab\tgeneric\tDog Beach, LLC\n.reise\tgeneric\tBinky Moon, LLC\n.reisen\tgeneric\tBinky Moon, LLC\n.reit\tgeneric\tNational Association of Real Estate Investment Trusts, Inc.\n.reliance\tgeneric\tReliance Industries Limited\n.ren\tgeneric\tZDNS International Limited\n.rent\tgeneric\tXYZ.COM LLC\n.rentals\tgeneric\tBinky Moon, LLC\n.repair\tgeneric\tBinky Moon, LLC\n.report\tgeneric\tBinky Moon, LLC\n.republican\tgeneric\tDog Beach, LLC\n.rest\tgeneric\tPunto 2012 Sociedad Anonima Promotora de Inversion de Capital Variable\n.restaurant\tgeneric\tBinky Moon, LLC\n.review\tgeneric\tdot Review Limited\n.reviews\tgeneric\tDog Beach, LLC\n.rexroth\tgeneric\tRobert Bosch GMBH\n.rich\tgeneric\tiRegistry GmbH\n.richardli\tgeneric\tPacific Century Asset Management (HK) Limited\n.ricoh\tgeneric\tRicoh Company, Ltd.\n.rightathome\tgeneric\tNot assigned\n.ril\tgeneric\tReliance Industries Limited\n.rio\tgeneric\tEmpresa Municipal de Informática SA - IPLANRIO\n.rip\tgeneric\tDog Beach, LLC\n.rmit\tgeneric\tNot assigned\n.ro\tcountry-code\tNational Institute for R&D in Informatics\n.rocher\tgeneric\tNot assigned\n.rocks\tgeneric\tDog Beach, LLC\n.rodeo\tgeneric\tRegistry Services, LLC\n.rogers\tgeneric\tRogers Communications Canada Inc.\n.room\tgeneric\tAmazon Registry Services, Inc.\n.rs\tcountry-code\tSerbian National Internet Domain Registry (RNIDS)\n.rsvp\tgeneric\tCharleston Road Registry Inc.\n.ru\tcountry-code\tCoordination Center for TLD RU\n.rugby\tgeneric\tWorld Rugby Strategic Developments Limited\n.ruhr\tgeneric\tdotSaarland GmbH\n.run\tgeneric\tBinky Moon, LLC\n.rw\tcountry-code\tRwanda Internet Community and Technology Alliance (RICTA) Ltd\n.rwe\tgeneric\tRWE AG\n.ryukyu\tgeneric\tBRregistry, Inc.\n.sa\tcountry-code\tCommunications, Space and Technology Commission\n.saarland\tgeneric\tdotSaarland GmbH\n.safe\tgeneric\tAmazon Registry Services, Inc.\n.safety\tgeneric\tSafety Registry Services, LLC.\n.sakura\tgeneric\tSAKURA internet Inc.\n.sale\tgeneric\tDog Beach, LLC\n.salon\tgeneric\tBinky Moon, LLC\n.samsclub\tgeneric\tWal-Mart Stores, Inc.\n.samsung\tgeneric\tSAMSUNG SDS CO., LTD\n.sandvik\tgeneric\tSandvik AB\n.sandvikcoromant\tgeneric\tSandvik AB\n.sanofi\tgeneric\tSanofi\n.sap\tgeneric\tSAP AG\n.sapo\tgeneric\tNot assigned\n.sarl\tgeneric\tBinky Moon, LLC\n.sas\tgeneric\tResearch IP LLC\n.save\tgeneric\tAmazon Registry Services, Inc.\n.saxo\tgeneric\tSaxo Bank A/S\n.sb\tcountry-code\tSolomon Telekom Company Limited\n.sbi\tgeneric\tSTATE BANK OF INDIA\n.sbs\tgeneric\tShortdot SA\n.sc\tcountry-code\tVCS Pty Ltd\n.sca\tgeneric\tNot assigned\n.scb\tgeneric\tThe Siam Commercial Bank Public Company Limited (\"SCB\")\n.schaeffler\tgeneric\tSchaeffler Technologies AG & Co. KG\n.schmidt\tgeneric\tSCHMIDT GROUPE S.A.S.\n.scholarships\tgeneric\tScholarships.com, LLC\n.school\tgeneric\tBinky Moon, LLC\n.schule\tgeneric\tBinky Moon, LLC\n.schwarz\tgeneric\tSchwarz Domains und Services GmbH & Co. KG\n.science\tgeneric\tdot Science Limited\n.scjohnson\tgeneric\tNot assigned\n.scor\tgeneric\tNot assigned\n.scot\tgeneric\tDot Scot Registry Limited\n.sd\tcountry-code\tSudan Internet Society\n.se\tcountry-code\tThe Internet Infrastructure Foundation\n.search\tgeneric\tCharleston Road Registry Inc.\n.seat\tgeneric\tSEAT, S.A. (Sociedad Unipersonal)\n.secure\tgeneric\tAmazon Registry Services, Inc.\n.security\tgeneric\tXYZ.COM LLC\n.seek\tgeneric\tSeek Limited\n.select\tgeneric\tRegistry Services, LLC\n.sener\tgeneric\tSener Ingeniería y Sistemas, S.A.\n.services\tgeneric\tBinky Moon, LLC\n.ses\tgeneric\tNot assigned\n.seven\tgeneric\tSeven West Media Ltd\n.sew\tgeneric\tSEW-EURODRIVE GmbH & Co KG\n.sex\tgeneric\tICM Registry SX LLC\n.sexy\tgeneric\tInternet Naming Co.\n.sfr\tgeneric\tSociete Francaise du Radiotelephone - SFR\n.sg\tcountry-code\tSingapore Network Information Centre (SGNIC) Pte Ltd\n.sh\tcountry-code\tGovernment of St. Helena\n.shangrila\tgeneric\tShangri-La International Hotel Management Limited\n.sharp\tgeneric\tSharp Corporation\n.shaw\tgeneric\tNot assigned\n.shell\tgeneric\tShell Information Technology International Inc\n.shia\tgeneric\tEmergency Back-End Registry Operator Program - ICANN\n.shiksha\tgeneric\tIdentity Digital Limited\n.shoes\tgeneric\tBinky Moon, LLC\n.shop\tgeneric\tGMO Registry, Inc.\n.shopping\tgeneric\tBinky Moon, LLC\n.shouji\tgeneric\tQIHOO 360 TECHNOLOGY CO. LTD.\n.show\tgeneric\tBinky Moon, LLC\n.showtime\tgeneric\tNot assigned\n.shriram\tgeneric\tNot assigned\n.si\tcountry-code\tAcademic and Research Network of Slovenia (ARNES)\n.silk\tgeneric\tAmazon Registry Services, Inc.\n.sina\tgeneric\tSina Corporation\n.singles\tgeneric\tBinky Moon, LLC\n.site\tgeneric\tRadix Technologies Inc. SEZC\n.sj\tcountry-code\tNorid A/S\n.sk\tcountry-code\tSK-NIC, a.s.\n.ski\tgeneric\tIdentity Digital Limited\n.skin\tgeneric\tXYZ.COM LLC\n.sky\tgeneric\tSky UK Limited\n.skype\tgeneric\tMicrosoft Corporation\n.sl\tcountry-code\tSierratel\n.sling\tgeneric\tDISH Technologies L.L.C.\n.sm\tcountry-code\tTelecom Italia San Marino S.p.A.\n.smart\tgeneric\tSmart Communications, Inc. (SMART)\n.smile\tgeneric\tAmazon Registry Services, Inc.\n.sn\tcountry-code\tUniversite Cheikh Anta Diop\n.sncf\tgeneric\tSociété Nationale SNCF\n.so\tcountry-code\tMinistry of Post and Telecommunications\n.soccer\tgeneric\tBinky Moon, LLC\n.social\tgeneric\tDog Beach, LLC\n.softbank\tgeneric\tSoftBank Group Corp.\n.software\tgeneric\tDog Beach, LLC\n.sohu\tgeneric\tSohu.com Limited\n.solar\tgeneric\tBinky Moon, LLC\n.solutions\tgeneric\tBinky Moon, LLC\n.song\tgeneric\tAmazon Registry Services, Inc.\n.sony\tgeneric\tSony Corporation\n.soy\tgeneric\tCharleston Road Registry Inc.\n.spa\tgeneric\tAsia Spa and Wellness Promotion Council Limited\n.space\tgeneric\tRadix Technologies Inc.\n.spiegel\tgeneric\tNot assigned\n.sport\tgeneric\tSportAccord\n.spot\tgeneric\tAmazon Registry Services, Inc.\n.spreadbetting\tgeneric\tNot assigned\n.sr\tcountry-code\tTelesur\n.srl\tgeneric\tInterNetX Corp.\n.srt\tgeneric\tNot assigned\n.ss\tcountry-code\tNational Communication Authority (NCA)\n.st\tcountry-code\tTecnisys\n.stada\tgeneric\tSTADA Arzneimittel AG\n.staples\tgeneric\tStaples, Inc.\n.star\tgeneric\tStar India Private Limited\n.starhub\tgeneric\tNot assigned\n.statebank\tgeneric\tSTATE BANK OF INDIA\n.statefarm\tgeneric\tState Farm Mutual Automobile Insurance Company\n.statoil\tgeneric\tNot assigned\n.stc\tgeneric\tSaudi Telecom Company\n.stcgroup\tgeneric\tSaudi Telecom Company\n.stockholm\tgeneric\tStockholms kommun\n.storage\tgeneric\tXYZ.COM LLC\n.store\tgeneric\tRadix Technologies Inc.\n.stream\tgeneric\tdot Stream Limited\n.studio\tgeneric\tDog Beach, LLC\n.study\tgeneric\tRegistry Services, LLC\n.style\tgeneric\tBinky Moon, LLC\n.su\tcountry-code\tRussian Institute for Development of Public Networks (ROSNIIROS)\n.sucks\tgeneric\tVox Populi Registry Ltd.\n.supplies\tgeneric\tBinky Moon, LLC\n.supply\tgeneric\tBinky Moon, LLC\n.support\tgeneric\tBinky Moon, LLC\n.surf\tgeneric\tRegistry Services, LLC\n.surgery\tgeneric\tBinky Moon, LLC\n.suzuki\tgeneric\tSUZUKI MOTOR CORPORATION\n.sv\tcountry-code\tSVNet\n.swatch\tgeneric\tThe Swatch Group Ltd\n.swiftcover\tgeneric\tNot assigned\n.swiss\tgeneric\tSwiss Confederation\n.sx\tcountry-code\tSX Registry SA B.V.\n.sy\tcountry-code\tNational Agency for Network Services (NANS)\n.sydney\tgeneric\tState of New South Wales, Department of Premier and Cabinet\n.symantec\tgeneric\tNot assigned\n.systems\tgeneric\tBinky Moon, LLC\n.sz\tcountry-code\tUniversity of Swaziland Department of Computer Science\n.tab\tgeneric\tTabcorp Holdings Limited\n.taipei\tgeneric\tTaipei City Government\n.talk\tgeneric\tAmazon Registry Services, Inc.\n.taobao\tgeneric\tAlibaba Group Holding Limited\n.target\tgeneric\tTarget Domain Holdings, LLC\n.tatamotors\tgeneric\tTata Motors Ltd\n.tatar\tgeneric\tLimited Liability Company \"Coordination Center of Regional Domain of Tatarstan Republic\"\n.tattoo\tgeneric\tRegistry Services, LLC\n.tax\tgeneric\tBinky Moon, LLC\n.taxi\tgeneric\tBinky Moon, LLC\n.tc\tcountry-code\tMelrex TC\n.tci\tgeneric\tEmergency Back-End Registry Operator Program - ICANN\n.td\tcountry-code\tl'Agence de Développement des Technologies de l'Information et de la Communication (ADETIC)\n.tdk\tgeneric\tTDK Corporation\n.team\tgeneric\tBinky Moon, LLC\n.tech\tgeneric\tRadix Technologies Inc.\n.technology\tgeneric\tBinky Moon, LLC\n.tel\tsponsored\tTelnames Ltd.\n.telecity\tgeneric\tNot assigned\n.telefonica\tgeneric\tNot assigned\n.temasek\tgeneric\tTemasek Holdings (Private) Limited\n.tennis\tgeneric\tBinky Moon, LLC\n.teva\tgeneric\tTeva Pharmaceutical Industries Limited\n.tf\tcountry-code\tAssociation Française pour le Nommage Internet en Coopération (A.F.N.I.C.)\n.tg\tcountry-code\tAutorité de Régulation des Communications Electroniques et des Postes (ARCEP)\n.th\tcountry-code\tThai Network Information Center Foundation\n.thd\tgeneric\tHome Depot Product Authority, LLC\n.theater\tgeneric\tBinky Moon, LLC\n.theatre\tgeneric\tXYZ.COM LLC\n.tiaa\tgeneric\tTeachers Insurance and Annuity Association of America\n.tickets\tgeneric\tXYZ.COM LLC\n.tienda\tgeneric\tBinky Moon, LLC\n.tiffany\tgeneric\tNot assigned\n.tips\tgeneric\tBinky Moon, LLC\n.tires\tgeneric\tBinky Moon, LLC\n.tirol\tgeneric\tpunkt Tirol GmbH\n.tj\tcountry-code\tInformation Technology Center\n.tjmaxx\tgeneric\tThe TJX Companies, Inc.\n.tjx\tgeneric\tThe TJX Companies, Inc.\n.tk\tcountry-code\tTelecommunication Tokelau Corporation (Teletok)\n.tkmaxx\tgeneric\tThe TJX Companies, Inc.\n.tl\tcountry-code\tAutoridade Nacional de Comunicações\n.tm\tcountry-code\tTM Domain Registry Ltd\n.tmall\tgeneric\tAlibaba Group Holding Limited\n.tn\tcountry-code\tAgence Tunisienne d'Internet\n.to\tcountry-code\tGovernment of the Kingdom of Tonga, H.R.H. Crown Prince Tupouto'a, c/o Consulate of Tonga\n.today\tgeneric\tBinky Moon, LLC\n.tokyo\tgeneric\tGMO Registry, Inc.\n.tools\tgeneric\tBinky Moon, LLC\n.top\tgeneric\t.TOP Registry\n.toray\tgeneric\tToray Industries, Inc.\n.toshiba\tgeneric\tTOSHIBA Corporation\n.total\tgeneric\tTotalEnergies SE\n.tours\tgeneric\tBinky Moon, LLC\n.town\tgeneric\tBinky Moon, LLC\n.toyota\tgeneric\tTOYOTA MOTOR CORPORATION\n.toys\tgeneric\tBinky Moon, LLC\n.tp\tcountry-code\tNot assigned\n.tr\tcountry-code\tBilgi Teknolojileri ve İletişim Kurumu (BTK)\n.trade\tgeneric\tElite Registry Limited\n.trading\tgeneric\tDog Beach, LLC\n.training\tgeneric\tBinky Moon, LLC\n.travel\tsponsored\tDog Beach, LLC\n.travelchannel\tgeneric\tNot assigned\n.travelers\tgeneric\tTravelers TLD, LLC\n.travelersinsurance\tgeneric\tTravelers TLD, LLC\n.trust\tgeneric\tInternet Naming Co.\n.trv\tgeneric\tTravelers TLD, LLC\n.tt\tcountry-code\tUniversity of the West Indies, Faculty of Engineering\n.tube\tgeneric\tLatin American Telecom LLC\n.tui\tgeneric\tTUI AG\n.tunes\tgeneric\tAmazon Registry Services, Inc.\n.tushu\tgeneric\tAmazon Registry Services, Inc.\n.tv\tcountry-code\tMinistry of Transport, Energy, Communications and Innovations\n.tvs\tgeneric\tT V SUNDRAM IYENGAR & SONS PRIVATE LIMITED\n.tw\tcountry-code\tTaiwan Network Information Center (TWNIC)\n.tz\tcountry-code\tTanzania Communications Regulatory Authority\n.ua\tcountry-code\tHostmaster Ltd.\n.ubank\tgeneric\tNational Australia Bank Limited\n.ubs\tgeneric\tUBS AG\n.uconnect\tgeneric\tNot assigned\n.ug\tcountry-code\tUganda Online Ltd.\n.uk\tcountry-code\tNominet UK\n.um\tcountry-code\tNot assigned\n.unicom\tgeneric\tChina United Network Communications Corporation Limited\n.university\tgeneric\tBinky Moon, LLC\n.uno\tgeneric\tRadix Technologies Inc.\n.uol\tgeneric\tUBN INTERNET LTDA.\n.ups\tgeneric\tUPS Market Driver, Inc.\n.us\tcountry-code\tRegistry Services, LLC\n.uy\tcountry-code\tSeCIU - Universidad de la Republica\n.uz\tcountry-code\tSingle Integrator for Creation and Support of State Information Systems UZINFOCOM\n.va\tcountry-code\tHoly See - Vatican City State\n.vacations\tgeneric\tBinky Moon, LLC\n.vana\tgeneric\tD3 Registry LLC\n.vanguard\tgeneric\tThe Vanguard Group, Inc.\n.vc\tcountry-code\tMinistry of Telecommunications, Science, Technology and Industry\n.ve\tcountry-code\tComisión Nacional de Telecomunicaciones (CONATEL)\n.vegas\tgeneric\tDot Vegas, Inc.\n.ventures\tgeneric\tBinky Moon, LLC\n.verisign\tgeneric\tVeriSign, Inc.\n.versicherung\tgeneric\ttldbox GmbH\n.vet\tgeneric\tDog Beach, LLC\n.vg\tcountry-code\tTelecommunications Regulatory Commission of the Virgin Islands\n.vi\tcountry-code\tVirgin Islands Public Telecommunications System, Inc.\n.viajes\tgeneric\tBinky Moon, LLC\n.video\tgeneric\tDog Beach, LLC\n.vig\tgeneric\tVIENNA INSURANCE GROUP AG Wiener Versicherung Gruppe\n.viking\tgeneric\tViking River Cruises (Bermuda) Ltd.\n.villas\tgeneric\tBinky Moon, LLC\n.vin\tgeneric\tBinky Moon, LLC\n.vip\tgeneric\tRegistry Services, LLC\n.virgin\tgeneric\tVirgin Enterprises Limited\n.visa\tgeneric\tVisa Worldwide Pte. Limited\n.vision\tgeneric\tBinky Moon, LLC\n.vista\tgeneric\tNot assigned\n.vistaprint\tgeneric\tNot assigned\n.viva\tgeneric\tSaudi Telecom Company\n.vivo\tgeneric\tTelefonica Brasil S.A.\n.vlaanderen\tgeneric\tDNS.be vzw\n.vn\tcountry-code\tViet Nam Internet Network Information Center (VNNIC)\n.vodka\tgeneric\tRegistry Services, LLC\n.volkswagen\tgeneric\tNot assigned\n.volvo\tgeneric\tVolvo Holding Sverige Aktiebolag\n.vote\tgeneric\tMonolith Registry LLC\n.voting\tgeneric\tValuetainment Corp.\n.voto\tgeneric\tMonolith Registry LLC\n.voyage\tgeneric\tBinky Moon, LLC\n.vu\tcountry-code\tTelecommunications Radiocommunications and Broadcasting Regulator (TRBR)\n.vuelos\tgeneric\tNot assigned\n.wales\tgeneric\tNominet UK\n.walmart\tgeneric\tWal-Mart Stores, Inc.\n.walter\tgeneric\tSandvik AB\n.wang\tgeneric\tZodiac Wang Limited\n.wanggou\tgeneric\tAmazon Registry Services, Inc.\n.warman\tgeneric\tNot assigned\n.watch\tgeneric\tBinky Moon, LLC\n.watches\tgeneric\tIdentity Digital Limited\n.weather\tgeneric\tInternational Business Machines Corporation\n.weatherchannel\tgeneric\tInternational Business Machines Corporation\n.webcam\tgeneric\tdot Webcam Limited\n.weber\tgeneric\tSaint-Gobain Weber SA\n.website\tgeneric\tRadix Technologies Inc.\n.wed\tgeneric\tEmergency Back-End Registry Operator Program - ICANN\n.wedding\tgeneric\tRegistry Services, LLC\n.weibo\tgeneric\tSina Corporation\n.weir\tgeneric\tWeir Group IP Limited\n.wf\tcountry-code\tAssociation Française pour le Nommage Internet en Coopération (A.F.N.I.C.)\n.whoswho\tgeneric\tWho's Who Registry\n.wien\tgeneric\tpunkt.wien GmbH\n.wiki\tgeneric\tRegistry Services, LLC\n.williamhill\tgeneric\tWilliam Hill Organization Limited\n.win\tgeneric\tFirst Registry Limited\n.windows\tgeneric\tMicrosoft Corporation\n.wine\tgeneric\tBinky Moon, LLC\n.winners\tgeneric\tThe TJX Companies, Inc.\n.wme\tgeneric\tWilliam Morris Endeavor Entertainment, LLC\n.wolterskluwer\tgeneric\tWolters Kluwer N.V.\n.woodside\tgeneric\tWoodside Petroleum Limited\n.work\tgeneric\tRegistry Services, LLC\n.works\tgeneric\tBinky Moon, LLC\n.world\tgeneric\tBinky Moon, LLC\n.wow\tgeneric\tAmazon Registry Services, Inc.\n.ws\tcountry-code\tGovernment of Samoa Ministry of Foreign Affairs & Trade\n.wtc\tgeneric\tWorld Trade Centers Association, Inc.\n.wtf\tgeneric\tBinky Moon, LLC\n.xbox\tgeneric\tMicrosoft Corporation\n.xerox\tgeneric\tXerox DNHC LLC\n.xfinity\tgeneric\tNot assigned\n.xihuan\tgeneric\tQIHOO 360 TECHNOLOGY CO. LTD.\n.xin\tgeneric\tElegant Leader Limited\n.测试\ttest\tNot assigned\n.कॉम\tgeneric\tVeriSign Sarl\n.परीक्षा\ttest\tNot assigned\n.セール\tgeneric\tAmazon Registry Services, Inc.\n.佛山\tgeneric\tGuangzhou YU Wei Information Technology Co., Ltd.\n.ಭಾರತ\tcountry-code\tNational Internet eXchange of India\n.慈善\tgeneric\tExcellent First Limited\n.集团\tgeneric\tEagle Horizon Limited\n.在线\tgeneric\tBeijing Tld Registry Technology Limited\n.한국\tcountry-code\tKISA (Korea Internet & Security Agency)\n.ଭାରତ\tcountry-code\tNational Internet eXchange of India\n.大众汽车\tgeneric\tNot assigned\n.点看\tgeneric\tVeriSign Sarl\n.คอม\tgeneric\tVeriSign Sarl\n.ভাৰত\tcountry-code\tNational Internet eXchange of India\n.ভারত\tcountry-code\tNational Internet Exchange of India\n.八卦\tgeneric\tZodiac Gemini Ltd\n‏.ישראל‎\tcountry-code\tThe Israel Internet Association (RA)\n‏.موقع‎\tgeneric\tHelium TLDs Ltd\n.বাংলা\tcountry-code\tPosts and Telecommunications Division\n.公益\tgeneric\tChina Organizational Name Administration Center\n.公司\tgeneric\tChina Internet Network Information Center (CNNIC)\n.香格里拉\tgeneric\tShangri-La International Hotel Management Limited\n.网站\tgeneric\tGlobal Website TLD Asia Limited\n.移动\tgeneric\tIdentity Digital Limited\n.我爱你\tgeneric\tTycoon Treasure Limited\n.москва\tgeneric\tFoundation for Assistance for Internet Technologies and Infrastructure Development (FAITID)\n.испытание\ttest\tNot assigned\n.қаз\tcountry-code\tAssociation of IT Companies of Kazakhstan\n.католик\tgeneric\tPontificium Consilium de Comunicationibus Socialibus (PCCS) (Pontifical Council for Social Communication)\n.онлайн\tgeneric\tCORE Association\n.сайт\tgeneric\tCORE Association\n.联通\tgeneric\tChina United Network Communications Corporation Limited\n.срб\tcountry-code\tSerbian National Internet Domain Registry (RNIDS)\n.бг\tcountry-code\tImena.BG AD\n.бел\tcountry-code\tBelarusian Cloud Technologies LLC\n‏.קום‎\tgeneric\tVeriSign Sarl\n.时尚\tgeneric\tRISE VICTORY LIMITED\n.微博\tgeneric\tSina Corporation\n.테스트\ttest\tNot assigned\n.淡马锡\tgeneric\tTemasek Holdings (Private) Limited\n.ファッション\tgeneric\tAmazon Registry Services, Inc.\n.орг\tgeneric\tPublic Interest Registry\n.नेट\tgeneric\tVeriSign Sarl\n.ストア\tgeneric\tAmazon Registry Services, Inc.\n.アマゾン\tgeneric\tAmazon Registry Services, Inc.\n.삼성\tgeneric\tSAMSUNG SDS CO., LTD\n.சிங்கப்பூர்\tcountry-code\tSingapore Network Information Centre (SGNIC) Pte Ltd\n.商标\tgeneric\tInternet DotTrademark Organisation Limited\n.商店\tgeneric\tBinky Moon, LLC\n.商城\tgeneric\tZodiac Aquarius Limited\n.дети\tgeneric\tThe Foundation for Network Initiatives “The Smart Internet”\n.мкд\tcountry-code\tMacedonian Academic Research Network Skopje\n‏.טעסט‎\ttest\tNot assigned\n.ею\tcountry-code\tEURid vzw\n.ポイント\tgeneric\tAmazon Registry Services, Inc.\n.新闻\tgeneric\tGuangzhou YU Wei Information and Technology Co.,Ltd\n.工行\tgeneric\tNot assigned\n.家電\tgeneric\tAmazon Registry Services, Inc.\n‏.كوم‎\tgeneric\tVeriSign Sarl\n.中文网\tgeneric\tTLD REGISTRY LIMITED\n.中信\tgeneric\tCITIC Group Corporation\n.中国\tcountry-code\tChina Internet Network Information Center (CNNIC)\n.中國\tcountry-code\tChina Internet Network Information Center (CNNIC)\n.娱乐\tgeneric\tBinky Moon, LLC\n.谷歌\tgeneric\tCharleston Road Registry Inc.\n.భారత్\tcountry-code\tNational Internet Exchange of India\n.ලංකා\tcountry-code\tLK Domain Registry\n.電訊盈科\tgeneric\tPCCW Enterprises Limited\n.购物\tgeneric\tNawang Heli(Xiamen) Network Service Co., LTD.\n.測試\ttest\tNot assigned\n.クラウド\tgeneric\tAmazon Registry Services, Inc.\n.ભારત\tcountry-code\tNational Internet Exchange of India\n.通販\tgeneric\tAmazon Registry Services, Inc.\n.भारतम्\tcountry-code\tNational Internet eXchange of India\n.भारत\tcountry-code\tNational Internet Exchange of India\n.भारोत\tcountry-code\tNational Internet eXchange of India\n‏.آزمایشی‎\ttest\tNot assigned\n.பரிட்சை\ttest\tNot assigned\n.网店\tgeneric\tZodiac Taurus Ltd.\n.संगठन\tgeneric\tPublic Interest Registry\n.餐厅\tgeneric\tInternet DotTrademark Organisation Limited\n.网络\tgeneric\tChina Internet Network Information Center (CNNIC)\n.ком\tgeneric\tVeriSign Sarl\n.укр\tcountry-code\tUkrainian Network Information Centre (UANIC), Inc.\n.香港\tcountry-code\tHong Kong Internet Registration Corporation Ltd.\n.亚马逊\tgeneric\tAmazon Registry Services, Inc.\n.诺基亚\tgeneric\tNot assigned\n.食品\tgeneric\tAmazon Registry Services, Inc.\n.δοκιμή\ttest\tNot assigned\n.飞利浦\tgeneric\tKoninklijke Philips N.V.\n‏.إختبار‎\ttest\tNot assigned\n.台湾\tcountry-code\tTaiwan Network Information Center (TWNIC)\n.台灣\tcountry-code\tTaiwan Network Information Center (TWNIC)\n.手表\tgeneric\tNot assigned\n.手机\tgeneric\tBeijing RITT-Net Technology Development Co., Ltd\n.мон\tcountry-code\tDatacom Co.,Ltd\n‏.الجزائر‎\tcountry-code\tCERIST\n‏.عمان‎\tcountry-code\tTelecommunications Regulatory Authority (TRA)\n‏.ارامكو‎\tgeneric\tAramco Services Company\n‏.ایران‎\tcountry-code\tInstitute for Research in Fundamental Sciences (IPM)\n‏.العليان‎\tgeneric\tCompetrol (Luxembourg) Sarl\n‏.اتصالات‎\tgeneric\tNot assigned\n‏.امارات‎\tcountry-code\tTelecommunications and Digital Government Regulatory Authority (TDRA)\n‏.بازار‎\tgeneric\tCORE Association\n‏.موريتانيا‎\tcountry-code\tUniversité de Nouakchott Al Aasriya\n‏.پاکستان‎\tcountry-code\tNational Telecommunication Corporation\n‏.الاردن‎\tcountry-code\tMinistry of Digital Economy and Entrepreneurship (MoDEE)\n‏.موبايلي‎\tgeneric\tNot assigned\n‏.بارت‎\tcountry-code\tNational Internet eXchange of India\n‏.بھارت‎\tcountry-code\tNational Internet Exchange of India\n‏.المغرب‎\tcountry-code\tAgence Nationale de Réglementation des Télécommunications (ANRT)\n‏.ابوظبي‎\tgeneric\tAbu Dhabi Systems and Information Centre\n‏.البحرين‎\tcountry-code\tTelecommunications Regulatory Authority (TRA)\n‏.السعودية‎\tcountry-code\tCommunications, Space and Technology Commission\n‏.ڀارت‎\tcountry-code\tNational Internet eXchange of India\n‏.كاثوليك‎\tgeneric\tPontificium Consilium de Comunicationibus Socialibus (PCCS) (Pontifical Council for Social Communication)\n‏.سودان‎\tcountry-code\tSudan Internet Society\n‏.همراه‎\tgeneric\tEmergency Back-End Registry Operator Program - ICANN\n‏.عراق‎\tcountry-code\tCommunications and Media Commission (CMC)\n‏.مليسيا‎\tcountry-code\tMYNIC Berhad\n.澳門\tcountry-code\tMacao Post and Telecommunications Bureau (CTT)\n.닷컴\tgeneric\tVeriSign Sarl\n.政府\tgeneric\tNet-Chinese Co., Ltd.\n‏.شبكة‎\tgeneric\tInternational Domain Registry Pty. Ltd.\n‏.بيتك‎\tgeneric\tKuwait Finance House\n‏.عرب‎\tgeneric\tLeague of Arab States\n.გე\tcountry-code\tInformation Technologies Development Center (ITDC)\n.机构\tgeneric\tPublic Interest Registry\n.组织机构\tgeneric\tPublic Interest Registry\n.健康\tgeneric\tStable Tone Limited\n.ไทย\tcountry-code\tThai Network Information Center Foundation\n‏.سورية‎\tcountry-code\tNational Agency for Network Services (NANS)\n.招聘\tgeneric\tJiang Yu Liang Cai Technology Company Limited\n.рус\tgeneric\tRusnames Limited\n.рф\tcountry-code\tCoordination Center for TLD RU\n.珠宝\tgeneric\tNot assigned\n‏.تونس‎\tcountry-code\tAgence Tunisienne d'Internet\n.大拿\tgeneric\tVeriSign Sarl\n.ລາວ\tcountry-code\tLao National Internet Center (LANIC), Ministry of Technology and Communications\n.みんな\tgeneric\tCharleston Road Registry Inc.\n.グーグル\tgeneric\tCharleston Road Registry Inc.\n.ευ\tcountry-code\tEURid vzw\n.ελ\tcountry-code\tICS-FORTH GR\n.世界\tgeneric\tStable Tone Limited\n.書籍\tgeneric\tAmazon Registry Services, Inc.\n.ഭാരതം\tcountry-code\tNational Internet eXchange of India\n.ਭਾਰਤ\tcountry-code\tNational Internet Exchange of India\n.网址\tgeneric\tKNET Co., Ltd\n.닷넷\tgeneric\tVeriSign Sarl\n.コム\tgeneric\tVeriSign Sarl\n.天主教\tgeneric\tPontificium Consilium de Comunicationibus Socialibus (PCCS) (Pontifical Council for Social Communication)\n.游戏\tgeneric\tBinky Moon, LLC\n.vermögensberater\tgeneric\tDeutsche Vermögensberatung Aktiengesellschaft DVAG\n.vermögensberatung\tgeneric\tDeutsche Vermögensberatung Aktiengesellschaft DVAG\n.企业\tgeneric\tBinky Moon, LLC\n.信息\tgeneric\tBeijing Tele-info Technology Co., Ltd.\n.嘉里大酒店\tgeneric\tKerry Trading Co. Limited\n.嘉里\tgeneric\tKerry Trading Co. Limited\n‏.مصر‎\tcountry-code\tNational Telecommunication Regulatory Authority - NTRA\n‏.قطر‎\tcountry-code\tCommunications Regulatory Authority\n.广东\tgeneric\tGuangzhou YU Wei Information Technology Co., Ltd.\n.இலங்கை\tcountry-code\tLK Domain Registry\n.இந்தியா\tcountry-code\tNational Internet Exchange of India\n.հայ\tcountry-code\t\"Internet Society\" Non-governmental Organization\n.新加坡\tcountry-code\tSingapore Network Information Centre (SGNIC) Pte Ltd\n‏.فلسطين‎\tcountry-code\tMinistry of Telecom & Information Technology (MTIT)\n.テスト\ttest\tNot assigned\n.政务\tgeneric\tChina Organizational Name Administration Center\n.xperia\tgeneric\tNot assigned\n.xxx\tsponsored\tICM Registry LLC\n.xyz\tgeneric\tXYZ.COM LLC\n.yachts\tgeneric\tXYZ.COM LLC\n.yahoo\tgeneric\tYahoo Inc.\n.yamaxun\tgeneric\tAmazon Registry Services, Inc.\n.yandex\tgeneric\tYANDEX LLC\n.ye\tcountry-code\tTeleYemen\n.yodobashi\tgeneric\tYODOBASHI CAMERA CO.,LTD.\n.yoga\tgeneric\tRegistry Services, LLC\n.yokohama\tgeneric\tGMO Registry, Inc.\n.you\tgeneric\tAmazon Registry Services, Inc.\n.youtube\tgeneric\tCharleston Road Registry Inc.\n.yt\tcountry-code\tAssociation Française pour le Nommage Internet en Coopération (A.F.N.I.C.)\n.yun\tgeneric\tQIHOO 360 TECHNOLOGY CO. LTD.\n.za\tcountry-code\tZA Domain Name Authority\n.zappos\tgeneric\tAmazon Registry Services, Inc.\n.zara\tgeneric\tIndustria de Diseño Textil, S.A. (INDITEX, S.A.)\n.zero\tgeneric\tAmazon Registry Services, Inc.\n.zip\tgeneric\tCharleston Road Registry Inc.\n.zippo\tgeneric\tNot assigned\n.zm\tcountry-code\tZambia Information and Communications Technology Authority (ZICTA)\n.zone\tgeneric\tBinky Moon, LLC\n.zuerich\tgeneric\tKanton Zürich (Canton of Zurich)\n.zw\tcountry-code\tPostal and Telecommunications Regulatory Authority of Zimbabwe (POTRAZ)\n\n__ICCTLD__\n# https://en.wikipedia.org/wiki/Country_code_top-level_domain#Internationalized_ccTLDs\n# https://en.wikipedia.org/wiki/Internationalized_country_code_top-level_domain#List\n# https://www.icann.org/resources/pages/string-evaluation-completion-2014-02-19-en\n# (update 2025-09-26)\n# DNS name\tIDN ccTLD\tCountry/Region\tLanguage\tScript\tTransliteration\tComments\tOther ccTLD\tDNSSEC\nxn--lgbbat1ad8j\t.الجزائر\tAlgeria\tArabic\tArabic (Arabic)\tal-Jazā'ir\t\t.dz\tNo\nxn--y9a3aq\t.հայ\tArmenia\tArmenian\tArmenian\thay\t\t.am\tYes\nxn--mgbcpq6gpa1a\t.البحرين\tBahrain\tArabic\tArabic\tal-Baḥrain\tNot in use\t.bh\tYes\nxn--54b7fta0cc\t.বাংলা\tBangladesh\tBengali\tBengali\tBangla\t\t.bd\tNo\nxn--90ais\t.бел\tBelarus\tBelarusian\tCyrillic\tbel\t\t.by\tYes\nxn--90ae\t.бг[16]\tBulgaria\tBulgarian\tCyrillic\tbg\t\t.bg\tYes\nxn--fiqs8s\t.中国\tChina\tChinese\tChinese (Simplified)\tZhōngguó\t\t.cn\tYes\nxn--fiqz9s\t.中國\tChina\tChinese\tChinese (Traditional)\tZhōngguó\t\t.cn\tYes\nxn--wgbh1c\t.مصر\tEgypt\tArabic\tArabic (Arabic)\tMiṣr / Maṣr[17]\t\t.eg\tYes\nxn--e1a4c\t.ею\tEuropean Union\tBulgarian\tCyrillic\teyu\t\t.eu\tYes\nxn--qxa6a\t.ευ\tEuropean Union\tGreek\tGreek\tey\tIn use since 2022\t.eu\tYes\nxn--node\t.გე\tGeorgia\tGeorgian\tGeorgian (Mkhedruli)\tGE\t\t.ge\tNo\nxn--qxam\t.ελ[16]\tGreece\tGreek\tGreek\tel\tIn use since July 2018\t.gr\tYes\nxn--j6w193g\t.香港\tHong Kong\tChinese\tChinese (Simplified and Traditional)\tHoeng1 gong2 / Xiānggǎng\t\t.hk\tYes\nxn--h2brj9c\t.भारत\tIndia\tHindi\tDevanagari\tBhārat\tBecame available 27 August 2014[18]\t.in\tYes\nxn--mgbbh1a71e\t.بھارت\tIndia\tUrdu\tArabic (Urdu)\tBhārat\tBecame available 2017\t.in\tYes\nxn--fpcrj9c3d\t.భారత్\tIndia\tTelugu\tTelugu\tBhārat\tBecame available 2017\t.in\tYes\nxn--gecrj9c\t.ભારત\tIndia\tGujarati\tGujarati\tBhārat\tBecame available 2017\t.in\tYes\nxn--s9brj9c\t.ਭਾਰਤ\tIndia\tPunjabi\tGurmukhī\tBhārat\tBecame available 2017\t.in\tYes\nxn--xkc2dl3a5ee0h\t.இந்தியா\tIndia\tTamil\tTamil\tIntiyā\tBecame available 2015\t.in\tYes\nxn--45brj9c\t.ভারত\tIndia\tBengali\tBengali\tBharôt\tBecame available 2017\t.in\tYes\nxn--2scrj9c\t.ಭಾರತ\tIndia\tKannada\tKannada\tBhārata\tBecame available 2020\t.in\tYes\nxn--rvc1e0am3e\t.ഭാരതം\tIndia\tMalayalam\tMalayalam\tBhāratam\tBecame available 2020\t.in\tYes\nxn--45br5cyl\t.ভাৰত\tIndia\tAssamese\tBengali\tBharatam\tBecame available 2022\t.in\tYes\nxn--3hcrj9c\t.ଭାରତ\tIndia\tOriya\tOriya\tBhārat\tBecame available 2021\t.in\tYes\nxn--mgbbh1a\t.بارت\tIndia\tKashmiri\tArabic (Kashmiri)\tBārat\tBecame available 2022\t.in\tYes\nxn--h2breg3eve\t.भारतम्\tIndia\tSanskrit\tDevanagari\tBhāratam\tBecame available 2022\t.in\tYes\nxn--h2brj9c8c\t.भारोत\tIndia\tSantali\tDevanagari\tBharot\tBecame available 2022\t.in\tYes\nxn--mgbgu82a\t.ڀارت\tIndia\tSindhi\tArabic (Sindhi)\tBhārat\tBecame available 2022\t.in\tYes\nxn--mgba3a4f16a\t.ایران\tIran\tPersian\tArabic (Persian)\tĪrān\t\t.ir\tNo\nxn--mgbtx2b\t.عراق\tIraq\tArabic\tArabic (Arabic)\tʿIrāq\tNot in use\t.iq\tNo\nxn--4dbrk0ce\t.ישראל\tIsrael\tHebrew\tHebrew\tIsrael\tBecame available 2022\t.il\tYes\nxn--mgbayh7gpa\t.الاردن\tJordan\tArabic\tArabic (Arabic)\tal-Urdun\t\t.jo\tNo\nxn--80ao21a\t.қаз\tKazakhstan\tKazakh\tCyrillic (Kazakh)\tqaz\t\t.kz\tNo\nxn--q7ce6a\t.ລາວ\tLaos\tLao\tLao\tLao\tBecame available 2020\t.la\tYes\nxn--mgbb7fyab\t.ليبيا\tLibya\tArabic\tArabic (Arabic)\t\tNot delegated[15]\t.ly\tNo\nxn--mix082f\t.澳门\tMacao\tChinese\tChinese (Simplified)\tOu3 mun4 / Àomén\tNot in use\t.mo\tNo\nxn--mix891f\t.澳門\tMacao\tChinese\tChinese (Traditional)\tOu3 mun4 / Àomén\tBecame available 2020\t.mo\tNo\nxn--mgbx4cd0ab\t.مليسيا\tMalaysia\tMalay\tArabic (Jawi)\tMalaysīyā\t\t.my\tYes\nxn--mgbah1a3hjkrd\t.موريتانيا\tMauritania\tArabic\tArabic (Arabic)\tMūrītāniyā\t\t.mr\tYes\nxn--l1acc\t.мон\tMongolia\tMongolian\tCyrillic (Mongolian)\tmon\t\t.mn\tYes\nxn--mgbc0a9azcg\t.المغرب\tMorocco\tArabic\tArabic (Arabic)\tal-Maġrib\t\t.ma\tNo\nxn--d1alf\t.мкд\tNorth Macedonia\tMacedonian\tCyrillic (Macedonian)\tmkd\t\t.mk\tNo\nxn--mgb9awbf\t.عمان\tOman\tArabic\tArabic (Arabic)\tʿUmān\t\t.om\tNo\nxn--mgbai9azgqp6j\t.پاکستان\tPakistan\tUrdu\tArabic (Urdu)\tPākistān\t\t.pk\tYes\nxn--ygbi2ammx\t.فلسطين\tPalestinian Authority\tArabic\tArabic (Arabic)\tFilasṭīn\t\t.ps\tNo\nxn--wgbl6a\t.قطر\tQatar\tArabic\tArabic (Arabic)\tQaṭar\t\t.qa\tNo\nxn--p1ai\t.рф\tRussia\tRussian\tCyrillic (Russian)\trf\t\t.ru\tYes\nxn--mgberp4a5d4ar\t.السعودية\tSaudi Arabia\tArabic\tArabic (Arabic)\tas-Suʿūdīya\t\t.sa\tYes\nxn--90a3ac\t.срб\tSerbia\tSerbian\tCyrillic (Serbian)\tsrb\t\t.rs\tYes\nxn--yfro4i67o\t.新加坡\tSingapore\tChinese\tChinese (Simplified and Traditional)\tXīnjiāpō\t\t.sg\tYes\nxn--clchc0ea0b2g2a9gcd\t.சிங்கப்பூர்\tSingapore\tTamil\tTamil\tCinkappūr\t\t.sg\tYes\nxn--3e0b707e\t.한국\tSouth Korea\tKorean\tHangul\tHanguk\t\t.kr\tYes\nxn--fzc2c9e2c\t.ලංකා\tSri Lanka\tSinhala\tSinhala\tLanka\t\t.lk\tNo\nxn--xkc2al3hye2a\t.இலங்கை\tSri Lanka\tTamil\tTamil\tIlaṅkai\t\t.lk\tNo\nxn--mgbpl2fh\t.سودان\tSudan\tArabic\tArabic (Arabic)\tSūdān\t\t.sd\tNo\nxn--ogbpf8fl\t.سورية\tSyria\tArabic\tArabic (Arabic)\tSūriyya\t\t.sy\tNo\nxn--kprw13d\t.台湾\tTaiwan\tChinese\tChinese (Simplified)\tTáiwān\t\t.tw\tYes\nxn--kpry57d\t.台灣\tTaiwan\tChinese\tChinese (Traditional)\tTáiwān\t\t.tw\tYes\nxn--o3cw4h\t.ไทย\tThailand\tThai\tThai\tThai\t\t.th\tYes\nxn--pgbs0dh\t.تونس\tTunisia\tArabic\tArabic (Arabic)\tTūnis\t\t.tn\tYes\nxn--j1amh\t.укр\tUkraine\tUkrainian\tCyrillic (Ukrainian)\tukr\t\t.ua\tNo\nxn--mgbaam7a8h\t.امارات\tUnited Arab Emirates\tArabic\tArabic (Arabic)\tImārāt\t\t.ae\tNo\nxn--mgb2ddes\t.اليمن\tYemen\tArabic\tArabic (Arabic)\tal-Yaman\tNot delegated\t.ye\tNo\n__INTERNATIONALIZED_GEOGRAPHIC_TLD__\n# https://en.wikipedia.org/wiki/List_of_Internet_top-level_domains#Internationalized_geographic_top-level_domains\n# (update 2025-09-26)\n# DNS name\tDisplay name\tEntity\tLanguage\tScript\tTransliteration\tNotes\tOther TLD\tIDN\tDNSSEC\nxn--1qqw23a[24]\t.佛山\tFoshan, China\tChinese\tChinese (Simplified)\tfat6 saan1\t[85]\t\tYes\tYes\nxn--xhq521b[24]\t.广东\tGuangdong, China\tChinese\tChinese (Simplified)\tgwong2 dung1\t[14]\t\t\t\nxn--80adxhks[24]\t.москва [ru]\tMoscow, Russia\tRussian\tCyrillic (Russian)\tmoskva\t[86]\t.moscow\tRussian[15]\tYes\nxn--p1acf[24]\t.рус\tRussian language, post-Soviet states\tRussian\tCyrillic (Russian)\trus\t[14]\t.su\t\t\nxn--mgbca7dzdo[24]\t.ابوظبي\tAbu Dhabi\tArabic\tArabic\tAbū Ẓabī\t[14]\t.abudhabi\t\t\nxn--ngbrx[24]\t.عرب\tArab\tArabic\tArabic\t‘Arab\t[14]\t\t\t\n__INTERNATIONALIZED_BRAND_TLD__\n# Internationalized brand top-level domains\n# https://en.wikipedia.org/wiki/List_of_Internet_top-level_domains#Internationalized_brand_top-level_domains\n# (update 2025-09-26)\n# DNS name\tIDN TLD\tEntity\tScript\tTransliteration\tComments\tDNSSEC\nxn--jlq480n2rg\t.亚马逊\tAmazon\tChinese (Simplified)\tYàmǎxùn\t[161]\tYes\nxn--cckwcxetd\t.アマゾン\tAmazon\tKatakana\tamazon\t[162]\tYes\nxn--mgba3a3ejt\t.ارامكو\tAramco Services Company\tArabic\t\t[14]\t\nxn--mgbaakc7dvf\t.اتصالات\tEmirates Telecommunications Corporation (trading as Etisalat)\tArabic\t\t[14]\t\nxn--8y0a063a\t.联通\tChina United Network Communications Corporation Limited\tChinese (Simplified)\tLiántōng\t[14]\t\nxn--6frz82g\t.移动\tChina Mobile Communications Corporation\tChinese (Simplified)\tYídòng\t\t\nxn--fiq64b\t.中信\tCITIC Group\tChinese\tzhōngxìn\t[163]\tYes\nxn--5su34j936bgsg\t.香格里拉\tShangri‐La International Hotel Management Limited\tChinese\tXiānggélǐlā\t[14]\t\nxn--b4w605ferd\t.淡马锡\tTemasek Holdings (Private) Limited\tChinese (Simplified)\tDànmǎxī\t[14]\t\nxn--3oq18vl8pn36a\t.大众汽车\tVolkswagen (China) Investment Co., Ltd.\tChinese (Simplified)\tDàzhòngqìchē\t[14]\t\nxn--vermgensberater-ctb\t.vermögensberater\tDeutsche Vermögensberatung Aktiengesellschaft\tLatin\t\t[164]\tYes\nxn--vermgensberatung-pwb\t.vermögensberatung\tDeutsche Vermögensberatung Aktiengesellschaft\tLatin\t\t[165]\tYes\nxn--qcka1pmc\t.グーグル\tGoogle\tKatakana\tgūguru\t[166]\tYes\nxn--flw351e\t.谷歌\tGoogle\tChinese\tgǔgē\t[167]\tYes\nxn--estv75g\t.工行\tIndustrial and Commercial Bank of China Limited\tChinese\tGōngháng\t[14]\t\nxn--w4rs40l\t.嘉里\tKerry Trading Co. Limited\tChinese\tJiālǐ\t[14]\t\nxn--w4r85el8fhu5dnra\t.嘉里大酒店\tKerry Trading Co. Limited\tChinese\tJiālǐdàjiǔdiàn\t[14]\t\nxn--kcrx77d1x4a\t.飞利浦\tKoninklijke Philips N.V.\tChinese (Simplified)\tFēilìpǔ\t[14]\t\nxn--jlq61u9w7b\t.诺基亚\tNokia Corporation\tChinese (Simplified)\tNuòjīyà\t[14][168]\t\nxn--fzys8d69uvgm\t.電訊盈科\tPCCW Enterprises Limited\tChinese (Traditional)\tdin6 soen3 jing4 fo1\t[14]\t\nxn--cg4bki\t.삼성\tSamsung\tHangul\tsamseong\t[169]\tYes\n__INTERNATIONALIZED_TEST_TLD__\n# https://en.wikipedia.org/wiki/List_of_Internet_top-level_domains#Test_TLDs\nxn--kgbechtv\tإختبار.\tik͡htibār\tArabic\tArabic\thttp://مثال.إختبار\nxn--hgbk6aj7f53bba\tآزمایشی.\tậzmạy̰sẖy\tPersian\tPerso-Arabic\thttp://مثال.آزمایشی\nxn--0zwm56d\t.测试\tcèshì\tChinese Simplified\tChinese\thttp://例子.测试\nxn--g6w251d\t.測試\tcèshì\tChinese Traditional\tChinese\thttp://例子.測試\nxn--80akhbyknj4f\t.испытание\tispytánije\tRussian\tCyrillic\thttp://пример.испытание\nxn--11b5bs3a9aj6g\t.परीक्षा\tparīkṣā\tHindi\tDevanagari\thttp://उदाहरण.परीक्षा\nxn--jxalpdlp\t.δοκιμή\tdokimé\tGreek\tGreek\thttp://παράδειγμα.δοκιμή\nxn--9t4b11yi5a\t.테스트\tteseuteu\tKorean\tHangul\thttp://실례.테스트\nxn--deba0ad\tטעסט.\ttest\tYiddish\tHebrew\thttp://בײַשפּיל.טעסט\nxn--zckzah\t.テスト\ttesuto\tJapanese\tKatakana[229]\thttp://例え.テスト\nxn--hlcj6aya9esc7a\t.பரிட்சை\tpariṭcai\tTamil\tTamil\thttp://உதாரணம்.பரிட்சை\n'''\n\n\nTopLevelDomain._read_data()\n\n\nif __name__ == '__main__':\n    for line in fileinput.input():\n        line = line.replace('\\n', '')\n        (cc, freq) = line.split('\\t')\n        tld = TopLevelDomain(cc)\n        # print(tld)\n        sub_type = \"\"\n        if tld.sub_type is not None:\n            sub_type = tld.sub_type\n        print('\\t'.join([cc, tld.tld_type, tld.first_level, sub_type, freq]))\n"
  }
]