From 5171d5f821d040063e82d416f27209ab2afd266f Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 17 Jun 2021 16:53:08 +0200 Subject: [PATCH 01/19] add c4 --- datasets/c4/README.md | 6 +- datasets/c4/c4.py | 322 ++++---------------------- datasets/c4/c4_utils.py | 488 ---------------------------------------- 3 files changed, 51 insertions(+), 765 deletions(-) delete mode 100644 datasets/c4/c4_utils.py diff --git a/datasets/c4/README.md b/datasets/c4/README.md index 821343585c5..4b24881da75 100644 --- a/datasets/c4/README.md +++ b/datasets/c4/README.md @@ -5,6 +5,7 @@ paperswithcode_id: c4 # Dataset Card for C4 ## Table of Contents + - [Dataset Card for [Dataset Name]](#dataset-card-for-dataset-name) - [Table of Contents](#table-of-contents) - [Dataset Description](#dataset-description) @@ -45,7 +46,6 @@ paperswithcode_id: c4 ### Dataset Summary A colossal, cleaned version of Common Crawl's web crawl corpus. Based on Common Crawl dataset: "https://commoncrawl.org" -Due to the overhead of cleaning the dataset, it is recommend you prepare it with a distributed service like Cloud Dataflow. More info at https://www.tensorflow.org/datasets/beam_datasets. ### Supported Tasks and Leaderboards @@ -138,6 +138,4 @@ Due to the overhead of cleaning the dataset, it is recommend you prepare it with ### Contributions -Thanks to [@github-username](https://github.com/) for adding this dataset. - -Thanks to @thomwolf, @Narsil, @patrickvonplaten, @lhoestq, @lewtun for adding this dataset. +Thanks to [@dirkgr](https://github.com/dirkgr)[@lhoestq](https://github.com/lhoestq) for adding this dataset. diff --git a/datasets/c4/c4.py b/datasets/c4/c4.py index 675a8e9611e..095671070cf 100644 --- a/datasets/c4/c4.py +++ b/datasets/c4/c4.py @@ -17,25 +17,11 @@ """C4 dataset based on Common Crawl.""" +import gzip import json -import os import datasets -from .c4_utils import ( - dedupe_urls, - filter_by_webtextlike, - get_clean_page_fn, - get_counter_inc_fn, - get_hashed_url_filter_fn, - is_language, - is_realnews_domain, - is_valid_length, - normalize_url, - remove_duplicate_text, - split_wet_file, -) - logger = datasets.logging.get_logger(__name__) @@ -43,11 +29,10 @@ _DESCRIPTION = """\ A colossal, cleaned version of Common Crawl's web crawl corpus. -Based on Common Crawl dataset: "https://commoncrawl.org" +Based on Common Crawl dataset: "https://commoncrawl.org". + +This is the processed version of Google's C4 dataset by AllenAI. -Due to the overhead of cleaning the dataset, it is recommend you prepare it with -a distributed service like Cloud Dataflow. More info at -https://www.tensorflow.org/datasets/beam_datasets. """ _CITATION = """ @article{2019t5, @@ -59,275 +44,66 @@ eprint = {1910.10683}, } """ -_VERSION = datasets.Version("2.3.0", "Deduplicate lines within a page.") +_URL = "https://github.com/allenai/allennlp/discussions/5056" -_DOWNLOAD_HOST = "https://commoncrawl.s3.amazonaws.com" -_WET_PATH_URL = "https://commoncrawl.s3.amazonaws.com/crawl-data/CC-MAIN-{cc_version}/wet.paths.gz" -_REALNEWS_DOMAINS_URL = "https://raw.githubusercontent.com/rowanz/grover/38f7184bd87237ae2d3bc330b99f1e2e246f6d51/realnews/domain_to_allowed_subdomains.json" -_BADWORDS_URL = "https://raw.githubusercontent.com/LDNOOBW/List-of-Dirty-Naughty-Obscene-and-Otherwise-Bad-Words/25e679f03d96baa721cde20db9944649e8d0a844/{lang}" -_CHECKSUMS_URL = "https://storage.googleapis.com/tfds-data/manual_checksums/c4.txt" -_OPENWEBTEXT_URLS_ZIP = "OpenWebText.zip" -_OPENWEBTEXT_URLS_URL = "https://mega.nz/#F!EZZD0YwJ!9_PlEQzdMVLaNdKv_ICNVQ" -_OPENWEBTEXT_URLS_FILE_PATTERN = "OpenWebText/Version 1/URLs/*.txt" - -_DEFAULT_CC_VERSIONS = ("2019-18",) # April 2019 -_DEFAULT_WEBTEXTLIKE_CC_VERSIONS = ( # August 2018 - July 2019 - "2018-34", - "2018-39", - "2018-43", - "2018-47", - "2018-51", - "2019-04", - "2019-09", - "2019-13", - "2019-18", - "2019-22", - "2019-26", - "2019-30", -) +_VARIANTS = ["en", "realnewslike", "en.noblocklist", "en.noclean"] +_N_SHARDS_PER_SPLIT = { + "en": {"train": 1024, "validation": 8}, + "realnewslike": {"train": 512, "validation": 1}, + "en.noblocklist": {"train": 1024, "validation": 8}, + "en.noclean": {"train": 7168, "validation": 64}, +} -class C4Config(datasets.BuilderConfig): - """BuilderConfig for C4 dataset.""" - - def __init__(self, language, cc_versions=None, clean=True, realnewslike=False, webtextlike=False, **kwargs): - """BuilderConfig for C4. - - Args: - language: string, the language code, or "all" to disable language - filtering. - cc_versions: tuple(string), a collection of versions of Common Crawl to - use as the raw source text. Set to None to use defaults. - clean: bool, whether to clean the dataset for badwords, duplications, etc. - realnewslike: bool, whether to limit to news domains as compiled by - RealNews. - webtextlike: bool, whether to limit to WebText-like URLs. - **kwargs: keyword arguments forwarded to super. - """ - name_parts = [language] - if cc_versions: - name_parts.append("_".join(cc_versions)) - if not clean: - name_parts.append("noclean") - if realnewslike: - name_parts.append("realnewslike") - if webtextlike: - name_parts.append("webtextlike") - name = ".".join(name_parts) - super(C4Config, self).__init__(name=name, version=_VERSION, **kwargs) - self.lang = language - self.cc_versions = cc_versions or (_DEFAULT_WEBTEXTLIKE_CC_VERSIONS if webtextlike else _DEFAULT_CC_VERSIONS) - self.clean = clean - self.realnewslike = realnewslike - self.webtextlike = webtextlike - +_DATA_URL = ( + "https://huggingface.co/datasets/allenai/c4/resolve/main/{name}/c4-{split}.{index:05d}-of-{n_shards:05d}.json.gz" +) -class C4(datasets.BeamBasedBuilder): - """C4 dataset based on Common Crawl.""" - BUILDER_CONFIGS = [ - C4Config(language="en", description="English C4 dataset."), - C4Config( - language="en", - clean=False, - description="Disables all cleaning (deduplication, removal based on bad words, " "etc.)", - ), - C4Config( - language="en", - realnewslike=True, - description="Filters from the default config to only include content from the " - "domains used in the 'RealNews' dataset (Zellers et al., 2019).", - ), - C4Config( - language="en", - webtextlike=True, - description="Filters from the default config to only include content from the " - "URLs in OpenWebText (https://github.com/jcpeterson/openwebtext).", - ), - ] +class C4(datasets.GeneratorBasedBuilder): + """C4, a colossal, cleaned version of Common Crawl's web crawl corpus.""" - @property - def manual_download_instructions(self): - return """\ - For the WebText-like config, you must manually download 'OpenWebText.zip' - (from https://mega.nz/#F!EZZD0YwJ!9_PlEQzdMVLaNdKv_ICNVQ) and the Common Crawl - WET files from August 2018 to July 2019 - (https://commoncrawl.org/the-data/get-started/) and place them in the - `data_dir`. - """ + BUILDER_CONFIGS = [datasets.BuilderConfig(name) for name in _VARIANTS] def _info(self): - features = { - "text": datasets.Value("string"), - "url": datasets.Value("string"), - "content-type": datasets.Value("string"), - "content-length": datasets.Value("string"), - "timestamp": datasets.Value("string"), - } return datasets.DatasetInfo( description=_DESCRIPTION, - features=datasets.Features(features), + features=datasets.Features( + { + "text": datasets.Value("string"), + "timestamp": datasets.Value("string"), + "url": datasets.Value("string"), + } + ), + supervised_keys=None, + homepage=_URL, citation=_CITATION, - homepage="https://github.com/google-research/text-to-text-transfer-transformer#datasets", ) - def _split_generators(self, dl_manager, pipeline): - import apache_beam as beam - - # We will automatically down the default CC version(s), but others need to - # be manually downloaded. - cc_versions = set(self.config.cc_versions) - auto_cc_versions = cc_versions & set(_DEFAULT_CC_VERSIONS) - manual_cc_versions = cc_versions - set(_DEFAULT_CC_VERSIONS) - - files_to_download = {} - files_to_download["wet_path_urls"] = [ - _WET_PATH_URL.format(cc_version=cc_version) for cc_version in auto_cc_versions - ] - if self.config.clean: - files_to_download["badwords"] = _BADWORDS_URL.format(lang=self.config.lang) - if self.config.realnewslike: - files_to_download["realnews_domains"] = _REALNEWS_DOMAINS_URL - file_paths = dl_manager.download_and_extract(files_to_download) - - if self.config.webtextlike: - owt_path = os.path.join(dl_manager.manual_dir, _OPENWEBTEXT_URLS_ZIP) - if not os.path.exists(owt_path): - raise FileNotFoundError( - "{} does not exist. Make sure you insert a manual dir via `datasets.load_dataset('c4', data_dir=...)` that includes a file name {}. Manual download instructions: {})".format( - owt_path, _OPENWEBTEXT_URLS_ZIP, self.manual_download_instructions - ) - ) - file_paths["openwebtext_urls_zip"] = dl_manager.extract(owt_path) - - wet_urls = [] - for wet_path_url in file_paths["wet_path_urls"]: - with open(wet_path_url, "r", encoding="utf-8") as f: - wet_urls.extend(["%s/%s" % (_DOWNLOAD_HOST, line.strip()) for line in f]) - file_paths["wet_urls"] = wet_urls - file_paths["wet_files"] = [] - - for cc_version in manual_cc_versions: - cc_dir = os.path.join(dl_manager.manual_dir, cc_version) - wet_files = beam.io.filesystems.FileSystems.match(os.path.join(cc_dir, "*.warc.wet.gz")) - if not os.path.exists(cc_dir): - raise FileNotFoundError( - "{} does not exist. Make sure you insert a manual dir via `datasets.load_dataset('c4', data_dir=...)` that includes the files {}. Manual download instructions: {})".format( - cc_dir, "*.warc.wet.gz", self.manual_download_instructions - ) - ) - logger.info("Adding %d WET files for manually downloaded version %s.", len(wet_files), cc_version) - file_paths["wet_files"].extend(wet_files) - - page_content_pcollection = self._get_page_content(pipeline, file_paths, dl_manager) + def _split_generators(self, dl_manager): + data_urls = {} + for split in ["train", "validation"]: + n_shards = _N_SHARDS_PER_SPLIT[self.config.name][split] + data_urls[split] = [ + _DATA_URL.format(name=self.config.name, split=split, index=index, n_shards=n_shards) + for index in range(n_shards) + ] + downloaded_files = dl_manager.download(data_urls) return [ + datasets.SplitGenerator(name=datasets.Split.TRAIN, gen_kwargs={"filepaths": downloaded_files["train"]}), datasets.SplitGenerator( - name=datasets.Split.TRAIN, - gen_kwargs=dict( - split="train", - page_content=page_content_pcollection, - hashed_url_predicate=lambda x: x % 1000 != 0, # 99.9% - ), - ), - datasets.SplitGenerator( - name=datasets.Split.VALIDATION, - gen_kwargs=dict( - split="validation", - page_content=page_content_pcollection, - hashed_url_predicate=lambda x: x % 1000 == 0, # 0.01% - ), + name=datasets.Split.VALIDATION, gen_kwargs={"filepaths": downloaded_files["validation"]} ), ] - def _get_page_content(self, pipeline, file_paths, dl_manager): - """Build PCollection of un-split page content.""" - import apache_beam as beam - - wet_file_paths = pipeline | "create_wet_files" >> beam.Create(file_paths["wet_files"]) - if "wet_urls" in file_paths: - - def download_url(url, downloader, pipeline): - path = downloader.download(url) - if not pipeline.is_local(): - path = downloader.ship_files_with_pipeline(path, pipeline) - return path - - dl_wet_file_paths = ( - pipeline - | "create_wet_urls" >> beam.Create(file_paths["wet_urls"]) - | beam.Map(download_url, downloader=dl_manager, pipeline=pipeline) - ) - wet_file_paths = (wet_file_paths, dl_wet_file_paths) | beam.Flatten() - - # Parse WET files and filter by length. - # Output: url, text - page_content = wet_file_paths | beam.FlatMap(split_wet_file) | beam.Filter(is_valid_length) - - # Optionally filter for RealNews domains. - # Output: url, text - if self.config.realnewslike: - with open(file_paths["realnews_domains"], "r", encoding="utf-8") as f: - realnews_domains = json.load(f) - page_content = page_content | beam.Filter(is_realnews_domain, realnews_domains) - - # Normalize and deduplicate by URL. - # Output: url, text - page_content = ( - page_content - | "normalize_url" >> beam.Map(normalize_url) - | "group_url" >> beam.GroupByKey() - | beam.Map(dedupe_urls) - ) - - # Optionally filter for WebText-like URLs. - # Output: url, text - if self.config.webtextlike: - webtextlike_urls = ( - pipeline - | "read_webtextlike_urls" - >> beam.io.ReadFromText( - os.path.join(file_paths["openwebtext_urls_zip"], _OPENWEBTEXT_URLS_FILE_PATTERN) - ) - | "add_dummy_page" >> beam.Map(lambda x: (x, "")) - | "normal_webtext_url" >> beam.Map(normalize_url) - ) - page_content = ( - {"text": page_content, "webtextlike_urls": webtextlike_urls} - | "group_webtextlike_urls" >> beam.CoGroupByKey() - | beam.FlatMap(filter_by_webtextlike) - ) - - # Optionally clean pages of badwords, boilerpolate text, and duplicate - # spans of sentences. - # Output: url, text - if self.config.clean: - with open(file_paths["badwords"], "r", encoding="utf-8") as f: - badwords = [line.strip() for line in f] - page_content = page_content | "clean_pages" >> beam.FlatMap(get_clean_page_fn(badwords)) - page_content = remove_duplicate_text(page_content) - - # Optionally filter out non-`language` pages. We do this after cleaning - # since it may change the predominate language. - if self.config.lang != "all": - page_content |= beam.Filter(is_language, language=self.config.lang) - - return page_content - - def _build_pcollection(self, unused_pipeline, split, page_content, hashed_url_predicate): - import apache_beam as beam - - def _emit_examples(el): - get_counter_inc_fn(split)("examples") - _, features = el - return ( - features["url"], - { - "url": features["url"], - "text": features["text"], - "content-type": features["content-type"], - "content-length": features["content-length"], - "timestamp": features["timestamp"], - }, - ) - - return page_content | beam.Filter(get_hashed_url_filter_fn(hashed_url_predicate)) | beam.Map(_emit_examples) + def _generate_examples(self, filepaths): + """This function returns the examples in the raw (text) form by iterating on all the files.""" + id_ = 0 + for filepath in filepaths: + logger.info("generating examples from = %s", filepath) + with gzip.open(open(filepath, "rb"), "rt", encoding="utf-8") as f: + for line in f: + if line: + example = json.loads(line) + yield id_, example + id_ += 1 diff --git a/datasets/c4/c4_utils.py b/datasets/c4/c4_utils.py deleted file mode 100644 index 94d8d38d69e..00000000000 --- a/datasets/c4/c4_utils.py +++ /dev/null @@ -1,488 +0,0 @@ -# coding=utf-8 -# Copyright 2020 The TensorFlow Datasets Authors and the HuggingFace Datasets Authors. -# -# Licensed under the Apache License, Version 2.0 (the "License"); -# you may not use this file except in compliance with the License. -# You may obtain a copy of the License at -# -# http://www.apache.org/licenses/LICENSE-2.0 -# -# Unless required by applicable law or agreed to in writing, software -# distributed under the License is distributed on an "AS IS" BASIS, -# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -# See the License for the specific language governing permissions and -# limitations under the License. - -# Lint as: python3 -"""Utilities for generating the C4 dataset.""" - - -import functools -import gzip -import hashlib -import io -import re -import threading - - -# WET file constants -_PAGE_DELIMITER = "WARC/1.0" -_URL_KEY = "WARC-Target-URI:" -_URL_DATE = "WARC-Date:" -_CONTENT_TYPE = "Content-Type:" -_CONTENT_LEN = "Content-Length:" -_METADATA_PREFIXES = ("WARC", "CONTENT-", "Content-") - -# Filters -_MIN_WORDS_PER_LINE = 5 -_MIN_NUM_SENTENCES = 3 -_MAX_WORD_LENGTH = 1000 -_END_MARKS = (".", "?", "!", '"') -_ELLIPSIS = "..." -_POLICY_SUBSTRINGS = [ - "terms of use", - "privacy policy", - "cookie policy", - "uses cookies", - "use of cookies", - "use cookies", -] - -# Memoized sentence tokenizer. -_SENTENCE_TOKENIZER = None - - -def get_counter_inc_fn(namespace): - import apache_beam as beam - - def counter_inc_fn(counter, amt=1): - beam.metrics.Metrics.counter(namespace, counter).inc(amt) - - return counter_inc_fn - - -def get_hashed_url_filter_fn(predicate_fn): - import tensorflow.compat.v2 as tf - - def filter_fn(el): - url, _ = el - val = int(hashlib.md5(tf.compat.as_text(url).encode("utf-8")).hexdigest(), 16) - return predicate_fn(val) - - return filter_fn - - -def _load_sentence_tokenizer(): - """Returns a sentence tokenization function.""" - # Lock to avoid a race-condition in the creation of the download directory. - with threading.Lock(): - import nltk - - nltk.download("punkt") - return nltk.data.load("nltk:tokenizers/punkt/english.pickle") - - -def _get_sentences(text): - import tensorflow.compat.v2 as tf - - global _SENTENCE_TOKENIZER - if not _SENTENCE_TOKENIZER: - _SENTENCE_TOKENIZER = _load_sentence_tokenizer() - return list(_SENTENCE_TOKENIZER.tokenize(tf.compat.as_text(text))) - - -def _get_sentences_by_line(text, lower=False): - sentences = [] - for line in text.splitlines(): - sentences.append([s.lower() if lower else s for s in _get_sentences(line)]) - return sentences - - -def is_language(page, language, min_probability=0.99): - """Returns True iff text is in `language` with at least `min_probability`.""" - unused_url, features = page - text = features["text"] - - counter_inc_fn = get_counter_inc_fn("detected-lang") - - # Make langdetect predictions deterministic. - import langdetect - - langdetect.DetectorFactory.seed = 0 - try: - predictions = langdetect.detect_langs(text) - except langdetect.lang_detect_exception.LangDetectException: - counter_inc_fn("langdetect-exception") - return False - if not predictions: - counter_inc_fn("page-filtered-nolangpredictions") - return False - best_prediction = predictions[0] - if best_prediction.prob < min_probability: - counter_inc_fn("page-filtered-lowlangdetectconf") - return False - if best_prediction.lang != language: - counter_inc_fn("page-filtered-ignoredlang") - counter_inc_fn("page-filtered-ignoredlang-%s" % (best_prediction.lang)) - return False - counter_inc_fn("page-emited-%s" % best_prediction.lang) - return True - - -def get_clean_page_fn(badwords=None): - """Returns `clean_page` with pre-compiled badword and citation regexes.""" - # Used to filter citation from Wikipedia pages (among others). - citation_regex = re.compile(r"\[\d*\]|\[edit\]|\[citation needed\]") - if badwords: - badwords_regex = re.compile("[^a-z]({})[^a-z]".format("|".join(badwords or []))) - else: - badwords_regex = None - return functools.partial(clean_page, citation_regex=citation_regex, badwords_regex=badwords_regex) - - -def clean_page( - url_and_features, - citation_regex, - badwords_regex=None, - counter_inc_fn=None, - min_words_per_line=_MIN_WORDS_PER_LINE, - min_num_sentences=_MIN_NUM_SENTENCES, - max_word_length=_MAX_WORD_LENGTH, -): - """Cleans a CommonCrawl page, yielding nothing if it should be skipped. - - Cleaning removes lines with no end marks or with too few words. After line - filtering, pages are filtered out if they have too few sentences based on a - simple count of end marks. - - Args: - url_and_features: tuple(string, dict), the url and features of the page. - citation_regex: Regex to use for finding Wikipedia-like citations to filter. - badwords_regex: Regex to use for finding badwords. Default None, which means - don't apply badwords filtering. - counter_inc_fn: function, a function taking the name of a counter to be - incremented and the (optional) amount. Defaults to a beam Metric counter. - min_words_per_line: int, the minimum number of words a line needs to not be - removed. - min_num_sentences: int, the minimum number of sentences a page needs to not - be skipped. - max_word_length: int, the maximum number of characters allowed in a word. - Lines containing a word with too many characters are removed. - Yields: - The url and cleaned text for the page. - """ - url, features = url_and_features - text = features["text"] - - if not counter_inc_fn: - counter_inc_fn = get_counter_inc_fn("clean-page") - - lines = text.splitlines() - valid_lines = [] - num_sentences = 0 - - def line_has_too_long_word(line): - for word in line.split(): - if len(word) > max_word_length: - return True - return False - - for line in lines: - line = line.strip() - if line_has_too_long_word(line): - counter_inc_fn("lines-with-too-long-word") - continue - line = citation_regex.sub("", line) - if not line.endswith(_END_MARKS) or line.endswith(_ELLIPSIS): - counter_inc_fn("lines-no-endmark") - continue - if len(line.split()) < min_words_per_line: - counter_inc_fn("lines-too-short") - continue - line_lower = line.lower() - # Remove documents which contain lorem ipsum - if "lorem ipsum" in line_lower: - counter_inc_fn("filtered-page-loremipsum") - return - # Remove "javascript must be enabled" notices - if "javascript" in line_lower: - counter_inc_fn("lines-javascript") - continue - # Remove docs which probably contain javascript code - if "{" in line: - counter_inc_fn("filtered-page-squigglybracket") - return - # Remove policy lines - if any(p in line_lower for p in _POLICY_SUBSTRINGS): - counter_inc_fn("lines-policy") - continue - # If any badword appears on its own in the line, skip this doc - if badwords_regex: - badwords_found = badwords_regex.search(line_lower) - if badwords_found is not None: - counter_inc_fn("filtered-page-badword") - return - num_sentences += len(_get_sentences(line)) - valid_lines.append(line) - counter_inc_fn("lines-valid") - - if num_sentences < min_num_sentences: - counter_inc_fn("filtered-page-toofewsentences") - return - counter_inc_fn("emitted-clean-pages") - features["text"] = "\n".join(valid_lines).strip() - yield url, features - - -def _hash_line(line): - import tensorflow.compat.v2 as tf - - m = hashlib.md5() - m.update(tf.compat.as_text(line).encode("utf-8").strip().lower()) - return m.hexdigest() - - -def _emit_url_to_lines(page): - """Emits url to all (lower-cased, hashed) lines.""" - url, features = page - text = features["text"] - for line in text.split("\n"): - yield _hash_line(line), url - - -def _emit_line_to_urls(el, counter_inc_fn): - """Emits (hashed) line to all but one url.""" - import tensorflow.compat.v2 as tf - - line, urls = el - # Materialize urls as a list. - urls = list(urls) - # Hash urls and sort to have a consistent, but unbiased, selection when the - # same urls exist for multiple lines. - skip_url = min(urls, key=lambda x: hashlib.md5(tf.compat.as_text(x).encode("utf-8")).hexdigest()) - for url in urls: - if url != skip_url: - yield url, line - counter_inc_fn("emitted-line-duplicate", amt=len(urls) - 1) - - -def _remove_lines_from_text(el, counter_inc_fn, min_num_sentences=_MIN_NUM_SENTENCES): - """Removes matching lines from the page. - - Process the result of a join containing a single value for 'features' and zero - or more values for 'lines'. Each value in 'lines' is a lower-cased, hashed - line. - - If a line has fewer sentences than `max_window_size`, the full line is - compared for a match. - - Args: - el: `(string, {'features': features_dict, 'lines': [string]})`, - element containing the result of a join on key with both the page text - and lower-cased, hashed lines to remove. - counter_inc_fn: function, a function taking the name of a counter to be - incremented and the (optional) amount. - min_num_sentences: int, the minimum number of sentences a page needs to not - be skipped. - - Yields: - url: The URL of the page. - features: The page features with lines removed from text. - """ - url, join_values = el - features = join_values["features"] - - assert len(features) == 1, "Invalid page count (%d) for %s" % (len(features), url) - features = features[0] - text = features["text"] - lines_to_remove = set(join_values["lines"]) - new_lines = [] - hashed_lines = set() - for line in text.split("\n"): - hashed_line = _hash_line(line) - if hashed_line in lines_to_remove: - counter_inc_fn("filtered-lines-duplicate") - elif hashed_line not in hashed_lines: - new_lines.append(line) - hashed_lines.add(hashed_line) - new_text = "\n".join(new_lines) - if len(_get_sentences(new_text)) < min_num_sentences: - counter_inc_fn("filtered-doc-toofewsentences") - return - new_features = features.copy() - new_features["text"] = new_text - yield (url, new_features) - - -def remove_duplicate_text(pages): - """Utility to remove duplicate lines across text documents.""" - # Output: url, lines - import apache_beam as beam - - counter_inc_fn = get_counter_inc_fn("dedupe-lines") - lines_to_remove = ( - pages - | beam.FlatMap(_emit_url_to_lines) - | "group_sentences" >> beam.GroupByKey() - | beam.FlatMap(_emit_line_to_urls, counter_inc_fn=counter_inc_fn) - ) - - # Output: url, text - final_docs = ( - {"features": pages, "lines": lines_to_remove} - | "group_features_and_lines_by_url" >> beam.CoGroupByKey() - | beam.FlatMap(_remove_lines_from_text, counter_inc_fn=counter_inc_fn) - ) - - return final_docs - - -def split_wet_file(wet_file_path, counter_inc_fn=None): - """Split a WET file into separate pages.""" - from absl import logging - - logging.info("Splitting file: %s", wet_file_path) - if not counter_inc_fn: - counter_inc_fn = get_counter_inc_fn("split-wet-file") - counter_inc_fn("wet-file") - - import apache_beam as beam - - with beam.io.filesystems.FileSystems.open(wet_file_path) as f, gzip.GzipFile(fileobj=f) as g: - url = None - content = None - content_len = None - content_type = None - timestamp = None - - def _maybe_get_page(): - """Generate a (url, {features}) page.""" - if not url and url is not None: - counter_inc_fn("page-filtered-nourl") - if not content and content is not None: - counter_inc_fn("page-filtered-nocontent") - if not content_type and content_type is not None: - counter_inc_fn("page-nocontenttype") - if not content_len and content_len is not None: - counter_inc_fn("page-nocontentlen") - if not timestamp and timestamp is not None: - counter_inc_fn("page-notimestamp") - if content and url: - counter_inc_fn("page-emitted") - return ( - url, - { - "text": "\n".join(content), - "content-type": content_type, - "content-length": content_len, - "timestamp": timestamp, - "url": url, - }, - ) - return None - - for line in io.TextIOWrapper(g, encoding="utf-8"): - line = line.strip() - if not line: - continue - if line == _PAGE_DELIMITER: - page = _maybe_get_page() - if page: - yield page - url = "" - content = [] - content_len = "" - content_type = "" - timestamp = "" - - if line.startswith(_URL_KEY): - url = line[len(_URL_KEY) :].strip() - - if line.startswith(_URL_DATE): - timestamp = line[len(_URL_DATE) :].strip() - - if line.startswith(_CONTENT_TYPE): - content_type = line[len(_CONTENT_TYPE) :].strip() - - if line.startswith(_CONTENT_LEN): - content_len = line[len(_CONTENT_LEN) :].strip() - - if line.startswith(_METADATA_PREFIXES): - continue - - content.append(line) - - page = _maybe_get_page() - if page: - yield page - - -def dedupe_urls(el): - """Returns the first value for a given URL.""" - counter_inc_fn = get_counter_inc_fn("dedupe-urls") - url, vals = el - cnt = 0 - v = None - for v in vals: - cnt += 1 - counter_inc_fn("filtered-url-duplicate", cnt - 1) - counter_inc_fn("unique-url") - return url, v - - -def is_valid_length(el, max_length=1.9e5): - """Returns False iff page's text is too long.""" - counter_inc_fn = get_counter_inc_fn("is-valid-length") - _, page = el - if len(page["text"]) > max_length: - counter_inc_fn("filtered-page-contenttoolong") - return False - counter_inc_fn("valid-length") - return True - - -def is_realnews_domain(el, realnews_domains): - """Returns False iff page's (sub)domain is not allowed.""" - import tldextract - - counter_inc_fn = get_counter_inc_fn("is-realnews-domain") - url, _ = el - ext = tldextract.extract(url) - main_domain = ext.domain + "." + ext.suffix - if main_domain not in realnews_domains: - counter_inc_fn("filtered-url-invaliddomain") - return False - allowed_subdomains = realnews_domains[main_domain] - if isinstance(allowed_subdomains, list) and ext.subdomain not in allowed_subdomains: - counter_inc_fn("filtered-url-invalidsubdomain") - return False - counter_inc_fn("realnews-domain") - return True - - -def filter_by_webtextlike(el): - """Yields only pages with a matching WebText-like URL.""" - counter_inc_fn = get_counter_inc_fn("filter-by-webtextlike") - url, join_values = el - text = join_values["text"] - webtextlike = join_values["webtextlike_urls"] - if not webtextlike: - counter_inc_fn("filtered-url-notwebtextlike") - return - if not text: - counter_inc_fn("missing-webtextlike") - return - assert len(text) == 1 - counter_inc_fn("found-webtextlike") - yield url, text[0] - - -def normalize_url(el): - import tensorflow.compat.v2 as tf - - url, val = el - url = tf.compat.as_text(url) - url = re.sub(r"https?:\/\/(www\.)?", "", url) - url = re.sub(r"\?(utm_|ref|feed).*", "", url) - url = url.rstrip("/") - return url, val From f369c9f2a48b8a2291c7468669b8312b5c6ab6a8 Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 1 Jul 2021 11:44:26 +0200 Subject: [PATCH 02/19] add infos --- datasets/c4/c4.py | 26 ++++++-------------------- datasets/c4/datasets_infos.json | 1 + 2 files changed, 7 insertions(+), 20 deletions(-) create mode 100644 datasets/c4/datasets_infos.json diff --git a/datasets/c4/c4.py b/datasets/c4/c4.py index 095671070cf..f88959ea5a3 100644 --- a/datasets/c4/c4.py +++ b/datasets/c4/c4.py @@ -1,19 +1,3 @@ -# coding=utf-8 -# Copyright 2020 The TensorFlow Datasets Authors and the HuggingFace Datasets Authors. -# -# Licensed under the Apache License, Version 2.0 (the "License"); -# you may not use this file except in compliance with the License. -# You may obtain a copy of the License at -# -# http://www.apache.org/licenses/LICENSE-2.0 -# -# Unless required by applicable law or agreed to in writing, software -# distributed under the License is distributed on an "AS IS" BASIS, -# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -# See the License for the specific language governing permissions and -# limitations under the License. - -# Lint as: python3 """C4 dataset based on Common Crawl.""" @@ -32,8 +16,8 @@ Based on Common Crawl dataset: "https://commoncrawl.org". This is the processed version of Google's C4 dataset by AllenAI. - """ + _CITATION = """ @article{2019t5, author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu}, @@ -44,6 +28,7 @@ eprint = {1910.10683}, } """ + _URL = "https://github.com/allenai/allennlp/discussions/5056" _VARIANTS = ["en", "realnewslike", "en.noblocklist", "en.noclean"] @@ -88,11 +73,12 @@ def _split_generators(self, dl_manager): _DATA_URL.format(name=self.config.name, split=split, index=index, n_shards=n_shards) for index in range(n_shards) ] - downloaded_files = dl_manager.download(data_urls) + train_downloaded_files = dl_manager.download(data_urls["train"]) + validation_downloaded_files = dl_manager.download(data_urls["train"]) return [ - datasets.SplitGenerator(name=datasets.Split.TRAIN, gen_kwargs={"filepaths": downloaded_files["train"]}), + datasets.SplitGenerator(name=datasets.Split.TRAIN, gen_kwargs={"filepaths": train_downloaded_files}), datasets.SplitGenerator( - name=datasets.Split.VALIDATION, gen_kwargs={"filepaths": downloaded_files["validation"]} + name=datasets.Split.VALIDATION, gen_kwargs={"filepaths": validation_downloaded_files} ), ] diff --git a/datasets/c4/datasets_infos.json b/datasets/c4/datasets_infos.json new file mode 100644 index 00000000000..dfb882a7201 --- /dev/null +++ b/datasets/c4/datasets_infos.json @@ -0,0 +1 @@ +{"en": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "en", "version": {"version_str": "0.0.0", "description": null, "major": 0, "minor": 0, "patch": 0}, "splits": {"train": {"name": "train", "num_bytes": 828589180707, "num_examples": 364868892, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 828589180707, "num_examples": 364868892, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00000-of-01024.json.gz": {"num_bytes": 319308785, "checksum": "8ef8d75b0e045dec4aa5123a671b4564466b0707086a7ed1ba8721626dfffbc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00001-of-01024.json.gz": {"num_bytes": 318039285, "checksum": "b945059cd1a343cabe311881b7840a6f0363f570e745a0eff0e687e266f6b55d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00002-of-01024.json.gz": {"num_bytes": 319748667, "checksum": "2967dc7e587ced6ecb9ba617ad2d4c44901467969de5bf5b0f5a9e5b70555d75"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00003-of-01024.json.gz": {"num_bytes": 318564193, "checksum": "b79d9abef5741578929be0d59db9ca652a8276207ef18a944b7a5f11fef5beb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00004-of-01024.json.gz": {"num_bytes": 318579884, "checksum": "cd9f98eac2bc6062f55d9a36bd744cc924a78ea2fd998830e0034e4456f5d014"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00005-of-01024.json.gz": {"num_bytes": 318003681, "checksum": "8ac5907a54dbc7ab9c14624448c7c3f6afed33af9d0a855f1eae955e62e255b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00006-of-01024.json.gz": {"num_bytes": 318495137, "checksum": "8fd9b9a4b74c9414466b245ebda7db041e7bd8603971de51b5db782bd758aac7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00007-of-01024.json.gz": {"num_bytes": 318417273, "checksum": "41dd377a1ba6b72eab0260c39c626fe45ab6b649d42d57b311d3ba21a0337cd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00008-of-01024.json.gz": {"num_bytes": 318131845, "checksum": "64da652c235f089a0b52f6db5883ef5f1e9c31edc4c950332b34dd12439c99a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00009-of-01024.json.gz": {"num_bytes": 318185592, "checksum": "807a548efbb10153c9eff0df5733a97a1b51ab1743242530de1b02a8ea17ace7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00010-of-01024.json.gz": {"num_bytes": 319045292, "checksum": "3bd0f6f664069c3bd964ce48ceae60ba47b55b54745a4b00c207bdb3a1926b17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00011-of-01024.json.gz": {"num_bytes": 319686980, "checksum": "5baa0c010083459ba58e34b4e93bb758caa878f7db6fba0528921329fa1a6cc5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00012-of-01024.json.gz": {"num_bytes": 320119088, "checksum": "fdee7442c06856e2c4b7665cc51978e9011b5e0a2112c30dd15bc9e53818842d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00013-of-01024.json.gz": {"num_bytes": 319474856, "checksum": "a4ab3b24087781c3577945492525696e182ffd7ca5265b958f49803a02867ecf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00014-of-01024.json.gz": {"num_bytes": 319693210, "checksum": "62215b2451e71b117018ef73570c944aff890624b384c538950b64c37f184c49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00015-of-01024.json.gz": {"num_bytes": 318427305, "checksum": "9893c9f413a1223e7b535527829bcd6df3219929fb1abf8f2a114dd8f6ea0919"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00016-of-01024.json.gz": {"num_bytes": 318785714, "checksum": "bd0ade8b8a57348952ca31c39efdab538f54c852941a225ccd13d0a7170724e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00017-of-01024.json.gz": {"num_bytes": 320134331, "checksum": "4132cfff3f5126d9e783191a5ccc34e5d85938bebf0b8489657805277a227202"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00018-of-01024.json.gz": {"num_bytes": 318653930, "checksum": "4675ab1d77da3d676d9743dca15bfce8478498f7738f79816a25ed790d28fa46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00019-of-01024.json.gz": {"num_bytes": 319468974, "checksum": "1d2f3a6aeb0f6c159295f283d302794cd3eb944cff3fe68691997bb2dc4c7780"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00020-of-01024.json.gz": {"num_bytes": 319109754, "checksum": "b5f26d832a0ec9b0489a27169d94496f5ea33c7fb046868c565c7b5a2407221b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00021-of-01024.json.gz": {"num_bytes": 318514423, "checksum": "428da5a8d4585de16f6b3f30865a5ca7a8d1ddcd3b6002dcc1283368b0c3d60a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00022-of-01024.json.gz": {"num_bytes": 318715623, "checksum": "9bc4812ba5e08c0b2d83cd3804129ba3d77cf84ba3d8828159788ee02e155a51"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00023-of-01024.json.gz": {"num_bytes": 319874293, "checksum": "38843ab4f5c60ed2b9ec0cdc65074eaca454014d5702edd809a266190689d2c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00024-of-01024.json.gz": {"num_bytes": 318105764, "checksum": "4fa0c7ec94445ea57dcecda7864b1346275e711c9820c2c39dbb9fdb95c97674"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00025-of-01024.json.gz": {"num_bytes": 319122521, "checksum": "0758514fa2e2c133c995c00d5f4abfc14b66582a4eedd0e721bdd95c4632a755"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00026-of-01024.json.gz": {"num_bytes": 318116783, "checksum": "56a73b9a556d6794d9c706e1b1c7e729fa13b711ddc25dd403b110eb5ed857f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00027-of-01024.json.gz": {"num_bytes": 320171191, "checksum": "fea1eabb734cda33d72f3d959234a240080b4fd42cc70494814a8429b087f9e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00028-of-01024.json.gz": {"num_bytes": 319047090, "checksum": "47d1c385952d6c18c431a7294339a030c213b8832f970ac987965b621c8181a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00029-of-01024.json.gz": {"num_bytes": 318705639, "checksum": "3c744d3dd915ceef3a93fd18c3ff5b117fb5118d1ced2089979b6cafc81c4525"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00030-of-01024.json.gz": {"num_bytes": 318327902, "checksum": "7f6959020242fdc841adfc10c102bbe79e2ef8502a09dac8451e0cec6f2add16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00031-of-01024.json.gz": {"num_bytes": 318990600, "checksum": "e56f29011594c765192c34298558e7227a829313196748f9a16ec34ecdb76d23"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00032-of-01024.json.gz": {"num_bytes": 320451482, "checksum": "9ea843dfd85e449439f3106d657762daff8f326730fefb342455c43cb48144e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00033-of-01024.json.gz": {"num_bytes": 319878207, "checksum": "2633cdb7b058f126173608897f69add614659b0b21cf54ecc8a2f4a79bc16073"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00034-of-01024.json.gz": {"num_bytes": 318701510, "checksum": "853c4b9ff2d79621ed27a6be826dae198af609d9f9dbd1c2773b778241cf6137"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00035-of-01024.json.gz": {"num_bytes": 318529104, "checksum": "fb50dac3f35cb71472464f511e6b8aee72ded10b3b6896d0d1f74a18ded2b8d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00036-of-01024.json.gz": {"num_bytes": 318849657, "checksum": "5cef5cfd50cfafd58feb452b85324a3d8198fca48789f0ce69227755e72d8e53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00037-of-01024.json.gz": {"num_bytes": 319621215, "checksum": "f0b67abf30e2d58d291aa9bcc9c8a03668afe819549802e4e591a261c171d970"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00038-of-01024.json.gz": {"num_bytes": 318135467, "checksum": "991bad578a83294d34a1b11649af07339aa8cb26d49330afa9fcbca0b87942c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00039-of-01024.json.gz": {"num_bytes": 320131759, "checksum": "abbbc21f81555e94484e6afe1975e13f67af19a820cd6f8d090c987a250bd4fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00040-of-01024.json.gz": {"num_bytes": 320214476, "checksum": "48020d2656709899abd2572b3424c0455df3c1089a69fe26b776aeb24f0da0ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00041-of-01024.json.gz": {"num_bytes": 319581259, "checksum": "db6fb8db7162ac87ea002c153ef0c54322f24c8f7ec263cfa290ac8c3683b194"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00042-of-01024.json.gz": {"num_bytes": 318100985, "checksum": "d499cba2383b16bb0f26b98416211eabf2599641ecd6708a5ef487692ca9e791"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00043-of-01024.json.gz": {"num_bytes": 317803029, "checksum": "dc6f1ccc3fcce79b16c5157f7125942e351d74744efc593f8372f8a408720340"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00044-of-01024.json.gz": {"num_bytes": 318837063, "checksum": "6170fced793461bd687640a658a085d02f971c2e609f6ff33b90df944fb56409"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00045-of-01024.json.gz": {"num_bytes": 319659188, "checksum": "b2f79e8600815578ec326cfc6c5242c2827cedbfac51772fdcf15ef5d027aa38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00046-of-01024.json.gz": {"num_bytes": 318771753, "checksum": "e4b4a3e53ee66c280a5e7ee33602ea0e910903748db8c2adbbec4b48bab1580e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00047-of-01024.json.gz": {"num_bytes": 318088661, "checksum": "bf8597fc359d8e9c721fd1d98b8ff3db5c011afd0fec9640670f31c7a7dddb79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00048-of-01024.json.gz": {"num_bytes": 317777133, "checksum": "369db8e9646b8229a23044a7257c2face97b8e05738f0413b581892876f268e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00049-of-01024.json.gz": {"num_bytes": 319329891, "checksum": "5cb2aa0432984b355b0ec6aad92f926b2fb75aea2a0e08b97f4c6a62838e6cc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00050-of-01024.json.gz": {"num_bytes": 318172322, "checksum": "11a7cc48539ac97eaec87beacef9d9bbb71fc875a0bff0c9ff096044bff46a44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00051-of-01024.json.gz": {"num_bytes": 318704544, "checksum": "ac2beee992c2b1ae8b1f162054e843e2b971bbd7cec45a0a7a7b7795fcdc7c26"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00052-of-01024.json.gz": {"num_bytes": 320806303, "checksum": "3a591fe9993c3d98a9e7949e98ca215ce164cd313fe53f3ce762c91b5fec7c53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00053-of-01024.json.gz": {"num_bytes": 320565764, "checksum": "60e67c8e6f3bfdf8b490ecfe62c79a13c5d04d393fbac712a6cda49fd78e883b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00054-of-01024.json.gz": {"num_bytes": 320425170, "checksum": "d69305c853e9e516f5fd4e2a9afb1939d829925f71102d8aa09387ded5d000df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00055-of-01024.json.gz": {"num_bytes": 318713224, "checksum": "e01737df8097a1526d6c31d37d7aeb1b92c0a7253b39f6964fcc897bf0eba9fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00056-of-01024.json.gz": {"num_bytes": 319441227, "checksum": "fe516c8c0a9e59f9f035ac5fdd13e973d25dd6635eee05d648740d3e8c1fc742"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00057-of-01024.json.gz": {"num_bytes": 319821142, "checksum": "7e058ed9072e968e9c8b92f9b50dab318515873cca6c617b544dacab5a2f018e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00058-of-01024.json.gz": {"num_bytes": 318643105, "checksum": "3479dc5a5b111b7f45f87e5a91c433907af97dbe15b9db1637bad666dcbdec40"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00059-of-01024.json.gz": {"num_bytes": 318053548, "checksum": "8208b0943f59b5914fa13d29108ede31a8d8d34bc6d603a2278ab8b80d28b1d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00060-of-01024.json.gz": {"num_bytes": 317935826, "checksum": "71324b62706aabd6faee682205cdedcd10dad289579b534d0e53f8d9b92bf2c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00061-of-01024.json.gz": {"num_bytes": 318870698, "checksum": "cdf0abc5804f0991871de48b249e30b666cb96f2254762a570c39904c5780f8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00062-of-01024.json.gz": {"num_bytes": 318945246, "checksum": "5ac676e16108446bd2980f9601c787eb754811a68e92ab6403c333820a6b9622"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00063-of-01024.json.gz": {"num_bytes": 318827790, "checksum": "a26f7cfe123cfdf3db7687996d0163212e70ff7635872b0754c03cbd5c31213a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00064-of-01024.json.gz": {"num_bytes": 318914155, "checksum": "858a145617a5902ab02bc77e47ee2f036a6211384c4f2285767c7558eb93e245"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00065-of-01024.json.gz": {"num_bytes": 319794084, "checksum": "52742215df5aaca43bed5405a397571efe7c22107ee2caa8c05e3ed229796efa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00066-of-01024.json.gz": {"num_bytes": 320294453, "checksum": "5b11cd54de0e95a75e53e4e32f72912cb01053d3fb609de6b7a45afafab414d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00067-of-01024.json.gz": {"num_bytes": 319468309, "checksum": "4c6c69b3eba9bcd6786d7dce893340f2d7093012ead04f3539352beccd2794ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00068-of-01024.json.gz": {"num_bytes": 318800742, "checksum": "ce94afc3c612e9de423a412147505ad7757216100becba2677bf5eaf443c4b6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00069-of-01024.json.gz": {"num_bytes": 319416585, "checksum": "ff3084a3e5a3960425a5c605274684c42fa638f99045527f77e74d165e52b6ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00070-of-01024.json.gz": {"num_bytes": 319165846, "checksum": "04c368b05f0ea42b3a51ed9bc0e817894f205c0ecd74084da015158d509ff2a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00071-of-01024.json.gz": {"num_bytes": 318017381, "checksum": "e8320e9982fa377b07c5b3e8a4451ac143b05ab7a4a03f748034b37fb998bfb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00072-of-01024.json.gz": {"num_bytes": 318874499, "checksum": "920f8d5ef2cae6bdbd52f724d0952e04146ff29f4aaec4dbf10bef7b66a98f40"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00073-of-01024.json.gz": {"num_bytes": 317890112, "checksum": "06a41bdb7bf0d52e2fe8e71f594de8d36d77880639ffdfb41e883237f76e8a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00074-of-01024.json.gz": {"num_bytes": 319201956, "checksum": "e0267d6782d30f1619a82c49c20be1c8b5424e653c093e4652a5c8ed117c6533"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00075-of-01024.json.gz": {"num_bytes": 320575937, "checksum": "42108758abc3c3197e7dca8293eed3800f3e79ceae80d3208d90c7a9fd205594"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00076-of-01024.json.gz": {"num_bytes": 320070510, "checksum": "c904b6e6041e23edeb1d88b7b69f07a339b7ff9835d0c22e0b6c354519369842"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00077-of-01024.json.gz": {"num_bytes": 319042024, "checksum": "1eb2b70ad4d12b7587eeb1ce86477817ad992c08fecafe5ccafc26af6b5657f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00078-of-01024.json.gz": {"num_bytes": 319997520, "checksum": "070370654960e02f766c10321546b280e9933531b796c252a94999d645f360b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00079-of-01024.json.gz": {"num_bytes": 320736487, "checksum": "3aa4f007660706563030b590cef9be992c18ba7ec1876210bc92665ec42c4be2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00080-of-01024.json.gz": {"num_bytes": 320082337, "checksum": "3b54eaf407bb593c2b16df99690446f26497530d21cf433a7d525e0eaebe9c3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00081-of-01024.json.gz": {"num_bytes": 318008114, "checksum": "d01975cdbd4360331b1a0f55e9b7e731d7d9fc70c7cdd0f33f1c772eff7aa03b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00082-of-01024.json.gz": {"num_bytes": 317829809, "checksum": "2a65dd37027fae03819ea5a5f6c3b16d921706ad758442881dc1d15b08bc5048"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00083-of-01024.json.gz": {"num_bytes": 319265318, "checksum": "e14cf18c687f7eb304df6abef7235e263a5736c799d742524205dead2abfb043"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00084-of-01024.json.gz": {"num_bytes": 319166958, "checksum": "1dc3fa8702a4477e3a3128440b68d4cc17e6d2ce7f3c53da28d50a57b8332020"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00085-of-01024.json.gz": {"num_bytes": 320338078, "checksum": "0222db7b1ae14c9b10aacdb05d055d1432b6d035e3937df5640facd242c52aea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00086-of-01024.json.gz": {"num_bytes": 318941314, "checksum": "55ddf7a27dc91bf8d932a5efec4aa458122ee337f2cb050e2c4b0ae8e770f3a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00087-of-01024.json.gz": {"num_bytes": 319218368, "checksum": "c61552d76bedbfa750c599a674d6732fb224c8a1e6c6583fca7ccabb20532920"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00088-of-01024.json.gz": {"num_bytes": 318974308, "checksum": "693fae3d50068ec39ad27a14335372c3e1530138cc65931edac5268dd62b7e96"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00089-of-01024.json.gz": {"num_bytes": 318781044, "checksum": "2d90b9318432a2313dfaec542c8b91431505035cca7416a63e3197ab26ad6e75"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00090-of-01024.json.gz": {"num_bytes": 318569651, "checksum": "ee674beda8ed39395e69c899f666990c5190dfad5494867e51fa727e4d38d86a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00091-of-01024.json.gz": {"num_bytes": 319683433, "checksum": "add2489350310ce500dde6637518c747c156f95f079a34367842bf875a8fdf5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00092-of-01024.json.gz": {"num_bytes": 318734793, "checksum": "5cfd4f25e9effaa2f7381bfcf49f9263e10619811aeaa32a77d3fdfc13517006"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00093-of-01024.json.gz": {"num_bytes": 319161014, "checksum": "bed8774909bba5ac656ebaad6e5cacca9e5ea12c80a41fd5689e6798c74f3c89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00094-of-01024.json.gz": {"num_bytes": 320143246, "checksum": "96abe370925f6962b4e75da530b5234eec21fab820d6cb02ae59b6070ab63859"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00095-of-01024.json.gz": {"num_bytes": 319707377, "checksum": "37b68cd632e8f86f364fd61c9581f48ad7602122b7f33c55103ac5bd727f015d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00096-of-01024.json.gz": {"num_bytes": 320159279, "checksum": "fb93c7467f0361c1d4b186d5e25f4bce4f237adb33b4e0ef56f57831b4f97f81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00097-of-01024.json.gz": {"num_bytes": 319841818, "checksum": "7f4d4a9536e37a0c2b9a1806fcb472784ff4d3840aa57e9603e74233b877fbac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00098-of-01024.json.gz": {"num_bytes": 321001731, "checksum": "239b9fefebe3815c8d785bd48086013d1a6dcd76c142786502c674d2d874fb11"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00099-of-01024.json.gz": {"num_bytes": 319475885, "checksum": "0a610d25a547839b8b6dfc2fd964e3ca64b23f0edc52d311c89dcb5e8a44a2c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00100-of-01024.json.gz": {"num_bytes": 319515329, "checksum": "f24d17cbd27296a15f51b9edc713c74a6997bbe82267403fdb6282404c2f4e6d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00101-of-01024.json.gz": {"num_bytes": 318803422, "checksum": "54b8b0c72ffa325abce3dd15bdcd0856b5594500c37f4bc6a6327721ba91e4bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00102-of-01024.json.gz": {"num_bytes": 320934688, "checksum": "24b99b4afa3b631a718a487d679026c91e2c936132df01df969e3173b49e091f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00103-of-01024.json.gz": {"num_bytes": 319835920, "checksum": "a2c68654ba81fa55bc24beb4319c8905f7b532fcb6793a6a311344d4f98a82b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00104-of-01024.json.gz": {"num_bytes": 319402378, "checksum": "27764d82793e35b8a7be3a3fb0470d018243a89283b5501c0b76056de1879389"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00105-of-01024.json.gz": {"num_bytes": 320100928, "checksum": "3bb2499337ebe52b63a5f20ec6ca6283971937962439699bd5e483cf80fed02a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00106-of-01024.json.gz": {"num_bytes": 318707110, "checksum": "83510312aa188431a8dda8746903d70cfc7ffdf5437e44c1f74b7670b78bd52b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00107-of-01024.json.gz": {"num_bytes": 319904239, "checksum": "40d42c39dea8e4898efba1886aa3be67742501f7a51d5bc635b03a2c6c2bd63e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00108-of-01024.json.gz": {"num_bytes": 320050265, "checksum": "88ce3ddae88e8024e76614a1b701c157f66fe39c6f0852a4869c5063876f6e87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00109-of-01024.json.gz": {"num_bytes": 318053254, "checksum": "865a124b663037f36a5738f25c82f8bea2ab54d4bbf8255ca0d1d00d76f8b250"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00110-of-01024.json.gz": {"num_bytes": 319794699, "checksum": "b17e210c8ceef98219ee12eba5dddd2001ded0d417c93955743c238360d96e76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00111-of-01024.json.gz": {"num_bytes": 318761540, "checksum": "05be318a057bb33bf9d7faca58569cdb0880fe8eeb0fc3f57f5999d5f2af55fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00112-of-01024.json.gz": {"num_bytes": 319121509, "checksum": "858dce8e43b06a0c1e26ab3e4f109814b6cc50c6b0e4d146ec79fda001ad471d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00113-of-01024.json.gz": {"num_bytes": 317916736, "checksum": "2e3968e48cb15a3326457d5a6ad49838d20d38c8138c529eee51f94e6bf269e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00114-of-01024.json.gz": {"num_bytes": 319319540, "checksum": "b72dc8207d93848f4fcb265b3e618d0eb8649445f7b9187c5165f4adec3e0708"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00115-of-01024.json.gz": {"num_bytes": 318863372, "checksum": "85ef0bf3cb12bc2fede4158853ed2259dff5d25adf99b43e8c35d7e0b9d4fdd3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00116-of-01024.json.gz": {"num_bytes": 318898370, "checksum": "a0c82c8b48e086be7396338cdda0fed52e8c4753f04fd086b9472c1bedfb150c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00117-of-01024.json.gz": {"num_bytes": 318153138, "checksum": "531d5d03fd8099806d92fbff2a48a0d68dcf46325e732e698e9c142902d152f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00118-of-01024.json.gz": {"num_bytes": 318966511, "checksum": "24b1c5ebbd07d50043be0d5d5c5427e042bdc53280825260226a2823e9b7546b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00119-of-01024.json.gz": {"num_bytes": 318733748, "checksum": "ce1fb1192b770e625430798aee94c93bd748ed474ff815a7f95cadebb826161a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00120-of-01024.json.gz": {"num_bytes": 319672996, "checksum": "4c2a6874921ac4a626a9c8ac4c6e91dae58f1f5b52e79124b3abf254b7433119"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00121-of-01024.json.gz": {"num_bytes": 318779046, "checksum": "029d3ab92f3e1724e3708790148e63b4c211d2ddfd04e3d194b24145e97c922a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00122-of-01024.json.gz": {"num_bytes": 320861175, "checksum": "4bb595140e5cf92147f99b58d236634ddfafbc0b160b4c88b337255482611ced"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00123-of-01024.json.gz": {"num_bytes": 318338141, "checksum": "d508261be287fa3d27e5f44524e22870269054213b61011ee8a6728a77910cc0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00124-of-01024.json.gz": {"num_bytes": 317655056, "checksum": "7612cb9fdd9f4b3a4f8958087ace120d4a73cf26bd16289bb20fc871f5744f2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00125-of-01024.json.gz": {"num_bytes": 317524610, "checksum": "049ebe4971811bb1fdcfd10cc264b2074b3ace18536340644e718dcc3cf3affb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00126-of-01024.json.gz": {"num_bytes": 317902192, "checksum": "d97bddf003b8f647c587fe9a9a9aed75ea604478e0b550d501ad7f07b6061b86"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00127-of-01024.json.gz": {"num_bytes": 319243191, "checksum": "6da4c882f88816a452af54ed217f84d6e4601c11a8e33bd47c49c0a1ea04f49a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00128-of-01024.json.gz": {"num_bytes": 318045852, "checksum": "ea43f63e6ef3bb5723ce75bb51f7183a525d8ccb00c93f49aaf2d9b560f7bdbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00129-of-01024.json.gz": {"num_bytes": 318436174, "checksum": "72ceb525367d6e8d1c0fca94d99d4fe5353ead08a5d52bf00e30e3b596fa90a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00130-of-01024.json.gz": {"num_bytes": 319017217, "checksum": "92f1b2687bee78441eeb4e05bbec2a491469b23c3aad0d951fbbe35a3c27998a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00131-of-01024.json.gz": {"num_bytes": 319237739, "checksum": "0fd07585a82b7d71ddabbc315195c84e2fa78a8319de7dea971cfcc9b38707b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00132-of-01024.json.gz": {"num_bytes": 318123742, "checksum": "c9f5604ca28ea2a9ae5267db50f6e3d1e576841abe840134b3817f370c057073"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00133-of-01024.json.gz": {"num_bytes": 319009751, "checksum": "7ec982de577e0eeff57dc60346ce35a7b35b3c4f037987316cfc071b0ed58a87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00134-of-01024.json.gz": {"num_bytes": 319750057, "checksum": "2619d265d76d82f6b84e2686371e5b6d6c08058cbd5765dd2906af9f549af092"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00135-of-01024.json.gz": {"num_bytes": 319068231, "checksum": "5e1bf5b09f2cd132a7747116442d6f26ce0002eaeb9f56fb02bc00e3abee8716"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00136-of-01024.json.gz": {"num_bytes": 317800994, "checksum": "80ebbf64fbd91215da553e3a8d9442380cee6c3b09fbbf8353a0817993d15862"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00137-of-01024.json.gz": {"num_bytes": 318954070, "checksum": "3b5d2ccafe526a19c52ac0fee50109b6a95ac3c8f7f2272a9a0302c4219e82f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00138-of-01024.json.gz": {"num_bytes": 318452853, "checksum": "2dd88569a62003383a3bf70d68143f16f234535469bdc8ab01a8764f6babb5fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00139-of-01024.json.gz": {"num_bytes": 320013821, "checksum": "f32ca62f6a9d2c8a72901e6f2c08880c2d1907f52beb4e8fdc30f4c02c7ad10b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00140-of-01024.json.gz": {"num_bytes": 319510423, "checksum": "7799838d8019d7cd71a505951f155bdfb862b4a3b3b77e182c706a624617169d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00141-of-01024.json.gz": {"num_bytes": 318339814, "checksum": "1601f6dbcbf4e7f1db119b232e862f3c9fe29e9abe5827177458079299ed511e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00142-of-01024.json.gz": {"num_bytes": 318438444, "checksum": "71d891be156e1b608733a3abe8f8dab7a6213c02931117b99889bc3fe8329d38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00143-of-01024.json.gz": {"num_bytes": 319413540, "checksum": "88fb2e7c3d426a6bb5775041658c07005a469306af0d97df7d68f148b64cbfe8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00144-of-01024.json.gz": {"num_bytes": 319901095, "checksum": "2734ff57f4265653b0b1f292f513017ba791c3091cf8ac0bbf6d75d0074e3386"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00145-of-01024.json.gz": {"num_bytes": 318500183, "checksum": "da2e6747f7230af5941c6bee262a606b4f7792da359dbf7516d82d8301cdf90f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00146-of-01024.json.gz": {"num_bytes": 319315120, "checksum": "6daac97153d51addc8b1e43b686e3d641666df3a106270a141d734079db2ad35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00147-of-01024.json.gz": {"num_bytes": 320621434, "checksum": "fb2584e0ce366ad30c8110591484b84798e9f06e8a27cd864e7800b8d5e2d225"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00148-of-01024.json.gz": {"num_bytes": 318269045, "checksum": "1c963c0ceb6cd776822352b186ae7e3d829ef334efcba0fbdd9182dde4deed05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00149-of-01024.json.gz": {"num_bytes": 318576426, "checksum": "6a21397e0104c7fe0fcd9f1d43a8e546000596d896a95eb9b6c4ab92235e6a49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00150-of-01024.json.gz": {"num_bytes": 318447048, "checksum": "075b113a73e6e21d7cac49391ee559ee8aaa2bb3338f709017077a4007a7bbb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00151-of-01024.json.gz": {"num_bytes": 315388730, "checksum": "bd47e3ac0209676d8a32490eb20ca8c07ca3c45c2beb88dae18b5c8d925f349a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00152-of-01024.json.gz": {"num_bytes": 319701880, "checksum": "241d9cf003f49d95168ebdeccd8209230507d4dfd0d170fa1b57d2355240a95d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00153-of-01024.json.gz": {"num_bytes": 318370254, "checksum": "3aa86900a749224dfed8a67960c166e43c3b9ef3ac7b49d28129b496c7193e30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00154-of-01024.json.gz": {"num_bytes": 320064875, "checksum": "3160c723cea6717fa9f5a9eb627d76107040d084a64106973099fa0e8de48758"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00155-of-01024.json.gz": {"num_bytes": 318089754, "checksum": "5b6e76a85bb1093eaba698864a54a938329b04494f9f72c3c3bbb155174da5e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00156-of-01024.json.gz": {"num_bytes": 320049467, "checksum": "cc013e8aa7c1cf7fc28ebecc64d893d03b092a09d725b5e626851de0b311c814"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00157-of-01024.json.gz": {"num_bytes": 319931950, "checksum": "2a27b4c29455bcd813a84aa3a54100d16cb6bfed25171aa3c552ea452ae569e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00158-of-01024.json.gz": {"num_bytes": 319963615, "checksum": "e477f769ea1513cf607932a29d793fdf1722cdea757e00c814dad594329cfac7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00159-of-01024.json.gz": {"num_bytes": 319000491, "checksum": "ff5d09415753c2aa4b51196e8f4bd6c77ba100ab281314aede118f501565cea2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00160-of-01024.json.gz": {"num_bytes": 319069618, "checksum": "e08c35aef8a20dccad80f6bb1579d6d2ce80113c8bf8459730c69fb7048c3cc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00161-of-01024.json.gz": {"num_bytes": 318750642, "checksum": "13eef84873b58e29894f9bf68a4de72a530c1bfc80a5654262fe71420292b8ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00162-of-01024.json.gz": {"num_bytes": 319847814, "checksum": "a8579c6bcc906fe018881a8474724576c3d0f7f1787f1568b79e5accbd9f962c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00163-of-01024.json.gz": {"num_bytes": 320370365, "checksum": "b97a74837ab9f659c13dcb4deb53c600584beb9e5ceed29e99974c4953f644c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00164-of-01024.json.gz": {"num_bytes": 319894618, "checksum": "9b63afffa2b84c91b749991ddb384399f1d408bd7b6b643e7329e49531ce9a53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00165-of-01024.json.gz": {"num_bytes": 320166197, "checksum": "5b2414477dc4e2b080b34f3b98672bfe3de6028e7ad83c323a7dd1ee08c05a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00166-of-01024.json.gz": {"num_bytes": 319612575, "checksum": "2cda682db53000c14fcb5d251bae4f50c8c4159348f8594c3ef020260f277a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00167-of-01024.json.gz": {"num_bytes": 319183884, "checksum": "5c406d7a8a404436039fde7c2019f0174ff8855caff319fa62bb7960d341b41a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00168-of-01024.json.gz": {"num_bytes": 319396348, "checksum": "df6a422d57a2e1443d10d61b13ab2c5227734195c82b43e1ead2db723cdea293"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00169-of-01024.json.gz": {"num_bytes": 319452933, "checksum": "81c81138e7163072e3779dd10ea8af7dff12b705fa008665298e08cfc2699f03"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00170-of-01024.json.gz": {"num_bytes": 317748609, "checksum": "6586ae8862b8ac925f424afb6ba779e95a147323fb83fc8c4bb0813877b17718"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00171-of-01024.json.gz": {"num_bytes": 319052376, "checksum": "8b3cd21d8ffbe963ce935ef9e0b6efc45f4d5abab703fdfed19a1309b700dca8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00172-of-01024.json.gz": {"num_bytes": 319068859, "checksum": "a42f5f5a10bfc84d51dd0855166959462faccd6a182af4c5d2115ff9995f5324"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00173-of-01024.json.gz": {"num_bytes": 319142377, "checksum": "e26514c5d6cea27c0cf7fcc1daadfa6f218ef9e62039c6d6fccfc31660c0c96f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00174-of-01024.json.gz": {"num_bytes": 319134484, "checksum": "75349aa8c734ed894965500eab2fdf59657a63e40e5a53e822ef1e5a12838a02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00175-of-01024.json.gz": {"num_bytes": 318330467, "checksum": "a3d0d14b28a5a3cc559d6d89e2ec09e49e92aa189e44e68dbb4ea47978e1eca1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00176-of-01024.json.gz": {"num_bytes": 318584643, "checksum": "dd68b42e5bfc656b71fe5701bacb929edae84055131f1dd65bbf3f3ad734e57d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00177-of-01024.json.gz": {"num_bytes": 319275087, "checksum": "05a8ff159006241cf938ef27b292f65906158ac25ac28919aa6761eaa634052f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00178-of-01024.json.gz": {"num_bytes": 318490550, "checksum": "a3aa38083c85baada29b207240bcca1a0d562a93971b420428d039092e58bd31"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00179-of-01024.json.gz": {"num_bytes": 319083249, "checksum": "12858fecd1dec728eba2c8c4311b17e4f2ac1fdb27c23e9adcd9258c5c4fc777"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00180-of-01024.json.gz": {"num_bytes": 319752094, "checksum": "67e968cb8d3ebec2f68eddfc539ea7402aa72c9274034494a43ea7d207b69a88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00181-of-01024.json.gz": {"num_bytes": 320476195, "checksum": "c1bd59eb7ca799e31bf037dc7c087c1ad94e4f88a4f12427c454510d97e1c803"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00182-of-01024.json.gz": {"num_bytes": 318538551, "checksum": "dbe7205a1919dca9d6936158d5653a20d239f2e547ec73280956da4f8c609220"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00183-of-01024.json.gz": {"num_bytes": 319620265, "checksum": "46f9e603e04040b59df8da6ee01d1c30588aa7233a00526d6f0fd84c4172ba93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00184-of-01024.json.gz": {"num_bytes": 318301621, "checksum": "880a02eabae231da388a5782a7194eef0d0211c2d1314db0c56d740647a114c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00185-of-01024.json.gz": {"num_bytes": 320515340, "checksum": "f522147aed30ebb3ab352c92a9dd24cd2e8b93df1d4c4a6284d89ceaa2858509"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00186-of-01024.json.gz": {"num_bytes": 318374733, "checksum": "5005f1c42038769e225a626a88c10bd4f6af98dcc14deed475954b00c088bc53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00187-of-01024.json.gz": {"num_bytes": 319116182, "checksum": "cbd7e0f486c6dac13090cd344337da1c336973e7ec75e32b0bd5b18b98f24bf8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00188-of-01024.json.gz": {"num_bytes": 318981305, "checksum": "064ce8c30b7a960b20720c133c3dd3281d27752a66def44d5133ff8f1b8279e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00189-of-01024.json.gz": {"num_bytes": 317036462, "checksum": "acc052da4501691fdd28f269c633ed826840f2634be49b5e2c5e1273de0cb4a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00190-of-01024.json.gz": {"num_bytes": 318061662, "checksum": "5a436e97c59b8636ca5081b71ca6fe8f8a3a99dd3f426c79edb2bf53345ee810"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00191-of-01024.json.gz": {"num_bytes": 318556228, "checksum": "2eebc89381ff78ae63f311c98b07853cefcc42fbcc210995095d568a6ff70ead"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00192-of-01024.json.gz": {"num_bytes": 317987733, "checksum": "99de46c4702c06a2303262b185b92fad82e12e189c923d5b76d9d8f96faabfa5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00193-of-01024.json.gz": {"num_bytes": 320294532, "checksum": "bccb7d8fc34d6cd6eb41e2a1c6234596b00a5517fdca7c47562fdee0e675377c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00194-of-01024.json.gz": {"num_bytes": 320852679, "checksum": "bb1e7768a57145fdbca7957ed964648d1deab5edc5dfad4722a81ad411c5e0f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00195-of-01024.json.gz": {"num_bytes": 319016077, "checksum": "ac520468a5bd933dbac1aa5f7f21ba276bdce15abf99963ef9d73af294e81e70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00196-of-01024.json.gz": {"num_bytes": 319289881, "checksum": "9eec5740115ab52ce98ac9efbed4fa1c5c06787fe93b4b28f6a1e4df06272870"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00197-of-01024.json.gz": {"num_bytes": 320180232, "checksum": "07a03763b84b4a86b4f71d725927d62c40925823ee454122a00fdb625ddb3a22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00198-of-01024.json.gz": {"num_bytes": 320004709, "checksum": "a1b250b01289fdaf6dcd997ef31c59c580f81f961aa0fd88ae0d175bd07c02ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00199-of-01024.json.gz": {"num_bytes": 321006991, "checksum": "650e57c3dbbf4ed929da8c6c5d78f35fbac4644722a84d98f93342a8d33b2140"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00200-of-01024.json.gz": {"num_bytes": 317913111, "checksum": "42caf6dee42bd73d9e4bf0c7bb16383caa936b2e0a913489b9f0aef57b6004cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00201-of-01024.json.gz": {"num_bytes": 317897148, "checksum": "990974a82de2b1c27465f6d097d7a5718c5ff334271e722ab3736e7aa5b89d4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00202-of-01024.json.gz": {"num_bytes": 319510250, "checksum": "8467066f2417af774363d4984a37968a0189adfe3a581723eab15004930e621a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00203-of-01024.json.gz": {"num_bytes": 319762388, "checksum": "4e7e20980dea2d5e77f380b24580f0df9319a0d1d73ec319e17d8cbe044e53de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00204-of-01024.json.gz": {"num_bytes": 317418128, "checksum": "2c027c5225ea7ce3c31f5f32dda12b7c892c6fdc9c52da6d0af749171cdce738"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00205-of-01024.json.gz": {"num_bytes": 320157174, "checksum": "d953e79c60be0e2c3b072c2186a845a351392ef395fa95135f47e6b8491c6f88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00206-of-01024.json.gz": {"num_bytes": 320459080, "checksum": "bc70c34931942ca143f7eb555e86458afcc36110aa9559151f31d781969d4458"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00207-of-01024.json.gz": {"num_bytes": 317361718, "checksum": "fad5ebd7a81bb737e12e9d4c803aea1a9e905d43a3fa87cace32a64eef01e8e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00208-of-01024.json.gz": {"num_bytes": 319976693, "checksum": "21381c727d945d8d3b4a275e3622bce64b07ed87d7f2371ac28b5d2023359cae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00209-of-01024.json.gz": {"num_bytes": 319550585, "checksum": "8b74e5f1780c4bf12936ac3a86be7a3d11287866522da8275aa4232c1e3d8898"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00210-of-01024.json.gz": {"num_bytes": 319574289, "checksum": "1594bd49cde9641b49a1ad9373a53e10d65440000363f7532a7d326d17c44236"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00211-of-01024.json.gz": {"num_bytes": 320615302, "checksum": "5b6f7eddfa3a9ffb0d6668d10f398b1d86482b64daa9817ca0af549433071244"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00212-of-01024.json.gz": {"num_bytes": 319395225, "checksum": "db58fa453269c794fedb595c6193dea5a85c72ff8b2d43e77c9bb371b8c86b78"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00213-of-01024.json.gz": {"num_bytes": 320131797, "checksum": "1d21d19b5e36820559590b339c049be29f27505ab4e88572edbdb84b649e0b66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00214-of-01024.json.gz": {"num_bytes": 320153141, "checksum": "55c9b4ff1cd8cc88738196f867aba620dec3c8b27b9a485c7e75d3129d76e9c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00215-of-01024.json.gz": {"num_bytes": 320525443, "checksum": "dfe9f44676c1abf0e2875924c094c0d788f8a0172d641d5f810258e948e37feb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00216-of-01024.json.gz": {"num_bytes": 320100146, "checksum": "57f19f5437b0428d9f40799af14f8bfba8f6c82ebacaea8f6fc7531524a6d4af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00217-of-01024.json.gz": {"num_bytes": 320688377, "checksum": "fad4f3143aa303c9c35165a15c6d90087c204c586fe20b0c0f45cf4238311b70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00218-of-01024.json.gz": {"num_bytes": 318896471, "checksum": "aabd471960d6db1e93e1129410d9138d9d9efa3292af7491b3b6844c2bd3f543"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00219-of-01024.json.gz": {"num_bytes": 319298204, "checksum": "f676701589e39802779a0947585638347bb4fe55376a33c6d0afcdc40c5f8938"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00220-of-01024.json.gz": {"num_bytes": 317757045, "checksum": "f3d0994379d244054c5e2db366a081caee28d301aa6b0d9431e7d9eb1cb38c30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00221-of-01024.json.gz": {"num_bytes": 318568870, "checksum": "8026854c8a8cc1d16b52a898b9dd8a8df7901dd8cdf285f5d937c4d5d45919f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00222-of-01024.json.gz": {"num_bytes": 319096912, "checksum": "71f76f898864de3ae60f7c0cdbc68d53cbfa04b2f8493c40d55e1cb56727b275"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00223-of-01024.json.gz": {"num_bytes": 319350414, "checksum": "ba01faf3fe41a738c255b5da83daf53a5858144557af6c6f8d6208a049e4245f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00224-of-01024.json.gz": {"num_bytes": 319007151, "checksum": "94200d12c61f7c73a9e3a2bb089a05b017a215348d52018a34e3224578c0da06"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00225-of-01024.json.gz": {"num_bytes": 319502985, "checksum": "0b7ce650e555baa546bb329d7f0567a3dc0a7ec9d49149792032a86321a73d6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00226-of-01024.json.gz": {"num_bytes": 317983607, "checksum": "40cf6d4b3deb05cd97ebed01405d08ae67be6e896736e4f371d15e5404567599"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00227-of-01024.json.gz": {"num_bytes": 320199564, "checksum": "e65ee475e3b6682b57bfa3f7b9c1cdabf36a7282fc793865df63dbe6a6a3d1fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00228-of-01024.json.gz": {"num_bytes": 318852183, "checksum": "8b27f2fbb0233802229fc776cfcb0b6b43af3149d217d0ab00cca0f1286482e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00229-of-01024.json.gz": {"num_bytes": 319407418, "checksum": "f2d5199a0022134ae127c88f0ac20d1b2b8a88014a774b5432b41085c83ecb5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00230-of-01024.json.gz": {"num_bytes": 320787790, "checksum": "e1b040895ac6068dd1aa892ec93d733096afc4adda698379006ef89926491255"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00231-of-01024.json.gz": {"num_bytes": 318220053, "checksum": "648a6349206c50c17d4e3562fd6fcb0a723b4cb40005890173d5de0c7ecc2ade"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00232-of-01024.json.gz": {"num_bytes": 319702777, "checksum": "0a44b7cb4f354e1eede683a697aba4051c1542fd030dd59767065f5f0204554e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00233-of-01024.json.gz": {"num_bytes": 319154465, "checksum": "4070448b7844776db6754bd33791900bf9ac8dbd81e4cd774a3055ada67f6fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00234-of-01024.json.gz": {"num_bytes": 319846160, "checksum": "b1e8c73078c347fa062ed408e81bbdcb2f714675bab2c082016e822e91ef63a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00235-of-01024.json.gz": {"num_bytes": 317722912, "checksum": "d8aa694e870157b2b5411f496db46dc71dfeed01a42973a65499596921198abf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00236-of-01024.json.gz": {"num_bytes": 318593592, "checksum": "e0c4ff6c8a12128da88777074d0b097664cf2f2395913c4d82b0eecd501946f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00237-of-01024.json.gz": {"num_bytes": 318902831, "checksum": "adce772ed699d7e908ae1fe1ddf1d9875305c7875c93cedf1b3ea0bbc21ff922"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00238-of-01024.json.gz": {"num_bytes": 318696723, "checksum": "926f9fc42cd248077afec1f4b88603c646fc5ae47c4ee3e9b8a5f6b8b6ff7f46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00239-of-01024.json.gz": {"num_bytes": 318321822, "checksum": "439d756b0ffc97ebecc6c48a7dc90da77de7ada05a6eae929db98057ea15bef1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00240-of-01024.json.gz": {"num_bytes": 318992553, "checksum": "1f57af6ff9477263806c0827c0dd8e494e103b6f54eec2cd5f8f8327b01ee39b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00241-of-01024.json.gz": {"num_bytes": 319345185, "checksum": "493932a44e09f4b311ac5bdb519111fad0982708d4b467688f2b1105316544eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00242-of-01024.json.gz": {"num_bytes": 320108156, "checksum": "de5603f1b276f1373011c8884f06af017c71b03c5de3b3bb89cd6d550a0d5902"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00243-of-01024.json.gz": {"num_bytes": 319855563, "checksum": "7c1b74de8ae3699c567edaa6e2d1a1f1ae82f4810e769c710a23cd2dfc536c60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00244-of-01024.json.gz": {"num_bytes": 318966332, "checksum": "d3ada80bad9fa776374878bc7504138e14c161bc9798ea8114b0d187d4c815f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00245-of-01024.json.gz": {"num_bytes": 319541864, "checksum": "3fe5f26e32795c49743d1b2497c333be57248c9db2ce12fb93e103d1a9595347"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00246-of-01024.json.gz": {"num_bytes": 318530369, "checksum": "a0bdeb2dcb5dfb46f843c4086230ba918f2d3ec125654cb924ea11e7c75cafbd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00247-of-01024.json.gz": {"num_bytes": 319496627, "checksum": "0c4099f832ada6b24ef6c1d15267cd3c179f5b3d79e3d813d944e3ebea908c99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00248-of-01024.json.gz": {"num_bytes": 319132981, "checksum": "608b1cd27ad345f6511fb677c00d56b6e827f288877d68aea1bcad3b02dd040e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00249-of-01024.json.gz": {"num_bytes": 318529093, "checksum": "8fd580be09f913cc3809e3b0e467e2faf657a5db6f71b75aa931043267b9b0f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00250-of-01024.json.gz": {"num_bytes": 318248903, "checksum": "faeac675c3634b0834939046e60cdfad6a13558d7a6799c5bde25567898d86a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00251-of-01024.json.gz": {"num_bytes": 319184870, "checksum": "038972e03db75417fc4cb25e54c3aee01e4f022eb0fab202142f539e4d866e28"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00252-of-01024.json.gz": {"num_bytes": 319631399, "checksum": "2fda0c2cec4624c6068556e16630c3551ef3110759bed59628913a9debd547a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00253-of-01024.json.gz": {"num_bytes": 318275716, "checksum": "b5da4bfa564fcc6c49a573b90e679d60c4e222249858f4e58fdb3727a5f279ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00254-of-01024.json.gz": {"num_bytes": 318638865, "checksum": "279eb2978fe94e1570318a247b82487c04d7494ceed74dccb1d7a5734ea84e5c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00255-of-01024.json.gz": {"num_bytes": 319640339, "checksum": "aa0a1ef845d0df7d81d2588d53f29205a4e3858a0888c1b7d9c83eb2fe1d32a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00256-of-01024.json.gz": {"num_bytes": 320353593, "checksum": "407133ea3b32a9e004b992a1bccade0440a39d0bfbd12993ea78c6526c0864a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00257-of-01024.json.gz": {"num_bytes": 318165587, "checksum": "72b7a72b8402b22cb51db44c9e7859460366c7c9d33e16a4c038ad07f7ad8f3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00258-of-01024.json.gz": {"num_bytes": 318003534, "checksum": "e5f9f2f74b7f9958dc9535f04a8965749ca4bd68005a6efa36f480fb487ca930"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00259-of-01024.json.gz": {"num_bytes": 318990454, "checksum": "7cb3c284613537fc6b1a85d7187dfca30b37a7a1a5708094f17486e3184e2d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00260-of-01024.json.gz": {"num_bytes": 319514850, "checksum": "0067e36b7156196e2451cdf78dc8832352f2481a4740afbef9046104b6810bdc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00261-of-01024.json.gz": {"num_bytes": 318747661, "checksum": "b1e4597420035c355abe15efc576751169e2b5e4c38e073c178346a7202d5ab2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00262-of-01024.json.gz": {"num_bytes": 319868329, "checksum": "374f4b951e545968da45b5055af2aa0b128c1d65d6c854f5b8f7e02d22c352e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00263-of-01024.json.gz": {"num_bytes": 319268788, "checksum": "7168e635a32859a85a152b29bcd1f699257ee4e340517e218ea9b8dac3922210"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00264-of-01024.json.gz": {"num_bytes": 319270640, "checksum": "1da08b65c83e79a0f5b7215e5a4ee58f21383b69f09dd9a3ba95381ba3d56d25"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00265-of-01024.json.gz": {"num_bytes": 318744354, "checksum": "0c908e81d59b2099eda038731b387a0ad86fa3d168eb2955413dde9cf29d947b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00266-of-01024.json.gz": {"num_bytes": 318518406, "checksum": "115e375464931638de4af669b7301b6112d18b23835f2db2b092f47545b1a855"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00267-of-01024.json.gz": {"num_bytes": 318921711, "checksum": "6d66c715137885a46f2472489b21751284ec8ecfde6dca6be3ec1ee75f6cd5af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00268-of-01024.json.gz": {"num_bytes": 317786222, "checksum": "588865d8f9d3da5a70c958997060ce4792e175c8fc5323f1887787070c8c160f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00269-of-01024.json.gz": {"num_bytes": 319004956, "checksum": "163ec7497602931de2eaffad320704e508e491937a2965e39907a086f640d975"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00270-of-01024.json.gz": {"num_bytes": 319175186, "checksum": "794e0e7ceccf28457a8ed5b0724337545661da16feafd0a53e4823b2cb1c92ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00271-of-01024.json.gz": {"num_bytes": 319785821, "checksum": "9c9ec0348f7d4ffc61e5f19f1f60c8382b33ca2fe4b852567cbc3c16024a4627"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00272-of-01024.json.gz": {"num_bytes": 318933435, "checksum": "883d85985237948018b13c20f4d4ee567c6ee36a135b326e8117d73dad4fe37a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00273-of-01024.json.gz": {"num_bytes": 318456664, "checksum": "fdca13067e8e118e538b8de538e164fb5397724045a5b1b02764510c8de90969"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00274-of-01024.json.gz": {"num_bytes": 318418161, "checksum": "27556558fe8a91a4aea4800ba9b7e844336a7638c5b96e652fcdb359f631b04f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00275-of-01024.json.gz": {"num_bytes": 318437784, "checksum": "6ad4e6a3e1cee04aee3051a66531e3f4aa97f7bbb7602c6aa5f46a727b319f2b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00276-of-01024.json.gz": {"num_bytes": 318470946, "checksum": "145a4d85ddf1e72fcdb8477dcd2f70a5554d9cd9349e02e058d3e7837204b6ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00277-of-01024.json.gz": {"num_bytes": 319580624, "checksum": "7116de0dbc5c7f6621f7c107dded9d85788937a87f2d56efca32ae9f25fc6865"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00278-of-01024.json.gz": {"num_bytes": 319619699, "checksum": "8dabdf2d26035d30c22204e6f46f292c58f4a4c3b0b77a1826a43341d4282df9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00279-of-01024.json.gz": {"num_bytes": 319344020, "checksum": "c2b7d5bf62be1772c6bb80f597b28d948cf3cdefb10b6df6f777f0ab7d8fb015"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00280-of-01024.json.gz": {"num_bytes": 318997864, "checksum": "025457720b0045e7bf01f9b4b847f28ef94af9ca250675efeee73eeb340a3f36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00281-of-01024.json.gz": {"num_bytes": 318718146, "checksum": "2979c0ac06570a9ee437521778c514bd8755193b9f1ae6a5a671ef885243f019"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00282-of-01024.json.gz": {"num_bytes": 318434530, "checksum": "a17bca50ec20c364adb899a9073bbe3a1505f81803a58190efc5d4f3f78b58be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00283-of-01024.json.gz": {"num_bytes": 319317663, "checksum": "9034f524fc5c2e246b22e2dee00b47e0c4da0316bc60d0a11d966c28db917f9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00284-of-01024.json.gz": {"num_bytes": 318957832, "checksum": "f08b96047e711831dfb8a44d90cb712d3e78c98dd28ec6b937ee83949bbef5b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00285-of-01024.json.gz": {"num_bytes": 318643283, "checksum": "c5df1f2e2dad46d71f8aadf856a5139020da8afc2ee010d53c0372ea09b2362d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00286-of-01024.json.gz": {"num_bytes": 318064839, "checksum": "16f7fd6abcbc69750b8131bca3e38ddc40bd7c86c48122ad2a9a77cb9cfd552e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00287-of-01024.json.gz": {"num_bytes": 320328448, "checksum": "41e82bd357b47a28f28a4a203d5b54263aadb3c9a08899f78302c727c56d8b38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00288-of-01024.json.gz": {"num_bytes": 319559271, "checksum": "970b9df224b58ca50b3023d92f6be0c37dbda479155c29c535e457ef6f2bca0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00289-of-01024.json.gz": {"num_bytes": 318786822, "checksum": "36a6515e7f516335d3fe057bb6ed9890a2aea033e08edd8588b3168b3445b2f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00290-of-01024.json.gz": {"num_bytes": 320634782, "checksum": "7d19fc82b9a5aa0e0046cd17cd2c46f356f8a4a7d203d5e03e1f319156f05cb8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00291-of-01024.json.gz": {"num_bytes": 318746713, "checksum": "86d610d4590bca69281348dbfaaec9e704fd6194141c50c71e84aad51ce26b91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00292-of-01024.json.gz": {"num_bytes": 320049630, "checksum": "d045df646213e29d4e7de4ec8915eb3b65bb962f35b0d74abf00889bd5aae8ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00293-of-01024.json.gz": {"num_bytes": 319966146, "checksum": "c66fff1a64b495211bfdcea650ff76115f8c857b9154c1b869062e702714b9ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00294-of-01024.json.gz": {"num_bytes": 318805332, "checksum": "ef3d9204ec85a1e65ae48af7924f614403d297a15f232ba41eb0e4fe223e507f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00295-of-01024.json.gz": {"num_bytes": 318898465, "checksum": "2a071fc28b1216f2dc0579528d9b04e597b5cdac9fd14719e312092242da190a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00296-of-01024.json.gz": {"num_bytes": 319406630, "checksum": "ea71e9fd444860d70d3728f7e2213a4bccf3aa31a164c9acfa8df7a0b6619786"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00297-of-01024.json.gz": {"num_bytes": 320312971, "checksum": "ddaeba8aad38b7e9727c579cc44f15b3c82d292e2901b47b785e9c8d3d5cdb9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00298-of-01024.json.gz": {"num_bytes": 320660744, "checksum": "814460ccfda29b45edaee5f44e3c980889aee2ee52e4e5323931ea489fbe938e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00299-of-01024.json.gz": {"num_bytes": 319848186, "checksum": "3b91fe32d3a731a5be3bf778eedfe13e8a7e26ba9eda51c278c5212aa7925681"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00300-of-01024.json.gz": {"num_bytes": 319647278, "checksum": "1e0424631f7f354bc63b3e71c5c6516c85343dafd3896acb9560eaf93b672799"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00301-of-01024.json.gz": {"num_bytes": 319080252, "checksum": "46c21af013f611729cc06ec033dbae80151987f9098e57fb98e2631f6fe76c8f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00302-of-01024.json.gz": {"num_bytes": 320028246, "checksum": "d1ca8ad6e5bd6cb18db1f1be9154dbc8ba9df7ca02db4c1f8a7df9d40820d8ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00303-of-01024.json.gz": {"num_bytes": 319388787, "checksum": "bce87161f77464adfb1fc04fc2993211bcec502d7172b86f726daf7096b04f82"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00304-of-01024.json.gz": {"num_bytes": 318627831, "checksum": "235b8085cbeb7b13f8e1a5f6d2225a9461b7bcd76e21466a189c2411ff4c4107"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00305-of-01024.json.gz": {"num_bytes": 318148428, "checksum": "f13f124e0ea150da13ebeb3390c311b3db54018de0d640579307bbcf2c46068d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00306-of-01024.json.gz": {"num_bytes": 319451712, "checksum": "de5c3fa2cd6a47551ab43268484d017602e2c3e1f66f43f1a1d8f95bac52cad5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00307-of-01024.json.gz": {"num_bytes": 319026244, "checksum": "88769fbf393671db352227a64cb8ba6b4ba60c5bddb4a14294b1ad9a65a750cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00308-of-01024.json.gz": {"num_bytes": 318447454, "checksum": "555bcfc0ba4db0551ce5ffb18057027ee695af166856125aeb79f7ce013851cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00309-of-01024.json.gz": {"num_bytes": 318147676, "checksum": "bf28e60a7970c548190cf0f4fe56f27ea55a1ad8313fa353a8013f0a0e7919f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00310-of-01024.json.gz": {"num_bytes": 318930650, "checksum": "45a68c0ef70ecd10838d604d51fecd26e5199f5372022b9c2af461a71c24c6ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00311-of-01024.json.gz": {"num_bytes": 319955339, "checksum": "fb3c4e93166f1cb2ccc8a7b68da0246f0827d3a81bb5614c8c84f1c01c6d53c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00312-of-01024.json.gz": {"num_bytes": 318554567, "checksum": "0dce2ac88ba7ac5340d551add9fe7b1a30772a6cc082347c536427b48daca598"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00313-of-01024.json.gz": {"num_bytes": 318978931, "checksum": "c5f99dab085fb705769a514626c9af8a26cf846fdaee4b403a3d6f84c892cb66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00314-of-01024.json.gz": {"num_bytes": 318158197, "checksum": "79de4fa2aed5e3efa71e75d13f08d7c1869aa59f42a819f4429430b3db6c1b27"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00315-of-01024.json.gz": {"num_bytes": 319744521, "checksum": "5a47a89a1537662a91853bbe2a5b3e243f5de74489f820621192cacef192593f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00316-of-01024.json.gz": {"num_bytes": 319861527, "checksum": "1cd34f17f3ae3c8bf8e1636714a9ff600a26799d5ec02ba42abefa5db9d00e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00317-of-01024.json.gz": {"num_bytes": 319286030, "checksum": "a3e34af81264a72b523b63fdc0268f450675f7993fa0885eb2b4c747b0d6703c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00318-of-01024.json.gz": {"num_bytes": 319054871, "checksum": "02fa8cf278578108083bc9a3c5cf07b0a9d243f2162397091ede6c85a1df31e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00319-of-01024.json.gz": {"num_bytes": 319943810, "checksum": "93ef0d7f1610043a6f7634af73e89ee9f3d7e87828ad34558a4d688e6fa6b6dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00320-of-01024.json.gz": {"num_bytes": 320037211, "checksum": "06fbd99a3d64df293db2655f321117f1afcf1cda51e421edef9335a25cb1a902"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00321-of-01024.json.gz": {"num_bytes": 318584237, "checksum": "a224e4d902f7368f91d6a72fc9f5730996dc37de576bc2211eb632e3690f1b38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00322-of-01024.json.gz": {"num_bytes": 319686632, "checksum": "57fba28c7104ff659f8a0f330ae89c68d3a392dd14a78247fa357a3bcc8b94dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00323-of-01024.json.gz": {"num_bytes": 319834993, "checksum": "e61c760cd3c42f71a1a7bb6adc4e0bc970bbf864b69e2a4a5d56bf0a14d4e0be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00324-of-01024.json.gz": {"num_bytes": 319243057, "checksum": "61d21ab1e7729f172ade5ab6c0dcaf07eaeaee6e047ca1c24722c06ddd919678"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00325-of-01024.json.gz": {"num_bytes": 318569583, "checksum": "2192a891ecc2a6aa9f6ea64f1d76ce763e0a3963ae03c95275ccd626171835ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00326-of-01024.json.gz": {"num_bytes": 319175980, "checksum": "d35e4d5f8e924ad97520db51a2c361bbc02097721195932b6768e7460df092a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00327-of-01024.json.gz": {"num_bytes": 319892298, "checksum": "ce967065d3915d466982b5258e07ad2c46b02d7637057e0547586657ea0f53a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00328-of-01024.json.gz": {"num_bytes": 318004026, "checksum": "0676d556f46b1f057669d3378c6fc335db6e3ac67a02e11dce3823658730f4c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00329-of-01024.json.gz": {"num_bytes": 319066225, "checksum": "b00bb4bda957e1287b98c432165448b3899f9155363f7b61bfd0f0181181acfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00330-of-01024.json.gz": {"num_bytes": 319268288, "checksum": "d14d1883941966ef3b35203d06e6fa1bb485dd77118bd7b6c811b0d06fa72fae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00331-of-01024.json.gz": {"num_bytes": 319131311, "checksum": "4d5d41c2b2242b299fb67fa8c9327db8b4f612bdf4ee9af4d4e45aba8cd1e409"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00332-of-01024.json.gz": {"num_bytes": 318827508, "checksum": "68cea08d4805b392bf4c2894a4501ee3fbbe9aac4b1b6533e686ea749ced2dcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00333-of-01024.json.gz": {"num_bytes": 320572240, "checksum": "06f211ae2fe1c4eef5e41caceda8ebbc289261057911fcf2583a59c730b7951a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00334-of-01024.json.gz": {"num_bytes": 318121862, "checksum": "46c62769e04ce8acde4562ba24d72e245babacdfb50600da4e6217948ad71d24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00335-of-01024.json.gz": {"num_bytes": 318692168, "checksum": "dca69a6976e7387a12c8da16b696ed4f604254693a3280be0f90fa694700b595"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00336-of-01024.json.gz": {"num_bytes": 319479902, "checksum": "c52969fad97f1dc0e1e115428e7dad1ac6cb6d804db0cd34f0fc7846b1b50c7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00337-of-01024.json.gz": {"num_bytes": 319987407, "checksum": "2c570f02aa6a6bac96be1e02663996c87f9a94c160f22101ce8ae1d549ae1de2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00338-of-01024.json.gz": {"num_bytes": 319051086, "checksum": "77132df95b147c471ead74bef16ed4fa11e15209f518dd460110132358816834"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00339-of-01024.json.gz": {"num_bytes": 319473192, "checksum": "7f3ac20a72d395c02ed3cb50052821521dc2d8d97303d00e0d0982e2c29e7659"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00340-of-01024.json.gz": {"num_bytes": 318423485, "checksum": "d1127da89e960d939cfc06cf1985df415b60d4bf02b12b7fab02b796100feaee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00341-of-01024.json.gz": {"num_bytes": 320087690, "checksum": "f753423f82157e95506566d3653d32af6a181e69ea0e10b4d4eb24b626d3ca49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00342-of-01024.json.gz": {"num_bytes": 319767100, "checksum": "db7410e6a6ca74163098681038f497faa373e1d81434b45c1a2f273d467c0a2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00343-of-01024.json.gz": {"num_bytes": 318389429, "checksum": "7ea1e432a1ffbed8f4ad6cb985c5cf1b2584d8eb7d2fa091a2db3f104a3f7210"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00344-of-01024.json.gz": {"num_bytes": 319117212, "checksum": "c7317a81a6224dec9be07b41134ac7a7db4039b7c98b2061b20bb59b82ed0a1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00345-of-01024.json.gz": {"num_bytes": 318504232, "checksum": "1498efe8280609d9d66c324e332c9433c6351bb7b99c5891a8f27d6841410407"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00346-of-01024.json.gz": {"num_bytes": 316721169, "checksum": "0cbc6b494d653878c9d52a37572064b88356058ed291aa773e5f47259fbfc722"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00347-of-01024.json.gz": {"num_bytes": 319007736, "checksum": "6265505e19a42a01a159297d33b1a91cd0e042a31ba6a1a867404a143ae565a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00348-of-01024.json.gz": {"num_bytes": 320167918, "checksum": "cc8b29deb44c8348aa4d05836f89cbae995c946f38d9cb8e7fedbd4762168ba0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00349-of-01024.json.gz": {"num_bytes": 319901226, "checksum": "2a0f2188b43ffedc8b95a8276c7647147587c5e544c9e6475e790f4b5e362992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00350-of-01024.json.gz": {"num_bytes": 318999223, "checksum": "1fde48c503998872aa71fc524c7408dc84cbc1faa0d885895d5c57708a15fced"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00351-of-01024.json.gz": {"num_bytes": 318935410, "checksum": "72d577eabcd814a7ff61b894b3fe9089f483a793e692d3ab20ce4ee59921f975"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00352-of-01024.json.gz": {"num_bytes": 318655907, "checksum": "8686dc0e4ff7b35cbc4fa6f3abce50c06f8b95378031c132a117e1d458cb4616"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00353-of-01024.json.gz": {"num_bytes": 320619683, "checksum": "cd5816469ef54bfeb0db6b55a78e0d34eb2e1f82448a41f67dfb70061c3ea91e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00354-of-01024.json.gz": {"num_bytes": 319352400, "checksum": "bf082c093423d562da4984b1f0428225d853a05b5f8fb3696273f36ebb5a235d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00355-of-01024.json.gz": {"num_bytes": 318868462, "checksum": "3b8baeca48e55a2cd268d6aef75f7eed96ef10fceca593a5179d52a2b0121f8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00356-of-01024.json.gz": {"num_bytes": 318903295, "checksum": "4c9a9926a4bad6721807d99cc02a9b6bd28bb0a6254aa1c15527b745c56a06a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00357-of-01024.json.gz": {"num_bytes": 318881446, "checksum": "84b4c2e05bc162fef4824e97ba7a03b1cecb41eda08a3e0aedd264b66e859a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00358-of-01024.json.gz": {"num_bytes": 318521100, "checksum": "aee99528ffd0323fe81e4ed26ed1b9295baa2a3910771dd2a42f4f378fd82569"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00359-of-01024.json.gz": {"num_bytes": 317796778, "checksum": "7b01f2d5ae54f60c2aeb7b96bd366d21e558e2dac48c83a78df9850f37e02f1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00360-of-01024.json.gz": {"num_bytes": 319502919, "checksum": "5b54f9a050e6f9008a1806101ea553d90eead56c949a5f3f46c8ccb88812081b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00361-of-01024.json.gz": {"num_bytes": 318595505, "checksum": "49f4164d66187d46adff7f9bbac97b232ab7906d812e571c2e0bf028895e7f47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00362-of-01024.json.gz": {"num_bytes": 318851572, "checksum": "17accad3c0706c54530f128260cacbf986cbbb20427d4ba8d3444a3702a22c55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00363-of-01024.json.gz": {"num_bytes": 318555337, "checksum": "2327866e541aa6aa73f7289c3ad82a19ff154d39657d98cb78a2f481a8765920"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00364-of-01024.json.gz": {"num_bytes": 318641145, "checksum": "6f52354d804e8d4a1af1f6c2c6b759ae115c4f23a63f1206a73e7e25acfbdd02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00365-of-01024.json.gz": {"num_bytes": 319212614, "checksum": "8f1834eeacc9bbdee95b1f0a4078eb9488bd1a7c5693489bff7943869674cad3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00366-of-01024.json.gz": {"num_bytes": 319336585, "checksum": "a9cf01b76104eebb4ef8462a924f61c262fa197a7c68a50e48d925cb81586e3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00367-of-01024.json.gz": {"num_bytes": 319161263, "checksum": "5ac822027d50c3196026fbaffc7d968e1ca702b947688a6f4d268b942b5067b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00368-of-01024.json.gz": {"num_bytes": 317911640, "checksum": "f9acffbe3c6617e85911ff9dcecec2378b3469ab4546a6973cceb460f9003cea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00369-of-01024.json.gz": {"num_bytes": 319585031, "checksum": "9234553649cfa5265c5a9ccc88486402f88eb81275067c51d9deef16bbe7211f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00370-of-01024.json.gz": {"num_bytes": 318345879, "checksum": "2fbb410346d31a33e8532602f4e3340fcc75c96be803250e9f0f1a6894ca0052"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00371-of-01024.json.gz": {"num_bytes": 318996184, "checksum": "b069b0c8a830ea841e82077548706f286308ef0420e163ff6d8312c8853af172"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00372-of-01024.json.gz": {"num_bytes": 317989343, "checksum": "bfd62e448d4d9f89353abaa384007b0b72bd860402ade3a9d938051a6446530b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00373-of-01024.json.gz": {"num_bytes": 319770759, "checksum": "e4e176250aceb7362ce38d496556a46409e9872e69f45166afe71aa750de8fcb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00374-of-01024.json.gz": {"num_bytes": 319212902, "checksum": "28aa4510c3ddb9ee0ac56aab3792bfe5e899531919ccc0214a4b68bbf2ba18a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00375-of-01024.json.gz": {"num_bytes": 318968029, "checksum": "35326b1f2280e07dd754e89dfa29989d0dfa5c78995d393b36a752d8364bfcd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00376-of-01024.json.gz": {"num_bytes": 318685188, "checksum": "0060dbaccf7f2f956fb8b57891cb176914ddac1bc485dd86c2fd110c46d174b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00377-of-01024.json.gz": {"num_bytes": 319291982, "checksum": "99fc38654197e506868e099c15b2cb15b93238dafd33f81a7d069b3e01c3b085"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00378-of-01024.json.gz": {"num_bytes": 319259094, "checksum": "9b8d97f9d57dd97373c4f57eae2b9c01a58e49017ee41d3969e94fb4dbabc260"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00379-of-01024.json.gz": {"num_bytes": 320228224, "checksum": "82913f2d182d2a57f6c93e9b229862cb72feaa6331d04cd4419113e1eb9d52cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00380-of-01024.json.gz": {"num_bytes": 319738339, "checksum": "e0de43f754ab97d103a02c708d1cd7e771ba079bd9e1f7c532a80a30bd5182ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00381-of-01024.json.gz": {"num_bytes": 319210620, "checksum": "df74823f78564b544677410508e675e2811905c56afe2a60d19d3e049dd65394"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00382-of-01024.json.gz": {"num_bytes": 319810275, "checksum": "f5d5291a695fe2cd228213fa2bf090bf6513c49c6911826aa43ecaefec0622ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00383-of-01024.json.gz": {"num_bytes": 319190426, "checksum": "a861ae79a66b72d6cd5e0a030daae52cffb85ba1272c36ae2be04a9b7c0287c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00384-of-01024.json.gz": {"num_bytes": 318501845, "checksum": "b8d0f5078ae82980f0f64120530bbeb20f627be0a8629d68885acb867091417f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00385-of-01024.json.gz": {"num_bytes": 319530458, "checksum": "7da119f3f63e25ff63cacd8ba0d77987b2d576be1f4b86e7e45aa3f2d194624b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00386-of-01024.json.gz": {"num_bytes": 318938980, "checksum": "c21f3de56fab26d7fb60bdb47c216b22793f67b8fa6d382520c79b88d1896f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00387-of-01024.json.gz": {"num_bytes": 319207426, "checksum": "e28b0884092f75836eed4d73ed24b7403d7b0530fc389386a68887420b0c2603"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00388-of-01024.json.gz": {"num_bytes": 319835376, "checksum": "b4f0db632cc9af66e8aea109c80d73a6281207e29ece131d5bf8b57ff8f81262"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00389-of-01024.json.gz": {"num_bytes": 319346837, "checksum": "413a8d8df1f6cf3094839b57231da5323f33f7115768c65d83f0af1574f71b6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00390-of-01024.json.gz": {"num_bytes": 318632301, "checksum": "a3e8664fbb3ec2af5a217225dbb7fcf3e93b427e5da1a88e35c04c319d61e4c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00391-of-01024.json.gz": {"num_bytes": 319066082, "checksum": "e22eed3415c90510e97768be5a685e0a8035e2635ef773c56e9ce2718c278658"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00392-of-01024.json.gz": {"num_bytes": 318356286, "checksum": "ddbf325390648d9d86f1e7901b75c99fe8db538d203de8dfb4c304282f82cd74"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00393-of-01024.json.gz": {"num_bytes": 318048288, "checksum": "974fd05f356c86be2f9109b0272eee69c5b2eaf0b16104cc573846c925d13b4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00394-of-01024.json.gz": {"num_bytes": 319444683, "checksum": "0d27d6f8c3b935cef23ea60abfa82bd6a4f5e2e061080419dc9c6bc455b9f868"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00395-of-01024.json.gz": {"num_bytes": 318353166, "checksum": "24d9956bd857484ffbabb3ba6f6ac688f48a94b50228238c7c9153a5c6878a7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00396-of-01024.json.gz": {"num_bytes": 319960396, "checksum": "9425f4f18e1690ded866c4b5313cbac8a6210092dc42f720200b7143b69eabe5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00397-of-01024.json.gz": {"num_bytes": 319030577, "checksum": "dee166674b835b9849d281a87238aa136e14d26edaa72d0ecb6b7e82d556a72e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00398-of-01024.json.gz": {"num_bytes": 317664320, "checksum": "f85e08272f73ce4aa602719d59205db54d230a6b7247830d78f91eac63d753be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00399-of-01024.json.gz": {"num_bytes": 319623875, "checksum": "85dea0672a0362a08503b70623907c8c92bd105f788fbd7f3816212a9181e7c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00400-of-01024.json.gz": {"num_bytes": 318840274, "checksum": "a104345698500611cd1a71a6647555300d315490918740a8c6e3b8dcff315407"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00401-of-01024.json.gz": {"num_bytes": 318336377, "checksum": "808327d156e183e102fd75cfbdb7b5a1fbde3740168f59b767ea380608305b67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00402-of-01024.json.gz": {"num_bytes": 319270185, "checksum": "b6a5f7c1ade628091fe86744a6011147ec32795ad694ccbc82929791b93aa307"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00403-of-01024.json.gz": {"num_bytes": 318038520, "checksum": "108904ab05b3ad23318f8aa0f7ddd00d97aae1872fb157eea73273e011cbec04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00404-of-01024.json.gz": {"num_bytes": 320933185, "checksum": "cd0c068c0831218849149eaab8f8a98748823911c745ca0ea33ae839bd625e04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00405-of-01024.json.gz": {"num_bytes": 317694827, "checksum": "d99909ccd59e2ec183b41a7c6d1bd5677798bd7fd784ab681546a7bf8292f353"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00406-of-01024.json.gz": {"num_bytes": 317937468, "checksum": "c7f2bd7a366b8c389e41fdfad4891068c86039e1a5fc3b8a0b993253badf33d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00407-of-01024.json.gz": {"num_bytes": 320226074, "checksum": "765db6f9f0c8c3d9bbb0499f0010928fe4f90d5915dfdd3b6d09d3dc78ad07a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00408-of-01024.json.gz": {"num_bytes": 318613788, "checksum": "165e78c858dfaf010307392474d4917846c9d21658558912e5ffc915803bd2fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00409-of-01024.json.gz": {"num_bytes": 319212414, "checksum": "5f7d5952aad1ae31413962983971b2b422d77c262ededd2ce1c1e186aeb6d87d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00410-of-01024.json.gz": {"num_bytes": 319023647, "checksum": "24588d41f40e3fe389575b97d41ef761be46bc9a9b3965c5e3f994760f7a4070"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00411-of-01024.json.gz": {"num_bytes": 318408922, "checksum": "b35d4ada5a000f51169557b00e508706d51a7becd33370014ff07c8b8dac1af5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00412-of-01024.json.gz": {"num_bytes": 317166932, "checksum": "d3ed1cae269ebefe4716843bd7954bf7e44ee889f72066afbdcd95f4e1f06703"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00413-of-01024.json.gz": {"num_bytes": 318519121, "checksum": "07fc61a7e164301113201e78c99d40289d88e0b463048e14aa5fe69c7490ccac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00414-of-01024.json.gz": {"num_bytes": 317417235, "checksum": "c5a7222b2eb8e8fe690f29a0fff7e214ba94e4d9dae62f67281fe25dd385b721"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00415-of-01024.json.gz": {"num_bytes": 319690993, "checksum": "37052fff729bdff124577d5ba041906b2ea7420c5cb28195e6cfca0e41d560c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00416-of-01024.json.gz": {"num_bytes": 319466518, "checksum": "6e8ce2b9e6e8208ad7e43ce709454cb0b96572d793e0b11c15892f5df18f6137"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00417-of-01024.json.gz": {"num_bytes": 319694381, "checksum": "20892d7a33c31d7967ae0cf595a2108de96a61c0bbd773aebc5d3d083f6ed93b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00418-of-01024.json.gz": {"num_bytes": 319048918, "checksum": "fd795ae8d53e632bb3e89a2becc5b801e10db781b14f2c0ed50b12def5376c8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00419-of-01024.json.gz": {"num_bytes": 319791424, "checksum": "5a8e56faaa0892249e5694ae01e2e4dcd22d9750a9aeea5ca390117c77b8de2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00420-of-01024.json.gz": {"num_bytes": 318060925, "checksum": "795ee64f4c9e2e35d9dc0c91ea593c9e41a3924162901fbf782dc7112f8094a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00421-of-01024.json.gz": {"num_bytes": 319328927, "checksum": "2670b7b6b53e9082c90e4a4e915f72673831ff15e9f55918a1244e0c19c8f963"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00422-of-01024.json.gz": {"num_bytes": 320065363, "checksum": "34df2d1afac2ae4699524492d6b93e4a2a1e551cb4a4ae35fc19353930afab8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00423-of-01024.json.gz": {"num_bytes": 319349887, "checksum": "a2b19afafb45cf30493ac2a3eb013e136e7213f63bd633374ca0d9fe2780efe9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00424-of-01024.json.gz": {"num_bytes": 317515288, "checksum": "ec2a84fb16dd16f9547f0c3314a91968324f2c537118ca36e982b235e23527ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00425-of-01024.json.gz": {"num_bytes": 319092219, "checksum": "1ac0b93c0faae7d446add3af3173637a4b0d638dbd5285b0f4e1bf3abd0d1542"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00426-of-01024.json.gz": {"num_bytes": 318421245, "checksum": "bade501dc71c0b4968a9a7c833751cee5d8f7067a45dabd53aa03534df48886e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00427-of-01024.json.gz": {"num_bytes": 317847935, "checksum": "7aef554aa2b120c4d787395e28aceba743e309f2540fab283e077a1429a2f7ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00428-of-01024.json.gz": {"num_bytes": 318822008, "checksum": "cd94547fe1953a1cc074d97558a70d1e55834606379a8f5e6e60e1b15b56fd35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00429-of-01024.json.gz": {"num_bytes": 318507684, "checksum": "4d3c9245565a808058293558603c657d6e9a0c87b6d2d4b871b856cea2eb3a19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00430-of-01024.json.gz": {"num_bytes": 319042136, "checksum": "9c5a4fe50db5d0822923fe29a5aa8ca6cb09e3629472b1bf61f670388b6c2076"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00431-of-01024.json.gz": {"num_bytes": 318925124, "checksum": "8f18b35bb952da090ade742753e30861ba39c6c54c8ff2d76b358ca7be475ed6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00432-of-01024.json.gz": {"num_bytes": 318680251, "checksum": "7968c370d0efa4601ab8b5ee68e480b211fb969593608bf7e00a0153f00f99b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00433-of-01024.json.gz": {"num_bytes": 317822797, "checksum": "f62d7e74434d52c36b22f6a8cd56ed3937ed6aa03f140d0fbdf5e360632d51fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00434-of-01024.json.gz": {"num_bytes": 320094364, "checksum": "55d7678c7e197e165b4e09bf3f8ac159853120acbe5801ed6ab3ab0f801c11bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00435-of-01024.json.gz": {"num_bytes": 319008936, "checksum": "09b451c8ee06bc06507b3e75a60c544a6b70f27e3d07daa29c59803f785faaf5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00436-of-01024.json.gz": {"num_bytes": 319023456, "checksum": "6fbcb93f9dfe65e12b7efeecc8af7823471787438b1ce90e5f48b68b2dcb1d14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00437-of-01024.json.gz": {"num_bytes": 319484997, "checksum": "9e70c8c1ccbfe93ec9296811ae496a518dcafbf38c81b7972f885e297da9e726"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00438-of-01024.json.gz": {"num_bytes": 320319141, "checksum": "eaab759d8c603e8a2ad3ebacd99e30338fb904ba307aeaba0d2e0e63679cfadc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00439-of-01024.json.gz": {"num_bytes": 318410397, "checksum": "7a03a92bf97b6750941c1070f933c68f1b2a3e13fb68b3a21a4726676ea75d34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00440-of-01024.json.gz": {"num_bytes": 319447470, "checksum": "bc899e436da7b3bf13c1bfa2fd2bbf9d90b42a0c00f2971259a14d858ca3e5ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00441-of-01024.json.gz": {"num_bytes": 317582955, "checksum": "4d777860c2750e43038ef709d77bdc403b3b3bcf0f08e3c4562952c9ac70b113"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00442-of-01024.json.gz": {"num_bytes": 319592118, "checksum": "d9e5dc244bb6f0b629b2a929aedf506dadaf5eacc80f0997816b95279552fe8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00443-of-01024.json.gz": {"num_bytes": 318104403, "checksum": "56133bbd7cf96dbe87d48898b886a024af69ca405d7cea1799bbd30f185e9c1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00444-of-01024.json.gz": {"num_bytes": 318547808, "checksum": "8be0270c3cc96dd7f7b3aad08bde81ea245feff4a09923277fb0d38a7c095604"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00445-of-01024.json.gz": {"num_bytes": 320463920, "checksum": "e02316fcd355914e4d08ecf37036d4727ae9ebe45bdc5c98279aa3437c2c1eb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00446-of-01024.json.gz": {"num_bytes": 319583221, "checksum": "80c9b8c47665b2cef6c291b0eefdac5b14be1d7cd4a4c06c2e14cf48b42da92d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00447-of-01024.json.gz": {"num_bytes": 319546881, "checksum": "a18d5aaca1717ec33fb1822a633268003bf88093dd7b48db080503c3d01b6ffb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00448-of-01024.json.gz": {"num_bytes": 320234711, "checksum": "c41595d2b9cbf0e23fd65df1cb51499ee262d345d79d2625388cf149c3c39f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00449-of-01024.json.gz": {"num_bytes": 320043698, "checksum": "3bef99334be9d39f41296f8f134c88f04fe66502da2d2639f0d6d2485338e607"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00450-of-01024.json.gz": {"num_bytes": 318033740, "checksum": "9cd05b1b70ffc3c004b4b4a2f21f91abee1395f3a485efd1aafda550193df9fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00451-of-01024.json.gz": {"num_bytes": 318549622, "checksum": "b2ef6cc4ac7c4c69fb1661d7ed9b2ce4da261c72f9e49dc3c934180501ef3a24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00452-of-01024.json.gz": {"num_bytes": 319317230, "checksum": "89927f1fd79a5b1439988fd37e0377175176d9ed22d14611f67a81e185a336b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00453-of-01024.json.gz": {"num_bytes": 318952561, "checksum": "427f55bbcfb6c1a0ef12f96cb122f362b975169770ce1d392b763c4b4408cb34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00454-of-01024.json.gz": {"num_bytes": 317545286, "checksum": "2fc3b172ea721bc92b0f7614e8fea61b0781e6f4f3e6b7263cf0190beef3ec52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00455-of-01024.json.gz": {"num_bytes": 318975631, "checksum": "c96f688ecb19bdb1592b0124021fb80d48965303442de76751d82fa03ab8f6d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00456-of-01024.json.gz": {"num_bytes": 320016575, "checksum": "61d2be7a4b9e34cfb994ae2c120ed5a51a6669564046637445a46b9872812416"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00457-of-01024.json.gz": {"num_bytes": 318236935, "checksum": "a74dd51c3c490458ea0e61196d7e0085aff80d50cd149a673f54f661b364a671"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00458-of-01024.json.gz": {"num_bytes": 318495925, "checksum": "adf9cd717f2c79504dace22b5929d4c4064353e869457c20cc81a0b2db390c89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00459-of-01024.json.gz": {"num_bytes": 318956821, "checksum": "d7be5bcb738a75586125e56a25aa234618528accda620eaac421beab6288b992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00460-of-01024.json.gz": {"num_bytes": 318968681, "checksum": "6181280df5418fd9ebb52aa26a631100b6c3da0750dc5fbae152a6a44fccb942"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00461-of-01024.json.gz": {"num_bytes": 320810761, "checksum": "5e943c458674371dffb2466274b8f2a9df9902a370901ef97992bdf920cdae0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00462-of-01024.json.gz": {"num_bytes": 320154899, "checksum": "76b3d1b120cbb7cd71d004440e0c6bd9f9c4395424c568e8362973038017a90c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00463-of-01024.json.gz": {"num_bytes": 319247449, "checksum": "9de2c86d85289113b24c2f7eb4771ec1391511930f5f26a12133d41faf0ce908"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00464-of-01024.json.gz": {"num_bytes": 318150152, "checksum": "85fce3104ef0b247798c1de8d9d616d3de754841fb6c49a01cca5b9da5efa94e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00465-of-01024.json.gz": {"num_bytes": 320342803, "checksum": "ddf312f0b8de8f53ed556483fd998ae308d4829d18195a48869db6bf1866c332"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00466-of-01024.json.gz": {"num_bytes": 318619029, "checksum": "01239a1ff6ffe9032da320c5a7d1a93125d0724851e3e10746821c9452070887"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00467-of-01024.json.gz": {"num_bytes": 317677227, "checksum": "41783d20189a4bcfc33f543597a5473900e692ea13fa522f2724e27e810b4e9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00468-of-01024.json.gz": {"num_bytes": 320038217, "checksum": "7131b6f4dd423f2efe55c3f598893676300b31651cce7eed32ce633a015f8ca8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00469-of-01024.json.gz": {"num_bytes": 318359701, "checksum": "925bc76c045f25532414f29820adb0cf1a56c54b406333a6f348c29e5efda9fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00470-of-01024.json.gz": {"num_bytes": 319329235, "checksum": "9be740483aa7bbaf94dce550f2c20404c89326f6ec4ebe1b7070f85f93507038"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00471-of-01024.json.gz": {"num_bytes": 318792779, "checksum": "0e3d9492f15dc9867bb0dc803bdf45608fbe67255014b4488902d7bf2e2554cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00472-of-01024.json.gz": {"num_bytes": 319552622, "checksum": "00484bbc10bace3dfd93b57fc53d6f5fac26b7dd54fd5b5428d75eb9e6dbb0e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00473-of-01024.json.gz": {"num_bytes": 319466828, "checksum": "5db5d585798e8ed8e4a3bc540871f1185f67125f397a12942d21b24e6b374519"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00474-of-01024.json.gz": {"num_bytes": 320014669, "checksum": "db07fd0e972c1a474806c1b4464ad4cefdd2e8fc15806ba0d259d4f9e594c3f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00475-of-01024.json.gz": {"num_bytes": 320379280, "checksum": "e6e36a9eed8be84c928980fffd8177b177182726c9e13b41a47343d431f76a7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00476-of-01024.json.gz": {"num_bytes": 318820301, "checksum": "0543ed2d0b3aaba0b0fccbf0311836143bd19175c5eed9bf0f024ffb9ce3c50a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00477-of-01024.json.gz": {"num_bytes": 320577830, "checksum": "a62fd62ad771dbcfb7af73841e15a49e9d7239c53dbbbd84de2282131bca9c99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00478-of-01024.json.gz": {"num_bytes": 319593908, "checksum": "beae9334a8e93e4b036c4a9b3c5b3a75fff17264177184d243d9e6da286dbe2b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00479-of-01024.json.gz": {"num_bytes": 319728825, "checksum": "ae5b475c7be35d98b77d6c4aed5d61cbd1c98544c9a6e73a53ef2911757ab7f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00480-of-01024.json.gz": {"num_bytes": 319903674, "checksum": "51e0611378455d909e8b0f292eb62038848aa7afaa4f93c9c83061258b211a95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00481-of-01024.json.gz": {"num_bytes": 319998409, "checksum": "68c640304ac952f544ea88c88d7c994c8d2955b95036f8352a67b57a836fa1bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00482-of-01024.json.gz": {"num_bytes": 319047238, "checksum": "74cefa57158d0008a06ae85b2a7a1c04d57a79b7ae3f7b4b3426dbe9918b36ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00483-of-01024.json.gz": {"num_bytes": 318775875, "checksum": "e99faa71222017521f1fc9999bbb0832df5c91f8b9f6e2ef501d3f827d3a1e85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00484-of-01024.json.gz": {"num_bytes": 319190491, "checksum": "4518faae7c9d51a51f0b02cd895cf27e7c87a623b787346c844a8d9f0b52d6ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00485-of-01024.json.gz": {"num_bytes": 318974502, "checksum": "1bc8b207583b9f36169e0e9facd258de8eb73dee8bf831051dd1ab04b7726c6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00486-of-01024.json.gz": {"num_bytes": 318599424, "checksum": "0b1d9900e1921483b85305491f914b6b78fabcd0686a20695e61b89b7380a894"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00487-of-01024.json.gz": {"num_bytes": 318958015, "checksum": "c0c789c5f3b34d170d2aeb72642c70d2fa5eca567e7850d0c89b3d170f3bbf64"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00488-of-01024.json.gz": {"num_bytes": 320205671, "checksum": "6eef7a1ea80be43e84cb0c974215a477c909844899ac694afe1af2e8f4ac171c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00489-of-01024.json.gz": {"num_bytes": 319193967, "checksum": "eccf5d7f682a76e11332f07e7d54a080f76c0be58a98a853a9fe90c815a22087"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00490-of-01024.json.gz": {"num_bytes": 319833603, "checksum": "afe99e32ba36134f23b59a2ee43965bf185432de947740fc19e26eef41027aef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00491-of-01024.json.gz": {"num_bytes": 318912982, "checksum": "e981151b23b233bd3e5798f78658b5f52a73f69db39c30615f615069cf0c4984"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00492-of-01024.json.gz": {"num_bytes": 320057824, "checksum": "0cc5f7df318e0718fef93d24e7ff904b3e8e2728c4fc0b1d13893c81d8e6e2c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00493-of-01024.json.gz": {"num_bytes": 317967559, "checksum": "93749543b04a5a7093177d2a03acfc0bf6f26d5b53864ae35839a9421fb48169"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00494-of-01024.json.gz": {"num_bytes": 320426917, "checksum": "e461f56b461a4d5ce353c60889dcb99e10818985d3788440c6119bb145876277"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00495-of-01024.json.gz": {"num_bytes": 319528392, "checksum": "e530f3030ddbf7191bc4082e8209f63eb48733d7085d79a8469ce3611ccb79b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00496-of-01024.json.gz": {"num_bytes": 317570766, "checksum": "ddec34b528bd5314019d12089e600df27e781d78f43b6722b9c0202ccf385755"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00497-of-01024.json.gz": {"num_bytes": 319154838, "checksum": "e7438a08000fc7a158f887755cc496edcf51c8bdf2bc4a888ddd2c829bf8fa3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00498-of-01024.json.gz": {"num_bytes": 317955368, "checksum": "ad133d808ca5b6181bae1921ab1261d79630c09bf9d6c904db036f22e6f32e6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00499-of-01024.json.gz": {"num_bytes": 318286671, "checksum": "cb40879ea08db5a9eb6f2c23756574bda34deb9acf039b992f0ab90fdbb01594"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00500-of-01024.json.gz": {"num_bytes": 318510936, "checksum": "21e5f7468a907f38c3dc0a5c19f09921476f9186beff967e829329f191dad6b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00501-of-01024.json.gz": {"num_bytes": 319611074, "checksum": "38829434c8539bb9fa9ea32bfba3c6732c5021ffb60c16fc502fe61de83906ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00502-of-01024.json.gz": {"num_bytes": 318630954, "checksum": "22d1ca1edae179d2587495fcdf1d3e515c6f547cebafc54996c93a121731fd8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00503-of-01024.json.gz": {"num_bytes": 318253198, "checksum": "e95689993390086880e630ec4540e0629551076c0cad2c70f5aedd3aebfec181"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00504-of-01024.json.gz": {"num_bytes": 319497151, "checksum": "0cd7b986d247e010fd76fa2ab2b62d5f9eec292b28c1e7bd3e4c577042b598af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00505-of-01024.json.gz": {"num_bytes": 317498965, "checksum": "f1504912fc53cc3690e26ec3babf736ddbeb8f7d9196dac83f757699310b30ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00506-of-01024.json.gz": {"num_bytes": 319684193, "checksum": "9f6defbac132e097cbf7cb7d181cb154bace6af48964fe09d111bc610fdcd2bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00507-of-01024.json.gz": {"num_bytes": 318394726, "checksum": "a58f39d0bef19abefc089342d8bb6d75dbb2c663f67127673ec395404bcf15ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00508-of-01024.json.gz": {"num_bytes": 319013108, "checksum": "176443b39840826bfb1db2cef2541449a6fd0c465ff9bbf0cb2479f07fb8baa8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00509-of-01024.json.gz": {"num_bytes": 319832758, "checksum": "cce5a142cd7a121eba8c182d499442f4b0a397ea1484c33ccd79b1acbae832fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00510-of-01024.json.gz": {"num_bytes": 318762241, "checksum": "bfc910625f0fd6074955906bb86e789b0d0adcd1f8956cb8da276933dceac256"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00511-of-01024.json.gz": {"num_bytes": 319240643, "checksum": "ce53021b90d1c86e2d46293e7053aa174387d7408bf0cf907898be69b1a7befc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00512-of-01024.json.gz": {"num_bytes": 318353376, "checksum": "e9333c6f73c30c9cb7f31794025eb9129455fac2edd64f8b3f22f879124c6a85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00513-of-01024.json.gz": {"num_bytes": 317653011, "checksum": "d9450c6f541e82922b37d3b7cc25611707b44884f27825db4dbd65466b59e8b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00514-of-01024.json.gz": {"num_bytes": 319391160, "checksum": "20b77f5fc2a939fc291f901e8774acfbf04ffaacb08192b724673eadc9f83c12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00515-of-01024.json.gz": {"num_bytes": 317994258, "checksum": "32ca1f60d0deb395538a93ce5044a48fde05864f2c26af42dc53405b6dc05031"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00516-of-01024.json.gz": {"num_bytes": 318786801, "checksum": "eba4f34749eef4da2b0729abbdfa2ada77bd65383c01213d4f86625670430a65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00517-of-01024.json.gz": {"num_bytes": 320010732, "checksum": "617765f971b879182db7debf879025f8dad4fd8846b11728ee1230767c031c04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00518-of-01024.json.gz": {"num_bytes": 318681019, "checksum": "6987893764c56b84fca014532824a05d4187db5c313be4f7bdcb363b7e8cc8db"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00519-of-01024.json.gz": {"num_bytes": 319951543, "checksum": "ba151c4734db52e7c220dbefe380825ac6d66a9c6abb901b8096a87d97a2deb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00520-of-01024.json.gz": {"num_bytes": 317948056, "checksum": "7e53ed26c3c068b0dedd026219b7cdab79775545ebbf31b5dadadb45364c9985"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00521-of-01024.json.gz": {"num_bytes": 317993802, "checksum": "4d1d4a5583430e373bd2cfd191e59cd8911953fbd73fa924e0c15be76499b54b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00522-of-01024.json.gz": {"num_bytes": 320189449, "checksum": "71d851498785e312acf93861a43169794d4d576f5fe8b960303419316c8c898a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00523-of-01024.json.gz": {"num_bytes": 320443871, "checksum": "587867d619115c2accb69322b197239b79f12de41ae80427fd369813ad8d81af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00524-of-01024.json.gz": {"num_bytes": 318192840, "checksum": "7324c02db00b06d0f41d6e5ebfa4e4dd6554f5f4849d6de187ebb84162d0446d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00525-of-01024.json.gz": {"num_bytes": 319294602, "checksum": "24ae3495e5b59883967c62b8fb3a4fa7525d33c40957fd5fa3be413d66c24eb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00526-of-01024.json.gz": {"num_bytes": 319783465, "checksum": "27cd95e7bc6a3f156f1f8f26dc5e490818fc4810562e3964a19fad401cceacd2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00527-of-01024.json.gz": {"num_bytes": 317240081, "checksum": "6b84920fe7e28c01a03800512915c7a9e47816267ac652f9ee0314e3428bca72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00528-of-01024.json.gz": {"num_bytes": 318320694, "checksum": "fec06589f714ffe1343cb6781898e29e5d0cb789deba3aa4a4ccf86514d3f690"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00529-of-01024.json.gz": {"num_bytes": 318391515, "checksum": "a98c34c04c1b6f0ca3acc9e10fdf4bd0ead2ea7271832ce4972df8677590918b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00530-of-01024.json.gz": {"num_bytes": 318473966, "checksum": "1677d541c7bc10971c711f1eb030faa2e85e0967112ba57d7f04712908e4f040"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00531-of-01024.json.gz": {"num_bytes": 319463272, "checksum": "92b5d82a058554d3396a2b54504f45fa88581cb2951140c0f0bde67ed11bed0c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00532-of-01024.json.gz": {"num_bytes": 318228175, "checksum": "291bb3d7613f7f00b6910a0de78dbab0d87602243c9c83014de341c131200853"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00533-of-01024.json.gz": {"num_bytes": 318966937, "checksum": "a0ce39eac6d6ecad3478373c264e88b2ea20b77fb2049537c229ad3da2769c85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00534-of-01024.json.gz": {"num_bytes": 318968162, "checksum": "387db79d4aacf8fa4c512fb78023ff94a43d5d597d5a8c2ec6198e62e4b8c98b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00535-of-01024.json.gz": {"num_bytes": 319253588, "checksum": "3ff8f4a926fdfb6201a94d75c17ec5afe662a339a65019eb5e1193c1238bd388"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00536-of-01024.json.gz": {"num_bytes": 319662526, "checksum": "0c805e83d8cfd979701df5714713d062e14853d7e2b0f77c0b414a626686cd33"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00537-of-01024.json.gz": {"num_bytes": 319177095, "checksum": "f9a0ac216e316075e5c2219449a954f989eb160ead2ca07ac9f3813274e18f2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00538-of-01024.json.gz": {"num_bytes": 320109104, "checksum": "a425ef4dddefb40bac5a8cd3191161a41737aea5088a614410d10d83bbab5e37"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00539-of-01024.json.gz": {"num_bytes": 320600564, "checksum": "3580ea8da9c4aff1296e89136c5d7f1a37d021e0b10f3ebd1e05612c092faebb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00540-of-01024.json.gz": {"num_bytes": 319993281, "checksum": "ad8dc83bfbe7c8976f08708c5f0229cd4e1a2d80e272b225a8d208133b129dfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00541-of-01024.json.gz": {"num_bytes": 318256020, "checksum": "c7452669237323fdd09ce97624791a0261f3ec07d8a5f98e71a4b1252a2805e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00542-of-01024.json.gz": {"num_bytes": 318843744, "checksum": "1e5a11c25f82ce717302dbcd9acc1f8b916d83eca88d345d8434b1f88768137b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00543-of-01024.json.gz": {"num_bytes": 320482002, "checksum": "bbf96edf50c913d5162ee154423242e7c8faf490ba229f325bac98a5e3eb9477"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00544-of-01024.json.gz": {"num_bytes": 319059260, "checksum": "22c04506b5744df8c71727fc6527fa2bc495a10a237c71762c66d09625d34097"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00545-of-01024.json.gz": {"num_bytes": 317874034, "checksum": "84a78bb62eb6f72de7a75325870d9ecd419f77c4f6728d29609b2f7ab1b8bcf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00546-of-01024.json.gz": {"num_bytes": 319891407, "checksum": "28631c527dc398c9626fc60b39ad94ed880b41c71f55b9c7c670f6a1837f98d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00547-of-01024.json.gz": {"num_bytes": 319361268, "checksum": "273b8598405def0165ceaf9723d1425c9b74368fc22a414616c7ac9327930225"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00548-of-01024.json.gz": {"num_bytes": 318360761, "checksum": "59990568c0ea055fab27f2b9cd028e1c7177df0479712d1e2d8372e9b017ccad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00549-of-01024.json.gz": {"num_bytes": 317320452, "checksum": "fd1e361f28cf099df6088e26d06d79f7f62bd8bd89b4524b9baa80ea49a1a4a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00550-of-01024.json.gz": {"num_bytes": 319017444, "checksum": "4424833afcb143f6fdbfc2f5fa2508d6226a4a1df391969b2a751d2d0070158d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00551-of-01024.json.gz": {"num_bytes": 319118159, "checksum": "77b78f94a8bc8f905cf8b1997df1fc3b8c6d77ce65fc28bef68c6083275a832b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00552-of-01024.json.gz": {"num_bytes": 320058125, "checksum": "e7b71167c4ad947232b6acba26e4d3cc9214c25b50b853b5745333bba942f50f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00553-of-01024.json.gz": {"num_bytes": 319220671, "checksum": "ce7891f3820ce065e3bd7afa006e90889428c80bd8e771d66fbbf023bb2a9eba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00554-of-01024.json.gz": {"num_bytes": 318858928, "checksum": "015a707235f46f179a08d3f6674b6d368dc9612841e2bf39f700f11fef8e64c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00555-of-01024.json.gz": {"num_bytes": 320490725, "checksum": "041dd2e902ed04dfa143476da03d5fd00c30ce1259c0658150af5b77a5a092c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00556-of-01024.json.gz": {"num_bytes": 319863694, "checksum": "22e3d9e4dbdf2b1b822a7bc8c889f4747aa16c71f4c91436d028a228bffe4b87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00557-of-01024.json.gz": {"num_bytes": 318940362, "checksum": "4cb8b113ad9687b7dee590242c5f50fb3ea3a8775c67492a8ce0cb5c15fc26d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00558-of-01024.json.gz": {"num_bytes": 319797786, "checksum": "ad157a34c6a8d496859f55b00c79fcedf7305d8502ca86a511026f39cdcaca59"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00559-of-01024.json.gz": {"num_bytes": 320156705, "checksum": "816d84753b71fae446428587f41de5b3490e88321f1fa0cfa2ef1fd5eef851e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00560-of-01024.json.gz": {"num_bytes": 318346216, "checksum": "0b1b3d26316f2c0e973ff19820793bcfffa957c3869f74f62fb40cb6839227e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00561-of-01024.json.gz": {"num_bytes": 319571572, "checksum": "4f92594382c897bf94211f1446dbb38c2cc1fff3647acba731dfe0ad89ba4061"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00562-of-01024.json.gz": {"num_bytes": 319453711, "checksum": "2a6ba0c64806add776081f417c8d1afdb324dd8b9aebb603372afd7fc2c4cd6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00563-of-01024.json.gz": {"num_bytes": 318990092, "checksum": "e3032365b9b86883c24bfe387d810c2d9fd1d0a55ff88acd1f5b5357246b13ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00564-of-01024.json.gz": {"num_bytes": 319491917, "checksum": "da6196ab8650fc9f8fa391b821ff070070946412277bd423c40d9fa1de325f93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00565-of-01024.json.gz": {"num_bytes": 318756269, "checksum": "edeb5b13aa0d65354d78a5ca5d1698732e95f1fcba249c42825a0351d4a34f79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00566-of-01024.json.gz": {"num_bytes": 318461036, "checksum": "f179addbca50d8612612b0e09138d7ecc89ba7ef2d6e857d7ef0b10223dc71d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00567-of-01024.json.gz": {"num_bytes": 319625728, "checksum": "eaa1d0ee28eb17c6ebe3d85c8af8b7adac28a720b2975f86ac83f3f4d2bffbcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00568-of-01024.json.gz": {"num_bytes": 318428567, "checksum": "3677e88545f2d76b601995cc3e2b6b12fcf65e350ed7eb4137ab4beef3d475c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00569-of-01024.json.gz": {"num_bytes": 320114923, "checksum": "2d8810d8bcfc0fc19d82313be6516b2fef4cf68f56b0448af48b512c98e1ae8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00570-of-01024.json.gz": {"num_bytes": 319148416, "checksum": "8e5356dc0fa2b4e5fa16b36a1586f16920306af1227c765e5d2f0818e74d30d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00571-of-01024.json.gz": {"num_bytes": 318223973, "checksum": "c87cf8b88e8e4fc0a664f4b3a381b78b317680253a83a672cb86e02adb43f2aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00572-of-01024.json.gz": {"num_bytes": 318322508, "checksum": "2bdc857dfeab99c8f83f0267ed5ed7529bca8ee086fce268534bc0264ff738f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00573-of-01024.json.gz": {"num_bytes": 319203246, "checksum": "564fc77dec25ce0d47f4e3d8d04bf114dc06119b28b3ab00d6092a799d496e51"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00574-of-01024.json.gz": {"num_bytes": 318397937, "checksum": "dc3f206e1b5da963184da72e47959844bb164335c76e3261f3a189a4b7b022cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00575-of-01024.json.gz": {"num_bytes": 319183651, "checksum": "7f0c46955e37d5d52b305f71b4ce4fca5368d72e8698e8b832ac0177f868e145"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00576-of-01024.json.gz": {"num_bytes": 318690625, "checksum": "b37d0fbd439bdc05021a71c192ce5e61ebce27448a17819bb53156d9d5f27e17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00577-of-01024.json.gz": {"num_bytes": 317926085, "checksum": "3092d1ad70fb2d262ecb33f3fb6ea554af3ddd26498ba42b644c383f6d4bd1a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00578-of-01024.json.gz": {"num_bytes": 319190472, "checksum": "d9833fd591a618a167b31b7aaca420f3e719ded98987dbc0f46fd4bfd12564c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00579-of-01024.json.gz": {"num_bytes": 318958744, "checksum": "a11217af10c85ad828de38847eeddcde6af6899563585d581c20adaed3c9e7dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00580-of-01024.json.gz": {"num_bytes": 319893900, "checksum": "71e8be705bfa8563e33392d1c14decd84f52d6a0139b98344f1a0ed9bdc94198"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00581-of-01024.json.gz": {"num_bytes": 320109861, "checksum": "c5f13ba973803ef069762d22bc37ee02a4348af379c75848d93b2685fc4280cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00582-of-01024.json.gz": {"num_bytes": 319238177, "checksum": "da815527ca68b5c2ed604d00ccbcc7c631c60f33e3132f79212634a82c266844"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00583-of-01024.json.gz": {"num_bytes": 319375634, "checksum": "a332b791df0801f0b7227117f0ea3971563e8e420ae24dd94b38d532c1ab0573"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00584-of-01024.json.gz": {"num_bytes": 318596018, "checksum": "e6496d31f42921eaf9f85047e7c2eeb5fef46e01e99760fa676da96481d7d5bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00585-of-01024.json.gz": {"num_bytes": 320156294, "checksum": "08b978ec05d65edd22c301ddc6ab44174eeb7bef5c5997a84342b6faaa47a79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00586-of-01024.json.gz": {"num_bytes": 318716838, "checksum": "567ce600ad99e543507fdf27b9009fe1782bc867f44f3dabbeb93fab1208f337"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00587-of-01024.json.gz": {"num_bytes": 320247814, "checksum": "8f5c82f5eaac4a315d8615c9700cd81f3b9c2e1a17376d3b2482f8694dfe2492"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00588-of-01024.json.gz": {"num_bytes": 319546079, "checksum": "bae91422f87091b3974ca92781a14fae8f10c5c41de9c9132f745b3dcb8bc468"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00589-of-01024.json.gz": {"num_bytes": 319771959, "checksum": "babb615d77f80e5ef99aeed3889a26cef5c9918a7fe68b70a503815e69b0b189"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00590-of-01024.json.gz": {"num_bytes": 318926571, "checksum": "61f2ed732f3b2b5e24882f47b4eb84fea28bf89d112f6f173cbb50523a43c4b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00591-of-01024.json.gz": {"num_bytes": 319669791, "checksum": "3aa2e792ec775a52ee78447b81204867e58b0a46727bab4b7974977aaec2889d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00592-of-01024.json.gz": {"num_bytes": 320393142, "checksum": "1419c263fb74409cb0e39ebd87b1c020ee6863a3a6f2f427be27d3c76b84043a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00593-of-01024.json.gz": {"num_bytes": 320977171, "checksum": "4f16f33217c35a2b155d5b6fe8014c2e52014e63c419e7d3aaf71a35246c1323"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00594-of-01024.json.gz": {"num_bytes": 318211092, "checksum": "c9301ddcafea22d085ae48f551f486e73089a76c7990871f787064c61e4e60b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00595-of-01024.json.gz": {"num_bytes": 318978629, "checksum": "349e104763320eaae96ac3bc53c5fa7a73e7dec93b8cc3afaad108a97e7c170d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00596-of-01024.json.gz": {"num_bytes": 318573003, "checksum": "0eb6c25cf57764ec3aa7f74d6d967c52003f872f2f3b140fe6d5ac6360241a8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00597-of-01024.json.gz": {"num_bytes": 318931514, "checksum": "b42b7b984aad729185ca9b3a6ffa856b2a79165ce2feebe519b10f8ff42c4ab9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00598-of-01024.json.gz": {"num_bytes": 319002677, "checksum": "8306c5971408767b3735288fd0ee7ee7d01d9af4ef4cbec2e57c97b1f78e6d63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00599-of-01024.json.gz": {"num_bytes": 319637870, "checksum": "844df34f2a263011f9d1d85eaad5a1d95243769e9cec5a104807dd55e1fe431c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00600-of-01024.json.gz": {"num_bytes": 318099852, "checksum": "b05e66568a4472feee31f20918e9813aeae2d881f47b5281ff29fbcfedf4d5b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00601-of-01024.json.gz": {"num_bytes": 319136069, "checksum": "8dff2d56c9915d73e6154533e5de0ca9d867c5fdedcfeceb3e0ab22f3ba509cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00602-of-01024.json.gz": {"num_bytes": 319369121, "checksum": "45b2c1757260395afeb168b545892b315fa0bf14b3d144bfcab1fdaa6d79086f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00603-of-01024.json.gz": {"num_bytes": 319499076, "checksum": "46edc9f556ccae692900b222b8e4843360dd5dbe0798a8ad9cb51c07a451dbb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00604-of-01024.json.gz": {"num_bytes": 319132921, "checksum": "0cba8c8738ea7ff9a08bd1bab215010b03c6c83fe35206d83344d78005bdee6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00605-of-01024.json.gz": {"num_bytes": 319315562, "checksum": "0dc0d37658fd672c8d72775bd8855dce9037cf9715feda35a76afb1f0e87bebb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00606-of-01024.json.gz": {"num_bytes": 319223528, "checksum": "f679e437a3acda1a81013dc0f3fa93fde6c3309905e8142f8699a76bc04b7114"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00607-of-01024.json.gz": {"num_bytes": 319326218, "checksum": "7fe91f86f751b9aa3abf1c5ed0fdab89a76c7fa4eb7ab8b809ef29b0cf4a78d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00608-of-01024.json.gz": {"num_bytes": 319393715, "checksum": "a5daf706100eb797b5b0770fe0c790856637b22dc849aeda5b445ae5fa63cb3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00609-of-01024.json.gz": {"num_bytes": 319554192, "checksum": "4434338fe97d398d9565ae940c62539e868fa261be361ede1b5b0feb004160f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00610-of-01024.json.gz": {"num_bytes": 319786301, "checksum": "6b0d0e0457a721af6c67a31f5016432011e717302cfdc7ee39feb253fbae4754"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00611-of-01024.json.gz": {"num_bytes": 319356910, "checksum": "bfe201b1775270afef3a09fcfc074920cbb01093eef90d46f26b6b813d603994"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00612-of-01024.json.gz": {"num_bytes": 318780229, "checksum": "29248c4732fdfda2ba97ed38192ab391457e20fd70f713ef4a7cf084f9865846"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00613-of-01024.json.gz": {"num_bytes": 320190496, "checksum": "f5cb9be2442797d967b9041e48771196a6c0595933ef2102840b704e355f4d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00614-of-01024.json.gz": {"num_bytes": 320245862, "checksum": "89b74d0daea02fb69289ad259bbd0ddb1a64c5d6380848f7d51669be952f8a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00615-of-01024.json.gz": {"num_bytes": 316874605, "checksum": "78600c8703d5ebf80c99c089bb7a7c1cde843a66d706fd219eeac304f80e8525"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00616-of-01024.json.gz": {"num_bytes": 320237707, "checksum": "630ee29d4dc4cd5062eeca7877e5c1b204b36eb0b3aeacadf036cdb75c1ce840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00617-of-01024.json.gz": {"num_bytes": 319739365, "checksum": "d418fd284d06b1d2d9daebea3047ed06286640ac75d23893f1effc2ee9d7aa14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00618-of-01024.json.gz": {"num_bytes": 318634299, "checksum": "f5d75d129ab6c0f052028cf0139c3cf20eed3a9c5cdb151cd88ae42d5d1a32d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00619-of-01024.json.gz": {"num_bytes": 319086471, "checksum": "c558908f6e08b0d02f377c9aed1655d80106f4cfe26e955774bb420d19b2f74f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00620-of-01024.json.gz": {"num_bytes": 320665446, "checksum": "977f959e5b5eaa24081ce025d137647fffd65f1a54d2c45db9805a232e0c0364"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00621-of-01024.json.gz": {"num_bytes": 318576410, "checksum": "d07f3c31d7ec1c71b5ab9539a2ed49f6d5f46b48ee2e51800b9e28cee588a163"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00622-of-01024.json.gz": {"num_bytes": 320053075, "checksum": "58b897603eb83f789a1cfc6bf40a091093cbd8a0c20702018c411adc7b07a437"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00623-of-01024.json.gz": {"num_bytes": 320045187, "checksum": "3665d7579b3c57eb21ec9e55850e39307cc6f4ef8aa8b9937076ad6f142063a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00624-of-01024.json.gz": {"num_bytes": 320136842, "checksum": "35db069ae090e95c5a4d3db44eae73bcb29463c120584d7f6ccbe235983c5fef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00625-of-01024.json.gz": {"num_bytes": 317314201, "checksum": "7f6ddbbc8815e8bd10c99361fd8113cbbd84ebd92799eb6958cf98af825d2aa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00626-of-01024.json.gz": {"num_bytes": 320219970, "checksum": "4e2c46d1e3a94957717bbbf1e1e4300bd27ac17e588d426e0ba688983e83f4e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00627-of-01024.json.gz": {"num_bytes": 320083102, "checksum": "851ce6dfa6a4d1a4e3b8bf439e36db9ceb59eefc60558d429e2fec80655e1775"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00628-of-01024.json.gz": {"num_bytes": 320386844, "checksum": "86d8927f16d0790a07d6c68e745501188d13887df4a137e937ae00497d07c055"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00629-of-01024.json.gz": {"num_bytes": 319476643, "checksum": "c48cff721137b641fe9d5bcf30462c7e4e3a3ae631b7b4e39979c8c77f0890ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00630-of-01024.json.gz": {"num_bytes": 317961579, "checksum": "cde626b34c6c8455227fbb18a577877b518f529b6c8e16881cfdf334f2875cd9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00631-of-01024.json.gz": {"num_bytes": 318952266, "checksum": "0401582821f7b15f0b406f7ce00c56351b8e86a3c3282bdf4dd45b2f6146ea22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00632-of-01024.json.gz": {"num_bytes": 318261820, "checksum": "be48396ef18ce0f3650eca86eb36039f90b51737f9848086494f34fa28d60e70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00633-of-01024.json.gz": {"num_bytes": 319748854, "checksum": "9d5c342d82fcace21de2900202c3f2af47229aeae9d487a8b77b7f5b86c05f74"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00634-of-01024.json.gz": {"num_bytes": 317806530, "checksum": "00a70705afb91f6570d17257057c15b45386597b917061686f131bd41ddce421"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00635-of-01024.json.gz": {"num_bytes": 320313573, "checksum": "22a1286582d65975ed94f0ba25bf87e94d52a55214d0a51979a3e0fd9f95e3cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00636-of-01024.json.gz": {"num_bytes": 318151690, "checksum": "026c699ac6fa30f9e156a957026d8fa8df72daee3407c8fdc5e0bd7d6a3b50fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00637-of-01024.json.gz": {"num_bytes": 318665365, "checksum": "9bd931dfc074bc99df31d7fd31a5ac1dc8c8bc75f8e87b763545cd824edcdcbe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00638-of-01024.json.gz": {"num_bytes": 318521250, "checksum": "4b30ad531f7502ef7bc6398ab286e5c6c63d340c22792da9258ea95b496d1c0d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00639-of-01024.json.gz": {"num_bytes": 319997068, "checksum": "2bfdf36396e49ff625138d29925f54eb12b18d35f6d0bf5ca9e79194977cfb43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00640-of-01024.json.gz": {"num_bytes": 319355927, "checksum": "d0d0ed7304b5d79318b5230a1ab48d3ed03183f1eb11d96070604a7008cd7b30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00641-of-01024.json.gz": {"num_bytes": 319002081, "checksum": "1461ecb6b92819bfdc12808a5442d70f94538931f856c91dea602a23ba86ab98"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00642-of-01024.json.gz": {"num_bytes": 317689465, "checksum": "aa0af0169cf13db1f8133e8d76afeeae5f71d63d179794377a55b6c2eb938dc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00643-of-01024.json.gz": {"num_bytes": 317523344, "checksum": "5c060166e776f8efda48882c118dc0fd5e058d9ef40be578bad31e477114a16e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00644-of-01024.json.gz": {"num_bytes": 318876813, "checksum": "ad98ee119742cb8a6efa1be46e9670969397c7bde10049886d7d6fceb82387ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00645-of-01024.json.gz": {"num_bytes": 319981258, "checksum": "8930ae8e14c124218793d2fd1bbfb1b624e918cb092b21c6ca74347abd9dea4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00646-of-01024.json.gz": {"num_bytes": 319624889, "checksum": "a40705c4f9a4db4d2d698cf96e43b99fa0790b886506300eb4986a26de7063e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00647-of-01024.json.gz": {"num_bytes": 319240920, "checksum": "7129182faeac82b47127458e92903a209acf8272166024e8313c167d6f358456"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00648-of-01024.json.gz": {"num_bytes": 317305623, "checksum": "3124091a6c438fecbfc948b1a35ffb1462287ae06866b02a6dbb1a6651ccf1e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00649-of-01024.json.gz": {"num_bytes": 318998755, "checksum": "fdb286cfe9e9091a57b31be61a56a425fae07d6b44f0b45f8743d7aab0e980dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00650-of-01024.json.gz": {"num_bytes": 319612451, "checksum": "ff88c4310f049344b8a3f701bce12d08ef5f9b037e82fef7f1f670b3d51e59c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00651-of-01024.json.gz": {"num_bytes": 319098081, "checksum": "9c3b1843082aae39b057bbc7364e69cbc39bbdf91d5bff4f52b12cf1a264adf2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00652-of-01024.json.gz": {"num_bytes": 317107981, "checksum": "e6199d12a893ae5d05c5388ae7a679df419ef6a050c8e3ce3c15fe534943a774"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00653-of-01024.json.gz": {"num_bytes": 319623884, "checksum": "333ac93cf1f1f4da0f72c5e57b675052453b42dffe1e4d45ec680f4e3e075d97"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00654-of-01024.json.gz": {"num_bytes": 319055728, "checksum": "1efe352f2f2eba826231a5bff6c79390630b44039b226a5041a087e116b60f5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00655-of-01024.json.gz": {"num_bytes": 318539829, "checksum": "613c741cfb738017b3fa233512296d9127d661738721d3fccd806aad54d19d84"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00656-of-01024.json.gz": {"num_bytes": 319970377, "checksum": "51fa9b217b6bcf664c472cc2b258813e1f1d7a0f501c29b822221bccafa4e201"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00657-of-01024.json.gz": {"num_bytes": 318548629, "checksum": "c542c6fd2f3284d64f8d53b71ab8308bbba59f7f13e9d9eb20bbbaf13ad4782b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00658-of-01024.json.gz": {"num_bytes": 319845984, "checksum": "b3d8fb6ed2258c463367108e2942742e88eac657c859cc8d128035110fc87e7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00659-of-01024.json.gz": {"num_bytes": 318887872, "checksum": "02feb4e03020d767a4468251786d4857d5dc833969626bee616c7882bfda9ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00660-of-01024.json.gz": {"num_bytes": 319854892, "checksum": "a997d9187a185a29fb3bbeb1e696d32898efba8f5e9d6ed816493669f0c5ec02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00661-of-01024.json.gz": {"num_bytes": 317599289, "checksum": "86d9189ebc534c99da5a4407624a623561b159f758fb04373a270887d0b45709"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00662-of-01024.json.gz": {"num_bytes": 318138720, "checksum": "9c626f7aebcc4fc9afd533b6c8a372d884d01f508ce49c01ddd830e4e9e8b2d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00663-of-01024.json.gz": {"num_bytes": 318110835, "checksum": "441d4dd0d5d2ea7b6098a3fe006b9d7afd526188824a3325d44538fc5655942c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00664-of-01024.json.gz": {"num_bytes": 318996945, "checksum": "08ab0739c3565643b6a83d7091936f5d75a4d8418c956146114aa0315f205dd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00665-of-01024.json.gz": {"num_bytes": 320612903, "checksum": "1ab7bc2d0f7c6704c97848a9325015f06228339bc52cc1fb593d9c56145e7c48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00666-of-01024.json.gz": {"num_bytes": 319241006, "checksum": "8b1213325ceb2a2c89dffb891a31317e903d08fff911e4ba1ae66fc3bcce9973"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00667-of-01024.json.gz": {"num_bytes": 319650665, "checksum": "14676f97937eb3d0734e5f121c5f63002ba2d2c62b6c41b4b46d2fcab9ea9614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00668-of-01024.json.gz": {"num_bytes": 319198651, "checksum": "a406fceed5b7d17ff6d5773679c3df50e747215e39926228ddc9a60c6bf9d152"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00669-of-01024.json.gz": {"num_bytes": 319363200, "checksum": "1d3267d77f43d3d720dcd79c40bc3e8c0cd777d421b1b7d0e69e140199e34552"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00670-of-01024.json.gz": {"num_bytes": 320079826, "checksum": "85111c229b8fcc8428b3c13676bde8268f027fe06e1f576a3adcd82bce1603bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00671-of-01024.json.gz": {"num_bytes": 319494773, "checksum": "eeeed8d9f63a5c16ab9d62454fae5bef1896973cfa69cedfcfaac4565a793b27"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00672-of-01024.json.gz": {"num_bytes": 318304853, "checksum": "6793ec3ffbc147c36e471e1c06a664ac2143408c9ee46305694708eee0fb38cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00673-of-01024.json.gz": {"num_bytes": 319031236, "checksum": "3c886ff71973805a59312d8d43ee9e616bcfafd76c03a64d53ab548036b1fa90"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00674-of-01024.json.gz": {"num_bytes": 318647345, "checksum": "fd7f4efc0c8af611e7e137680342843d0471ca072421ab3c172a169ba2f5d217"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00675-of-01024.json.gz": {"num_bytes": 318313871, "checksum": "3b797b2ad717749a24866a97acb95aace0dd4e91ee7d51dcf1fdd46a9232b794"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00676-of-01024.json.gz": {"num_bytes": 318858652, "checksum": "2ccdf652fd413dc624643d35a76223e8a44e6241997841ec2d13ae11b56400fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00677-of-01024.json.gz": {"num_bytes": 319236091, "checksum": "bbf069c696f09e5467b17ba98479948a85101efa776094084e37581e72c01123"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00678-of-01024.json.gz": {"num_bytes": 318996096, "checksum": "3e3dd21861c713bd38d1803c32da1c0bc2496899648b4cffe1fa2e61b35ca056"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00679-of-01024.json.gz": {"num_bytes": 319915466, "checksum": "6ed56468a31564cb25668ceb5df325ff7138dd231afa85f676ac7af5e81e0642"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00680-of-01024.json.gz": {"num_bytes": 318537417, "checksum": "959ce407e7a892495c477b9e0071dff496fd20db9cfb04dd035ac59dd5b2f309"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00681-of-01024.json.gz": {"num_bytes": 320181225, "checksum": "0aa77d778f24bfdc8566b390a7a1ef1d7880a42b98b3e82e9b37ee3ed821a8e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00682-of-01024.json.gz": {"num_bytes": 319087756, "checksum": "a4da802570ee7bc27e752069612b633edf226078f48d5f55280f73a6dc934127"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00683-of-01024.json.gz": {"num_bytes": 320019766, "checksum": "587497efb7bcd4ca85ec0559e372ea285c1b95e3889d406f142cfe454d8e0e2f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00684-of-01024.json.gz": {"num_bytes": 318814245, "checksum": "6e904f73976ca18aed3375d1c1b308d749b9a4405a333dd0a2cf85360822e205"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00685-of-01024.json.gz": {"num_bytes": 318586686, "checksum": "c51012772c5bae73821b67f72c035f22a40725d42bcf51e439bbdfcd84393ef2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00686-of-01024.json.gz": {"num_bytes": 319648436, "checksum": "890b7408abd0cc04a84be3a3992d05714dbd30a9d33a8a9b05316a980fe51313"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00687-of-01024.json.gz": {"num_bytes": 318909835, "checksum": "b54b20c21ae9834b630a8aac057d47069cf137577d30b91fd1475f5824b61561"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00688-of-01024.json.gz": {"num_bytes": 319381735, "checksum": "422091d5ba0d44c64bb0c84ab4757318414bc01455a97f53190eddda89c2f3f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00689-of-01024.json.gz": {"num_bytes": 318995026, "checksum": "ad5080fbddc914c649027d5e2214f1d75e0cf0617eb3ca0b1fdb8ed9129f99cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00690-of-01024.json.gz": {"num_bytes": 320745318, "checksum": "d45492346bb4bf519e657356ecf1805b6b592683b98c20c93da2f07c50b06092"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00691-of-01024.json.gz": {"num_bytes": 318575084, "checksum": "43a07e8a98bc99f381558c938fc83acd4a37d565459c0f3f83aaadda816f66c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00692-of-01024.json.gz": {"num_bytes": 320651368, "checksum": "21a790ef1dcc9c6ffa071d1a2e21e330d6afcb45368dde9cfae8933c6d029742"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00693-of-01024.json.gz": {"num_bytes": 318429145, "checksum": "85558018ee61e33c4f3e05acc2029e69447a5717be880e9a0aa8fa715dbd0c05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00694-of-01024.json.gz": {"num_bytes": 319562061, "checksum": "894f4c906a33c644ea80c3a00155ced807a62e1bcd9f6e254cb6c88efeedd142"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00695-of-01024.json.gz": {"num_bytes": 318298964, "checksum": "06eb05f651f1d2fff495c48475894420334070df10c051c7253b7afb0bc38291"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00696-of-01024.json.gz": {"num_bytes": 317473664, "checksum": "59ea4f951335553945a644f7628403ba1a99a27e0d93fcfe5db18cbc3dd48ce9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00697-of-01024.json.gz": {"num_bytes": 318839008, "checksum": "f0203b0f2caa3287b8f7a64288af52bafbf033bcdf31dae54e501e4da47b9935"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00698-of-01024.json.gz": {"num_bytes": 318288032, "checksum": "fe2a581cd174429a81424e407aceb1d81b61d9796d74db4590327778fbd5016b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00699-of-01024.json.gz": {"num_bytes": 318696527, "checksum": "edf3aabcdb28fa2feb532b3bd55cd167c2200a6d8e19f05152be194e48acf87b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00700-of-01024.json.gz": {"num_bytes": 318900366, "checksum": "67d89417d1440afeeefd59a0993e4d12fb5731e917ec7f4e65d9319541b4b9e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00701-of-01024.json.gz": {"num_bytes": 318901212, "checksum": "64d302459e6871325282fd890d2922cb1fb25b47d677ce793bc065acc8d1bd07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00702-of-01024.json.gz": {"num_bytes": 318913325, "checksum": "f0bb360189166a0bd717bad85edf06943333b1854687839864aef3ee02814795"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00703-of-01024.json.gz": {"num_bytes": 318730274, "checksum": "c4e027079b9cf9b1adae3e285c5cc5dafeee5c74cf3621c424b6df9801d508f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00704-of-01024.json.gz": {"num_bytes": 320112232, "checksum": "37540f6a00523cbf429764893aa15aae6a57e53c89cf51d82a815feef02b1210"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00705-of-01024.json.gz": {"num_bytes": 319643559, "checksum": "9dae018569fa4bf33674f67ba03732a2f85cfceb53ec2cbb9457eaea607b8dfa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00706-of-01024.json.gz": {"num_bytes": 319941519, "checksum": "03926405dc629f0664a3d27c700a4fa2f606496f0b52a9bbf2fd2d75faae2f46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00707-of-01024.json.gz": {"num_bytes": 317628508, "checksum": "fac92295e4c85f087d27e0a6f231d782be7b2448e99cfc42c09c0e1e20964c3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00708-of-01024.json.gz": {"num_bytes": 318863059, "checksum": "39d4880d3e47e65ab6351e94b015810d66295a86a9f08534260ccbef41fdaf04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00709-of-01024.json.gz": {"num_bytes": 318412651, "checksum": "044fc99a1307737bc8d6d8a9b67997010309fc695eda6e8dd42e5b6bab2256d1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00710-of-01024.json.gz": {"num_bytes": 318631334, "checksum": "0b2c93cf298051864b8660e57182b38408ad738cf930afc09afdde26d952f819"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00711-of-01024.json.gz": {"num_bytes": 320587866, "checksum": "f1f6bb9770b76742d0131495879fa38ed8aebe8a0b38463e7834f0697f174ede"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00712-of-01024.json.gz": {"num_bytes": 318191204, "checksum": "b6873a7d375aa29ff39ca17c3bbc7e328292b1671b59a35e7b01c0e992da90f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00713-of-01024.json.gz": {"num_bytes": 319472539, "checksum": "3bb12a0a806ecb8a5eeaa00188c655f399460609b8a19005a7141bbcb3a7a694"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00714-of-01024.json.gz": {"num_bytes": 320196397, "checksum": "ca6e1fa6f27c9dbadbbaa767fd21dddee7c84ca96bbb6735640ba2631668ad0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00715-of-01024.json.gz": {"num_bytes": 320075706, "checksum": "1a773eec7d738c0e1e253bfd4533f0c43c0d133e564c3458159e0c47d767689c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00716-of-01024.json.gz": {"num_bytes": 318736413, "checksum": "c17a6b2115e56cc3d6bbbd94e8565fb14287057f80199528e6cba20adf557bf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00717-of-01024.json.gz": {"num_bytes": 317351537, "checksum": "cdba391e16c3bcb5569d978a8d11518103e7687714710ef4eba4f7c0821d67d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00718-of-01024.json.gz": {"num_bytes": 318017965, "checksum": "a25c494e4baead0af0afe6eabaa054bc15f80b6ca0ac8dadb1b354d72ffbe63b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00719-of-01024.json.gz": {"num_bytes": 318124432, "checksum": "94f5dfbec85a8c5b22ff1368a16ec2eb7fb4be25c0c8f004096156ae40bfa2bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00720-of-01024.json.gz": {"num_bytes": 318235852, "checksum": "c0248326e698599dcad01eca25d747c138881c61b5636ba765b21f9cd0df996a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00721-of-01024.json.gz": {"num_bytes": 318817834, "checksum": "c11df487a966e748cec522fae4ed76abf3e8cc9bcd28c301117fa52ddb83dc6d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00722-of-01024.json.gz": {"num_bytes": 318553851, "checksum": "63d3d0c3f5dcdff29a0a6ef41e3a9df3fb505c73c8554839e3032293a78bae2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00723-of-01024.json.gz": {"num_bytes": 320174720, "checksum": "29c97bb8ff301080547255af29bb5019a2c1fbc74f0a2711e626461d5a5f0b54"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00724-of-01024.json.gz": {"num_bytes": 317805413, "checksum": "65f8932f3c77b0fee5f2224643a71ff95246720368fe66d45c22df25ea4b9c2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00725-of-01024.json.gz": {"num_bytes": 319460597, "checksum": "dc785a8aa3a1f4ed77512d51a9139dfb24b356b5499ae67dd5b860101b1e0e4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00726-of-01024.json.gz": {"num_bytes": 320934004, "checksum": "45d857536d3535d08cddb6cf50d08d89cc28138a5be082465c3a8c27c02ae2bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00727-of-01024.json.gz": {"num_bytes": 318393879, "checksum": "e4a02e43eeabbecb81b971f4201212104b6214078cafd9500d5b5f323595f060"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00728-of-01024.json.gz": {"num_bytes": 318826577, "checksum": "cfaa0d0c8dfb333899c73e0c2aa00dfdadd00e5b4a3d477e7518c4141899c8a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00729-of-01024.json.gz": {"num_bytes": 320390067, "checksum": "528fe99b0c8dc917ac0f02a555603f9ae81e690b4ce1040f65ebbad3390c0426"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00730-of-01024.json.gz": {"num_bytes": 318156386, "checksum": "786e6913b4417a87cd4cb1882e181d8b2e1eb4b4db5b4b9ad2120b5efdf3e2ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00731-of-01024.json.gz": {"num_bytes": 320013543, "checksum": "f28fc2794c280fc1de263b9b2a81e42423f8dac3af7c4fbd3b3aff888821ca9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00732-of-01024.json.gz": {"num_bytes": 318753697, "checksum": "69491eb25dbaef78235f769422e773de7a2578e678ecde29dcaa663f4ebfa78d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00733-of-01024.json.gz": {"num_bytes": 318640706, "checksum": "dfde8960d738b873bcb75abe1661fcaa096d70c76aef21846b173b8adf049bbc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00734-of-01024.json.gz": {"num_bytes": 319447398, "checksum": "145add76dcd73916b548e7e3b161757c1bdc1f22a0f127019f24827afd6f85e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00735-of-01024.json.gz": {"num_bytes": 319868149, "checksum": "dcd4ba95672630f89e75b70dc08cb918bbe896f5d32ffeba7d3e4921b27c1f4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00736-of-01024.json.gz": {"num_bytes": 318404586, "checksum": "4710b1569342b7aa7ca610d8b8cbb2248a1c5fcd8c6ab3b7f875657dff4779cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00737-of-01024.json.gz": {"num_bytes": 319915151, "checksum": "7091dc758fd14c206514663eed0ae446178ff38e76c4cb7e711c63d419506e49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00738-of-01024.json.gz": {"num_bytes": 319709793, "checksum": "afe1a96ced49662b14bc60b4ff8fc1f610bbc6f3c515bb73f2fade7a0ba67678"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00739-of-01024.json.gz": {"num_bytes": 319789716, "checksum": "9e2332cfc994483d4b913c6556ca9c1698b95e81033b7bbc5a4f5271e5cce708"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00740-of-01024.json.gz": {"num_bytes": 319102226, "checksum": "61ddcc3af919b753638dd46f18f790d7783cdc3090dfddbbeb40faa93bed340e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00741-of-01024.json.gz": {"num_bytes": 318717589, "checksum": "aa3038c23a37561f2ba92e95ffeaa3e3641c1a69f8688b724116edd128e9ba52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00742-of-01024.json.gz": {"num_bytes": 319456536, "checksum": "ea9d23abfed6e3e8ab900291a3bc1faa27751ff94e35378f8c4eb07207036a9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00743-of-01024.json.gz": {"num_bytes": 318641730, "checksum": "6efcec6cd087be4eaa98491e463d0fb9c1253aca275971de08c56a20be9aa579"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00744-of-01024.json.gz": {"num_bytes": 320264992, "checksum": "71653351253c8f7fa18673a3f956bddebd158978708c5a4c9e9b5318f598e1f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00745-of-01024.json.gz": {"num_bytes": 318665967, "checksum": "347dfd824d6f4afe58c6f418ab5d332909038c880f4dcda7f774d3d7a588c3f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00746-of-01024.json.gz": {"num_bytes": 320005833, "checksum": "812bc3c082e3a65c8c77fc7767bb435f9be9a999961d84eadc9e0c602e5ce168"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00747-of-01024.json.gz": {"num_bytes": 318575441, "checksum": "a4414d376c69ae8dd5e60b206315cf920d5a797c6ef7c08fe0c4b4e28b4eb4ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00748-of-01024.json.gz": {"num_bytes": 319266882, "checksum": "f08aee694b85d5e7120652350bfafaa05495e609aa6d2fb0b913ed8a718d7dcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00749-of-01024.json.gz": {"num_bytes": 320205042, "checksum": "b3402b16a5cc817d89a19fd3456a50b5b6d5f3f555eea725167558cc85366d12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00750-of-01024.json.gz": {"num_bytes": 319198252, "checksum": "6b95232f6d53cff8045bd5ebaa87d6e6c511a74dc646d2a960eb87e801ff4f2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00751-of-01024.json.gz": {"num_bytes": 317855407, "checksum": "badc9d82efdbc8db5dc328e8aa5e80155c52f00b105b136d8c5c948fe237d61d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00752-of-01024.json.gz": {"num_bytes": 320283992, "checksum": "67c32eb497533d6fd20b206c38483d171275029ff525bba3da13b0c62e1ef073"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00753-of-01024.json.gz": {"num_bytes": 321030653, "checksum": "5e95b1cb54d7d7f12bec1559ababcab0c364a0af99e10a42a08357647ef5d3cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00754-of-01024.json.gz": {"num_bytes": 319059779, "checksum": "32cb59ad16dfda8a5b52615498fe2e6d85753fa44ab667af2f525a2467508da5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00755-of-01024.json.gz": {"num_bytes": 317737268, "checksum": "0ad2fef2fe37d59b163e29c2287938a768ee87acc34752394809295d0710c602"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00756-of-01024.json.gz": {"num_bytes": 317293218, "checksum": "db737ceace329fb1f8fe1aca38db048a1dedcb5226a4132485f26afecdc6c3c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00757-of-01024.json.gz": {"num_bytes": 319529375, "checksum": "8b823e97964894189a13df393e1b3978342fb24bd81f07af6e54b7bfa2992796"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00758-of-01024.json.gz": {"num_bytes": 319297548, "checksum": "3f31d7ad99d88dde757a651b12db909a30cfcae5796fe3f85722598d92344ba5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00759-of-01024.json.gz": {"num_bytes": 318154496, "checksum": "a4b780127d6f22aed49d155e234e21a847a60626143a8e7dc6e31a5f204e79f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00760-of-01024.json.gz": {"num_bytes": 319386997, "checksum": "020e68dc60004d0661de8a22fe2b9fa7f481fcecaef8fb06efa43093a2a9cc52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00761-of-01024.json.gz": {"num_bytes": 320035555, "checksum": "8d7b5a97770a062276ca909a3bd20365cbaf3931fcbeb8b7e479f5ee03b47053"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00762-of-01024.json.gz": {"num_bytes": 318099583, "checksum": "b8fcbbf9b55cde2ff66ca046884870e1e5f2d2a729a8eedb253c16fe0d7658e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00763-of-01024.json.gz": {"num_bytes": 318354409, "checksum": "ce2d9e44161b13f6226cfb9f93ad42fa0edd18eeaee923c8ab31c25aec1fc976"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00764-of-01024.json.gz": {"num_bytes": 319181291, "checksum": "53ed1ef77f24bdd7c189aae0905d63be97f48aa3233fda139e59af53baab242a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00765-of-01024.json.gz": {"num_bytes": 318147738, "checksum": "26b9b9ea2f94b322c03d1b83b25ab4e9a1a203fe9923728c5dd91f22d5f8fef5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00766-of-01024.json.gz": {"num_bytes": 317964368, "checksum": "e59fec52abde3fb4cea58a5a4e511f4cc61e21062bfdd1e3ffd60131a847e0ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00767-of-01024.json.gz": {"num_bytes": 318750919, "checksum": "0e5eff983e793a3d7cdd1ec85a45d58e5e6ecf7a12cf83a01888e148ab08acf9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00768-of-01024.json.gz": {"num_bytes": 318978892, "checksum": "171509b0bed8854b6de92fe146993be80ab31e0aa56953c7b0a66eeb738ff70a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00769-of-01024.json.gz": {"num_bytes": 319386097, "checksum": "704e7daa85c0e3ac974d51a6e2cf6df2ee053613fd2b77b5fe16d10b29a50a4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00770-of-01024.json.gz": {"num_bytes": 319623528, "checksum": "e787064473427fe17ba95d9326d009e9723148fb314a7a9605dcb6698854dad5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00771-of-01024.json.gz": {"num_bytes": 318911381, "checksum": "c54aaffd8162b30280e974e81e9d0669357b74394e0da2d1ca2ce613f5715e4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00772-of-01024.json.gz": {"num_bytes": 319386949, "checksum": "2f9c83681632482df6c65e4c70718c83f500305ee1d061626cdef35bd794a412"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00773-of-01024.json.gz": {"num_bytes": 319962599, "checksum": "f47c487ba09051c9a4bf320d69db9546e98948e3de68050ae2ba025c71e09146"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00774-of-01024.json.gz": {"num_bytes": 320370991, "checksum": "69a1eacfdb6f6fd49ea2b729a7ab291b96fd5bd42f993e2306d044871b069aa7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00775-of-01024.json.gz": {"num_bytes": 320433220, "checksum": "d35934fb537d1283d40897d05c1486f629776fe9e4ef127694ecfd0221f860c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00776-of-01024.json.gz": {"num_bytes": 318809986, "checksum": "9079970aa1618b6be51caeab7a2cab26e61c30aa53af361a6184ef6249bf65a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00777-of-01024.json.gz": {"num_bytes": 319617796, "checksum": "5e200e354ece1713a32a3e1ebcea33412de814dd5843df3523afa1ec9a4d5275"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00778-of-01024.json.gz": {"num_bytes": 318039278, "checksum": "b79309eb335c0c860c85d2b724df52c3613f61b92ab6cd6276c2be8c25a7b01e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00779-of-01024.json.gz": {"num_bytes": 319078058, "checksum": "fc6053d53255e4d4a4c22c42049ce3eabc224320a51c94c1116f3201f87b377b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00780-of-01024.json.gz": {"num_bytes": 317637428, "checksum": "e38c933003910b02beef64af2d330f32af6e6f3b7346fa121e89045c136c13af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00781-of-01024.json.gz": {"num_bytes": 318792407, "checksum": "b6795b4db199f7a7a92ef195aee3753e5e00df05fad2d8401b2b9feb56d71a76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00782-of-01024.json.gz": {"num_bytes": 319081289, "checksum": "dc20640bded03596eeec689f1293be55e72d138cf0c576df9768c7631931ceb9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00783-of-01024.json.gz": {"num_bytes": 318663257, "checksum": "ac2b4ee9ab8f25ec010a17358d2f3f1fb9d8d50c9f4b73357429277710e6564f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00784-of-01024.json.gz": {"num_bytes": 319687102, "checksum": "fb93dee8a974f2ea204c240ed4c24e1b64f91ccb421070be305487e4e53ca083"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00785-of-01024.json.gz": {"num_bytes": 318909034, "checksum": "2f298b358cc619fa72097e3dbd9ac91e7dc3f7c5f9c4f2ff6881c988921d2a6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00786-of-01024.json.gz": {"num_bytes": 319213094, "checksum": "60ebe35e0f23ccc61fc0eedc891ea9deb43001beb8205d31360a05b5d58e31f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00787-of-01024.json.gz": {"num_bytes": 318335621, "checksum": "a7b0aa4dafdda2f3dc3c1832b71d4a92af08f99a70a315b4cf9f60c1768bf2c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00788-of-01024.json.gz": {"num_bytes": 319444037, "checksum": "874dda510a01a2f78e51d917d309bcf1a0f21e7e1ca46661f93931a6200b3d01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00789-of-01024.json.gz": {"num_bytes": 317955670, "checksum": "ec949a05ec7750dacfdf692c1ba118a33454097fdcaa56626fb042eb93933811"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00790-of-01024.json.gz": {"num_bytes": 319033823, "checksum": "0939164a602d7c7140c619130977b6814639122d0038aff7bb840093def5172d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00791-of-01024.json.gz": {"num_bytes": 319366402, "checksum": "fd6ea942b3402b5da4acb1a03bf59b17df402e90c47dbb66fb198ca2f4b5e1cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00792-of-01024.json.gz": {"num_bytes": 319218667, "checksum": "9e8af5aaa6d5ed915eae334c6101948fbcc7bcf6c8c6beaf80fd1adecd67b078"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00793-of-01024.json.gz": {"num_bytes": 318865241, "checksum": "675330d6736a677760d854dcdd9a174eb7c1d426f94e34836a048c2139befac0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00794-of-01024.json.gz": {"num_bytes": 319384084, "checksum": "fd4c2623d9cbaed3fefd6bb88c2d88b58fe8f08e9e8ef0cea6bb22cac68dabd2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00795-of-01024.json.gz": {"num_bytes": 317654308, "checksum": "157533ddb56290662e25cb60842327daec23e377e116496338c9313cbf6991b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00796-of-01024.json.gz": {"num_bytes": 319298258, "checksum": "fd90f055499095efa9cb848dee62406d25820f929554b0e07674d4c95db574b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00797-of-01024.json.gz": {"num_bytes": 320048871, "checksum": "e089a95e96a081dd76e38acf9506bfc7b86c682892d3a8774e9784019db39306"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00798-of-01024.json.gz": {"num_bytes": 319291246, "checksum": "e29133ab6f83c84a69752a451053dfe20887ea884e09cc373afd89bba7458664"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00799-of-01024.json.gz": {"num_bytes": 319175282, "checksum": "8f3f3a67946615bdf499d64341d200477280947e5be8538748e28db768115947"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00800-of-01024.json.gz": {"num_bytes": 316687275, "checksum": "c9a17dc92658ce5d062af25e5c8610a7fbae501627cfc7324ace7ca6a8d75d8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00801-of-01024.json.gz": {"num_bytes": 318710698, "checksum": "4b7d1e130fd8ba536da073069221f68d567492b2bff27d8769fb4ef124cec3a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00802-of-01024.json.gz": {"num_bytes": 318914381, "checksum": "9f186b8d08f5d3090b7c9eb8a6954cf3202caec7cbf5c308221333cd115af561"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00803-of-01024.json.gz": {"num_bytes": 319111424, "checksum": "117b0590a976805001a879c49c42db55579e5bb9a5d4db9ce20e42746f59d574"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00804-of-01024.json.gz": {"num_bytes": 318186018, "checksum": "ea376d6cc1043dee9a00e1eca1c431aa59755d8966162701817f9cf274a758c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00805-of-01024.json.gz": {"num_bytes": 320382848, "checksum": "1e69e7896202206f9f804b2497c4d99cca5c1d139efc782b8ede2cb88f68b48b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00806-of-01024.json.gz": {"num_bytes": 319508172, "checksum": "9da7e230c7abed9beaed9d6090efa8ae1029a418dbbf6d04bb4386aafde3dbce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00807-of-01024.json.gz": {"num_bytes": 319995091, "checksum": "2e3ba0dbe85c004c6a23b4caf340282e0d0004ab574a14bedc9c83c67cc2c0c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00808-of-01024.json.gz": {"num_bytes": 319880961, "checksum": "f53fd08fea0f874d727422357521176c6810a54abf4fcc7019357b50f1928daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00809-of-01024.json.gz": {"num_bytes": 317100774, "checksum": "dbeed220f330b489cc262fbd7cbe84f04ba8a5118ebbd8f48bc7a4f5f63ae7b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00810-of-01024.json.gz": {"num_bytes": 319625750, "checksum": "fe5dced88ccd54b258c6740d8988e10b128a869ecf28e7096e689c59fa147d4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00811-of-01024.json.gz": {"num_bytes": 318375975, "checksum": "e4bcc5571fdc4f51b733d975e78ff02939d3463264a02d7e651271ab91c81df8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00812-of-01024.json.gz": {"num_bytes": 319663092, "checksum": "b1e41c198bc69d026ab997fdeaa4e687f7a8ddfca751add9bc85f00481708a63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00813-of-01024.json.gz": {"num_bytes": 319094357, "checksum": "c07287aedf6854f581aaf83b75c4939aa4b10181977d4c4be97c20989ab8f992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00814-of-01024.json.gz": {"num_bytes": 319521327, "checksum": "c96203ba5461ef92a7a2b0d4e598efda943b5b3adf42a7268c26f1c224410c01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00815-of-01024.json.gz": {"num_bytes": 319098749, "checksum": "72f2e65c5b482be0d9e3a3d8f5cdb703cec7a515e927bc4411e2f6ff5085ed5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00816-of-01024.json.gz": {"num_bytes": 320377295, "checksum": "df95ac17a25cebb854088cca345f60c2634d07f088e45e251d7f9afdb334c0c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00817-of-01024.json.gz": {"num_bytes": 319007451, "checksum": "bad1cc25de4f66ff36c69284e6b615f68bdc25e45f08e04e33ee463a0c6ef0b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00818-of-01024.json.gz": {"num_bytes": 319609737, "checksum": "acf1b390f1c492d97bf027f06898f1dd5cf8cc6def41f4d43b38a0c99f4a85e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00819-of-01024.json.gz": {"num_bytes": 319164157, "checksum": "3d973eb401876c57e9cd1420fc938da9dd7b08f97d4596c66a8c159e2b56b1b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00820-of-01024.json.gz": {"num_bytes": 320181073, "checksum": "101d5f0079caa840b934c14800ba5cbb7fca22e9e6915b98b4dc5f37c57f5b4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00821-of-01024.json.gz": {"num_bytes": 320949305, "checksum": "34ba423c93c4262234e6e2005aba0436daa99b05570cff0a58e9d27b65d76896"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00822-of-01024.json.gz": {"num_bytes": 318392521, "checksum": "4a586e220fe34f544dd068f4e1c310459cabd5dbea9a991c21c09f70079eb4c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00823-of-01024.json.gz": {"num_bytes": 318526893, "checksum": "3b10a8e32a3a8f6541400d697516fcd3fffba3554e8d8a96451f01fc6b729d8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00824-of-01024.json.gz": {"num_bytes": 318640792, "checksum": "c921270db8004d309f91e3209340c476191793d47b3cfa9d19fdc602d43dfe65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00825-of-01024.json.gz": {"num_bytes": 319524026, "checksum": "a6eb347db464976ba5d1aaa4fa64e103ba36520dd1e9c103644caf187be471a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00826-of-01024.json.gz": {"num_bytes": 318469810, "checksum": "dc5f88e6161ac06165f3cd4cb91a00cdff75d2f900e8f53d62bacfd833e352b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00827-of-01024.json.gz": {"num_bytes": 319391185, "checksum": "66a240be851d6622adf7801d9634a456e83e9edfd135601c0dc1aab48902d7cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00828-of-01024.json.gz": {"num_bytes": 319625277, "checksum": "2e989beeeb2a63bfb87a5a401619a8e4155a961b44441cb5f627c29f25962dd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00829-of-01024.json.gz": {"num_bytes": 320001237, "checksum": "0653e4052fb7a4ef503bdfbbee332d650492e99c130a85c04250e18d91cfd30c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00830-of-01024.json.gz": {"num_bytes": 319240468, "checksum": "bd56e55e75a8237b5292fa65e5ecb0dfbabef6ef0dec6695b13522803210f40c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00831-of-01024.json.gz": {"num_bytes": 319174603, "checksum": "ca9d6c643127a390823655256a45462ee6e75aa2485141f6530a3bdf6ce4f572"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00832-of-01024.json.gz": {"num_bytes": 318909883, "checksum": "e91c35d94e183515e660cd8c874c12bbf22e1fd683312446f02287b0d032fb68"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00833-of-01024.json.gz": {"num_bytes": 319095835, "checksum": "971d9a4f8bfce564d42dc0a80009acfa7d2f47557ac19836ab426defe1877714"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00834-of-01024.json.gz": {"num_bytes": 318319786, "checksum": "159412a58fb8deb59e039fa0102bdb746065cbc6b4d1d3da892930fbf8b0f178"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00835-of-01024.json.gz": {"num_bytes": 319959334, "checksum": "814518d53b3023e3b8ac22dad9d65dd50d455a4c7db1490022f447f793f4d24f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00836-of-01024.json.gz": {"num_bytes": 317642779, "checksum": "19ad4fbaa3ff5c638b77980300b8c162c21a8237b87d054a30c46aee67d0ad94"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00837-of-01024.json.gz": {"num_bytes": 320687986, "checksum": "190de7948a4b163047ecdfc856e5f78bbff52ca883edfad26b32fbc0b57ffe36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00838-of-01024.json.gz": {"num_bytes": 319802866, "checksum": "ccb4d342791a187f3bde225e008ff8cf70465f7fd3eacaa8bbce1ec4e52c2622"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00839-of-01024.json.gz": {"num_bytes": 318621894, "checksum": "3ff5cf5b33996a663df5783f3f41a5b5b2f6e08a2cf91e74cad3bf82291192fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00840-of-01024.json.gz": {"num_bytes": 319757379, "checksum": "8292e0854c01ca79ef03dcc1752ddc1f0df747ad67551b7c0fa5208b6aa3f822"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00841-of-01024.json.gz": {"num_bytes": 318779722, "checksum": "9eee9e089bd396adf5a276eddca9f6352e07f8c33877f85c1f65968aa0c06128"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00842-of-01024.json.gz": {"num_bytes": 318692591, "checksum": "caf3f40a144b43af08687e41a1eb7d08da1b78cd1600574566e11f29fde9cd34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00843-of-01024.json.gz": {"num_bytes": 318944616, "checksum": "e74d624534091173546755ca236e5912cc8acf8cfef5f9c197b541ebe76f0818"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00844-of-01024.json.gz": {"num_bytes": 319392887, "checksum": "e47d3f44f996398b54f18729f4e81d88d04b19bc529847e86277a6a91ae74e6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00845-of-01024.json.gz": {"num_bytes": 319215311, "checksum": "de7cffe64f422b02668137272943537946c15539954b564345d6722c4eb06345"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00846-of-01024.json.gz": {"num_bytes": 318129297, "checksum": "1d5ea0ab8fcb3975735aa421d646cea4544087f60a79ec209b63c93b6318523f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00847-of-01024.json.gz": {"num_bytes": 318134095, "checksum": "6fa4c50808df2aa8efebae3bbf832ba2b0be2f7113633fef720cffb3c50143a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00848-of-01024.json.gz": {"num_bytes": 318521356, "checksum": "3aeb657aa448af82551c653802c669c985c00b7daa593de07f80733ae5dee84d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00849-of-01024.json.gz": {"num_bytes": 319541694, "checksum": "1cc016f58a4a2c54625214f028df05247ed319b8c1868c96c2efe8147a73d08a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00850-of-01024.json.gz": {"num_bytes": 318861613, "checksum": "eb5fbe6eeb4b0281604df264a5b04a3a0db96ff0d04f252375a788a0d3345c67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00851-of-01024.json.gz": {"num_bytes": 319356648, "checksum": "ffe1397f1d412979cc66820555ef27345f3a2a48b8bcfe682d48301135e8c12a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00852-of-01024.json.gz": {"num_bytes": 319662372, "checksum": "fa78ed98d602276520e823e17adc7f796320d95e27e08d84d06e66e415b79161"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00853-of-01024.json.gz": {"num_bytes": 317625507, "checksum": "b10cff62fac5191b9cb5e2025227adb838088773e79bfec0937a34bb857e1b1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00854-of-01024.json.gz": {"num_bytes": 319665550, "checksum": "15441b2a7c09a477389a8fbd7401c549dc8281f2bd44251b1546077301e24624"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00855-of-01024.json.gz": {"num_bytes": 319059897, "checksum": "f6127845b162181dd7157dd316021a4e6b5d41393c66d3e577491cdb74657f2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00856-of-01024.json.gz": {"num_bytes": 319243991, "checksum": "ec9f0884c5ddf82550105f969222d3ee8b0d4907a0a2540ea6c8c67c2d2e9179"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00857-of-01024.json.gz": {"num_bytes": 318546680, "checksum": "840205fa73336ff51d75008ce8c530164ebcef3b50f1ad8deab879a67acf8d5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00858-of-01024.json.gz": {"num_bytes": 318306547, "checksum": "e9b3819e9dc98d66a61f8f4e8f6ecb03099c79ae87a175fe1ae484174b173b44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00859-of-01024.json.gz": {"num_bytes": 319088302, "checksum": "eced8de72f8755fa0dfb690c626cefcacf5fbbce97029d4589058913c31b9339"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00860-of-01024.json.gz": {"num_bytes": 319704792, "checksum": "90a169718609f16abe120c4b63a20adc0bbedba51de14b004d34dabe530339f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00861-of-01024.json.gz": {"num_bytes": 318444445, "checksum": "d020840f09fa426ee15d19f05e5afd9cf674048e0dc4438dae0b6f02c7227d9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00862-of-01024.json.gz": {"num_bytes": 318606300, "checksum": "e02bf9d3f1a398972f7d78b9b1aaff9a92146554a1358ea1b16ce7873a9f8fd8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00863-of-01024.json.gz": {"num_bytes": 319273730, "checksum": "c977f143cbb5e61160ce76f1cabf7bea6c158abb7e159ec3362aad1cc7af0ade"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00864-of-01024.json.gz": {"num_bytes": 318143165, "checksum": "bdf20dbde61f0663feb70be419c39c60acdc7ecbbe1430d47bf79ae2e114f168"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00865-of-01024.json.gz": {"num_bytes": 319041356, "checksum": "11c9c068ec5c1b612494c1473b7cace67a55ee66155559b19035df180ee260a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00866-of-01024.json.gz": {"num_bytes": 319758401, "checksum": "ab4436f283af0ef2d33b93cf026907cf68255beee9d9dc1d6c542dee9c3f48a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00867-of-01024.json.gz": {"num_bytes": 318991336, "checksum": "56beb5edbca3b66981f5f8e65f2a13a0f6e99e68ff50cc263cc529a4d8ebf371"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00868-of-01024.json.gz": {"num_bytes": 319984390, "checksum": "b9368d2ae0eff869c70c1a1214126c1d084f56887102d3d46e450b2c934102be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00869-of-01024.json.gz": {"num_bytes": 319462888, "checksum": "68ab404e0ca2247686eb264a0d7feeb9d2460162434f5babb2b1da82d865343e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00870-of-01024.json.gz": {"num_bytes": 318426018, "checksum": "2d60208a558f6ba92d6c6307e1ab626acd7ff3b7bc25963b09e87e464751c42b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00871-of-01024.json.gz": {"num_bytes": 320233396, "checksum": "ee2517922079c713605dafffe6bc0db0a947abf64ff92c409aa1015b92cdb099"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00872-of-01024.json.gz": {"num_bytes": 319570251, "checksum": "83ca4f125bd628cb28210fb874db717635009e36c60b42237bda48fcb611a53f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00873-of-01024.json.gz": {"num_bytes": 318755978, "checksum": "d94ce49fd17da5f70d1a89bc9e5323daa54f0b8417e1ee5d991467c80c068ec7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00874-of-01024.json.gz": {"num_bytes": 318986904, "checksum": "f634915d1b529d9d728fd96993bb151dc07016767cd44ceeedddec73eaf37074"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00875-of-01024.json.gz": {"num_bytes": 319116193, "checksum": "6367b1216e1c6ab18af66471d866f39caeb9a538209134a9e6bbbcb81bc51db7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00876-of-01024.json.gz": {"num_bytes": 320829257, "checksum": "c9ad4ab8c6e5995aaacd72ebc6654b43b4756804bf3cea808610f9b618f98fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00877-of-01024.json.gz": {"num_bytes": 320082625, "checksum": "835ae7d54732c309bc9aff231268474af66653b06ad6ca17b54dab6f4a7d30c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00878-of-01024.json.gz": {"num_bytes": 318964554, "checksum": "49c761449d5052dd6c408268c77196bffc5125eb5189390f73ba0ce8550f0175"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00879-of-01024.json.gz": {"num_bytes": 318699617, "checksum": "521e1c5fa967a6f29641e7c4c2b210acda0736b32f318e24aef0e587895ed492"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00880-of-01024.json.gz": {"num_bytes": 318723630, "checksum": "dee1814b24f9bbc3aa3430cd80302b08b863eb1b92698158960b6be216845843"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00881-of-01024.json.gz": {"num_bytes": 319839271, "checksum": "9e57ea6a0e3d8a7798a0cb3e6344e1711e8fd879e2e396294718ff360fc7c4df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00882-of-01024.json.gz": {"num_bytes": 317773196, "checksum": "2e5e5749618e53668222c7d310929e2177772dd7c14592e61dc86f163e353c8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00883-of-01024.json.gz": {"num_bytes": 320262049, "checksum": "f80afaa4495a2d41ad4d7380b79040569179b24ef5c2df17f75ce8e135d786b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00884-of-01024.json.gz": {"num_bytes": 319146213, "checksum": "77338479b420dab9316a4737fc243de84b5e88392cbbb46fa0619045a42432cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00885-of-01024.json.gz": {"num_bytes": 319022605, "checksum": "3a67fee2fb77e64aa13fd595d7786b432203f36712ff723ec5999a341834b38c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00886-of-01024.json.gz": {"num_bytes": 318624429, "checksum": "2afe387f2500c57294acf1403a8c27f27f6c7c2d228dee0f1ed70a02c438f838"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00887-of-01024.json.gz": {"num_bytes": 318733911, "checksum": "3fe087b3441f74730ab137ba9486650cfedfe2d724573c3d166565d7d1e40938"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00888-of-01024.json.gz": {"num_bytes": 319926754, "checksum": "dd2df1977458cac34ef1e52059bbc28738e541761d7ad11c0ffc8ef3ca061190"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00889-of-01024.json.gz": {"num_bytes": 319085344, "checksum": "4172244cc3fc4a4e9e09f04f8097cbc678aebaedb9d1fb97b1daae16b0b8ef45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00890-of-01024.json.gz": {"num_bytes": 319838671, "checksum": "8ffaf34eb8209e7ec250303298f9eebd2833fedcf80414c20331e8dbed42251c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00891-of-01024.json.gz": {"num_bytes": 318169092, "checksum": "daaf74ba5d12a7415da94be0f4454336aa3d86ad5cd300dbe30cef596835ac8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00892-of-01024.json.gz": {"num_bytes": 319662776, "checksum": "6d99c0419a6c9633620fb0aa7b7610cc5d06696e839a1a52953fd7db7a18e053"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00893-of-01024.json.gz": {"num_bytes": 319541919, "checksum": "5f246aeacef0dc8d40a036bb1eeecf278f66d7215a134fb746d30f3420d18c18"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00894-of-01024.json.gz": {"num_bytes": 319528897, "checksum": "9975fd5d23d25938f00de3fc9240d77c27b4784c2f443b1914652a06d3b59fcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00895-of-01024.json.gz": {"num_bytes": 317548307, "checksum": "7af9e2abfaebd4afe05a0e28d3e6e3126800a8b9b7ad49de360e42f2eb2c8506"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00896-of-01024.json.gz": {"num_bytes": 320278601, "checksum": "1941689d6a0e449423faad6e41714f33d5b23cdb1bb73961a888a87678fc74b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00897-of-01024.json.gz": {"num_bytes": 320161831, "checksum": "3d951cb1ae4a9b3c6ff70555139435febda83d24bb04ea27b229a05424b470c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00898-of-01024.json.gz": {"num_bytes": 319341305, "checksum": "3227b97aa9ff57b62be2a26fd8131e9ea45f7731673acb43432e529ea4978a25"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00899-of-01024.json.gz": {"num_bytes": 319658969, "checksum": "c746f8bd5fffac933640ff39db0b9d7b022edb28d7a4b3237d8c69fd919b7b48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00900-of-01024.json.gz": {"num_bytes": 317494627, "checksum": "0327f0c57a668b2b34e72f4c53d4cfaeed787d879843d0bba27b5be58d1ee5fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00901-of-01024.json.gz": {"num_bytes": 319683481, "checksum": "886449092779ee26fccd11e0c89c36e449346dc6b1f0a7cb15b6b53c897790a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00902-of-01024.json.gz": {"num_bytes": 320228529, "checksum": "6960d8539df78e98858ba8cebb2e637b6c2ef20890b5f2af1cbf4621b52c364e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00903-of-01024.json.gz": {"num_bytes": 318961279, "checksum": "4ddb3c9e9276d220f1d4dfc32bb61a090e895e9e3c9f53c169db99a024e7cd95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00904-of-01024.json.gz": {"num_bytes": 319926290, "checksum": "69a941cbbcb673efdb254c162854fcfff6fe1132182210235b91d1d21ed4d2ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00905-of-01024.json.gz": {"num_bytes": 317982280, "checksum": "1d9613f366b91102d018e57894df520aaf1910aa98e06cf369d9676e498610c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00906-of-01024.json.gz": {"num_bytes": 319012210, "checksum": "4855989c814582f5cc0a5e9b8f9d1f642ae33de81625d4bbafaafb709c1cd260"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00907-of-01024.json.gz": {"num_bytes": 318515420, "checksum": "8f34dbaa454215922a29fea975357e4e705381a65e4dcaf8b0d8c200f9a277bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00908-of-01024.json.gz": {"num_bytes": 319286320, "checksum": "536bf0610a2c14d1d59aea0b52fdc29cec19cd7eaa4c3a5e5fec04dee103b29e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00909-of-01024.json.gz": {"num_bytes": 319938295, "checksum": "3bb3943183f579c15d0d30440f6c82d0c9c64d6ded398dfc7c67502d73868781"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00910-of-01024.json.gz": {"num_bytes": 318423425, "checksum": "adbdcf170531c725b54c1e5713676b789589b2fb77310f3e64a0cc30b83602ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00911-of-01024.json.gz": {"num_bytes": 319578185, "checksum": "a1342a95ce77013820c36e7d038ed47ca4d40cdf3584a66abc310132435b25fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00912-of-01024.json.gz": {"num_bytes": 319154715, "checksum": "4973afcb1d7b4816e3a3df1b9ce1e48a0eea4fe8ead5f83ea753e46a934e5ddc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00913-of-01024.json.gz": {"num_bytes": 319011218, "checksum": "c9a158f69a123859569e1cdd475355afda32d7e5c48001591f0b6c20dc17d572"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00914-of-01024.json.gz": {"num_bytes": 320027387, "checksum": "61f6c0f839908e7d3105a6926c501bcacd293d1ba50c3b8639ee227c9a8270b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00915-of-01024.json.gz": {"num_bytes": 320280632, "checksum": "a74fb91d8f7d79b09017a7f996b6ca5d59e4ecad9fec354ac977c0076d53fc66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00916-of-01024.json.gz": {"num_bytes": 319278877, "checksum": "cbbb8dc274fabb4435db5fef5da1d91671e1a4c7f3f652742324f9632b01c5dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00917-of-01024.json.gz": {"num_bytes": 319616831, "checksum": "31e62cbd6209fb7831078e4a262d1b25c0590f9425c62b2b208d4030ed5722d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00918-of-01024.json.gz": {"num_bytes": 318635363, "checksum": "95e5c2f51abc9ef4c0422e91b77f79ff83c8cc38e585df621fbc0dfef48a84c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00919-of-01024.json.gz": {"num_bytes": 318885096, "checksum": "ea5960d4fbc7d5e7097edbf2c9c706e6b7c7e9d3e36633be9bd68c4038955f10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00920-of-01024.json.gz": {"num_bytes": 319228627, "checksum": "73b721ae576dcfa83bd963e49530f73d76b788a669e3abc1c02189900c80cf02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00921-of-01024.json.gz": {"num_bytes": 319557114, "checksum": "710c65cd504e87b5019c01f658e669d1e023473d879913a9522760d33546cf24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00922-of-01024.json.gz": {"num_bytes": 319356053, "checksum": "f0b54b3c6b51a356debc9414df0438ee525ae5114cbb7c8176634b7493095022"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00923-of-01024.json.gz": {"num_bytes": 319766600, "checksum": "d5b80091c8113c283d91ff5826b46068b96c423c0dc74a646e2c8d1c5d815cea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00924-of-01024.json.gz": {"num_bytes": 319733540, "checksum": "56a54c7d4114c21c1657df0d295839c2bd4904cd1b651104e2a155c2bf1b5aca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00925-of-01024.json.gz": {"num_bytes": 318944357, "checksum": "4d396c29cd1d9ba16016fac37c333c0a872f6cb0e9faae7966e53f6e5c879d67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00926-of-01024.json.gz": {"num_bytes": 320276135, "checksum": "39a64c261a76d5e13f187f12c886b22e2db08fba968bc9d0c1cb0d3c241abda7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00927-of-01024.json.gz": {"num_bytes": 319181837, "checksum": "86db529dd52fb67173588fcbc9f0e52c99ad6dd34e44865150bc6c962de5b3c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00928-of-01024.json.gz": {"num_bytes": 318966114, "checksum": "d232df8033ddaa7397dbcfa8ba4ded9421ee9bfc091c725b311fd963b29f13eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00929-of-01024.json.gz": {"num_bytes": 320087917, "checksum": "fca6bfe8fe17c867681c58df081f2186dcc6bf22e46ce3783f85b918644c0b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00930-of-01024.json.gz": {"num_bytes": 318921677, "checksum": "b8031359e758cd835c44e81303e04ef7b2137d2e1a9472d7e04552c353d883c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00931-of-01024.json.gz": {"num_bytes": 318978028, "checksum": "bb5f2ea8a2e56c69813bdc08cb243c0763126e7b5f6c5cb57e7f4767d2126f89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00932-of-01024.json.gz": {"num_bytes": 318627424, "checksum": "f6fd2065ce202d5347243a2b396707bb606be20c1829989bd7dff6d9fb7adec9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00933-of-01024.json.gz": {"num_bytes": 320226802, "checksum": "b303d2ece81c1f7b882703b915765212796518010aea6a108a441dd0a84a6128"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00934-of-01024.json.gz": {"num_bytes": 319908526, "checksum": "e5b05714922d132073122e83933853f52f0046c9f51f985cfbdbd310e8d677de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00935-of-01024.json.gz": {"num_bytes": 318941663, "checksum": "4296055a31409a778c516afe25a8108f23dfffaf13cac33e5ed834a37c46b37c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00936-of-01024.json.gz": {"num_bytes": 318430860, "checksum": "4634630c012ed184b264ea01c97f7bb3f1af030f2466f1d99d20bb0472f74511"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00937-of-01024.json.gz": {"num_bytes": 318008229, "checksum": "131cc9a2fef4ebe81749f1844b7c4b194b97de7db4f5253ce59207e68d8b4df8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00938-of-01024.json.gz": {"num_bytes": 319099506, "checksum": "fff55e3b2ff8b53e56ab99def626a7334ce67d2414351b2e83d84298052dd9b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00939-of-01024.json.gz": {"num_bytes": 320457851, "checksum": "8431e38c86516ed88d5c028f4a1dad32b02bcccdc03f9687d18f8312e493bcb7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00940-of-01024.json.gz": {"num_bytes": 320607829, "checksum": "a68c577555781adc777c09c68f623431469d67e9b66af7b0813f09a512b7d777"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00941-of-01024.json.gz": {"num_bytes": 318923471, "checksum": "807ffde4034b6b95a5eacb71f093686586ca11e417517894cca99dfe7b12563d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00942-of-01024.json.gz": {"num_bytes": 319880902, "checksum": "d03d04f619a8f3afbefa6d67986f50d5ee264c45de36c0ba67b069e343e002ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00943-of-01024.json.gz": {"num_bytes": 319079341, "checksum": "e482c4dee03a34a1a5756e6def26134c9a3f18ee386f5569d6cbf16d3875a429"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00944-of-01024.json.gz": {"num_bytes": 319436318, "checksum": "6241f9f35640598c05bc5cd00d8cc024dde59c0065c8935da229a8a583de32fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00945-of-01024.json.gz": {"num_bytes": 318998098, "checksum": "85f192c1ee9734da0f1dcad31c2b8111076977582e139ecc1ba959bf2df6b262"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00946-of-01024.json.gz": {"num_bytes": 321951470, "checksum": "44bccedf6a8db115bb6563d6775ff03c67511ce4e23a2de77e79edcb568c9fa1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00947-of-01024.json.gz": {"num_bytes": 318689631, "checksum": "36f0bfa191ad7d51452d51249c724150f8c3774142df3720f176f2772f42f3fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00948-of-01024.json.gz": {"num_bytes": 320347661, "checksum": "f4a7afa90b6d81a4cdc99100b75b4d3174c4d5d670042766c3e0418b7a97ef80"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00949-of-01024.json.gz": {"num_bytes": 318054841, "checksum": "f39d0c9bfc0a562ede67b8cfc57e6974a8a999e2bbc1b6940f107169b4f06e4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00950-of-01024.json.gz": {"num_bytes": 319722042, "checksum": "bf376260e5a838b3b901ceb22f922829619be710718446ee95c24400cbc73495"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00951-of-01024.json.gz": {"num_bytes": 318315382, "checksum": "987cd895f63bb74c9d4ce229ee853c7bce53c75c324366a0d06377c36030e39f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00952-of-01024.json.gz": {"num_bytes": 319247792, "checksum": "d218dda02748a22821c2ecccf1cbb136dc8772a25ddfacc7ab354fc089470e87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00953-of-01024.json.gz": {"num_bytes": 318411551, "checksum": "698768f3d7959b33fa74a3827e995b0c184bb3b4c46eba667d7dc3365fdd07f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00954-of-01024.json.gz": {"num_bytes": 318809810, "checksum": "651d9ff43d5a3f7f5945ccf26b9410018248bf64956f3485c50b0df9034fb2ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00955-of-01024.json.gz": {"num_bytes": 319761211, "checksum": "29fa5c68fb8d3719e5f5f17568ce888522de64499554b5f0f4dafafb4ee5b40b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00956-of-01024.json.gz": {"num_bytes": 319255736, "checksum": "333a90a9c13f71e41a7cdd4784684bc142c79ef99155b9d62d062db318798b93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00957-of-01024.json.gz": {"num_bytes": 319504417, "checksum": "730c90615fca09c81d9644cfae40d325851bb9bbc1af696caaadd67d8282ab5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00958-of-01024.json.gz": {"num_bytes": 319066016, "checksum": "bb565af6529720ba2a3e989769b33d978ef49cb2aae49c60f2ff98a981414280"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00959-of-01024.json.gz": {"num_bytes": 319887940, "checksum": "8992783693dd0ad5ce07427f6b5739c818f13952d90bb61312ec98f9c813f313"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00960-of-01024.json.gz": {"num_bytes": 318051437, "checksum": "4773edbc822ff8d51ec13af6c371214aea7545047d9babeeac0b29180d52fa0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00961-of-01024.json.gz": {"num_bytes": 318373291, "checksum": "ff33854746566f7d3b4ba9eadd1329ece48c034345fda000d9af73cb26d197af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00962-of-01024.json.gz": {"num_bytes": 318572513, "checksum": "a6d07f7caf55fda0df74a22b454d196fb2e29312d433bc5506b00448c22b579c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00963-of-01024.json.gz": {"num_bytes": 319488084, "checksum": "453f666c6578376508b1fe8bd3fb8ea5bf030aca5cfedf383cd23b27de15228f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00964-of-01024.json.gz": {"num_bytes": 318905670, "checksum": "74f64ed6583e6a4df4b3c3f8a76263a2d63905d51d5680d9683d86f5039d5b56"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00965-of-01024.json.gz": {"num_bytes": 319452844, "checksum": "88016c1a0663b89dc3d76689c827c82a6d128401ae05f7b70c8727d75302cd47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00966-of-01024.json.gz": {"num_bytes": 319334588, "checksum": "dd9300bdc27513dd62578e1cf3c8302647b49c61185c282a684011d788c43d17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00967-of-01024.json.gz": {"num_bytes": 317872396, "checksum": "90747ee63ac7d8176fde1f2afce8deb7e39bf19e682e17d0fcc1711d09d5f1d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00968-of-01024.json.gz": {"num_bytes": 318988069, "checksum": "2cc785d650013d35d5d31b1e85c5530b197687c69117881362bf6b98f47c22fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00969-of-01024.json.gz": {"num_bytes": 318324244, "checksum": "83750d93c788ad32a256862b8173db3549eedf52ac131f09f662f1fe0f46bd13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00970-of-01024.json.gz": {"num_bytes": 319494164, "checksum": "e0e46e185851ec569dc13a18519988ad926bdcd9bf448eff00aebf6df141f5cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00971-of-01024.json.gz": {"num_bytes": 318714665, "checksum": "941c9bf116353230417950d292c38b12b00935184162227eaec01870ab7f4510"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00972-of-01024.json.gz": {"num_bytes": 319518275, "checksum": "de30e19a155a6f4303afb0311416aa84cc3baf5a09cef55b8e2adc2a4f478f6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00973-of-01024.json.gz": {"num_bytes": 318092574, "checksum": "f70bf6727f1f308d93684ca41e9c2c68dfbd737a90da6375b58f162e8470fdea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00974-of-01024.json.gz": {"num_bytes": 318555677, "checksum": "109fe184ac9498ac571cd9c6cb38ae5ed566b0e98e8b7718984656a70cc6b224"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00975-of-01024.json.gz": {"num_bytes": 319045215, "checksum": "03c4257851857450f7397ac3d627a60ffc98708ad5aac6e1f73e6ce818fe7be8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00976-of-01024.json.gz": {"num_bytes": 319172031, "checksum": "7d98fa662aa9d0ff7ed50cc72195bdda2147212b34a3d22f0f757a4eb158d5b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00977-of-01024.json.gz": {"num_bytes": 318650530, "checksum": "bb8ccc07ecc6fd39ae97136418efc543efe5541e85910a7f333ee5cebaa3b595"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00978-of-01024.json.gz": {"num_bytes": 318609909, "checksum": "40b49f3fbb2fce73bb1851304b290fc7fb400d13c2448ac7e5e559dccfda7ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00979-of-01024.json.gz": {"num_bytes": 318881197, "checksum": "b29f96cfba574428cb66f54b20c4a848bc83438256167afdaed576a3931117a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00980-of-01024.json.gz": {"num_bytes": 318506081, "checksum": "a15996adaaf41e5615cb5c7fa2ef1b4e3003836542d0851d1c6907522f534fee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00981-of-01024.json.gz": {"num_bytes": 320000305, "checksum": "38e282b433c4e3dcc9fc2b056f6ddbe4eb857c5137f7c51301d53ca259d6bdc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00982-of-01024.json.gz": {"num_bytes": 319959158, "checksum": "97d5e58088a87a15b71db975d5e09b69daf497b7dff3ef809e1b8292caa27905"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00983-of-01024.json.gz": {"num_bytes": 318921242, "checksum": "f062e04f89132576ac1969fdaa43db761a0ff7e4269a6f173d87fa011a4c289b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00984-of-01024.json.gz": {"num_bytes": 319577980, "checksum": "e52a6c08d5243717f21120b4c3ebc8fcf77168928945adf68bc665392a6e8d11"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00985-of-01024.json.gz": {"num_bytes": 319812101, "checksum": "8b4f5645ae0e0b190af4ca5335c57735ae919d3c6402438af506c7907f1d1494"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00986-of-01024.json.gz": {"num_bytes": 319582409, "checksum": "3654109968d918aa4d8db17cb7057111c42894cfc7eee093df13036cfb3ac6fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00987-of-01024.json.gz": {"num_bytes": 319957581, "checksum": "4b9e6febb461940b993c50945a2ed06736c6786aa8f758565ff545814ebfddcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00988-of-01024.json.gz": {"num_bytes": 320346479, "checksum": "2891565dd75fd4354777b4f4f393983180584ee9c64b5d9b4557dbf26a3c4cfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00989-of-01024.json.gz": {"num_bytes": 318546717, "checksum": "929d0236c9fb77d638e0a18aa97b00004316bbb0ef3c4323e39f61aaf7c0af53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00990-of-01024.json.gz": {"num_bytes": 319606761, "checksum": "6ebd2552ecdcce7b194d4f6d5b5e66ede9d65da4e4999ee8ec4705d847e473ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00991-of-01024.json.gz": {"num_bytes": 319117521, "checksum": "1b3496964d0a895b347529ddb7b712d211c9419317fb41cdd6e20bba43f39f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00992-of-01024.json.gz": {"num_bytes": 317781551, "checksum": "9f9cfb5f9152b9a60121b03c24d944129c1ee43e862112fe3896e2772fef99a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00993-of-01024.json.gz": {"num_bytes": 319341839, "checksum": "fb329b7470ae127efe1be4adc960b06eec4f55bbcbe1f3f0f0b794d70a8aca14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00994-of-01024.json.gz": {"num_bytes": 320357337, "checksum": "bbe9a60c3c2b3b5b11a5d531d1d85f0a90ebe3dbc79189b3825e169ae302932f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00995-of-01024.json.gz": {"num_bytes": 317824612, "checksum": "26643091ae3425b63036453ffca7ed82c85c24b6a24264197e6516b68a39a4c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00996-of-01024.json.gz": {"num_bytes": 320453890, "checksum": "db33809437e62bf1f086f40e4d66ad0133db7c7d406b2ce52ce5d9c9b0809961"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00997-of-01024.json.gz": {"num_bytes": 319469732, "checksum": "3447b74f09dc4d63dd04d6bbd4382147071504338e6ea428b37c3a5174877537"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00998-of-01024.json.gz": {"num_bytes": 319562604, "checksum": "270a1c19e6321541398836d3d982c2e396db99abf94317912714251d1f68e8ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00999-of-01024.json.gz": {"num_bytes": 318895764, "checksum": "d68f8f4d85d91679c20e972b2b1955d41a8f6601873bb311a2621f4b3f3152a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01000-of-01024.json.gz": {"num_bytes": 317697031, "checksum": "68b47464ca3e97e9d3f4075b656f804c1bab667f231701db9cce1f0b0a921088"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01001-of-01024.json.gz": {"num_bytes": 318915840, "checksum": "582216879b058ccd4d0ca2edccaa2db49b64459371f8798a1d9c66c06a0cf908"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01002-of-01024.json.gz": {"num_bytes": 317811256, "checksum": "6864299a7d0174f92abc696dc293524291623891b86cd69132348fdf78760a4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01003-of-01024.json.gz": {"num_bytes": 318605529, "checksum": "4ef35b7546266f99eae5f332cbe3e284801c5d7b39f840297d67e71c036edf62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01004-of-01024.json.gz": {"num_bytes": 319379897, "checksum": "040dfa80eaf8355370d8a50692bc3ad03a1d57272af340d70031a4398f37b9ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01005-of-01024.json.gz": {"num_bytes": 319515177, "checksum": "012ac70ef2715181ec1fb578a2366d68e786d3a9ea41c59c08d7c494b89b429c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01006-of-01024.json.gz": {"num_bytes": 320078217, "checksum": "46030d85d8333ae224320fa54e487f3770de7de280cd0001344136b0bd87c431"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01007-of-01024.json.gz": {"num_bytes": 318526753, "checksum": "dd432d865ef3dba4b5af30e42b11ace96900bd7b97af053ea892292e75bd142c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01008-of-01024.json.gz": {"num_bytes": 319407137, "checksum": "165cd3a688be6f9f5a4cedde198a9dda4f9d3dbc1d275d1e99411f3ee96a0d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01009-of-01024.json.gz": {"num_bytes": 319763066, "checksum": "e44e86d497f8471e53531374b0e6ee61aac54996b6af64a4af0f5620673f9f7d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01010-of-01024.json.gz": {"num_bytes": 318653930, "checksum": "61115f16e718d3a2b66574cc17841aa5d02739762138abe3c9a7f325cf9f2e31"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01011-of-01024.json.gz": {"num_bytes": 320037079, "checksum": "65e18df845f1e6cce1bb92a45f71274dca94d3f0ece1d556116085b5c0e6338f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01012-of-01024.json.gz": {"num_bytes": 319753418, "checksum": "cd5a8ee1bc7d9ad58e98aa6fe56d60501115592519a19efcf9fa370668c6327b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01013-of-01024.json.gz": {"num_bytes": 318657671, "checksum": "986ead2c1b37f4094aa6f7a7882824ff013e6393323d5290d7f3e9215589d07b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01014-of-01024.json.gz": {"num_bytes": 318028602, "checksum": "3c82c0611fb1fb0f635eaedd2bbe7cfc9d53d1ae967a9cbd0416def046e4b104"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01015-of-01024.json.gz": {"num_bytes": 319164504, "checksum": "5eb5cf76022b12d8751a2fce5c4d4831066785a68edd7b3cd3dfc10017f91621"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01016-of-01024.json.gz": {"num_bytes": 318474894, "checksum": "a99d827be814e27d948264d6ae55c6a032a664f3ff0ef6ae94bda90f7faf29bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01017-of-01024.json.gz": {"num_bytes": 319516762, "checksum": "7eac25ebb9383a4592023634b852d88a128604c494972a8fd9e2b183fbb303a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01018-of-01024.json.gz": {"num_bytes": 319433935, "checksum": "35adb751748043a36f22b412d3ea0e01166037cd96216f516abc547e9d2609ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01019-of-01024.json.gz": {"num_bytes": 320305440, "checksum": "54c4d52564221e48dc5354cb51d447658707ab8edaa3d6d8fec5ec379a29d462"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01020-of-01024.json.gz": {"num_bytes": 317445661, "checksum": "edf1c6ab9900d75b91738fc7e9e3db8cdde3f9ef2234ff249833b5cdb04c65a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01021-of-01024.json.gz": {"num_bytes": 318134525, "checksum": "1c5e670ec9d815637e9bdbd75289c7ef7f3ecf384e32f403ae8a9fe2595cc983"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01022-of-01024.json.gz": {"num_bytes": 319809162, "checksum": "9def881764ca614c88ceabb41032d3e145f06c843a7ceebd87dba6b93c974a6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01023-of-01024.json.gz": {"num_bytes": 318155801, "checksum": "552a6a2be423c0ecbb767611074200c5b85c1cf76c8640c79e3be5e967b293b5"}}, "download_size": 326778635540, "post_processing_size": null, "dataset_size": 1657178361414, "size_in_bytes": 1983956996954}, "en.noblocklist": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "en.noblocklist", "version": {"version_str": "0.0.0", "description": null, "major": 0, "minor": 0, "patch": 0}, "splits": {"train": {"name": "train", "num_bytes": 1029628201361, "num_examples": 393391519, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 1029628201361, "num_examples": 393391519, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00000-of-01024.json.gz": {"num_bytes": 396728190, "checksum": "06fcf4d9bf6ae45fac94245952f000c924d2a0b5cc8841c916b3ee949333410d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00001-of-01024.json.gz": {"num_bytes": 395686133, "checksum": "8a0b64c5efb1db1ebcc0a664c801221049f5812652dc1a727a0e9f8d0df0cd0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00002-of-01024.json.gz": {"num_bytes": 397762165, "checksum": "087fabf9563297a6eab8bc39b68c0c6d15169032001d3a17c9bd964080759f2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00003-of-01024.json.gz": {"num_bytes": 395307518, "checksum": "1e5b89200528320e354f60be0868a3ab6dbbe667a6b16b48e4739b988a6360e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00004-of-01024.json.gz": {"num_bytes": 396280504, "checksum": "8291badbe84854960c0ddac3d6c226cb519268d1b3fd267bd72cfb4f10800de1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00005-of-01024.json.gz": {"num_bytes": 396636600, "checksum": "c74226ceada7d78e3e7a2ad931d0a99df93f4cc4377ec69d4f1fab4164c3d845"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00006-of-01024.json.gz": {"num_bytes": 395364336, "checksum": "4e52e99dfc4e55c41226978b4dbf48fac2f886b9b0446bc3bd576f32bdd7cfea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00007-of-01024.json.gz": {"num_bytes": 396428805, "checksum": "283ae93ecc3f8daefa9c47651ded763dc5f339ddc619c8cb5e32dce9cb9cfe4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00008-of-01024.json.gz": {"num_bytes": 395030041, "checksum": "d3fc7fffdf9c2172d233bea3bb7dc485d753319e6196672d0186b8ba04a1d903"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00009-of-01024.json.gz": {"num_bytes": 398255693, "checksum": "61e10cef5c2cab162fb1d26f97fd9d76b30c9ee989c01ef8597d2a4e35b303da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00010-of-01024.json.gz": {"num_bytes": 397825333, "checksum": "f72040887c2a2c17564c2c6a9a4b5ff95fce6a0eed4f0800cdeff8277af651ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00011-of-01024.json.gz": {"num_bytes": 397877458, "checksum": "ee34ff11164e10a86f76593205cb13986c70ea3d3a8849174a6dfb5b4ec91262"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00012-of-01024.json.gz": {"num_bytes": 398317059, "checksum": "7a3ef558efaca3e5d19e9ad02b47dd61f9639dd806130b62d66e9c3341c0edce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00013-of-01024.json.gz": {"num_bytes": 398518794, "checksum": "f5a6c18992ab2b59a9c02469d20768bf5757624e03bcaf92957ce736a3a9edb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00014-of-01024.json.gz": {"num_bytes": 397026214, "checksum": "c174b625c1534c69814f8e4879169b58af96f801dbb433113740af0d78535abd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00015-of-01024.json.gz": {"num_bytes": 395621683, "checksum": "4e8e52a602d4eb4b27104780f4a36617505505fb66a82f36e90631a4e668f5b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00016-of-01024.json.gz": {"num_bytes": 398138551, "checksum": "a3e7a95b16f09e09e45f1c3bed3524415581e21b065d8efcc66cece705dee4d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00017-of-01024.json.gz": {"num_bytes": 398720813, "checksum": "79cdb89052e8dcecd1f1319e47f4c4ae1d350ab81777a9ba8077cebdb558e795"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00018-of-01024.json.gz": {"num_bytes": 398538940, "checksum": "8da6aac3a794ce326b5a3971fb75a2ee848f008940d4f1bedd724ce7c5874278"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00019-of-01024.json.gz": {"num_bytes": 396834319, "checksum": "b57c93502949dad9001e89847947f6c65943927eb519e16de4eaf5590b235faa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00020-of-01024.json.gz": {"num_bytes": 396402861, "checksum": "05e14c7e21df3d4af7be7a597fa22463868464d6475282376536e12e82367401"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00021-of-01024.json.gz": {"num_bytes": 397560852, "checksum": "756d15d8b07414dffd7cff3efde606aa62cf8f73b85d8e1cd17408d6a339414b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00022-of-01024.json.gz": {"num_bytes": 397210987, "checksum": "60aa08d9c5d813d5f2448d910bc23a705cdd0828a9403c18ec223e53623889cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00023-of-01024.json.gz": {"num_bytes": 397563062, "checksum": "bd865213ffb2b40c2cd3eb16724b68c0f37e29f68215990dc84d91852c7c0d72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00024-of-01024.json.gz": {"num_bytes": 395799120, "checksum": "08ff3615ecea3eb5b55703e123475c95afbecfe7107eedf05750147c9ffd12ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00025-of-01024.json.gz": {"num_bytes": 398336372, "checksum": "e3e30b97e585fd881b3a1b006775854a11a2b967d992e7eea886338d8beefb13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00026-of-01024.json.gz": {"num_bytes": 396819084, "checksum": "fddc9e1a8405c5e05e63ce98b19c7833c0fd46392b4b55532b317e7f81426590"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00027-of-01024.json.gz": {"num_bytes": 397912380, "checksum": "d3e597b3a96b993840e47adb761cce2f2ae1c96aefcbd6c250198dedaecde15a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00028-of-01024.json.gz": {"num_bytes": 399078461, "checksum": "abd6d2341b6c61cdb89b80a8b9bfd938bb6d8a423a89e6a9f997c22c6479d537"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00029-of-01024.json.gz": {"num_bytes": 397303107, "checksum": "ee35a3af1056cdab79b644f6352150aeb6fb19a630cd6bc893a072e35fbfbad2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00030-of-01024.json.gz": {"num_bytes": 396602401, "checksum": "1d04d4bc295aee2ab80b24f587f8c483599db7d5a8157acc99a1d8b001f8353e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00031-of-01024.json.gz": {"num_bytes": 395941329, "checksum": "cf1dd244555511245c0e6a5b1dc9c24f747b8377674aa3690677ce08ebb8c26f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00032-of-01024.json.gz": {"num_bytes": 398049663, "checksum": "c83e5572647eba5ab14fdc4dcba8efb6981740b99b8f634e2c6b1942a051c249"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00033-of-01024.json.gz": {"num_bytes": 398044404, "checksum": "b76815aadcf4ad802071428864ce0b406cabd73dfc2be5e20b44885ec6a85419"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00034-of-01024.json.gz": {"num_bytes": 396885224, "checksum": "da00d92418fbdb9799d8f16977b3a33f67cb98a31808544cb68cf3b42ea9adf1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00035-of-01024.json.gz": {"num_bytes": 396185021, "checksum": "265ad43ce00666c83fd441d35ff29ba1ebf7d62442cc3e3c176091b4c725ea9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00036-of-01024.json.gz": {"num_bytes": 396702503, "checksum": "4733156df48f2dd0f2e859fef28f56d12a84e8012085ca9318073ae647b0fcdc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00037-of-01024.json.gz": {"num_bytes": 397582277, "checksum": "7d62d03c3496ee2e17ab6b9635710efef9e4cefb88ddccdc16ed720a414c38c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00038-of-01024.json.gz": {"num_bytes": 396186761, "checksum": "670affddf8fcca6933af3f5b30efd1bf490c3e38c3e90f2e8e9a464994d613f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00039-of-01024.json.gz": {"num_bytes": 397056953, "checksum": "4acbd97f9c8fd9a930a6f4284a11cfe37f6cca3b5858ae3c2cde747dae35e0d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00040-of-01024.json.gz": {"num_bytes": 397809786, "checksum": "d350e48a36bb1ba3125f72a07ed8024d26eae6d89ecac686ac0bdf3d5d89e1a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00041-of-01024.json.gz": {"num_bytes": 396944358, "checksum": "817a58dc40440b8b1f54d129db08ae9124e0293e5a0e45f034fbffb2140d90c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00042-of-01024.json.gz": {"num_bytes": 394327995, "checksum": "6bd6bc1269c2dd81db466ae9c41f76b8b8cf71cc7bd6e131452fa1a1318ff459"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00043-of-01024.json.gz": {"num_bytes": 396476043, "checksum": "f3525d9c861d984ea0cdacba7fddffaef058d8f95aa99ef1f09f9f0792fde5e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00044-of-01024.json.gz": {"num_bytes": 396893614, "checksum": "292ca2b6b9ba41567fe7cc60e5424aa1f3e431ac874d06ae8eb98794563a7d35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00045-of-01024.json.gz": {"num_bytes": 395885483, "checksum": "ea2c8fac41ededba7da8bf2bb48463d83f148e5c0970a689876d4932ab18a3c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00046-of-01024.json.gz": {"num_bytes": 396963386, "checksum": "97672d9bca357cd2721f51301aa37d37a271dd3ca7487244c057570b995da66d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00047-of-01024.json.gz": {"num_bytes": 395856712, "checksum": "52c517670ba4eefb262cb71373d6370f86ddeb0aea7391a47a22d52a55bff7a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00048-of-01024.json.gz": {"num_bytes": 396091027, "checksum": "49f5b68e29c55eb50da941eab1cf446c7d8c9d0b30290318977edb39ef0b887f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00049-of-01024.json.gz": {"num_bytes": 396892998, "checksum": "82a51eb6f301c00d927ca7920338247038cf4e9e0072d74c02bac897701f5859"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00050-of-01024.json.gz": {"num_bytes": 396308050, "checksum": "d72f92ecd27b716cd90cc4abe562d25fe6d49740b4a3d1fb9beac2526a61988e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00051-of-01024.json.gz": {"num_bytes": 396137777, "checksum": "a956e4d086077f7ab309ff10b0eaf4833e4d3ed74435293e96588f4361e1536d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00052-of-01024.json.gz": {"num_bytes": 398302544, "checksum": "5a54f7faa07661ea6a5f0585ca49ad66c8f7025fd9627b3af832dc886d50f78e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00053-of-01024.json.gz": {"num_bytes": 399616791, "checksum": "7f8fa496d50a0b7c399faff4c1864e24717b3f9c86b2552536c8f91e3e0cf9d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00054-of-01024.json.gz": {"num_bytes": 397332881, "checksum": "ab862f26b4fa38b6c16d8cfd0d63a9f0973827e45915e85aefb95d4e182b7b9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00055-of-01024.json.gz": {"num_bytes": 397075146, "checksum": "cb67aa9229bec8b88e496829aa0a60ca1c3ff4a2293632cf7782b69aa71aebfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00056-of-01024.json.gz": {"num_bytes": 397827600, "checksum": "2f63e3ec40d32237d4a50c873b966d7fc2c16ef5c04a2bcfc33328b128654e7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00057-of-01024.json.gz": {"num_bytes": 397533583, "checksum": "7c90bf39bddf8ad0c6a8bb3dff02caea8bbc2abbd76047c5d523930d2a00dbc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00058-of-01024.json.gz": {"num_bytes": 396411363, "checksum": "ee6059f3c8a2df34858a0110a06ec4e9673555fa56c1a2b40930337ba5b1b39c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00059-of-01024.json.gz": {"num_bytes": 396735510, "checksum": "d9dbe2421edba1820294e757d88aa25455db42ce8992f8933b51cd84cfc35a36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00060-of-01024.json.gz": {"num_bytes": 395694553, "checksum": "b05d6502fc95587fa7047fac64978d6be13761dcc6954629332812e5937c2731"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00061-of-01024.json.gz": {"num_bytes": 397740757, "checksum": "39303faa5dc33995dfec683b44fc24066ecccdf6b5001b9c0644d8e9899d45f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00062-of-01024.json.gz": {"num_bytes": 397358263, "checksum": "fe27dd467cc2c34abe5b0bb34473ee68859f2198eeb78304e1d2e54460a67383"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00063-of-01024.json.gz": {"num_bytes": 396826654, "checksum": "1da2c414bd03e5547d8c9c7447e42b8dcff5f6ca8ba35c53076f2895e8ea63f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00064-of-01024.json.gz": {"num_bytes": 395781869, "checksum": "af96de4d6b5bc1ab0527efa33a73d7eb788dca15829acbb7291ce72ad05e6c66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00065-of-01024.json.gz": {"num_bytes": 398192274, "checksum": "7f46ccfc1703fee106e932bc9a1bc5dedf7de944172cfa34ec9b31413bf0bbda"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00066-of-01024.json.gz": {"num_bytes": 397133438, "checksum": "dd3b67d8578927d7474dae76bdca35f35a2aa125fc50873e4a9f6e73d7a81831"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00067-of-01024.json.gz": {"num_bytes": 397204214, "checksum": "4cdc87a7c9fea33e15d638e5c921f45149212769bfba5f59f0a5943398ca0d55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00068-of-01024.json.gz": {"num_bytes": 396489592, "checksum": "64d175c23574998f8c5d28ce3d3f3934144b1fd4f6527ede1aa3420c28bb90d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00069-of-01024.json.gz": {"num_bytes": 397697351, "checksum": "3329857f531c9fa22d98bd567638f0564f73062da1478ca84385246f71baabff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00070-of-01024.json.gz": {"num_bytes": 398449973, "checksum": "bd13494aa03a95d943a01f3436f62c46ee3390b30f6ff0fec0636f3c0b09fa1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00071-of-01024.json.gz": {"num_bytes": 395498960, "checksum": "5e69529ae82c305acbf1f58a7021b4e3fc67285a871dcbcaaff0781d0e721070"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00072-of-01024.json.gz": {"num_bytes": 396170387, "checksum": "9b9c7e11b9bb2cf6ea0fcdfd58754f522a95070feae74c29559522e12e1b41f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00073-of-01024.json.gz": {"num_bytes": 395915819, "checksum": "87a2069589fee8de23730b8b994ba59d63d5128175b5326ba0a8c8ac9e01a3dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00074-of-01024.json.gz": {"num_bytes": 396986018, "checksum": "e073efb3f00db65c1ee14e8bfa6e8c807f7827d0f3dd4d4026f823bc6f61b1cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00075-of-01024.json.gz": {"num_bytes": 398555103, "checksum": "a1793748c7979e241ca34291c843ca3cc90dd7643f04810b6cd324220efbd6e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00076-of-01024.json.gz": {"num_bytes": 396357420, "checksum": "7b1cd69788ca9a7e614de70a8b908183f41f316eaadf3b0236a7c4e126db9844"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00077-of-01024.json.gz": {"num_bytes": 396666167, "checksum": "aec828d3c2a1f7fa970de328a8fd1a85a90493dbcbec4f50816ccbc2275a1fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00078-of-01024.json.gz": {"num_bytes": 398167446, "checksum": "e14bdf5af810574aca7c6f3daa67e503f24ab1705435a62129c66c248667ee97"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00079-of-01024.json.gz": {"num_bytes": 399696096, "checksum": "b63756f81b8b19ecdc9bf227045df10840cbf973b60bd8ffdf28f58a53cdb028"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00080-of-01024.json.gz": {"num_bytes": 398755610, "checksum": "dfc118f680b79260e7ece75f27c0459484eb8458f2422df9f1918f726b54ccb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00081-of-01024.json.gz": {"num_bytes": 396606787, "checksum": "17d6a503947f5132728f53ea62fd093f55bf2dc6a32316a5c0413353cf13eff3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00082-of-01024.json.gz": {"num_bytes": 395714484, "checksum": "8ca41818ee6a0ffd5b00714779289c18cd97d620258c5d3d741c482b72344300"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00083-of-01024.json.gz": {"num_bytes": 396807173, "checksum": "12d87c0a948f32f788497858751c3ef22f289136e6ae58518a97a2e976f5cdc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00084-of-01024.json.gz": {"num_bytes": 397241529, "checksum": "7c3da4ca4d2b2077f0ab7be511038255732fc88d954f2f17cb0f3ab144216206"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00085-of-01024.json.gz": {"num_bytes": 398357369, "checksum": "26df55183e78f8d69fb16e21d07edf98659b69bcb3c48f340da6a5bc44007f4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00086-of-01024.json.gz": {"num_bytes": 396997317, "checksum": "09f0641e9075cb88800d0eaae3f7b99b047552edbc71d1fd2d8594f645d22c2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00087-of-01024.json.gz": {"num_bytes": 397978000, "checksum": "c9437ef5f58a46b8a6d8efcae37fa658da3f2c4f1cad0f9cf47fbcd09bb82f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00088-of-01024.json.gz": {"num_bytes": 398468913, "checksum": "be187fc14017f666b84ed7049c169c1a28654441c2f523eee8b655b3b9d9ba8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00089-of-01024.json.gz": {"num_bytes": 397071121, "checksum": "637c3f964ee2c750a0a175f2e5d24b786a37d37701f10616b448804d68b72f4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00090-of-01024.json.gz": {"num_bytes": 395753807, "checksum": "8eef7ff1a8080aebe5226cc3539baac46ab64d93f8e3ffb6e8b7ab3346e151dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00091-of-01024.json.gz": {"num_bytes": 397039764, "checksum": "a2904ae5bf69b393a697afd62ae9b8a560c1f076e8a141e6f3feef29cb5d1352"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00092-of-01024.json.gz": {"num_bytes": 397058578, "checksum": "eb4d7e2712a9983bc1581133fa8eaa2e1d28b314861833bd8d810d615ec1ed81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00093-of-01024.json.gz": {"num_bytes": 395855981, "checksum": "5c9a7573a5644d89d46666306d333ff1e4af3213f287cb9adb48ef87a023d479"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00094-of-01024.json.gz": {"num_bytes": 399516118, "checksum": "de7ae1508815e48ba031762c084cf6946b084871463821407090d23c197c6474"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00095-of-01024.json.gz": {"num_bytes": 398236235, "checksum": "616cef1f21ef078ffb9fc2b4148735668debdd15a8bc1be281183ba3659e9fcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00096-of-01024.json.gz": {"num_bytes": 399526010, "checksum": "eb754381b8a6f3c74dda5ee5852958f7b69c707a3908cbaa9410c972e002a0cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00097-of-01024.json.gz": {"num_bytes": 397935028, "checksum": "6d6d2ca80708b7c6ad4240a042dddc2170060e8976c2e7b4ace446d2f2395076"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00098-of-01024.json.gz": {"num_bytes": 398645934, "checksum": "568db6971230fb42df8973ecb5a2a6d77204aa8cf0bdf47b386c04370da8dfd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00099-of-01024.json.gz": {"num_bytes": 398110916, "checksum": "9bacb381e3b06976619e816e40ac2ccd3bcf3cb9ecd30c294b388cfb75c8bf77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00100-of-01024.json.gz": {"num_bytes": 397631228, "checksum": "7d515ac0f767736600a216ebe7280b9751f16e70df969ba601d1aaae15f201e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00101-of-01024.json.gz": {"num_bytes": 395102356, "checksum": "87c5c81e154e136f3e090ba91682ad54fe678653f86f6f32002ae5ec3c9aa743"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00102-of-01024.json.gz": {"num_bytes": 398926159, "checksum": "2df85a9ac13812c3870180901dbba99b52e53fc045da019160a3f06d0dfa5e95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00103-of-01024.json.gz": {"num_bytes": 398383820, "checksum": "8134d12e84ed4a58a5f8f6eff8a4349f7d6ded6a1d7539b5c23193571569d6c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00104-of-01024.json.gz": {"num_bytes": 396628542, "checksum": "208f0cb3365b0243d70e7b4e52ff977e9b11d8e451adea521a5bf6e10cd40ee0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00105-of-01024.json.gz": {"num_bytes": 398737797, "checksum": "855ac7b8cb621a240319ef00197d2f20338d17db71a1aec68fb66930bc17c59c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00106-of-01024.json.gz": {"num_bytes": 397281064, "checksum": "544d5d91d066f2450bfe622ce55bdfe16a300aee9c05aaffae8a645966bc695e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00107-of-01024.json.gz": {"num_bytes": 397919761, "checksum": "f4af405c0f19c9139d93b3073f3fe328be998c9dc6f74afc7e21ad068964b92c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00108-of-01024.json.gz": {"num_bytes": 398810219, "checksum": "bdfce29353c6caa33b178bdebbf7e48526c391bc6c71180e3fa378b723879563"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00109-of-01024.json.gz": {"num_bytes": 396605124, "checksum": "ed6acc172bc9af0e31170f5533001a8fcd344e6732a4b3a714b7ad43740f25f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00110-of-01024.json.gz": {"num_bytes": 397491755, "checksum": "428b6c91f12c4f7032fa692bbe887f1a4c02635eb88b91d876da4c71f3da5e4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00111-of-01024.json.gz": {"num_bytes": 395754897, "checksum": "a723863559edf291fd8a6c2736cc1cefed70dd3c8625b967df049ce0d373f68a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00112-of-01024.json.gz": {"num_bytes": 398567649, "checksum": "a90ddc9ccfbca20b9c75bd2b7d63ee6abd03236a0f0dd2827eb9f7350d9c3931"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00113-of-01024.json.gz": {"num_bytes": 396706569, "checksum": "479052b6b9edcc2bbda40b982976e7e28d84fad7b2dce46b017f4e3d1f61e0d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00114-of-01024.json.gz": {"num_bytes": 397384355, "checksum": "a95984e4c261a3057d1bc51939aefd9413853111e19030b19c5d26f778be00ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00115-of-01024.json.gz": {"num_bytes": 397702826, "checksum": "5eaf7fc2c9d4b2ee3e216c215da7f4fc7558e89d6993033b95a940a78061ab05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00116-of-01024.json.gz": {"num_bytes": 397252590, "checksum": "268033cbbdf3be9790cb6010791693f1b490af06f9fef91b0b307420a4e30a08"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00117-of-01024.json.gz": {"num_bytes": 395506730, "checksum": "cb80908eee1054ddaf7e2e5d66c9a41505025c2b6dc7fe6aa287db0a9f3829ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00118-of-01024.json.gz": {"num_bytes": 396452136, "checksum": "d75bf895c88ff2e9c4031c1f65b067222cfbb1a937d685ab4dd33369f5f5ff7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00119-of-01024.json.gz": {"num_bytes": 396777389, "checksum": "2c00362f4d99cef2bae2f13f17b79ec56a5ef8aca18ffd56a12fea2308e5017b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00120-of-01024.json.gz": {"num_bytes": 397730478, "checksum": "e31296949f7ce2e2a74fd2443552cb64b9f3cddcca691097a56992f51033fd11"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00121-of-01024.json.gz": {"num_bytes": 396593647, "checksum": "c2f0f81e3c835848a47532d8fd1c215a624f47740196a7bb45b5099916853014"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00122-of-01024.json.gz": {"num_bytes": 396576172, "checksum": "72edb7581a623e20f26cae4885f3b9d7f329581921253ca4d7ceedfbca17b7b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00123-of-01024.json.gz": {"num_bytes": 397378329, "checksum": "4f045ce7bd077b7f878012aead8c51073022448de66d2e35a755d4c8c4a6f59d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00124-of-01024.json.gz": {"num_bytes": 396545003, "checksum": "dc7949657328520d31a27d8e267c2ab07cd4e8639036d4b1bb59454c309f862d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00125-of-01024.json.gz": {"num_bytes": 397630505, "checksum": "530bd95e5ef9a1d5989c595e60e0ab11583e0f42d16b2bd37c49ed09a67af207"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00126-of-01024.json.gz": {"num_bytes": 395483747, "checksum": "d9df071edec6959ba842509f72ad43be3ea3f529b60d48f3dfbf390908887a5f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00127-of-01024.json.gz": {"num_bytes": 397295159, "checksum": "02b61f5bc7d1d241484c4f04fd517960ae755a69f35192bdd5bb471baeba5614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00128-of-01024.json.gz": {"num_bytes": 396276865, "checksum": "0c7d618df232c36ba018269ddf3b2863cd6d63bb7fabeaae33fd508715bd8ce2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00129-of-01024.json.gz": {"num_bytes": 395314703, "checksum": "03443afda032187d2dc2e696ce6eaecbf2219e6dabbdd593379e97c0e00e3112"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00130-of-01024.json.gz": {"num_bytes": 397411481, "checksum": "8969873d5efd3df0cef1742e4bc67f2df7a5b5d9e641f7a12e77c7e8e96a1bf1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00131-of-01024.json.gz": {"num_bytes": 396925311, "checksum": "31adc39ea4eda8667662608bdad6bb32bbc82b1ee1ad53ceb4df50924a933bdf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00132-of-01024.json.gz": {"num_bytes": 395826124, "checksum": "d2f035ba2c388fec2d847bd43449c885eadd0bcab5fb8afdf031a53e72c4ec32"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00133-of-01024.json.gz": {"num_bytes": 398892794, "checksum": "b7ed60983058a5f9f0ef72602789f50359f415ecbe60dc967e7a869866d833b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00134-of-01024.json.gz": {"num_bytes": 398206890, "checksum": "9ba78624879aabb72bae0b4119fa2625793915382031ed897a0b4c3f2863b8aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00135-of-01024.json.gz": {"num_bytes": 397161888, "checksum": "9fa6fee55f5e8f887dcc64d94cc65ada6f283a580edc7926cb159b80d0084ea8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00136-of-01024.json.gz": {"num_bytes": 396185585, "checksum": "81a1fcafcedfdd9bcb32d2467d9c963cc7d8b2f32e13e52ee04db41b0d3f5483"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00137-of-01024.json.gz": {"num_bytes": 396933735, "checksum": "c7558304b614e1cff13b0f6e967fc5ef77e4953a1eea1f39ed925c33076d7723"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00138-of-01024.json.gz": {"num_bytes": 396371698, "checksum": "3e896da8bf296403f7b4061ba0b24d3c3978993de4854fabd688cfce9fbf7bba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00139-of-01024.json.gz": {"num_bytes": 397289537, "checksum": "1a5ffa3aaf565ccf4db7444983643ad06e386938a0a2d313aecdb972c36111e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00140-of-01024.json.gz": {"num_bytes": 396983259, "checksum": "4047916916fd9dd7b76a8cbc595d52803344467135f744b23bd10296004a47d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00141-of-01024.json.gz": {"num_bytes": 394947050, "checksum": "7edfc9e5870d80d470e3797e8bef5183e9d170eab410ab50957e946dde2e8199"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00142-of-01024.json.gz": {"num_bytes": 396852755, "checksum": "4affc3a24616858fab84211e3825e90a1ea7d9c8f2cfabbe9a5c9b24c21a116b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00143-of-01024.json.gz": {"num_bytes": 397579248, "checksum": "d5aa9ba68e9b30576bd640f647d4069b6c56db276cc5229573440e4a38a7f1e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00144-of-01024.json.gz": {"num_bytes": 398800367, "checksum": "fa104e63eb7a8a6b066a5f00bf05b3ea095bad35a902bc728251f096173f1417"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00145-of-01024.json.gz": {"num_bytes": 396709510, "checksum": "b615ecd58821b1697c82094cb3435375924263827c342ab1b87e53907d4aa63b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00146-of-01024.json.gz": {"num_bytes": 396042389, "checksum": "6004c782f3235490865b6634b2c4840a989745b70ef2da674e75c62aeedf8a6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00147-of-01024.json.gz": {"num_bytes": 399840661, "checksum": "5e8b46726f7ff2c3dfd381fb252f1b4bddf9436fd9ffd10fa300cb0fbe76998c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00148-of-01024.json.gz": {"num_bytes": 397098215, "checksum": "0851cb274aff2ec4f781c82af11c94f8938a797aca5097fb0089299cb4c75aff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00149-of-01024.json.gz": {"num_bytes": 397540697, "checksum": "7cadf4ef9b0e29d9e8f68474464dc072b78e909a0f03c74e61b67912ff9b551d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00150-of-01024.json.gz": {"num_bytes": 396347701, "checksum": "521e4f67d12ae47b8f2a02b6f77e0c85cdf9a0efbcb45602d09ae116110ebe66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00151-of-01024.json.gz": {"num_bytes": 394890490, "checksum": "2255bf3e1940ea28da9656028dee26865a9ee682cbaab4d5aeb34c081062f8fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00152-of-01024.json.gz": {"num_bytes": 399584675, "checksum": "f8ca4aaf5706ffb0f5518c7461d9045d18c645df068aa436137299e5ca77df82"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00153-of-01024.json.gz": {"num_bytes": 395606567, "checksum": "24f0e81dc3140f063ac89173fc262b01f2420133025b114f29632262cdd2e7fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00154-of-01024.json.gz": {"num_bytes": 397925578, "checksum": "5f40a87b15b0acebbd324e7c5cd2c0f31f911558d57f774f278634db94f2d5f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00155-of-01024.json.gz": {"num_bytes": 395428741, "checksum": "36281c154f187a09a83822878da815cd9b7f659a41cd90ac64653b437e798c72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00156-of-01024.json.gz": {"num_bytes": 396799274, "checksum": "0fb66965107e54c9fed0013962763e874b940b0e174d775b21fa5e688fa53b33"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00157-of-01024.json.gz": {"num_bytes": 397321211, "checksum": "014d1443a4940fe95089bf87e245817d3a90c50e3e371a703098f5b9c3f6c759"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00158-of-01024.json.gz": {"num_bytes": 398736992, "checksum": "f912d27d68318fc0089fbaf8e0481ebe8dc5d2963cb89ed315f3bec637460bfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00159-of-01024.json.gz": {"num_bytes": 397250687, "checksum": "1bfd02a301b09bfd53058522d0613e1fbecb788d3173eb30b58115cd1cbdb477"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00160-of-01024.json.gz": {"num_bytes": 397492158, "checksum": "149a7bd76e9ea41185d99d21df870ddd4f32857fdd628cee927d6bee7d6a527d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00161-of-01024.json.gz": {"num_bytes": 398383574, "checksum": "0c385b4c9b33574cdc75070309a0aed46aa7b2e3b8754a7692035a3c5a04f916"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00162-of-01024.json.gz": {"num_bytes": 397126197, "checksum": "5c012b2a6bbc9413914ed1420b6150a5549cd74185bf2788d8809005034d433f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00163-of-01024.json.gz": {"num_bytes": 398201223, "checksum": "79448c338e86cea2609399705268fc6011cb21c4f0aff82e3fb7660391ce85c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00164-of-01024.json.gz": {"num_bytes": 397914908, "checksum": "dfb89631dce146ab4713a03f184e864472eb133b2cd04db8b4bccab688e9e287"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00165-of-01024.json.gz": {"num_bytes": 398142696, "checksum": "74acc88d6612aae7bdf5187d3b9eddcdb04cf60f1cc350661ffa50219a747f9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00166-of-01024.json.gz": {"num_bytes": 397533050, "checksum": "757d23402b3a155cfcb6b30bdc305c8014c9b64ba4e067753664670c2c5e9534"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00167-of-01024.json.gz": {"num_bytes": 396241119, "checksum": "521bd7a9dcfa0390c35e50a3d0cde3ea627ca538dfc419a97ed83b251d8a3005"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00168-of-01024.json.gz": {"num_bytes": 396041761, "checksum": "dc540ec27d5999f6a4c71f075ae1ec64ea84415c720cd2b6ef3fdac925e576da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00169-of-01024.json.gz": {"num_bytes": 396350882, "checksum": "36d5d35075a82038dfdd5abd29a839f4e9ab79d51f0bbc635d3dcf3f5f1e2732"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00170-of-01024.json.gz": {"num_bytes": 396885157, "checksum": "db9a3f6a7e085007eee381357ea9e4d5d6f702580d38220860967ec441ba3525"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00171-of-01024.json.gz": {"num_bytes": 397266368, "checksum": "7f8098cb6532bc888d3c1f0ea5072cf8419ce1689b9ffe1c370ca20071e7e1c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00172-of-01024.json.gz": {"num_bytes": 397140430, "checksum": "90ae7e2551b1f3bf2e5ccf4fb3fac8fa3512add5e299ba7c90319611baf8c840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00173-of-01024.json.gz": {"num_bytes": 397069631, "checksum": "a86f5ab72e1a9b1d491988154fd6400e6ee8c74378a9e64276df438a3c4edf9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00174-of-01024.json.gz": {"num_bytes": 396743897, "checksum": "451cfe8e14c17113a2f6673ece27e01f8d54bed1b57d1b20cb84f125879939ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00175-of-01024.json.gz": {"num_bytes": 395780705, "checksum": "3252e9781545bc3f9f19ac6e8fdb87d81cdc5a94838798daf6037c9f4f473db4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00176-of-01024.json.gz": {"num_bytes": 396205053, "checksum": "49d1648d37150b90632a6459828eedd82deb2fce7f108bf4e1b050f2f9ad1668"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00177-of-01024.json.gz": {"num_bytes": 396248718, "checksum": "99346ccda762ae85038a10baba937ef8ef668a0beab483c4005dce77e331768b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00178-of-01024.json.gz": {"num_bytes": 396634813, "checksum": "8d3bb1610ce79cf359d75f32e7624b6203140ed3eb276362b040615e9ffd4b54"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00179-of-01024.json.gz": {"num_bytes": 396524113, "checksum": "971e5c9499425294cf5945436b2ee419379a75bdd72d4cd6a33b1d17c17de298"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00180-of-01024.json.gz": {"num_bytes": 397938782, "checksum": "dd6b3e60219788b82ab3fc63a9e65f38f64aa2f7b294135ec2d16b36350f1f40"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00181-of-01024.json.gz": {"num_bytes": 399155769, "checksum": "c6a806d627a9d197789bfc6257a92b0223ca51e724c3c2ad10fe2397dbe30848"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00182-of-01024.json.gz": {"num_bytes": 396136228, "checksum": "2c48e3237253eaad9afc121e6946a9e1856bbe82c5a7cb287b05cff3e6ea8e8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00183-of-01024.json.gz": {"num_bytes": 397083292, "checksum": "52645e03ab47da01bb40226eb90042be914f1170688ae940314871e16cbb1037"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00184-of-01024.json.gz": {"num_bytes": 397402964, "checksum": "1edbdb41edeabc108f0147e18b439a75e390e0a843ed915f1cbf73a7c7f7867d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00185-of-01024.json.gz": {"num_bytes": 398411052, "checksum": "ef071e52174a19597e567696262470906275c2cd1cbbb0b1e98864999ea2d463"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00186-of-01024.json.gz": {"num_bytes": 397122443, "checksum": "0d87080bc08f7f8a1952a7df57ce2bdbf61e40c05b61937c8c19ae0ecd952b1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00187-of-01024.json.gz": {"num_bytes": 397244868, "checksum": "4aed75ea9f885fc3dab599c19c7bb98f7d57ce2b2ec11ac8ab3258fa479fc0db"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00188-of-01024.json.gz": {"num_bytes": 395677432, "checksum": "342882e436ea826cda9fd38c0caca68bb35444a2a07596f8de0e53a3e2169f59"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00189-of-01024.json.gz": {"num_bytes": 393653750, "checksum": "22ed9e389f6c8410c9bde898d97ad798c236c2da4d0b2c76b86d013f8686da03"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00190-of-01024.json.gz": {"num_bytes": 395437920, "checksum": "b3f9ba5834d4f0280d6defd3bd50fdf961bee6be4c71ed47046cf4e115acab01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00191-of-01024.json.gz": {"num_bytes": 396944861, "checksum": "4e7ed636a60edc44b5ba709dcd83bf4263ad8d5a06a02827d3d27191bf3731a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00192-of-01024.json.gz": {"num_bytes": 396611165, "checksum": "4fea34466d9b470bf0bc44455183b2c61994c4e71e4bfb684dff3b5e3870d1e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00193-of-01024.json.gz": {"num_bytes": 398283211, "checksum": "4c4e6d31f455831330971ed1e0c33221203401b817adbda5b53de16f8299a9ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00194-of-01024.json.gz": {"num_bytes": 398915952, "checksum": "dfd0b1ceb2a437da8cd38c9c791af809e94f2e36ab4399b2a45a5b916f4ccaa9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00195-of-01024.json.gz": {"num_bytes": 396352694, "checksum": "0ccd90ced34b3ff28c21d015a87eca3f31eae2bf31f11f25ac073139f9d50c22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00196-of-01024.json.gz": {"num_bytes": 398582922, "checksum": "f22e59765cec074a0c687c500f4e6348250d0e418d12dcba211e39c133aaf290"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00197-of-01024.json.gz": {"num_bytes": 398839554, "checksum": "95fa68cd75d77a1b5bb526dd5ef16a2f04a3520604f734baeb6e2d95608b5973"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00198-of-01024.json.gz": {"num_bytes": 396202192, "checksum": "f0e6343e8105178b38f75eade6774aa6e85b62a271622fcfcbe2745f1cae11ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00199-of-01024.json.gz": {"num_bytes": 398029364, "checksum": "4c58736410c8d3c7174ce011e2f281cb16e4949d756ff4ace86b4a9d4795c04e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00200-of-01024.json.gz": {"num_bytes": 395867629, "checksum": "1cb798ee6609e670053987d881d130d5b73db19d9f37fecff7a6da41152aba05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00201-of-01024.json.gz": {"num_bytes": 396858169, "checksum": "7357eb22b2aa75c55885252c62d12e08cf8f7ef285c0052cf1d706c3f0f74fef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00202-of-01024.json.gz": {"num_bytes": 397955766, "checksum": "8901d0f27c4c11916cda7cf806cd00000771b6351954c8503bc312cca5ad3a10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00203-of-01024.json.gz": {"num_bytes": 397737882, "checksum": "ed51917fc8936701b681cfc49ef95b2dab451ca597e76b34ba90be9405a1a0b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00204-of-01024.json.gz": {"num_bytes": 396094006, "checksum": "88692bb8da78347cb97c0e0849d1a10a97b1686cde1f75626236b89bd507e2b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00205-of-01024.json.gz": {"num_bytes": 399027636, "checksum": "fb17fe19d1f0fcaa43fb31a3ad9b105b3d93fa287351c7f93fb599edb7f40bc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00206-of-01024.json.gz": {"num_bytes": 399406254, "checksum": "668d2a9927080b686a4d728236e4cfc780b262f9045dfe9575cfc48cb69d6adb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00207-of-01024.json.gz": {"num_bytes": 396291803, "checksum": "928f451dddfe42bb2ca791dbc61c36ddc618006ef709eaccbc2beb665c8427e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00208-of-01024.json.gz": {"num_bytes": 397807368, "checksum": "11e8627b758588056b61d31de07c50092222013a38ba802b7a9ae34b6b8b84a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00209-of-01024.json.gz": {"num_bytes": 398085408, "checksum": "d49d31d1719698ab7a2b9ee91d887f3192c8fc1b6108152a75b39de2a0ad25a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00210-of-01024.json.gz": {"num_bytes": 397670254, "checksum": "049b3294c3e22e6db6c115979a4a55f0650966c600ca17250e91b241cc97bbd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00211-of-01024.json.gz": {"num_bytes": 399643598, "checksum": "7772f26fd90f47033670e7f1d3f6fe092116486bb9a991577f9560b54ed3832c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00212-of-01024.json.gz": {"num_bytes": 397390768, "checksum": "7a24e4a70f43f6227fe6491fcc7bb6b2a19cae203521c803bedf8882c995d7e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00213-of-01024.json.gz": {"num_bytes": 398657925, "checksum": "21d0ee8d1a01957b56ac503aa88c6f3269b4e4692762a3f929fe0e7069be8c0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00214-of-01024.json.gz": {"num_bytes": 398282324, "checksum": "ede2d9824d8f99dd578a36ea82caae942ebcafd99f308cf5d0ff8aa4a56f0a05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00215-of-01024.json.gz": {"num_bytes": 399178235, "checksum": "82516fa361dec02c7ed59ea2d0510d9ee4187609b449dca649a04141b12bc037"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00216-of-01024.json.gz": {"num_bytes": 397630870, "checksum": "4a6d5e60354b7b93f005010c6fc55c0a81596e98a116cdeec99e1ab4e58fd03e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00217-of-01024.json.gz": {"num_bytes": 398628848, "checksum": "02dffb623b628a3a3ea38084fe6bb840aafab8419feed3d1f2bd3598cfa80aab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00218-of-01024.json.gz": {"num_bytes": 395087998, "checksum": "e1e9a7ac7a922d6a9bb90f82cb48dff11ab7208dac08511e9613cd2726ca67ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00219-of-01024.json.gz": {"num_bytes": 397622792, "checksum": "955afc7d45a080ae137e9dc25ba3d85629a6a14c3d9bbe4065aa37d710345b7a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00220-of-01024.json.gz": {"num_bytes": 395112655, "checksum": "a3560918bec20087e9908009a362957ecb06401924789e20b36c26e363db5ae7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00221-of-01024.json.gz": {"num_bytes": 397132000, "checksum": "d8459bb5b6fb6b341b24fe517cfc5dc099765ad70c3383bae913229e06cf99e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00222-of-01024.json.gz": {"num_bytes": 397138513, "checksum": "20d3c6219921dc9c2928d637000e488635fd9a12b5636de5a6a7e52c1b67d781"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00223-of-01024.json.gz": {"num_bytes": 397167661, "checksum": "43a18accd194646893324537991e0162f6f98a9cec5ff59fe8fb510d81d707bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00224-of-01024.json.gz": {"num_bytes": 397905941, "checksum": "a516485cbefdef2e31a493cd8827a5f936f10674ff3525b71d414e17f48241c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00225-of-01024.json.gz": {"num_bytes": 397218123, "checksum": "791c85c78c5e7f3557855a1fc71acd860521710515b89f92e54e02960549f46e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00226-of-01024.json.gz": {"num_bytes": 396619135, "checksum": "52a36037696e6245efad80e00d1f123c36dbd79e7ff52b1fb99f579e712d2b30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00227-of-01024.json.gz": {"num_bytes": 396654998, "checksum": "e31123ab579fe95bd50afa10d52a51e9c15a4af28c06583fb5aeac4e3418f129"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00228-of-01024.json.gz": {"num_bytes": 396899165, "checksum": "86481361fff334dee3183fac8ab3f346e44ab3e6e7b35bbd7e6e062b2d2fa0d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00229-of-01024.json.gz": {"num_bytes": 397489378, "checksum": "bbb717711fb4c78ebe8a0476296a21a50285ec41d9fb9f08d5d66d899577e04a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00230-of-01024.json.gz": {"num_bytes": 397462301, "checksum": "054414aac29b5c8faee71a918f2586ad3fce8ee44c71e7a2e2af4b91e0169523"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00231-of-01024.json.gz": {"num_bytes": 396097584, "checksum": "8136e320fccba75a493954fefbb560f92532be44a6e0990404edae659d48ce1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00232-of-01024.json.gz": {"num_bytes": 398984795, "checksum": "3d9362aab157beef3b5fcd4a0a0236d59de635a565b1c86423f45b26e8b437b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00233-of-01024.json.gz": {"num_bytes": 397258012, "checksum": "e1a532922477d17f7cbea7db72c2391d26b4db580e526ebd5a90be23607a8d31"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00234-of-01024.json.gz": {"num_bytes": 398350453, "checksum": "c464829565bcaafdba165b2d886be4580f3c0a516b5417853ffc4fe30049cffe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00235-of-01024.json.gz": {"num_bytes": 397147353, "checksum": "573a6a1d33ccc6c5b605d381f04d73989504bb6d24514b938e92c3d4f61501e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00236-of-01024.json.gz": {"num_bytes": 396963006, "checksum": "21318462014bc185d0da7cbd342fddd07521401ca2b73e47eb5cb4bd42a82bbe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00237-of-01024.json.gz": {"num_bytes": 397087111, "checksum": "49459c97b078726bf8377748d4bb2066bdfa47e2717315a9b3c8075cfc4b9b10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00238-of-01024.json.gz": {"num_bytes": 396984031, "checksum": "befb46e9f928876edc580c60ea4242f63cf6df77c6c107fec6e4280d279e348d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00239-of-01024.json.gz": {"num_bytes": 395915197, "checksum": "dc5ab17e04e4f2678771094af67909dcaa8be36a6cb047cfa66e75f986c91312"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00240-of-01024.json.gz": {"num_bytes": 398321096, "checksum": "25b92f7a499e9aaf0496a57f6292a7f65941b34dd6c78f14b08358d180070029"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00241-of-01024.json.gz": {"num_bytes": 396626980, "checksum": "1ae21ee5585ec718763a3c7bd70d9338aaf77d0e02f92a41f6ed213d1eefa5b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00242-of-01024.json.gz": {"num_bytes": 398220596, "checksum": "c29f98174a0c02a817d5cfa3ebb2a92d5f49df8a34fa40abd360f1b39b4bde05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00243-of-01024.json.gz": {"num_bytes": 398250083, "checksum": "819387c95ea7183b1f9e1e78d077de65023c4809198ef3a0c946f46f8b6c19b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00244-of-01024.json.gz": {"num_bytes": 396943969, "checksum": "7a0b0b984d7afc4181827705212f917cf4ac12412f640a2c8120513763cdb390"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00245-of-01024.json.gz": {"num_bytes": 398365865, "checksum": "a424157137a5eeca89819d600deea2a1619ea8f5ae1ed395c88ac600a85e3afa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00246-of-01024.json.gz": {"num_bytes": 397285385, "checksum": "73029f721bdaccd9d126e871973e70a551f48f077f5903656b305ea9885c4798"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00247-of-01024.json.gz": {"num_bytes": 397132841, "checksum": "b223cf1270d2c728592ec65b09599bbdef8d64f7df2eb525e114f86268500daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00248-of-01024.json.gz": {"num_bytes": 396316645, "checksum": "94102d9bcc086ed5b203bc0c6b830dd245c9bf6c695b23b19922b2a98eeb6a52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00249-of-01024.json.gz": {"num_bytes": 396644237, "checksum": "36be793f4d76070ba1c696b3274e6dbab43f415c8fbaf752145cc99af6558680"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00250-of-01024.json.gz": {"num_bytes": 395860541, "checksum": "313febcf026d2cd1495fdd3d5ba3b492ce5d5749153e189672b6d9dff3e26a61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00251-of-01024.json.gz": {"num_bytes": 396709140, "checksum": "7e2480b3d5869ba35007c40e18585f3fa208cdf8e004078cc8de4fac36773507"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00252-of-01024.json.gz": {"num_bytes": 396508847, "checksum": "25df46ae56c0d4a6f945922e31fc697d12e0b7c525be9bc2b8eced802641488d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00253-of-01024.json.gz": {"num_bytes": 396364816, "checksum": "6b2125b9eab9bf893e7f8913a6beedbeeef5de53893fbd6172f706e33bab5177"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00254-of-01024.json.gz": {"num_bytes": 396122930, "checksum": "7947e5152c5305863e2d664622e3de49f9386b4384eb09630c5bfcad21fb458e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00255-of-01024.json.gz": {"num_bytes": 396929803, "checksum": "a1ec8c609ac969c24e2524f0f3dc31ef43ca0147ffe66569d3135e4f28394325"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00256-of-01024.json.gz": {"num_bytes": 398432943, "checksum": "3fd0373f5a8974a3499c436d96ea73be95f5619b8388dc316f51aff01e9ecad7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00257-of-01024.json.gz": {"num_bytes": 396003748, "checksum": "516cf3626076f083962983b2d6c596ef355609492f2e81c6c3cdec01acf8c5d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00258-of-01024.json.gz": {"num_bytes": 393890690, "checksum": "700760a7764f890c8aae337e7ee458c8467eb9048347edd237e341dd2bd5d236"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00259-of-01024.json.gz": {"num_bytes": 398130606, "checksum": "d868f8ef5e1cc971ffd00908bdc7eace32ec151d7405d7cac5fac22df9ea10c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00260-of-01024.json.gz": {"num_bytes": 399765969, "checksum": "7d5eb3b88eb8a0291ae70c1997458cf5aecac645397e50a67fab3d1193064353"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00261-of-01024.json.gz": {"num_bytes": 397418895, "checksum": "ca607c9e13d7cfb73a29ee3131f77e6bef3130d8627037cef9f57ed459185f0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00262-of-01024.json.gz": {"num_bytes": 397925991, "checksum": "ca789394ab4398c41490ec6147a41ffc8847155ea9ff74d7ff8b3402ed0634e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00263-of-01024.json.gz": {"num_bytes": 397082336, "checksum": "aac81d1bf0ade80758c14d01842b9b06c89ebf2fcdb9a06b1472bf2f70bbc348"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00264-of-01024.json.gz": {"num_bytes": 398101079, "checksum": "3cf56a2989b5c3f26ba94124cc534f5c9ae9770bdc6a3431dd745603b480ab19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00265-of-01024.json.gz": {"num_bytes": 396949669, "checksum": "d4f252a6c2f43833d6d89bf69337449b4cae5dc88fd08fb20b35fe7194a50ddb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00266-of-01024.json.gz": {"num_bytes": 396242007, "checksum": "71c745968d8ee4a0d64f38930a76e65d68ea094ba3e0b963d5d6878f65f51b34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00267-of-01024.json.gz": {"num_bytes": 398342031, "checksum": "706a560c862979594265925c3200d4bd0981a9eaa279841f2cba673634f7074b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00268-of-01024.json.gz": {"num_bytes": 396399468, "checksum": "eb3dea553c37f220b3b9b5f377d5a4ef94243b3c0b6b46981e3e5b7ba5b4a935"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00269-of-01024.json.gz": {"num_bytes": 397181296, "checksum": "4f0feae035dacaeb720ca3b6ea17685144895a0d78cfa358e30983f8d6c4ec76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00270-of-01024.json.gz": {"num_bytes": 395712883, "checksum": "6e0f6de1e5a5c6d4bf23d0539ee72ecc2b4285da2b0f1ec2cdcc443d2e22aa88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00271-of-01024.json.gz": {"num_bytes": 398066980, "checksum": "4c5cd1ef1917ed762d7d8c5c54e1da05db74e45721697df8b0626e0aeac96966"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00272-of-01024.json.gz": {"num_bytes": 396667308, "checksum": "77a33c37a5d88e419e2b31cf560d53f129a38e5bc2306b5baccc187b7e94e589"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00273-of-01024.json.gz": {"num_bytes": 396020214, "checksum": "b18e40c00b8e0e02dfac40ea0519964e231c8a2f28bc1294b044fb090f41a9fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00274-of-01024.json.gz": {"num_bytes": 396300833, "checksum": "34c8945a6ebac564fe87881d6968d05363a89985f297692a3df7104128b9c26c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00275-of-01024.json.gz": {"num_bytes": 395206463, "checksum": "1e41d7e2a6117224dc23fbaae8e9d20df9d7744adb4687d2b0e570bf8d9e47f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00276-of-01024.json.gz": {"num_bytes": 396667995, "checksum": "45973b91c2f1140f79265a24f484fc6d6653f43f83d5bd2d18954892dfa4dfae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00277-of-01024.json.gz": {"num_bytes": 398134029, "checksum": "b7da91889b6695cf01bceddfc139b23f9465bda5cad54088b84a1f5a4d7a4f9a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00278-of-01024.json.gz": {"num_bytes": 397422615, "checksum": "e794a2903bda1f3c082e8f590383c714a518c202ecb99eda5513d6b320f70e86"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00279-of-01024.json.gz": {"num_bytes": 398776175, "checksum": "a5528d3e33151138ef9bdc2433744f1797de2b20673a570de5bd4d81b306354a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00280-of-01024.json.gz": {"num_bytes": 396208086, "checksum": "1be2d8c3d0eca510fac7b06a5401b2b8873bc6dfbf85a3c736301756f9681309"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00281-of-01024.json.gz": {"num_bytes": 396893734, "checksum": "1db3e9017561d38a91c417ffef875b7a948c4f64c51b90b0983c71bc9d950903"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00282-of-01024.json.gz": {"num_bytes": 397411883, "checksum": "4e23d39fcec2c310cbde3fdc5d9c185046086877ac03bbf9d772b092614f93da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00283-of-01024.json.gz": {"num_bytes": 397906911, "checksum": "850eb5e60b84bca4d2f10b2e511fdb2661e3d08444a07db1782ad85c754fe808"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00284-of-01024.json.gz": {"num_bytes": 396043261, "checksum": "fea24050c6aec13eb706a6f3854b4debde62b1b842f2992fc027820c66218b0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00285-of-01024.json.gz": {"num_bytes": 396961329, "checksum": "6052f82887cd2362320f72f6545d2e5b5a775e9bef95783c9b9995ecb7a5ecc4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00286-of-01024.json.gz": {"num_bytes": 395697481, "checksum": "f4361838b5b679c8306447364166c1c3083af392b4c8793399c122af09c7312a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00287-of-01024.json.gz": {"num_bytes": 398773520, "checksum": "9add91f23f31ff8c5d8d84e6a0af75fc6fa08ceef8ccd9b633d8c49aa1d0104d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00288-of-01024.json.gz": {"num_bytes": 397684645, "checksum": "64dc94555a122353c3a3c9999e67d17b0e4b682096ba80be2258c791ce1c2b9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00289-of-01024.json.gz": {"num_bytes": 396655864, "checksum": "2472c76b1cbcfc3cb82126795673126e8f532119a03722a304396ceee9b7db3a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00290-of-01024.json.gz": {"num_bytes": 397415313, "checksum": "960b71edbdc6a6a62a0d3cc1069bbbfb11893cc017aba543e10c9a23cb759d1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00291-of-01024.json.gz": {"num_bytes": 395617977, "checksum": "96e582d7a750bee597331f373ec2e16d3a9686f48a49d39765d39550c8cbbad8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00292-of-01024.json.gz": {"num_bytes": 399332500, "checksum": "cd6ec4941aa5babbe274684945bf899447ec2459b8f7076ec8c74d2b3fe794c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00293-of-01024.json.gz": {"num_bytes": 397021546, "checksum": "d0d0c4d80e75c5d02103b49027d9e2e6f7db74c12f8b53f600d7fe420b2d0a7a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00294-of-01024.json.gz": {"num_bytes": 396272726, "checksum": "caf5708a6989f867ec6c4c56f338aca9f3a43a1806a27ef473d9b0f219001cb4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00295-of-01024.json.gz": {"num_bytes": 395233811, "checksum": "a7b5f904e34c0b370238e6beb19149d4bb96d0cce43a1eca3bfaf181952ede53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00296-of-01024.json.gz": {"num_bytes": 396480926, "checksum": "4fcf284d98c2f7b63e47573e9d084eeec2516fbfa62be42c3ff94e1cf518e313"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00297-of-01024.json.gz": {"num_bytes": 398883718, "checksum": "c1cb458076497e7dee645f50281d1af2fe5dad556d28a2cbbd73abe6537c8a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00298-of-01024.json.gz": {"num_bytes": 398733629, "checksum": "4a612c715025292e62860fb0018e9fa2d3fade692342746d044be6297e25a034"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00299-of-01024.json.gz": {"num_bytes": 398155026, "checksum": "d33f4043fad9551f92084a45b7f54d920ded9d6fec271cbbf85f71b021f9ee4f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00300-of-01024.json.gz": {"num_bytes": 398612975, "checksum": "61b1181b796a2f40db3cb6954f2890397c3722c486dccd4075d74679cf61a70c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00301-of-01024.json.gz": {"num_bytes": 395385748, "checksum": "95a78e9d3cece0620430c85822fedf4021ebd88ece57d6714933c268d3b6af6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00302-of-01024.json.gz": {"num_bytes": 397620059, "checksum": "321aed402a5e779febe9766294ad040a3f8dcf57bae68648c03d3c59023aafa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00303-of-01024.json.gz": {"num_bytes": 396549027, "checksum": "4198f6a2b5bdaf90ac4251f013908123a5964429870ccd6b245a9069278c4e17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00304-of-01024.json.gz": {"num_bytes": 396596460, "checksum": "74a6440e93d18d0d6d0622ab7d8832d7ccc91c03297faf20c8090d16f7c042d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00305-of-01024.json.gz": {"num_bytes": 394881271, "checksum": "654deec494bba4eece19c27140426049574cf529c93ccb422fcc09fe4496af15"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00306-of-01024.json.gz": {"num_bytes": 397760377, "checksum": "e0840cbc94db6cfc35df66d413a11261756392dd59b0fdf89d9ff166ec76f3e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00307-of-01024.json.gz": {"num_bytes": 396671816, "checksum": "31ceb8cfcd09fda621a9a483b09dfb43f5436e867363f6736ea3f710a6af10fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00308-of-01024.json.gz": {"num_bytes": 395961013, "checksum": "8c1e5acc3f964eaa5aff300731a74dde84ed0671cd764b121ea638fb08c3dd0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00309-of-01024.json.gz": {"num_bytes": 396035179, "checksum": "7d555942b1bcb2518aa5ff9c0549d98fabe7bb563cdc6c73d3f11e6a0bc502b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00310-of-01024.json.gz": {"num_bytes": 397140669, "checksum": "859eeb7a9d2ed03d5299bbf7f1c3e719236477950d7601112a458ea5a2adf7c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00311-of-01024.json.gz": {"num_bytes": 398170419, "checksum": "1e7661637b0a4445119ba403e4f8ede129c829fb7d1907ca7660870b536b8b29"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00312-of-01024.json.gz": {"num_bytes": 395605627, "checksum": "87a3ccd2ac9deff1ac4a5dd02bba269a48692d4598c5899630e8d2e4136dbb99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00313-of-01024.json.gz": {"num_bytes": 397081206, "checksum": "c6952116cf573a6e20c849cf1b7d8d0edf3b9d00fc7e717e7bacde915c4c52a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00314-of-01024.json.gz": {"num_bytes": 395555727, "checksum": "762066fd85c596ee01b3b8070708517cc5759bb1e3c4bb65f4645fd62b550d13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00315-of-01024.json.gz": {"num_bytes": 397871218, "checksum": "814f19cc5e81144f5bfd7037f5f522dd5c44faf150c10337c675174a5965a5b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00316-of-01024.json.gz": {"num_bytes": 398577523, "checksum": "27643c7c3c0a1a78c9003b936ea27785709a2df80d09817278a179eecaedc352"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00317-of-01024.json.gz": {"num_bytes": 396388623, "checksum": "5f840180e2017c41c6b1c865784788dc3b002478a9ecb43c3859174af788ba5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00318-of-01024.json.gz": {"num_bytes": 396173471, "checksum": "2aeab99fbc84a2640a05081e2c7438451e75f76cbece3cbe5d82e85463a61966"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00319-of-01024.json.gz": {"num_bytes": 397912127, "checksum": "fda805ed19f4b996b048386f4bd73924dc965a069e85b8b4452a54a1372375fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00320-of-01024.json.gz": {"num_bytes": 398765416, "checksum": "bce244d024c076911c1c6dbd35609be5442c8b0440690e2cbb342ac64bdc494b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00321-of-01024.json.gz": {"num_bytes": 396005962, "checksum": "763584ee096223b8aeffb1576ec6e4f3bea674ec4de40fa163c2f2221b3701d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00322-of-01024.json.gz": {"num_bytes": 398615672, "checksum": "5c12ec1d0c450fb7515c586f24311bad145050dfc64180d65bacbd346c2ce9c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00323-of-01024.json.gz": {"num_bytes": 397861187, "checksum": "93326f43273fb963593e0b1caab1e9588387291c23d5c14b5ae40b46b199998c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00324-of-01024.json.gz": {"num_bytes": 396679008, "checksum": "6ebfe6e28851e6d79cfdbf370602373fc2136e88936eece302ecaa8ef8251827"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00325-of-01024.json.gz": {"num_bytes": 396358086, "checksum": "51190fbfd48479842ec3c7d910b5519e01ff797ca0143c39be142c1650c5e893"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00326-of-01024.json.gz": {"num_bytes": 396490692, "checksum": "f4d9bbfd1bbc6e939fce9a2df26e45c79be73dbe2650fe79af395bdaa39cd121"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00327-of-01024.json.gz": {"num_bytes": 398354656, "checksum": "c70c824b6c16e5fad922ec9b8d363d97bed90501522b641b0eb0f66b8c086325"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00328-of-01024.json.gz": {"num_bytes": 397326336, "checksum": "7e6008433a0e5bc6eed28a13b9dba17246e7d65ca96c31092086c3546a3a397b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00329-of-01024.json.gz": {"num_bytes": 396390524, "checksum": "f379d844a35172424554bb82a65c790c354b76c0e7abfd868225d1968017d1a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00330-of-01024.json.gz": {"num_bytes": 398259199, "checksum": "ea15be4a83c3de66c42410e13e5ef9c93baf86099a8eded1c1d10b0cd5ad0f29"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00331-of-01024.json.gz": {"num_bytes": 397618860, "checksum": "7b6aad6224ead9ee3a0c860cfd991301ef5e97093b23c76d713e73f4911d0e44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00332-of-01024.json.gz": {"num_bytes": 396743573, "checksum": "bc5333d383020d2296aa0f6ec940ab586a367efe50d1c597f9db55ca72fa66e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00333-of-01024.json.gz": {"num_bytes": 397460128, "checksum": "095b3a85a9598009638622ca21cb00142efa0d68196c8c3a8bb922cccb465e8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00334-of-01024.json.gz": {"num_bytes": 396900262, "checksum": "6f005575f4843b84f4512e1b7c1b748edf497e4e9f55eaae47f9b4637161ccab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00335-of-01024.json.gz": {"num_bytes": 396106895, "checksum": "66bfe399d0859f71c20db01de53ca7bf997b33afcd3d181f181d9f265a2c2fa2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00336-of-01024.json.gz": {"num_bytes": 397732616, "checksum": "1f1e0435de870b98b119e91edd4a0d32d078dbb810f919a70b85360cd860f0cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00337-of-01024.json.gz": {"num_bytes": 397834763, "checksum": "1db4bcdaa6fca612c3f1b38dad6d5402679ca21aa6a545850d61bcda10103697"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00338-of-01024.json.gz": {"num_bytes": 396712179, "checksum": "810c104a8862699c490fc8625a7be4115872fe2de4d8c061e095dc5a81eb4d19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00339-of-01024.json.gz": {"num_bytes": 396838831, "checksum": "9bbc616d5c4aba46475957a22544dbdb0557f8de31cdf919718fbfe55bc70ac8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00340-of-01024.json.gz": {"num_bytes": 395587861, "checksum": "48c8411ee2b5fc8cffe1589ed204d0ac8a12b5b3bb1857373f84bae984d49e8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00341-of-01024.json.gz": {"num_bytes": 398093153, "checksum": "4ff8ba83e489580da2401aaa23ca3329befe8fc08b6f299b612950c358688604"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00342-of-01024.json.gz": {"num_bytes": 397248009, "checksum": "c72e063f95d10ce661b4bc97538eccf6da6ad493b7e54da555a46e4a47aabbed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00343-of-01024.json.gz": {"num_bytes": 395939409, "checksum": "249eb2080c55402aab34a31a442b06bcaa25d2df3f4319ea1a5f50dc6bb709b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00344-of-01024.json.gz": {"num_bytes": 397608807, "checksum": "8cc57604fcc5fa920b0d16df6e8d8b7f4ca88c0c76c86f9ac81f42a615b330e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00345-of-01024.json.gz": {"num_bytes": 395751274, "checksum": "13fbc76e49a8b856f7563b945bef10d786a86caff63b4cebea50416ca34932ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00346-of-01024.json.gz": {"num_bytes": 395516794, "checksum": "61d43da2e3e7770016ba7235eaa74a1e6a180e64cd2cfacefed5c34e8b72eca7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00347-of-01024.json.gz": {"num_bytes": 396180000, "checksum": "4a0ca2103de168d05d0090c8800d47f216cc167a9cfe9e736403aedf040c5e46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00348-of-01024.json.gz": {"num_bytes": 398461180, "checksum": "a56396961496499ac289a85d126b916132e787d0dc4fbd9961aca7dbbc7cfcff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00349-of-01024.json.gz": {"num_bytes": 398049366, "checksum": "ca012572c575f6a8e6ad6453296ff93f22118995c17928e76b655da44ce5810b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00350-of-01024.json.gz": {"num_bytes": 396532962, "checksum": "bb35d17862201063b46d8745dc182756d1bb09e809c4c355452ab1967e655491"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00351-of-01024.json.gz": {"num_bytes": 396576223, "checksum": "19ea45ab2fe5487d2a69cca7c9a1db7a09c8d5dfdf130412bbcd241cc60a61c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00352-of-01024.json.gz": {"num_bytes": 395956381, "checksum": "bb5869b8649fffadd5f1945ca9a79588e84081a8fc45b7e4cb5507149b5be2d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00353-of-01024.json.gz": {"num_bytes": 398903623, "checksum": "cb16a7ecadd28a8b5622c4e581f463f0ae2fe20a3e6582fa6885d76e7523715a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00354-of-01024.json.gz": {"num_bytes": 397316693, "checksum": "42aea18548695c458ddc229d8c837356845609aca3bb64ce6e07b185443b9468"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00355-of-01024.json.gz": {"num_bytes": 396240550, "checksum": "1577d76807548d83427293b9f534a3261fb72a345569f0491a1fd2691047bd92"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00356-of-01024.json.gz": {"num_bytes": 396132315, "checksum": "b6e17a39292e082e517082b23b381305ebe889c2530fb5eb74a2683d36d07a86"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00357-of-01024.json.gz": {"num_bytes": 395948117, "checksum": "524ebed10c881f52f155db5d6690806f5a97aa8f811deadae916323b50427ed5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00358-of-01024.json.gz": {"num_bytes": 397397242, "checksum": "8e23d852bc3a0dda4684d5fd511003ad6f18232e5f54e32638c8db62e9d18c6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00359-of-01024.json.gz": {"num_bytes": 396141321, "checksum": "345c34dafbc59f5e93355c8b2e6fcde6bf59bc9e1ebbf5cb962d54228e6d3204"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00360-of-01024.json.gz": {"num_bytes": 397258644, "checksum": "51db06055d95e2b43fddebf8c2b7d76b7572745f129d89fe005f8e5d3f12b758"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00361-of-01024.json.gz": {"num_bytes": 397913411, "checksum": "2c0f6054fef084d3e7cd10e2de0b1d3a48dc716af1e9146548195df128bdaba9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00362-of-01024.json.gz": {"num_bytes": 397722576, "checksum": "664b390b20498eb6e78fc09604b3a947fc1847a01e3eaae4c7861d1dde3b90fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00363-of-01024.json.gz": {"num_bytes": 395416894, "checksum": "c57529884c6d4977a279a097c0dfbcc31d52048cdcf64950182c743583d7989a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00364-of-01024.json.gz": {"num_bytes": 397028679, "checksum": "ed4f252d63c679f6e3f35847e0871c3360e072b0d6963f662d7e808b6615457f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00365-of-01024.json.gz": {"num_bytes": 397574891, "checksum": "68e8e44a531d98897245fee90ad349f4fdee891b2f68dfda78a1dedcc9474326"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00366-of-01024.json.gz": {"num_bytes": 396905692, "checksum": "9e88b888d85633671e009ed7093763b934a42054ed6a1252222dc64781a20e22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00367-of-01024.json.gz": {"num_bytes": 396802011, "checksum": "2abaf3f3946788258b8543fa2ccccc0c20e6980b9d26a38decd356e67f575fa1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00368-of-01024.json.gz": {"num_bytes": 395630737, "checksum": "b4960e3395d8a1bf8350f57e5f6280b00443a4c6b85e6fd47478fbbfc1733caf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00369-of-01024.json.gz": {"num_bytes": 396228047, "checksum": "08e8210426e6c6ef9746675592a3eea4a92eff9aa4bb7ffc6bf6ba54bc411f72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00370-of-01024.json.gz": {"num_bytes": 396548482, "checksum": "10e0305ac4d1e410d749637e0c03386d969563f8eb73bbbc376fc1d21025e4ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00371-of-01024.json.gz": {"num_bytes": 397344482, "checksum": "03df0f4aa5c377f6b45db3c3b863240bfb1211ddb226bc055433fbcd9ee8e873"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00372-of-01024.json.gz": {"num_bytes": 395872223, "checksum": "9b70549213cb01595179928cdb020daaf7bcd2085c5e947d111f3cc66e406d2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00373-of-01024.json.gz": {"num_bytes": 397399096, "checksum": "945c204cdb107669a8d1252a91323eb300c902bdd6c6a8167a90805ec02cba9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00374-of-01024.json.gz": {"num_bytes": 397755002, "checksum": "8353d4383f73caceb5d112f260b37d1349dc7898af2d05b98ffe17d22aea97ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00375-of-01024.json.gz": {"num_bytes": 396534763, "checksum": "a3de41388a6d8ce3b605c6586e47b74a565dd2f54175551987bda0a0ff95036f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00376-of-01024.json.gz": {"num_bytes": 395594630, "checksum": "7cadf813f2b31a1bfe44fdfc84aef4eb65e889c2616c56b189890734c22b731f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00377-of-01024.json.gz": {"num_bytes": 398241040, "checksum": "15df154b52cb4d9314dbc4ac26ca4b4df7125b12131d538fd480f8a6b3fbdfc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00378-of-01024.json.gz": {"num_bytes": 397217224, "checksum": "208ce680427f62d78dad857bee91122a79f968589b4e44f2f89919e91f4dea30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00379-of-01024.json.gz": {"num_bytes": 398504097, "checksum": "0052fe7f27e720423b6143f401b8618428d913b22fc2af2950874785e2ef7528"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00380-of-01024.json.gz": {"num_bytes": 397494149, "checksum": "15c4f07a2629c7bd79b243c97367e3e18de02b5ab09eccc0f85b1eba0e0b071a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00381-of-01024.json.gz": {"num_bytes": 397190859, "checksum": "77c71b4a79ac2f462040ea0e8408fdb8f719fac0f09fadb760ed00b709e9dea5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00382-of-01024.json.gz": {"num_bytes": 398126420, "checksum": "aa44d029398c33f733065c489ab3ded9395f6e53263407173b6e9c27b6fb9c45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00383-of-01024.json.gz": {"num_bytes": 399108296, "checksum": "f507161fbe96f8abe9dedccba2458448719e6b153bcc1256ecee6b4b9c82256e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00384-of-01024.json.gz": {"num_bytes": 396156787, "checksum": "83c236bbc8508fb81992c837751a4d8ad4b9bc138dd1f4bb5c1fcc68203e12da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00385-of-01024.json.gz": {"num_bytes": 396878483, "checksum": "df45b4749951a46695f88789fc536617ee3470083e55562292f606e09185e4a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00386-of-01024.json.gz": {"num_bytes": 397495799, "checksum": "a8240c9e7266e47bda8880e38ac8a5afa8541aed4b989d6642b31497716a51ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00387-of-01024.json.gz": {"num_bytes": 397062301, "checksum": "e6fd54ea6f17d5570fa4cc97554813a7a33bd4e44cbc456b27b0c87c1af22c60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00388-of-01024.json.gz": {"num_bytes": 397074091, "checksum": "fdc2a134df4a669deb839f26947c86b7e7a4bc7596a6a1c25562cb97fbb6b089"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00389-of-01024.json.gz": {"num_bytes": 397056868, "checksum": "e7390f0007582a3460fa67375b2628c85a1aa85954796d8e6584fadcb35761cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00390-of-01024.json.gz": {"num_bytes": 396404332, "checksum": "820a97060abd3172852f38e1636706c8389adad8495de56f4c3a2c3ba6008235"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00391-of-01024.json.gz": {"num_bytes": 397125489, "checksum": "68732c5ab9f4b6945e79ce2a1b45b97a97822d6a107aa79aa9135f29d91173ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00392-of-01024.json.gz": {"num_bytes": 394992472, "checksum": "c9d1e8cfd481631a76544e5880ceee9990e7553c88c5978a91b48ec8aa47717d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00393-of-01024.json.gz": {"num_bytes": 394778146, "checksum": "7a5ec4f0878f676a3ac2c417f512186066d793f28d611f97135c3626b3b60fdd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00394-of-01024.json.gz": {"num_bytes": 397024190, "checksum": "44e32db5a39684ab1789cfe97b6e9cbd3c539390e7a4c8ec9298e7177945452b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00395-of-01024.json.gz": {"num_bytes": 396537190, "checksum": "601ec281240753ac5793ec7cb83802a788c4d88e56dfd83e6c875cf2ef9bd8f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00396-of-01024.json.gz": {"num_bytes": 398049705, "checksum": "b1024b69e191b2c7073f5f4f3ea51e8710be54db8603ce8aaabbfb919ea6694d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00397-of-01024.json.gz": {"num_bytes": 396670567, "checksum": "11357bc600f9b0c443f124c7fa4046d10cf03e19016e5ba8cdde884d2ff76c9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00398-of-01024.json.gz": {"num_bytes": 394706629, "checksum": "778eca6d845b9a7d49e22941b959a95e5e4d2d9714720f27b810230d136acfde"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00399-of-01024.json.gz": {"num_bytes": 398257272, "checksum": "27c2a30af83975d32469e85fb2e27953a3aa9f97514f621063325cb9af1829fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00400-of-01024.json.gz": {"num_bytes": 398732278, "checksum": "aff9a39748526a03d3476288cdbce122c3683baf113362e9085895609d03c3c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00401-of-01024.json.gz": {"num_bytes": 396372632, "checksum": "a6af262bb962eb1c45d2003ee1bb2be1a3a12cb3e53d4ffe58b4b68dd852957f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00402-of-01024.json.gz": {"num_bytes": 396783625, "checksum": "db9aca12012da21fc5a0619a47e9c3075959786d6d6d74f6a244af1cb33c402d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00403-of-01024.json.gz": {"num_bytes": 396950960, "checksum": "b3566f7b9251f6aea9343d1344151f10fc104464f92e8f10a97742defffc2244"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00404-of-01024.json.gz": {"num_bytes": 398481154, "checksum": "897904040b5887620b9996cf89656f5bff329a430a8c3dfd6802d0c879675376"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00405-of-01024.json.gz": {"num_bytes": 396065216, "checksum": "45e0108549ab06d9a8ad5c45dc53250798d0e58f7e940080a754106801250009"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00406-of-01024.json.gz": {"num_bytes": 395637879, "checksum": "bda70f3a19b19e2ffdd1c3a26b959945b447acd450cab49e72ce727d2218af5f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00407-of-01024.json.gz": {"num_bytes": 398356109, "checksum": "1df9e8b4715d9a3f02a0b06aef6095f81d38acd1be0b4fa402acaac0258c3116"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00408-of-01024.json.gz": {"num_bytes": 396041456, "checksum": "e89ebf354280543204e78f4308a8f8751cc26094524628cd8e9cb691d9911b82"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00409-of-01024.json.gz": {"num_bytes": 396254329, "checksum": "15729474174d6a5adb5935f25afa6de2f03a8dd2f73b780e23795ede92f5762d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00410-of-01024.json.gz": {"num_bytes": 397850848, "checksum": "98f1b8fc845e0005b76d7eac70a430ce98e6989569344ea92266f8391b1396fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00411-of-01024.json.gz": {"num_bytes": 395527322, "checksum": "52b2e31f2adb61c8e703c6758016cbfc650f8104dcd5f78867c81434be155ea6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00412-of-01024.json.gz": {"num_bytes": 396155992, "checksum": "7b6b4192f9bec4fdeaf9d6dcabd9cbba6b4c8ebb42d26730fea21bad139823c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00413-of-01024.json.gz": {"num_bytes": 395766377, "checksum": "775d1fac6b1708ba0384d922640b2f372b3ee146fc79fbe692ff69a7c6c699b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00414-of-01024.json.gz": {"num_bytes": 394860848, "checksum": "0386d8a8e0cc9d5d613b1f84085791de57ad05751d94d25681d86dff5cec1afb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00415-of-01024.json.gz": {"num_bytes": 397566065, "checksum": "1957b0d185943b1952dc66e78f0a7d449f49f8f55fc0978bf77e8dde10f4714d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00416-of-01024.json.gz": {"num_bytes": 396297306, "checksum": "3f8796934edb79d172e682511a5ed7666aa09ff541ce55e2c66406bdb6eeda9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00417-of-01024.json.gz": {"num_bytes": 398314475, "checksum": "8da08075b966c04aa7859275eefd34c78cd2b9edc366684733d027ad6d619ba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00418-of-01024.json.gz": {"num_bytes": 396296110, "checksum": "efe43733ebfc7b65c646aee68b883cf40124c1446a28e70ff2bfa9e1bb1377cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00419-of-01024.json.gz": {"num_bytes": 397614415, "checksum": "c0f02d78715de9c3ea0c684dad36a506386081fed2011ec298ca0ee623c7792e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00420-of-01024.json.gz": {"num_bytes": 395133656, "checksum": "6237f5797a35dcdd89a0b70cac4dedcfb3fe418560f8dbbf6cad685f11c870b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00421-of-01024.json.gz": {"num_bytes": 397061849, "checksum": "ee37899a6a49269026633ec79577491ff4b11e219e0236dcba68eb168279067b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00422-of-01024.json.gz": {"num_bytes": 396539584, "checksum": "e5914a4b97c27da82eaee2f4f67a165de946bb38a00d6126b1527f5eb1200417"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00423-of-01024.json.gz": {"num_bytes": 397715346, "checksum": "b99e628f8790a7baa8ee7828e31f2ec72374f9a8390c1d64c9b8092b10d9c7fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00424-of-01024.json.gz": {"num_bytes": 396335469, "checksum": "9cb3b9eb00760bb68f3df4b66b96f1e5798c338231500472fd64c49cd87c6599"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00425-of-01024.json.gz": {"num_bytes": 396714466, "checksum": "f28d4901ccde8eb7afcede9732ab94fd18c49e0e3731659ef587058d6ea2ab28"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00426-of-01024.json.gz": {"num_bytes": 395566563, "checksum": "9ab75a89a425ce974fd36e936476a30db913c2d7c9ca6e5522b91ffbcbbe30cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00427-of-01024.json.gz": {"num_bytes": 395379035, "checksum": "5e1ca658bea5ba5506afbb9ae5a5da4d35cdc3a215478c68e11652a7d5d918f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00428-of-01024.json.gz": {"num_bytes": 396419259, "checksum": "d740b37b576bcde0e1c8eee27c3bfb3b58c1a0d3c5b471001804b2a37f277ac9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00429-of-01024.json.gz": {"num_bytes": 397116774, "checksum": "d1c10b0ba72aa2d4cb4640d1263c32868190942b1e93b4bb4e9798e25f10ba67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00430-of-01024.json.gz": {"num_bytes": 396634586, "checksum": "11dec038b4c1c35d32d000915812b6ec8da9abbbec2e15f7493551198b6a1ef3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00431-of-01024.json.gz": {"num_bytes": 396704705, "checksum": "efdfdef444cf68fc05090107033ffe2ac906b6efe2fc138e90f47cd4bd0b6204"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00432-of-01024.json.gz": {"num_bytes": 396264701, "checksum": "fa649c2e2dbc992408c3a60327e5d5ace4697c84010446bb286e544eb6c604be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00433-of-01024.json.gz": {"num_bytes": 396887722, "checksum": "3d5fd3fbf209dfff2057143a3dcf7eceeccb1e85967a9a85a992f465e3522335"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00434-of-01024.json.gz": {"num_bytes": 398856291, "checksum": "ab6dc5343b052da901f4671c1cb3173850fbc6bbfac2623ca14936b2b83d9667"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00435-of-01024.json.gz": {"num_bytes": 395888569, "checksum": "26abd1e2263af02f998705501bd02ead2edc3d7f68fadc7b198e7fcf4dffc454"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00436-of-01024.json.gz": {"num_bytes": 396976077, "checksum": "a5dadf6ec93e8dcd62b0e1de3cb03c866147bafe0da8e631341663ccc03bb801"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00437-of-01024.json.gz": {"num_bytes": 395809168, "checksum": "7f98e98270f9b88570b5e498511ee65d07428db604af349ef9107dbcf65ac4e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00438-of-01024.json.gz": {"num_bytes": 399136723, "checksum": "0e03ec507b90b38d5b6d7dfe27d40e127efdc9a0bae349bea2e743375ea29b9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00439-of-01024.json.gz": {"num_bytes": 396435416, "checksum": "5f868ba66ea32a23be4a926fda0a86d0d2ab4948326e1ebac615fa16a2a6864d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00440-of-01024.json.gz": {"num_bytes": 397487165, "checksum": "d30005787e7472313982cf2860e0a0764900b82a7bf616da27e6c1c3298eb215"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00441-of-01024.json.gz": {"num_bytes": 395968030, "checksum": "181461b447d88040130c3348ae7d22f220e0f97ace030d6f54301a9a3d483fc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00442-of-01024.json.gz": {"num_bytes": 396909150, "checksum": "0854cd3454047e0c6a0746ef21e0cbbb22fbdf4349c2e668f4fa1e49add183c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00443-of-01024.json.gz": {"num_bytes": 396271897, "checksum": "2493db29dd3cadef3719576c34213496eff807df5ae8cf538f13e84d403fec77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00444-of-01024.json.gz": {"num_bytes": 395540084, "checksum": "5e717d9e0c1b6f728df0f206e422a0958a537dddf31fffa4d699e5bf4b3c2b16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00445-of-01024.json.gz": {"num_bytes": 398750991, "checksum": "b8af9d413da48fb5f9a9174b12ad253b2eb2c1ed7709cab710d66710841568e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00446-of-01024.json.gz": {"num_bytes": 397575547, "checksum": "2bad5a914cb9f2e5e99d76afbf85eef66c18e7c1cf2e11c5d455792ae86ab441"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00447-of-01024.json.gz": {"num_bytes": 398035036, "checksum": "d834925674a33ed5eb8fcb335fd81b95e4ab882010e434e3fb9323e0f23be2bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00448-of-01024.json.gz": {"num_bytes": 398658613, "checksum": "16f3ac40180e47b9b97998f5d1d7c0e9336e2fee5612a3397fd161937f7a2b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00449-of-01024.json.gz": {"num_bytes": 397934476, "checksum": "09dd3d5a529f62b10d1ec97f37ed142315190fb437be3f50987ee955b11f7672"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00450-of-01024.json.gz": {"num_bytes": 396444119, "checksum": "8a25c11e0adc5fdf50944767fbfbf01a9c35b3c0e07205c7c06288d1f68b4c10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00451-of-01024.json.gz": {"num_bytes": 395963541, "checksum": "f3ac2e295ca4b3ca1f55c8b500ea2588f1519163cec381297ad4bef390fbbe1c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00452-of-01024.json.gz": {"num_bytes": 396594911, "checksum": "25a57709e934077c2972f0f8a1a9db7afe9b7558ab023bd6ee5224b2f8cd770a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00453-of-01024.json.gz": {"num_bytes": 396745507, "checksum": "75c1a4803bb58efe5df885bccd13596d46dd1f3ea30899a7e83812167b990bde"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00454-of-01024.json.gz": {"num_bytes": 396193342, "checksum": "c151679573ea5f5b52e26e8b50da7e14760d1ec15c63a5b864b648190efd48f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00455-of-01024.json.gz": {"num_bytes": 398096160, "checksum": "7f86270b13ee4133adaa06de809f26ef581229407813fca05db521d9d36880dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00456-of-01024.json.gz": {"num_bytes": 398965570, "checksum": "d5b292189c5d318e0ad622eec1e764993084d0477147f51f29acd637935fec5c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00457-of-01024.json.gz": {"num_bytes": 396672892, "checksum": "8b490f615b3ed701390ed671d5645dec4aa3fc576a032da8f9d434087c1eb8c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00458-of-01024.json.gz": {"num_bytes": 396911580, "checksum": "8bcadc16baaa4e36fe17ffc0862c264230385e18bbd861671ad5fd8cbb86404d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00459-of-01024.json.gz": {"num_bytes": 395969213, "checksum": "b8ff8371a01d7bd1782044058ee0f53d4d1275ebca0870ba16104c1c4b12f07c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00460-of-01024.json.gz": {"num_bytes": 396928338, "checksum": "23dde1fe55277467d6d2385684b71e90e9066e6a3c349a1da30a1487e87c8539"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00461-of-01024.json.gz": {"num_bytes": 400009637, "checksum": "34b98d46d207c5b6ea7416fab6f3cfcb1444cdc19376464ae9abb9296fd14c3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00462-of-01024.json.gz": {"num_bytes": 398107677, "checksum": "2031735c0f38ce43e37a5bb1b9728fc37c758fc4af71758c3d3b9535716a3253"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00463-of-01024.json.gz": {"num_bytes": 395503017, "checksum": "7820184904183fad9a61b6c638df9de11d4624bb3aca08885b842255172cecee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00464-of-01024.json.gz": {"num_bytes": 397493281, "checksum": "b39b1b1e6686014a3c62e74912ec3b915dfc161b62e2d1108410354e6dec760a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00465-of-01024.json.gz": {"num_bytes": 397080149, "checksum": "a65cc7f590cc498da334d5a8653e818421e09e5e6ce2e8bc2a29ac67a02c3d43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00466-of-01024.json.gz": {"num_bytes": 396633690, "checksum": "15d891873ba02923893cbc8c42adc0468bb39161f898a810037cc2e9f82e0796"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00467-of-01024.json.gz": {"num_bytes": 395045117, "checksum": "711686ff5478ec35ccaaf1549b7a33b941e322585f702257dfe2d31630245ba9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00468-of-01024.json.gz": {"num_bytes": 399486439, "checksum": "59c4599c8610f4c54778daedbb358f5e26fa527f8f94c3364b70565ebc90571e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00469-of-01024.json.gz": {"num_bytes": 396170105, "checksum": "4263dbb03135c2d8b16fb323208f98fe1a1ff1223e76a7ba085f881411a0ab95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00470-of-01024.json.gz": {"num_bytes": 397479432, "checksum": "2db90de8f4d2bde9af453478ed4667166f636af701bb487095311f99b28e59bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00471-of-01024.json.gz": {"num_bytes": 396679096, "checksum": "caea3c4744adb89f006d9b0d9ef93241a55c1fc165cb0cd62b6d07fa3a40cdc0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00472-of-01024.json.gz": {"num_bytes": 397080237, "checksum": "34995676d953f4c95f8bd4f54fba8f92b86189cd73298ab77ee2702611b86e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00473-of-01024.json.gz": {"num_bytes": 397881706, "checksum": "c0fc6c68ae509d8273e7ca0efbe24f1452a57dcb000f44f550fe9600fd305e62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00474-of-01024.json.gz": {"num_bytes": 397705270, "checksum": "50aeb620f8c03a2e4f2346a0c79a4509adfae084ffbeff0b86d8892b858a821d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00475-of-01024.json.gz": {"num_bytes": 397201717, "checksum": "4fa508d23abd417bdb0b0e7a61f9aedfb770609214cd85b10b4bde7ced7f12b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00476-of-01024.json.gz": {"num_bytes": 397522775, "checksum": "27da6164865687041e4f53d9ecec2edc877b147da5b424acbac2c69480132a08"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00477-of-01024.json.gz": {"num_bytes": 397323156, "checksum": "e40115fc4901a3930494652ce9ee7abb0c3f41abc6d6c58c81fa75a0ee752db8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00478-of-01024.json.gz": {"num_bytes": 397380721, "checksum": "79a16b7016aed0eec375ca383eb316765687f12421f786b2e133faa5690ef197"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00479-of-01024.json.gz": {"num_bytes": 396828680, "checksum": "08185ce3c3e5b01552be7d8f08ed5b27a6b1b121bb2d7d70a78b7074fee02fa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00480-of-01024.json.gz": {"num_bytes": 398678311, "checksum": "37a5804dafb2f4aff9e393af5b127c3577ab8a5dd23f1e41f2304b25a4c428a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00481-of-01024.json.gz": {"num_bytes": 397654112, "checksum": "47ce12535b753d8936ce3b569675e76cb6f638bfb74a93caf201f3ffc409d71a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00482-of-01024.json.gz": {"num_bytes": 396387301, "checksum": "1d07828a199bb1e1c0c8342ba99e484093557188370d1ced90803c2615d24b7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00483-of-01024.json.gz": {"num_bytes": 397178863, "checksum": "b6499612fac654798010e11c27ee8a25fc05d1dbed8aaf2338fd0ea377dc4732"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00484-of-01024.json.gz": {"num_bytes": 395826769, "checksum": "ce197ad5a226249bbba53c34b9f3c83508b542853748c3094a5b98befb537f2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00485-of-01024.json.gz": {"num_bytes": 397100006, "checksum": "f483044a4a0418b695e0b989f0fd03bfa79df01b649991f2356443bcb29d0820"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00486-of-01024.json.gz": {"num_bytes": 397658615, "checksum": "297beef7b85dc128a6a58d834c5fd1b24bd7fe84c7a317500461720c742235f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00487-of-01024.json.gz": {"num_bytes": 396904673, "checksum": "06751938694fad1645ed575208e8e2c1efebb7165b4feb2d0ea871dc348741f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00488-of-01024.json.gz": {"num_bytes": 398019631, "checksum": "eb58bf8b011fedf15835841317e445e9e757c9939b4453a013233f020f98a697"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00489-of-01024.json.gz": {"num_bytes": 395822836, "checksum": "b339e33e7affbdaf691852d3668ff79adf8476a3c33eb86ad9f4ad4a6ebbf3dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00490-of-01024.json.gz": {"num_bytes": 398410737, "checksum": "4d8356cf804474538772c5520e77e75ac750dce3e6b103c9feab49ccd46a58ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00491-of-01024.json.gz": {"num_bytes": 396607853, "checksum": "1757097fb884d03aa288a05870016b1c2b9f1700ac5913d85c9821cf2e367702"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00492-of-01024.json.gz": {"num_bytes": 397612443, "checksum": "92e98e431a378e0402d81299c49209c66d39b0ba7ae63711f8d6ecf542f5fdf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00493-of-01024.json.gz": {"num_bytes": 395595466, "checksum": "d839e1763aa6ebc7cbcf1b870d947ba45b0b4ac95b0adbe4941a0b121690a311"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00494-of-01024.json.gz": {"num_bytes": 400397068, "checksum": "31caeb5f0ef694c06ce434df44c01f4a91fcd48e4acb4f1bf167eae6e59a02de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00495-of-01024.json.gz": {"num_bytes": 396458630, "checksum": "26291dfcae5145cdc306317ecf95851a3f693b4a7c6e132e55384ec69d85ef3c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00496-of-01024.json.gz": {"num_bytes": 395037560, "checksum": "b32344b92f81006ad9e2e471f5ef8133e87924c5150145b13d51c3d7a0f68c46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00497-of-01024.json.gz": {"num_bytes": 396247929, "checksum": "0396f0bb16b06ff130e955f260233ec868ada1daef6e8cbd480ce388628d49b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00498-of-01024.json.gz": {"num_bytes": 394798084, "checksum": "28d43d4e7bbce4e20167741ea2bbc3f17981aa51f9c040cfc41c522e732c6d32"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00499-of-01024.json.gz": {"num_bytes": 396699883, "checksum": "c6f6deff919b375fb08c74e159c25aa66362e4cddb0700f9b1e0e2701293ae70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00500-of-01024.json.gz": {"num_bytes": 397014521, "checksum": "7ee22957fdfad0880f132f47860612331afce7a48975b9312233ba8ddf537bed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00501-of-01024.json.gz": {"num_bytes": 399063718, "checksum": "ec94186b620037002819cd40347e6aaf67cb847848483790cd687222c9addbbf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00502-of-01024.json.gz": {"num_bytes": 396938850, "checksum": "a218de10cee75c4bb5a7102fbe208e6e65142ba5f960ecdc2b56b6f85fa30840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00503-of-01024.json.gz": {"num_bytes": 394631309, "checksum": "8189de9454986f63253fa1ad44c63d5c2f692ff4bc3a848c7c2fd02e08f4e1b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00504-of-01024.json.gz": {"num_bytes": 397884411, "checksum": "b7b268545c27573840bf8a6abb7361c209f92f9b5f0f8028fffd49b0c773854b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00505-of-01024.json.gz": {"num_bytes": 395784113, "checksum": "b9f1610be9f045c15e43a7343bd2918743a71585a7122a4e781533dd39a73132"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00506-of-01024.json.gz": {"num_bytes": 397939195, "checksum": "f07b77d1be71c5922321e8683140f9a63a90903f1fbd1515d908807e12fc4597"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00507-of-01024.json.gz": {"num_bytes": 395925741, "checksum": "23e9927e9e83fd03e9d99c3fac05f1bf63d6c296a2b02d1aa208798d27d8dc1c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00508-of-01024.json.gz": {"num_bytes": 397426015, "checksum": "f4b8a74c610cea50a6b144337f65fcfed11fff21df6683503f25d4b82e29a4e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00509-of-01024.json.gz": {"num_bytes": 399072341, "checksum": "c3069ae9658273cbaeaed1730f171837c8d3042e31d1093cf0f519f601309a41"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00510-of-01024.json.gz": {"num_bytes": 395859781, "checksum": "e5863648f64423397ca1a7838df18aeddbb3d5d3a2551321fd99a480508fa86f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00511-of-01024.json.gz": {"num_bytes": 396948832, "checksum": "a2209ec05a794f083cf163c102c6ddd8d5e5627674686950e17e586128a81e60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00512-of-01024.json.gz": {"num_bytes": 396585426, "checksum": "1c6fdb002dab490e6ddd7fe6023b2124bb944b7ebe95ee3b7faca9a92f4b5de3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00513-of-01024.json.gz": {"num_bytes": 396789970, "checksum": "83b02c0cf9ffea9d021adc102269c30a33ab3a803d331ba8d39aaa9b3b7acb43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00514-of-01024.json.gz": {"num_bytes": 397131474, "checksum": "783f25460641cd3532c3bb3920c7d3f0c68b5e674d44cba33b1ed755608cf8ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00515-of-01024.json.gz": {"num_bytes": 396127068, "checksum": "61e5b9947f77d929442f23fe84465d88044631aa1eb6438a0b86372cba7286fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00516-of-01024.json.gz": {"num_bytes": 397526020, "checksum": "539b032f528d1ec3a8e8420514ef2118f05482297b052f6d28876a8bf776a080"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00517-of-01024.json.gz": {"num_bytes": 397748661, "checksum": "03b85a51aa7bcde672cc017fcbb0f11976cbd1447fc0ccb4f4bc822b2b04b27b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00518-of-01024.json.gz": {"num_bytes": 397915751, "checksum": "80dec6dc7d15459c113c16f23978c38cdc1157ca18468d8a00e0d2192bb2ffd9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00519-of-01024.json.gz": {"num_bytes": 397847480, "checksum": "7125e7915fd03c6312cfe448e4e7a8629249765c13d8558b17c240c2aef713b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00520-of-01024.json.gz": {"num_bytes": 396232144, "checksum": "27974f9766c18fd0b652c94eafa3493243c8e1b25b6e850e857ab6246b193b48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00521-of-01024.json.gz": {"num_bytes": 395111538, "checksum": "61406e92a8f9a6ab800b3dd25cbac842e3487a4c7db7b1bb2070a41d627367a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00522-of-01024.json.gz": {"num_bytes": 397690206, "checksum": "b2e29801d120132a5fbbd3662a54290e46ff5e178b3146ebfc2169facf72e7e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00523-of-01024.json.gz": {"num_bytes": 398274007, "checksum": "79905dbc45756c9f1c225120709d39cbf3caf435e322a531a4add690a1d0440c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00524-of-01024.json.gz": {"num_bytes": 395689218, "checksum": "1dc3086cb869abb13862970186f6a77cb29b687cd49518173f639c148d937f6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00525-of-01024.json.gz": {"num_bytes": 397979085, "checksum": "6958bbc6029c00229fb0059d016a6b7a2bd21cfdc69392893423d2657c35c7c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00526-of-01024.json.gz": {"num_bytes": 398473877, "checksum": "895f42c4e7569f0db3832af13e56499f65fff74e93fc0cdf60c1c4b4b08881c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00527-of-01024.json.gz": {"num_bytes": 395879939, "checksum": "e84e72048b56878b1ff904ee83d92c208e15b16663b99a9d763edc23c2e0e55f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00528-of-01024.json.gz": {"num_bytes": 396472889, "checksum": "badcc3cda339c61936591e9333787ea032c42d7ff2288fdaff791bdc8504ce96"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00529-of-01024.json.gz": {"num_bytes": 396983038, "checksum": "ad20643f9d50c7c508fa136ceed0039ce39708e0e7a5e743c1981f1000bc3c4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00530-of-01024.json.gz": {"num_bytes": 395774249, "checksum": "9453fa3fd296150b436f0146171ea8317512c6735ee9434622a83765a5d9e310"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00531-of-01024.json.gz": {"num_bytes": 396171120, "checksum": "3e3c230ab6beda13e4dd4747c7c6291e57b1ccb4a96ac2edb46ffdb4c3cb05b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00532-of-01024.json.gz": {"num_bytes": 396200411, "checksum": "e9b52c3dad233fd1c4310cf5f76c2e6d0788ed084abcf931f99ab7002976d75b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00533-of-01024.json.gz": {"num_bytes": 395580851, "checksum": "e135cc4420d9f4d17ab523f7db8c559021a46a9a6bcdd21a6c4075047465906e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00534-of-01024.json.gz": {"num_bytes": 397459281, "checksum": "bb4f32ee1c1bedf4582b0f4f9ec7644be73fa25bf18cca7506e3c26e98818bad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00535-of-01024.json.gz": {"num_bytes": 397344480, "checksum": "3766ddf8313c5cee08a575fa96bdde06a5b293f1964e58293ea583d72bd18e20"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00536-of-01024.json.gz": {"num_bytes": 396588089, "checksum": "56d236a4250f9488d80b93c0c005962d018da256ea5632c7e16ae26c54188749"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00537-of-01024.json.gz": {"num_bytes": 397606873, "checksum": "d7ec24ef99de2769937b89e0ca7e291eca2bd0438d501d9228d5ab035f49d83e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00538-of-01024.json.gz": {"num_bytes": 397608864, "checksum": "1a60378a0f1a200b11f85577bbd0f373ae47022eab16fad53da492ca1ed35bfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00539-of-01024.json.gz": {"num_bytes": 398377669, "checksum": "787d263107eb09e852b015c17d1d0f54d8b93e78292c0c1e60cf99f27535c608"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00540-of-01024.json.gz": {"num_bytes": 398516980, "checksum": "dce03ef0813ef66e27df8730da7e341b49bf7e684bffd3a9cf700905501d1d72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00541-of-01024.json.gz": {"num_bytes": 395557685, "checksum": "e4035222d65124bd3e33372b76b65c2dad9e696701607ceeb5968d483595645c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00542-of-01024.json.gz": {"num_bytes": 395725875, "checksum": "4e7ae0b1c0c4d514e0208e21336d095fea5970475077d6690a917faadb2b72b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00543-of-01024.json.gz": {"num_bytes": 397625187, "checksum": "a96ac467b6ace74a08f7dbc4bb8e3fc57fae36abc8975d6b60a7b7353ca9ca88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00544-of-01024.json.gz": {"num_bytes": 397078230, "checksum": "337470c84cde5d02bc6a89003a6796de9e63db269e7800637ef2d220d75bd3ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00545-of-01024.json.gz": {"num_bytes": 396145060, "checksum": "da65d66aa4cfff77c754f8017eedd92cb82494b9425c2d5c5491d64603b2231e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00546-of-01024.json.gz": {"num_bytes": 396093007, "checksum": "399f7b70d1c1b45ce315f396d5fa0db2c69e41c522b0514e19bcc6802b953b1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00547-of-01024.json.gz": {"num_bytes": 397457696, "checksum": "47fc8fd82271e6b1fb074512da45dc005e22cb7f0aca3b7b621ea87613aeff9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00548-of-01024.json.gz": {"num_bytes": 396246097, "checksum": "3108770b39746852d7c048d9a8777722480505bbf4592732c7d1f231e2505c55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00549-of-01024.json.gz": {"num_bytes": 393096516, "checksum": "9bb2b88775593afe4060349985ff4417a37f1ba9b4ef33399c58644c01a92b89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00550-of-01024.json.gz": {"num_bytes": 396631619, "checksum": "cbb55d645d145ecc2ff9b96524463f82d5548c0bdf42381fc6faaad256e7ead7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00551-of-01024.json.gz": {"num_bytes": 396806780, "checksum": "ece03d7f12daa39473b6b8d5faed08a3f751efb9b1ee99f69c5188633d4a0f43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00552-of-01024.json.gz": {"num_bytes": 398608968, "checksum": "7fbbde9c39d67d8d7f9f16c0848188b743c6ff5bc44e6339d5fd88c32e1aafef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00553-of-01024.json.gz": {"num_bytes": 397696672, "checksum": "85f9c5c5fbcfd06f715b520a1a3a63a014b1831d2f65de5f02cfea49a18ddf63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00554-of-01024.json.gz": {"num_bytes": 397122204, "checksum": "78e3d43c3d2b71d8483788a085cd5706648767de7a2fc4aab707d6a05257ff00"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00555-of-01024.json.gz": {"num_bytes": 398704893, "checksum": "113e5fd99ada6ca96c086487b6e4012bad711d1d482d580e22d3af5b9d118572"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00556-of-01024.json.gz": {"num_bytes": 398099675, "checksum": "c7a816f8f2f74b4554ac17ffc41e67ebbcabb7c8b0c94292b4569bea372bea3d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00557-of-01024.json.gz": {"num_bytes": 396538561, "checksum": "7af6d2c9886481a0d393e026739b5ad7d0fc358ecc216d2fc124160402d4b50a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00558-of-01024.json.gz": {"num_bytes": 397660839, "checksum": "c1033428189671d4e1ba55c822040f307748c6ec31b80be3e4ed8e7a4325066b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00559-of-01024.json.gz": {"num_bytes": 398754128, "checksum": "69c9f88840166363f2b7ddaef05ac9d10441fd184d8451abfde76eb105572342"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00560-of-01024.json.gz": {"num_bytes": 394988981, "checksum": "a2dc4fc315a0db8f1a868d631d2941ab2806f44c2ae698e94bb7e8308bd67c70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00561-of-01024.json.gz": {"num_bytes": 395801300, "checksum": "dc1b2b4594e3fc7f8795f7649d1c524405edce56d617f1e214692565de8c8937"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00562-of-01024.json.gz": {"num_bytes": 398322250, "checksum": "c23404fef6a6b5b887cc2dddfe341e983939ae36078d62842919a3739c96b43a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00563-of-01024.json.gz": {"num_bytes": 397584845, "checksum": "c909fe429772c8198f904496ea6cf239d669c6c787889cefcb7623e08a988db0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00564-of-01024.json.gz": {"num_bytes": 396436964, "checksum": "8e7cb1863057a3b9929af4da29b4e1cca1f71c254f5eba91a657d9e8c1fd6dea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00565-of-01024.json.gz": {"num_bytes": 396486039, "checksum": "23ba56e78c4edc4d58fd7fbfcf784b29037204a641e43a9894c95c68bdb982fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00566-of-01024.json.gz": {"num_bytes": 395358745, "checksum": "71259a300ff096b49e3461c91824a8185037ca85ef2018dff2617f335ab304b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00567-of-01024.json.gz": {"num_bytes": 396405726, "checksum": "d9b56ed523376681dd81cb9831727467461bdfb87c80d3932937338370093033"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00568-of-01024.json.gz": {"num_bytes": 397509797, "checksum": "c650aad13a48d5b0c51162ad19c9eb3135559d0a3318dba701a90e8138a8cd24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00569-of-01024.json.gz": {"num_bytes": 396514261, "checksum": "d71e4126c2deffae8ee55077cee9dd2b70ce27adec767bce06e02afb23b42416"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00570-of-01024.json.gz": {"num_bytes": 397072833, "checksum": "519a32e1bdf7f5b97e1a438242a79218317e04e44021dc61aa65c526d35ce8ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00571-of-01024.json.gz": {"num_bytes": 397170114, "checksum": "919a9659156cafb26b87190fc00b9d33c4fd536dd35544cbef8e5ddc018ae365"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00572-of-01024.json.gz": {"num_bytes": 396475017, "checksum": "3d7e4e548f01c9ad5fc99b4342cbf9a9004737058dd93aae8b7d95b2c00856bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00573-of-01024.json.gz": {"num_bytes": 396749955, "checksum": "032f8e37328c9f0fc046e5a6ff5a79cbb744f3100c4cbea78e397c449471bb10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00574-of-01024.json.gz": {"num_bytes": 396036505, "checksum": "8e795341527712be32a69307ce8cbd2d6195c6b2fea596d326a279734505198e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00575-of-01024.json.gz": {"num_bytes": 396722381, "checksum": "45a43576cfc61842bde146eaa566b4f22a128c3c2eb8f30c59a6b6cae4bcd4e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00576-of-01024.json.gz": {"num_bytes": 396163377, "checksum": "38429d2d6176ee42ddd495e052c01735a9a7f0076cde107d24a0a9c7a26bf2a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00577-of-01024.json.gz": {"num_bytes": 396813305, "checksum": "eae77c319bba236feaffc9f74eaa38e911fa48eb06f4794c9b1a6d17edab91a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00578-of-01024.json.gz": {"num_bytes": 397797226, "checksum": "1dd2b3d7e99fde8903bc12625568ec4fc6fe653737b3af5e9c71432e311cf5f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00579-of-01024.json.gz": {"num_bytes": 396012631, "checksum": "d9322e66701b4ada3788b91a07e87b03af6c91eb4cfaaefee23c0330987a1840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00580-of-01024.json.gz": {"num_bytes": 397943129, "checksum": "23deb32e1b0f07a55a5cf1572cb8e313ce716c748a07f58bd90cbae97290d0a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00581-of-01024.json.gz": {"num_bytes": 397614648, "checksum": "6193f8b848c7930fc04b9f2429dbccf36f1b291271b3eaf646c655433bf3ff9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00582-of-01024.json.gz": {"num_bytes": 396659280, "checksum": "40997ef02c7040356cd1c5acd8e6a5121e00b31253713cad4f529ab2922affc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00583-of-01024.json.gz": {"num_bytes": 397686445, "checksum": "5cd21271e4ae036f8d1e0c320330a6c93a8b1ffbb9293a80c56c2d7f123f9ee7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00584-of-01024.json.gz": {"num_bytes": 395500815, "checksum": "c25befb7c735b2340b092a04375d2109c1b876d2b0057dd8d4ed4beac87118ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00585-of-01024.json.gz": {"num_bytes": 398413461, "checksum": "073f632e95c218fdf17274fc21915c94f56bdfbb58a6b1a0550de249ce4d2129"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00586-of-01024.json.gz": {"num_bytes": 396849745, "checksum": "647cbe9bd7709c0d8a01485096fd88ad0fc09b27de324eae141a8d841536b71b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00587-of-01024.json.gz": {"num_bytes": 398567154, "checksum": "557af97a8d2b2656149bc25ee5b362116d173e6a48911b860ec10d512b4b763d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00588-of-01024.json.gz": {"num_bytes": 398086388, "checksum": "9e9afa15ee3534e497c9fc7c8cd967388183193dade3d1ec82a8e2b0e82c5118"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00589-of-01024.json.gz": {"num_bytes": 397335823, "checksum": "ed8a1d0b9c55f465b5d4a4e5ea022f6d17aaa8b82569be7cfec55629c1bf26c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00590-of-01024.json.gz": {"num_bytes": 394931693, "checksum": "3fbe539fcf64f0d914c19b383de9953b0605d4a69f48801145f0db1972f9c6b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00591-of-01024.json.gz": {"num_bytes": 397828770, "checksum": "9165de8866384d3d03c3876c39c96706e33a24b9f95acc09999c2dbfb85cd9cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00592-of-01024.json.gz": {"num_bytes": 398782493, "checksum": "433a9cb730d7ab024b56ad662a3ea53633f7ff26c625051c4c02f252beeb87a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00593-of-01024.json.gz": {"num_bytes": 399264489, "checksum": "4a7e5f40aa8b692cfa0519d33a868e9a05e579ad430204bc13c48b533eadc5ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00594-of-01024.json.gz": {"num_bytes": 396629833, "checksum": "521d5e90550dbc97ab26a18a0b75da81e38ce2083ff5fd93340fded2e54e1ca1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00595-of-01024.json.gz": {"num_bytes": 396916313, "checksum": "30c9be1d99ce0a41b214fdbd5115988c82ca317d4aceb30c19fbca05e0a409e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00596-of-01024.json.gz": {"num_bytes": 397013253, "checksum": "b16bd9d7d893b4a71056575fa0799bef96120c03cfc6e2a88c292469a67f2614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00597-of-01024.json.gz": {"num_bytes": 395980036, "checksum": "3bd15089b6fff342df2b3109d7ebadca35cead4f44ca5b1b55e55d8892aab82f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00598-of-01024.json.gz": {"num_bytes": 396295935, "checksum": "6252d951a9570baea9767cf3350a6d09ac5a5fc34ba80eae3b5c40adb8361ab9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00599-of-01024.json.gz": {"num_bytes": 398608239, "checksum": "b265a385cdd5e64d1fb2ffce739e72f2fe2cc8944621f20e2084dc52b91cdd9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00600-of-01024.json.gz": {"num_bytes": 396563743, "checksum": "43d12028cbe738e8f450911f6a55dcb00f8742cefc2a2c4da5f9e9220b0572c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00601-of-01024.json.gz": {"num_bytes": 398256993, "checksum": "9368dcfc581e6d572d899ef25b129bc0268901a2fa009500174a0985bcf330df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00602-of-01024.json.gz": {"num_bytes": 396202546, "checksum": "3cc57d7afd161fcd411f73da8369d98db4c6d8e30643ee01450adef21e8ea3ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00603-of-01024.json.gz": {"num_bytes": 396338425, "checksum": "cc21fc5b8ed6e5115bd8924954d685ed52cd5b773ab63d37188343443c95851a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00604-of-01024.json.gz": {"num_bytes": 397597307, "checksum": "d24f6d807ae35037e695e19917ed446f74448166fa464c862e31fe7ba2bea196"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00605-of-01024.json.gz": {"num_bytes": 398278313, "checksum": "99166183c752aed8d0f2cc9c010f1ebdd4fb93d40e936fd6c082eb3542baa956"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00606-of-01024.json.gz": {"num_bytes": 396590468, "checksum": "657ce79340c15524a5897459a6cf712fa4127def2445f7eb3de21c9b46db3794"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00607-of-01024.json.gz": {"num_bytes": 396603228, "checksum": "3705441435f18d1e4aeea9e794e1216fcd29b48213763a554808e3d3697951a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00608-of-01024.json.gz": {"num_bytes": 397280580, "checksum": "be0bef2c16e9bdd0387276402dc99fe5a9a0a7a105a44e88bdb783139f2de474"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00609-of-01024.json.gz": {"num_bytes": 398284528, "checksum": "3a7c7a8cb01f6d7589152a1483682a5fa99e119490f3e70d8a02f582f2e2b19c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00610-of-01024.json.gz": {"num_bytes": 398872039, "checksum": "c349aac5b64227397ec2870992ac9e4fac9fe39f1fd4e0a7b8c727e171655e14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00611-of-01024.json.gz": {"num_bytes": 398736440, "checksum": "63ca5eb2d27632b3b4dde8e40f9925e71e21ef737262bcda7a99324a67e0fab5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00612-of-01024.json.gz": {"num_bytes": 395170895, "checksum": "3b4bb3e14ee981a9edb9828ce40b86b5d83dfafcc1a5e0e02642cb40924bd6ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00613-of-01024.json.gz": {"num_bytes": 398443337, "checksum": "e95adbd7d55024b7e62145860f217a6f04f5fcef79ac23e92dd9e14f9a0b2a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00614-of-01024.json.gz": {"num_bytes": 398854661, "checksum": "def8cb789f8f79fa169e855816c5e4bc7d5c253e565502691a9abb826d7436d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00615-of-01024.json.gz": {"num_bytes": 395505189, "checksum": "6775ca6aa4f834289396a438906b90936ed0ff6390213dac2b0861f40d7761e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00616-of-01024.json.gz": {"num_bytes": 398999454, "checksum": "6cd5efddacb09cc80ec1eb79f93b562044787903b3cb1c879be2acec64a9dbdb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00617-of-01024.json.gz": {"num_bytes": 398570431, "checksum": "26d1f587377446e8b1499be7a3b6776d437baa40353fb04c591203a420eb0cc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00618-of-01024.json.gz": {"num_bytes": 397064982, "checksum": "e59a87fd1cd3d87fff4b15c3a9331521d7587ac7f4a7fd51ec3906b484ef9ad0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00619-of-01024.json.gz": {"num_bytes": 396676338, "checksum": "8077c3a15d93579d0fbf00bd9d117bf4f50092c5be3acf46c7d4433ef7be9dfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00620-of-01024.json.gz": {"num_bytes": 398186471, "checksum": "ee3fb91d7797ebf1daf8dcb81563b7dae7b161d97732efd35e3eb6ebea732ee2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00621-of-01024.json.gz": {"num_bytes": 396467968, "checksum": "386adb83129a7306ef4da37c1cbedc39b3971e7633d516d406a982f307577e67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00622-of-01024.json.gz": {"num_bytes": 398293882, "checksum": "b708cad0e04c56174d0feec84d7224a4490cb8db023d38e57398cad89b78568f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00623-of-01024.json.gz": {"num_bytes": 397396780, "checksum": "c50c4568c6f103b3e6a3702cbd915ecb530df954df808156bc38a98f36a0b944"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00624-of-01024.json.gz": {"num_bytes": 396971282, "checksum": "11351ef83c9fb883d6c0f484af5c10f0d686b7ac4a2f08fae9ac3d9837df0a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00625-of-01024.json.gz": {"num_bytes": 395882440, "checksum": "dfa97ea7949c9bbf7af43d43ac5c8d0034bdbd1ad572895159b7c7846ab89676"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00626-of-01024.json.gz": {"num_bytes": 398292846, "checksum": "fbc9c23dc286ad6fd7f01f344de97ef5789733af581de278488869bd36f3b246"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00627-of-01024.json.gz": {"num_bytes": 399890427, "checksum": "f43bbde36b8bd34ed9998b99b42c85434b8bbc8bbaa1cf5b38cec6393099c23f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00628-of-01024.json.gz": {"num_bytes": 399589466, "checksum": "c50058a4937912b678d33d34ff91e2287e8701365f4f71fce61f9002652556cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00629-of-01024.json.gz": {"num_bytes": 397355095, "checksum": "051c4631d0587b6f65827410ad2f2121c05c849a009274415bc5e7f72db42d44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00630-of-01024.json.gz": {"num_bytes": 397860559, "checksum": "07b48a86a8a3245fe5b78f6943c8970c839942b8d86abf173507225b0d1520d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00631-of-01024.json.gz": {"num_bytes": 396161304, "checksum": "70a03f0308105de5266c4a40803b51f99888b362b71409719b7f71f73761b590"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00632-of-01024.json.gz": {"num_bytes": 395620184, "checksum": "c6923984c419f08bb4e6effc27dd25dd986513034338debc9b238592dad9f607"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00633-of-01024.json.gz": {"num_bytes": 397572527, "checksum": "900fc701703234031e825a1eb2d11b364f1dda97eb0c7943e17ef278695f7bea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00634-of-01024.json.gz": {"num_bytes": 396215174, "checksum": "0cc838e395581933123fc57c6690afbdd2be1b67d213336d9b8c08b3876f8458"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00635-of-01024.json.gz": {"num_bytes": 399176005, "checksum": "5a3daa1bd0be8c997da56257f063a7d1c7b2b271648a46615b26ca4beeb42863"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00636-of-01024.json.gz": {"num_bytes": 396035356, "checksum": "9d21ce1c8b5a7c1330cc95b1f45286fb8578d5dcec0686724ff6e25a97f38a7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00637-of-01024.json.gz": {"num_bytes": 397214839, "checksum": "83cd34e1ba09c268b515fda7699e12bfa2531fb7e60e2f861946ffdc01e54a04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00638-of-01024.json.gz": {"num_bytes": 396292535, "checksum": "82a7bae9a7d35fa707bcb6d90f7b244f1509e112dfdbd604c9be1f8b8ce7150b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00639-of-01024.json.gz": {"num_bytes": 398009954, "checksum": "b6d7ebd102c67960413caf5fcdc5b4aea728b6d3d6369ab8dd3cd6bee6c769de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00640-of-01024.json.gz": {"num_bytes": 397558496, "checksum": "151c55d019fd84fdc0eab73d24984e5d88ac964c86f89a361a03dc776a22b5b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00641-of-01024.json.gz": {"num_bytes": 398031508, "checksum": "e0e87304a8ac408adca2badf2564ec52caf155295ea303a121c30f3b1ce797b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00642-of-01024.json.gz": {"num_bytes": 396594124, "checksum": "73d08c99b6b96d96b82d88267b2a392a7dda2084ba5142b8eefd0d23212702d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00643-of-01024.json.gz": {"num_bytes": 394552252, "checksum": "ebccf3b935d63c30f626d317af250b6bd0f04ef5e1cced829287ba64fbb0d25f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00644-of-01024.json.gz": {"num_bytes": 397586341, "checksum": "674c0965a9a880c057b6f2dbb785a4a6ae048954d44ba4f5266dd5e65095d06e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00645-of-01024.json.gz": {"num_bytes": 397950976, "checksum": "7ac8d4dacd682a2977818f01d860c3dfa5a5e5a78f7d2d95be0353a675452e93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00646-of-01024.json.gz": {"num_bytes": 397511840, "checksum": "452a9cc03facf9151552f914f9a8a3507a96fd8ea40f7d04951a29ecbf6aa1e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00647-of-01024.json.gz": {"num_bytes": 396692070, "checksum": "5a795a238203444596c711bcedc634e653e5240c9a800a9884c51f878340b494"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00648-of-01024.json.gz": {"num_bytes": 392707626, "checksum": "9cc366c37950624df6af318ee52a97d32a40e278fcb519cbe8545b04bee3204e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00649-of-01024.json.gz": {"num_bytes": 396283284, "checksum": "4ddeec31a30b5c563838b17e1115ad30041e08c70a94f299ea324ee4b71fd82b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00650-of-01024.json.gz": {"num_bytes": 396349662, "checksum": "f5bc63114ec9d73d6cea7f8e38a95031ae2bcde849b27440afd840a3e72aac13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00651-of-01024.json.gz": {"num_bytes": 397187042, "checksum": "7199c0242b2654509af187c9c8bbfc22cc5067aafa1ff69949b1f0e5b718425b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00652-of-01024.json.gz": {"num_bytes": 396263026, "checksum": "c9e62b6df7213ea5b71913fbf736403f33c51e5a868bf1035cebcc39d80635bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00653-of-01024.json.gz": {"num_bytes": 398689010, "checksum": "f3bcc9eca4d71043e920db6399a032f916c23b1da329d2ef86434a74f8e7b318"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00654-of-01024.json.gz": {"num_bytes": 396938678, "checksum": "fb41df26e1f68e1e9d12ae8740535ca66e80910320be2270d680fec40d6fe9a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00655-of-01024.json.gz": {"num_bytes": 395995226, "checksum": "018b40ddf6d88c4c346c8018439d16f6ca66ee0720970e84ddc34b1010ae35d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00656-of-01024.json.gz": {"num_bytes": 397860049, "checksum": "8f3847e9bb5a8145e2959b340f86cc06f85e6646f32d5d785c5c90ec11a9f404"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00657-of-01024.json.gz": {"num_bytes": 397142407, "checksum": "a1ae8735a39bd099dac2e50c22e312f1a010f2644774ef53c995f3437c0a5524"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00658-of-01024.json.gz": {"num_bytes": 397827609, "checksum": "f6154377cfff2453392fb899f81514a7c0ffd40dbc35d8842d61a115d0aeef35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00659-of-01024.json.gz": {"num_bytes": 396861858, "checksum": "4299633524667921549573c469a73e33abae89d107375d5ccc6a6d987c2a2a26"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00660-of-01024.json.gz": {"num_bytes": 397773823, "checksum": "44eaf6c1739d8a9c13c54750c473ac04aaf9d2223d8893cd8094f1769b1f6f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00661-of-01024.json.gz": {"num_bytes": 396311257, "checksum": "18edb60444b660c7cc68dbe59ac71989be0e20ff13639725a5f05e4d4d512514"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00662-of-01024.json.gz": {"num_bytes": 396176936, "checksum": "7b60541181fbb92f361fbdf0bee80d086c75279610aab792a7b3877d49a3e1bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00663-of-01024.json.gz": {"num_bytes": 396274985, "checksum": "59e057ee5f5e8c7267138c18c5c88f3ca24d30f86c484e4bb0c0a4eb5169c4a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00664-of-01024.json.gz": {"num_bytes": 397483935, "checksum": "585f45d3ac3f88c3bf1c86e01daa46537f8f5c5165521412de0e67393cb6da33"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00665-of-01024.json.gz": {"num_bytes": 398831104, "checksum": "e403d2f4ff6e74abc9639749f93f77cc868453908c10821fea7fafdbcc981a06"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00666-of-01024.json.gz": {"num_bytes": 397668116, "checksum": "f9bbafa396a466b24630a259a01804b2857c1dde2fa3cec60b2967a88ad9f528"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00667-of-01024.json.gz": {"num_bytes": 398123165, "checksum": "ed693d5ecb9dfcaf545e831b5769b877e927125794cae61a0ec7821c3c85dfe6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00668-of-01024.json.gz": {"num_bytes": 398152096, "checksum": "51c33c07d503743704f564bc6a372c2f6f8f13a1ddd00b0b9a2c44c94cc57444"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00669-of-01024.json.gz": {"num_bytes": 397927981, "checksum": "d356b5268ba39e38ffccd20e95803f3218407e0a1ca3b4d1165ff82796ec1bae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00670-of-01024.json.gz": {"num_bytes": 399074605, "checksum": "bb96ea8154ae01275a9197709820e670c4e6212c740e92a7f1cfb7c618a49bea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00671-of-01024.json.gz": {"num_bytes": 397864381, "checksum": "afca3dbcaefdc368e996259fd595b77fd98a885ec005a93069a01b83227c827b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00672-of-01024.json.gz": {"num_bytes": 396077133, "checksum": "3da96ebd1b28b55b03bbab8e85f78295cffdad9020f869cb456da27058ffa090"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00673-of-01024.json.gz": {"num_bytes": 396943842, "checksum": "6a4c344a8af68a95e20d58b64fff8fe616c2a406cf26f642cdfea65fce5883d1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00674-of-01024.json.gz": {"num_bytes": 396975969, "checksum": "e6b0f7727d78143fa180abb76e617b37660b35f6323f19bf1dcbc78fb9374508"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00675-of-01024.json.gz": {"num_bytes": 396692800, "checksum": "e4ed97b19c6d83e618a3fcaff75460d828ca419b1e62842a1493b0ec4c9703e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00676-of-01024.json.gz": {"num_bytes": 396514400, "checksum": "a5672f1561ab85f071395de43e702791aaacff77a9f67f6ec9e14b12aba675b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00677-of-01024.json.gz": {"num_bytes": 395939125, "checksum": "3dacd3bb90b5e645d1b9a962d8df87f571b0fcf227996068535bb98a68f9191d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00678-of-01024.json.gz": {"num_bytes": 397022852, "checksum": "c1a0ef31342161369b7fb709be17e3c86191c1a52cb04b704fc58190818302c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00679-of-01024.json.gz": {"num_bytes": 398325372, "checksum": "47ddd1056ad977407f61b2eac3ff803d17b1aa8fa0719279bf911caf49bbb7c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00680-of-01024.json.gz": {"num_bytes": 395502228, "checksum": "cbb93f322d684ed558cbf8d92b9f83958ba772fe4177093a334b4596343f3cd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00681-of-01024.json.gz": {"num_bytes": 397981781, "checksum": "9ec2dec493733846a1ec9f68ff5130cd461d7ab9c07b22d4aae94463bcf03146"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00682-of-01024.json.gz": {"num_bytes": 395265758, "checksum": "7731cb9a2898c730a650e5d1b358886ed562228928aefe55d991cfaaa61a9a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00683-of-01024.json.gz": {"num_bytes": 398783283, "checksum": "6f2bb48070e809ac17fc90e1117d63bd8c7cd0079d9e44c9f262c4ce60f5d373"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00684-of-01024.json.gz": {"num_bytes": 396160769, "checksum": "fd07413637b97b68cb3a7a6cb86c4656017b7841728e806485ae196294e79f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00685-of-01024.json.gz": {"num_bytes": 395594461, "checksum": "939925a9169da729891fbeef926f420b80bcc60e0f170bcf9a2095449a22d424"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00686-of-01024.json.gz": {"num_bytes": 398275260, "checksum": "13836c45719ba10f2d581cf17cdab1daa4cc207a49db2b4786b451605842ac4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00687-of-01024.json.gz": {"num_bytes": 395256765, "checksum": "0c0d0e6c1e3cb9a024c184a8510066a005c031a15af74d117d0e736a358a91d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00688-of-01024.json.gz": {"num_bytes": 396635904, "checksum": "2462e084563f8b8de68c6e826289949ff8ebf8cfaf323344c07ab93e56373539"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00689-of-01024.json.gz": {"num_bytes": 397749444, "checksum": "d03746220f3374c80102ed39d8f6ae0daec40fc1b23312c08ecdee82a65ac6df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00690-of-01024.json.gz": {"num_bytes": 399380060, "checksum": "217d032ecce8d0b7e448befe83aa051a3bfab8cb0e167d043b6abc833f5e9b4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00691-of-01024.json.gz": {"num_bytes": 396975651, "checksum": "354fe9bc07aefc55cbbf8752f53ad69d45761da928bc8deb6fee1de9e244e93e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00692-of-01024.json.gz": {"num_bytes": 399720848, "checksum": "21f88940b6cbceefd66ea5e8d466467806370ae24a5833ca308cd840daf5ff8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00693-of-01024.json.gz": {"num_bytes": 396787846, "checksum": "c8d28980ffa1eff4459d2fbf0043a1f8eeaf840a3b1d1ea4989b2192c7a82041"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00694-of-01024.json.gz": {"num_bytes": 397945967, "checksum": "1936570da24c4bab9fe0559826f1cc509c4ab6eb3679e26d697efa6e7e5c8a81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00695-of-01024.json.gz": {"num_bytes": 396349049, "checksum": "8e497506f84513272a8a0694e7d4efb004b1e3b515887e3b5762f59b6c659dc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00696-of-01024.json.gz": {"num_bytes": 394901418, "checksum": "9e1d6cc187ff67ee734bbadc6cbd57eae05634a448edfde184fa8d6fc3259836"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00697-of-01024.json.gz": {"num_bytes": 399142528, "checksum": "9584496113a8612620748aaba35e185b8f47b7c96b4ff0dc7bfdd6024a3faa14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00698-of-01024.json.gz": {"num_bytes": 395923784, "checksum": "83a3c57b3870ed9beeaf3ec8ab694e0be458106f3128b14b2a44a036e89d32b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00699-of-01024.json.gz": {"num_bytes": 397137494, "checksum": "0befea64fe749d79592e337bc359bcef70ca8816d0126ebf89d4b8fbfbdcbec6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00700-of-01024.json.gz": {"num_bytes": 396554785, "checksum": "34739b543636aeadb6dcce3e7c97ca49026cc9897c13add6b592fe60e5c40338"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00701-of-01024.json.gz": {"num_bytes": 398091188, "checksum": "c9bcc7c9e91de707ee548e67452d6970af2e19bef91f966b19fa71504e5305fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00702-of-01024.json.gz": {"num_bytes": 396039798, "checksum": "fcda5f8ddc5ed163db84aa70c565f8181731af9a29918a2ece0436d3146d7125"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00703-of-01024.json.gz": {"num_bytes": 396889704, "checksum": "c80445d442a766d2e87ecf5804e87bf7f8b23c2238476fc2b51f657400739306"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00704-of-01024.json.gz": {"num_bytes": 399465260, "checksum": "0bb73674d579523fcbe079fbea7190138911711f023404ae46ea7b685fc09c73"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00705-of-01024.json.gz": {"num_bytes": 398579507, "checksum": "97d6fd9cea2a47913c6ee9d1e34c3440858f25f3d670cc81c8f83f2346fce6e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00706-of-01024.json.gz": {"num_bytes": 398761590, "checksum": "2f4836001b8b80066ae09b6e385ed0048770c13ba2410e0f0309ab4b9200e37d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00707-of-01024.json.gz": {"num_bytes": 395576626, "checksum": "8e0c0c635a7a7c32d4fdb1a7906ee95a9f334a55b2ff3881cdc7d5e816a9c817"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00708-of-01024.json.gz": {"num_bytes": 395930921, "checksum": "e6978b92f333230972e2b4c31cb86b5286fb899948c7680c7a9cbe75a9d60296"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00709-of-01024.json.gz": {"num_bytes": 395734676, "checksum": "13071a3527071f06570c6cfa485073f2f3980c83cac782db6bf66a75dd865df3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00710-of-01024.json.gz": {"num_bytes": 396501107, "checksum": "6562cb3675a42a58b8c8b2a232043adf532fe49420e30c3c237a6d8889a8de30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00711-of-01024.json.gz": {"num_bytes": 398422179, "checksum": "f38b59c4739d3c15e5bf5dbc0965d1a5dcc0f49a3c89eb7a6822003aaa1ae7c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00712-of-01024.json.gz": {"num_bytes": 395905103, "checksum": "500b4914f3c42d5e24ced7d36dbd3143c49e4fd5dfc3d53a172d1a55ae738889"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00713-of-01024.json.gz": {"num_bytes": 396009909, "checksum": "4f50bfa762db1435a89195fd180615e9f569c1668e128d343c87c40ac5cf60ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00714-of-01024.json.gz": {"num_bytes": 396963447, "checksum": "fd9eea7dfb93916a3798a8b69d29fb5d4bf0fec448b8a24427f729e7a41205e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00715-of-01024.json.gz": {"num_bytes": 397474378, "checksum": "3c61bcf6f24e21d2584bb4ae008230540d9a375e35f3c4ba1668621b80d85c5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00716-of-01024.json.gz": {"num_bytes": 396285471, "checksum": "c554e562a369d9696219ea8b0e363907c50f626d7c410a26515e07de801da74a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00717-of-01024.json.gz": {"num_bytes": 394827995, "checksum": "f8b4678c21d93c19d50cb576f0910050d24dfd606238bbf8013c45f98defda12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00718-of-01024.json.gz": {"num_bytes": 395517823, "checksum": "1bf63affd6914d98e197b6e1ce526cae7754ecdc750184154d3cb8e3bdd21a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00719-of-01024.json.gz": {"num_bytes": 395561934, "checksum": "c04b162d984ff2ada9f39aa6c0fac04a1531fbde05175f856d2e3ca2797a448a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00720-of-01024.json.gz": {"num_bytes": 396227762, "checksum": "25da2ac7c1f3cbc361807f67e8826ffa95f4caa25f81f66832cbd0a08f1a51f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00721-of-01024.json.gz": {"num_bytes": 397716450, "checksum": "28180c6396deaf34e2a197f5cad1b53ba1c9532db8b5c21dd7d81332b2793181"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00722-of-01024.json.gz": {"num_bytes": 398022279, "checksum": "9c3a8038a7f9431b90f67ea0d3b77353d0508b09865f49af575b6aaf5e32d6b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00723-of-01024.json.gz": {"num_bytes": 398064523, "checksum": "4b18959f604bd5f379a73b52947261cb8d63f2243f5afeb5807a13669ef4a800"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00724-of-01024.json.gz": {"num_bytes": 394747045, "checksum": "615f13a1b2a6942931519b7a7f6aba286f6045aad65b041c2c6643ce906de1a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00725-of-01024.json.gz": {"num_bytes": 396726374, "checksum": "4099a416eccbb56818efda68bd027c993c1a5fa1a8e722bc268041fd3f804cfb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00726-of-01024.json.gz": {"num_bytes": 397361407, "checksum": "152d5e2bad0de3b6b48fb26066891b160ea79c4c382ce6aec6047196e3b08ef6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00727-of-01024.json.gz": {"num_bytes": 395542925, "checksum": "ce1d46b0cd7d9e4075db3feab71d2f72939817ebf45819e73ec277c9cc07307b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00728-of-01024.json.gz": {"num_bytes": 396647931, "checksum": "c859626b14584c1bab396c867ad5eb11ff3af39628206b03612ee2d2b3058497"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00729-of-01024.json.gz": {"num_bytes": 398272080, "checksum": "758fbdc5bf6d66a36d69d31141742b2a917bf0341494b844f22ab82cd54e7ead"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00730-of-01024.json.gz": {"num_bytes": 395977662, "checksum": "56a7fcb59ece26d4b19be0bd5e6c2d0f05e4b1b23e8ce7b4fab064a29b229c02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00731-of-01024.json.gz": {"num_bytes": 397530948, "checksum": "bf0f4dc8796a737daf80b977a6e3656cb1e244fc40d6df92852da45e53e6cfdd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00732-of-01024.json.gz": {"num_bytes": 398314575, "checksum": "1862bcc85d48f59283eae56836e5598f20287ce36a185252abb24bcfbd1377cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00733-of-01024.json.gz": {"num_bytes": 398547748, "checksum": "476389cb582df3c214f3f5a45268bdb47b581a432c08723bd811daa5f5990083"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00734-of-01024.json.gz": {"num_bytes": 397380175, "checksum": "2b6fd36a8f8bc3edfcd8a486de44d2f3132f7b8f4bb2d4c93453dbf1a1b6667a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00735-of-01024.json.gz": {"num_bytes": 399584382, "checksum": "3e0a067fef0b40edcd23ce6680efc07253660b8c00699630bb7629b9d803a198"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00736-of-01024.json.gz": {"num_bytes": 395312038, "checksum": "e4f92413c837d269481ecc0b5d0fc87548bd2ae718ef7f9bff18674ece289bc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00737-of-01024.json.gz": {"num_bytes": 396820243, "checksum": "e61680c57505f027ef8cbd28a45e706936befa2ab40a24a63e638019a1717b63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00738-of-01024.json.gz": {"num_bytes": 397691872, "checksum": "d3acc0c9c76ef2df89f49896744dac53f488f830d3d42f0c481f2321ed60fa67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00739-of-01024.json.gz": {"num_bytes": 397912166, "checksum": "18d281ed9831f28c4c54256a844ab2cff7a5b681da1b7c8eab2565b106381aa9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00740-of-01024.json.gz": {"num_bytes": 397093867, "checksum": "6a65230910384587f5e7f34b52c2a6d9a86a8b1f7a23d26f890b6e810c051815"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00741-of-01024.json.gz": {"num_bytes": 396371058, "checksum": "26eb40e98075ab716b4edec76d1723a679e648258d6812119b46f7522dfa9b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00742-of-01024.json.gz": {"num_bytes": 398346941, "checksum": "466043ec98eb806916806cff7495f0bae89cfeb2835204ea34328030b92a27f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00743-of-01024.json.gz": {"num_bytes": 397366055, "checksum": "d98d31aaadf95dd0d1cf0548db515c8e77c95bbc4b611ae9ab5650429c171889"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00744-of-01024.json.gz": {"num_bytes": 398722902, "checksum": "a43c80ab3bd8d12d12b4ea41d9054b90214fd3ea2ef957f317d6ed6fa7b60e34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00745-of-01024.json.gz": {"num_bytes": 397562514, "checksum": "1e6dad94e0f90bfa0fdc5557c58873aaa95fa9ce1c7b70a1fe76817289cff78b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00746-of-01024.json.gz": {"num_bytes": 397731351, "checksum": "21fefd6cffa9032c9ca7cec91cd775c83bbd37419ae236eeec9589f8bc4be0dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00747-of-01024.json.gz": {"num_bytes": 397781450, "checksum": "b84c74bf1caecf92777fb85129bb009eb3a27fbab1b97af567f36a8bf100e704"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00748-of-01024.json.gz": {"num_bytes": 397425031, "checksum": "fe9bb225f6d03b44e552ec985c844e5012e90c4ad99f699ec4ed4297db91349d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00749-of-01024.json.gz": {"num_bytes": 397925850, "checksum": "3913b2955fee02e2ba716d843559bc4bf4e85a2884ae4495446a379f857a30e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00750-of-01024.json.gz": {"num_bytes": 397089489, "checksum": "773486144d3008cb3207c3c8b65fe6081c9e64dda09728d3586bc82e6bb73fca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00751-of-01024.json.gz": {"num_bytes": 394819424, "checksum": "d728b117a7b74150b03ed7d562514c2e45ccc03b0bceb120eddfa8333166a923"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00752-of-01024.json.gz": {"num_bytes": 397199683, "checksum": "6c10c3f4e3737db6a70375bd605139de61ae8b09a1aa91dd1cfdb82c183f0cb3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00753-of-01024.json.gz": {"num_bytes": 399197199, "checksum": "101c4ed5426b586a4aeeb7dbd377306eae9eec2eaf934e79d25583abff70b15b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00754-of-01024.json.gz": {"num_bytes": 396415619, "checksum": "732f4dedcf1266bcabf15a6a1cdead617ea37d428d8cfbccb5a9dd7521133075"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00755-of-01024.json.gz": {"num_bytes": 394564662, "checksum": "a23f1bb1de23554efff68e730d85802a6491936fb54e256744af641f97ec155b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00756-of-01024.json.gz": {"num_bytes": 395577258, "checksum": "2f4275994a103dca517d4eb3656009c8138930079e00303c7b8746ab6094fd19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00757-of-01024.json.gz": {"num_bytes": 397161772, "checksum": "ab16360173283b22a7e19d181fbf55a6a8d07f0d9007b51aa159c1e81661f5e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00758-of-01024.json.gz": {"num_bytes": 397545456, "checksum": "ff5a6292bc557aa9895de39697e8aea5843fa5a00c83c7983eaa36640d446ecf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00759-of-01024.json.gz": {"num_bytes": 395470957, "checksum": "66a64accfa6c281d2bdfa7b6846397f56c2d4f8a22ae8925a07af853e42f5521"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00760-of-01024.json.gz": {"num_bytes": 397328304, "checksum": "46778c90bcc6da96cf02e66956a1bcabcb9a95bad538cfc0d5190db473a278a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00761-of-01024.json.gz": {"num_bytes": 397706141, "checksum": "4825f25d6e1d13c70e6e65ce13ccd7b1922344c48ee2806952f3ba1b6e26d3ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00762-of-01024.json.gz": {"num_bytes": 396983663, "checksum": "25e1645f05d342b5f872ca809b36d516c7336c22035bfa86cf295d0865e08789"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00763-of-01024.json.gz": {"num_bytes": 396355038, "checksum": "d4c3a92808f0bfb042423cd4166abc57d20603ef07a0f0912058a718a38f26d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00764-of-01024.json.gz": {"num_bytes": 395434042, "checksum": "aa4384f587fd64c24fad9a27defb0345eb44cc536b3d45c710017d225c191ded"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00765-of-01024.json.gz": {"num_bytes": 397204482, "checksum": "cf419554f6c4f6201ebe92e7a232013e5949910f3d54f5cf3d1d65845685c7ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00766-of-01024.json.gz": {"num_bytes": 396420917, "checksum": "32076dd8004ebe35f46d6e790fd6330ad1d7df2b7ae3c4ede325b0da73a673ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00767-of-01024.json.gz": {"num_bytes": 396840905, "checksum": "08e5fd0fc1578a337f3dafdb3c718ade437256119e1968e9f958a8ea9d052c81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00768-of-01024.json.gz": {"num_bytes": 398085225, "checksum": "3579e0756bb6cbf1eddfca27de5cf067a212d683134bc6f8c26a79b7d802bfce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00769-of-01024.json.gz": {"num_bytes": 396879117, "checksum": "0913c93203a084521212e473d08c1d11e8136a8e37f1891330fbce0397bd431b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00770-of-01024.json.gz": {"num_bytes": 396386647, "checksum": "6c12ab51c92b9c92336a6142a1a4e2f7c3725beb7e61dcb004551d13e8d5488e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00771-of-01024.json.gz": {"num_bytes": 396279989, "checksum": "752deaefbf22dd1b1adb36561e8524c1dc555fd105bf3acb78611be9bce72318"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00772-of-01024.json.gz": {"num_bytes": 397850815, "checksum": "4f1969284d1f448caf0bff5d05eeb995cf2339801f6a71e01286f4f7f387c564"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00773-of-01024.json.gz": {"num_bytes": 399466666, "checksum": "20ba552cd30349bc8a2c0b6a8701d4587a005e7ebdf6e3f2a3bf95462c304447"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00774-of-01024.json.gz": {"num_bytes": 398051538, "checksum": "1f66196e8fbf0ebef977f235d2aacb7245f4033b53ecf75ada2f8007465a629d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00775-of-01024.json.gz": {"num_bytes": 399284061, "checksum": "97df92baa605c34ce857d380f1ca42f9e2a0de499ccaa9bab26a5c449451d1ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00776-of-01024.json.gz": {"num_bytes": 396710162, "checksum": "4b1ec54b82c8e5d969d3000ce547f4c20df16d9cc0b889b2b58c8839e9d8e27f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00777-of-01024.json.gz": {"num_bytes": 397265441, "checksum": "03827ccc3c5bebbd12a04019e9797945c55becabf7f9c1f3fe5353513f5c5a38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00778-of-01024.json.gz": {"num_bytes": 396050013, "checksum": "54aeadf4fe16949b2ee9438feabe979570e7587bb07b3c57e47422f662191936"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00779-of-01024.json.gz": {"num_bytes": 397124991, "checksum": "913e268b5474a8b4cf1426f5a0a06c7f437eeabbc35f0126481328b419f85bf6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00780-of-01024.json.gz": {"num_bytes": 395196367, "checksum": "4c1a4f296916c30103a5dacacf8a167e43bb424d085ed3491b19f0ec1985d9f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00781-of-01024.json.gz": {"num_bytes": 396578403, "checksum": "a54f26c233662299ec8f0ae1bd266879e93cf4676707b0955114a1a80e2fcf61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00782-of-01024.json.gz": {"num_bytes": 396142106, "checksum": "3713c6b725afd833063402e6577bc0ed003a87720f700f9272864c2360bfd260"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00783-of-01024.json.gz": {"num_bytes": 396470511, "checksum": "fe9d904a07ffb2581b6734c8dd847435b867d3043ce4b4840b1c54374919d757"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00784-of-01024.json.gz": {"num_bytes": 398156228, "checksum": "af762a9ff3eeb7ed4a56f54702911f0c190b97f8efaa02cb89b1626a1c44c9f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00785-of-01024.json.gz": {"num_bytes": 397185035, "checksum": "6629e1827aab88f55d53de24625f8362daccf910663db8584d959aa44f8043a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00786-of-01024.json.gz": {"num_bytes": 396556703, "checksum": "ce51603900ea0aad8981fbfa8d05d684bfef5360413dadc6933246c2dc81c413"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00787-of-01024.json.gz": {"num_bytes": 396214799, "checksum": "6eed5802b89d63eea115cbfd9e00f6d1b4970bb3600a887b904b548181a4acef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00788-of-01024.json.gz": {"num_bytes": 397965162, "checksum": "eaa948fdaa744576f006bd70d54f129968772a479fb0bd8e946d7605857545d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00789-of-01024.json.gz": {"num_bytes": 396280999, "checksum": "e0b80ec73507f96310abf070e5cd17d5a67ffb4a337820a8b79a02afe81a0b99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00790-of-01024.json.gz": {"num_bytes": 396224660, "checksum": "2b4a06fb6f68c773da34f8d4c33d7746b6a3206bb242042841e5e007fe3cb6ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00791-of-01024.json.gz": {"num_bytes": 397681975, "checksum": "1b167c20d0414d970cda74cd357cf07d69abd1d3fb0f57222028b369551d513b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00792-of-01024.json.gz": {"num_bytes": 396210611, "checksum": "ab55128753a1e58d1032b8fd747c48158a721b12e85990627478f22b78e156ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00793-of-01024.json.gz": {"num_bytes": 397534599, "checksum": "e7476bde08e0065c523d09932cf2cf6ffe8ba023ae0ee435238efb5dd6f93d7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00794-of-01024.json.gz": {"num_bytes": 396536137, "checksum": "6228922504b2d3ebeef4735abdff06cc786d6533a6c150d50f34042aeeae1544"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00795-of-01024.json.gz": {"num_bytes": 395235406, "checksum": "9dae151c15898d7991417596a364e30f00e0ff6280f1505953e6de40c2e228e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00796-of-01024.json.gz": {"num_bytes": 396226178, "checksum": "1dc8decde490324087fcd06e4b1e17117606f2d61a80d506d89a12cce11ba291"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00797-of-01024.json.gz": {"num_bytes": 398556774, "checksum": "a454758e8cffccc88f83517a241f2457e683647949cde6aaf1e217de42f6a52b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00798-of-01024.json.gz": {"num_bytes": 396109677, "checksum": "3daa6b8602517b9873db96522a2852d940d52cdf0fa86f259ac41a9cd688751f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00799-of-01024.json.gz": {"num_bytes": 397930210, "checksum": "09dec669699a437d6fb78b3f2705028fb380b2eaa20ee73b77270216a48b8a95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00800-of-01024.json.gz": {"num_bytes": 394545441, "checksum": "726f99301047519de253e3edbaef5f4a4f95e3850b1b98e01c7864499dad7833"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00801-of-01024.json.gz": {"num_bytes": 395867151, "checksum": "a97ef657bd8ea718427ffc686f55fc1786f0834755fce3ea3ae8402d9f75c11b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00802-of-01024.json.gz": {"num_bytes": 398573429, "checksum": "20ee1f30272a0d5db74e8589be12c17173580cc9f14b039b3d33f3197816ef95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00803-of-01024.json.gz": {"num_bytes": 398084513, "checksum": "31d1a8f6965d3a8cb7e28fa8bf2cb9a5609d4a129dbc630a8e2a939f475b2003"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00804-of-01024.json.gz": {"num_bytes": 397815811, "checksum": "edb758146d462848bdb113df90fa4b9f451eca6658cbd2cab147c8b0eaf88a70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00805-of-01024.json.gz": {"num_bytes": 398641802, "checksum": "b916bafa7269ad4ed09c58c74dc3f098b529444609dafc57e6e4056aa6496ee9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00806-of-01024.json.gz": {"num_bytes": 397993720, "checksum": "92fcc5881ca81b808c14f8c9960d873be70f857f95fd1e777b1ae1d4c62bbbaa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00807-of-01024.json.gz": {"num_bytes": 397743279, "checksum": "79aca62194176964b66a90dda7631d01acc2a6abea1ba19a90076139e390170a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00808-of-01024.json.gz": {"num_bytes": 397076817, "checksum": "a469391e432dac6967e841d46eaeabe9429849492a3df5e91431777fe9b9f164"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00809-of-01024.json.gz": {"num_bytes": 395533122, "checksum": "1278d928e105ea7d9c397ef1da79dcc8791dfad9177727aba098bd451734ce45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00810-of-01024.json.gz": {"num_bytes": 397468683, "checksum": "5c6f3e7550827de9d7028decd82320a55722785394ea4951ee78f3ffadb2d4e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00811-of-01024.json.gz": {"num_bytes": 397348260, "checksum": "8c1ece72814dd82bf1bb663b76a40c58129c08540195f9b2134eff5837faa366"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00812-of-01024.json.gz": {"num_bytes": 396753479, "checksum": "b3770924d0576f7cd1706771c411f0f288277c6c6c922dc7af4017b665109a88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00813-of-01024.json.gz": {"num_bytes": 397977743, "checksum": "864040da6f03f4d2ed2a9eae4daedf304e0d27196f0b522cee4e8fee55f9ea71"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00814-of-01024.json.gz": {"num_bytes": 396168620, "checksum": "542986bb3b75ffcfc853af11a80edb6a31e12527d2588f1c5b2119fe35d3f150"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00815-of-01024.json.gz": {"num_bytes": 397639162, "checksum": "a617c2f27306ce5de74ab756cbf74707fddeb0aa92277b66d0cd65be230f386a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00816-of-01024.json.gz": {"num_bytes": 398296204, "checksum": "174a2e77e6562384cc4e7459ebf536db5cf4b530e4f1d7714e60d082ac7a19c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00817-of-01024.json.gz": {"num_bytes": 396112543, "checksum": "95af2c4f32efb4ed2a41cfa38dd2be09d51d4b0dc53ca8763309503f0276d56b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00818-of-01024.json.gz": {"num_bytes": 398371592, "checksum": "67789e3525f2daf6af2551df12a50341c3ef51c89a9c714a8def76209b5b7460"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00819-of-01024.json.gz": {"num_bytes": 396751420, "checksum": "07431a263e2bb92c048fadbab74ce1399f76fc57a04d7f9e90cb33aa60a4c5e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00820-of-01024.json.gz": {"num_bytes": 399213859, "checksum": "83c03df95869973c2ed46c909c0e92e7ecd75317c06b09e447a62b592421d1c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00821-of-01024.json.gz": {"num_bytes": 398408628, "checksum": "b5cb8c52a8713c5291ccf29c171e9bd9b57a54211392a19e8f31182d1053a032"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00822-of-01024.json.gz": {"num_bytes": 395429180, "checksum": "8c47bf7a0d2b9c84d255df0e7da058fba2b4ca6da3c20cbdfe5a686e01cf5c45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00823-of-01024.json.gz": {"num_bytes": 395437149, "checksum": "62818e45f34e70728494c74daa583e30c70aebf91c2f057470039f6d35059691"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00824-of-01024.json.gz": {"num_bytes": 394503147, "checksum": "e9fd88994b23531ba26e6859ec1985798a2ab9b300c2fdb1e202ac553ab305b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00825-of-01024.json.gz": {"num_bytes": 398841091, "checksum": "77ad5a9ac5e3c1d1180981bffbbdbf8a429854001d990258c615e0e16c8a9f6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00826-of-01024.json.gz": {"num_bytes": 397404278, "checksum": "06a39374c1cda19cc4b034c4877e1fd3bdc84290fdb621fdcdc77f3c5eea9a47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00827-of-01024.json.gz": {"num_bytes": 399316947, "checksum": "fd27a73b130c1cf8256f22212e23799d0dd31281cd29bcf9bb658bcda457b66e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00828-of-01024.json.gz": {"num_bytes": 397514415, "checksum": "3e7d199d05f885e8bba769d21a55a3f2ef2114b66ed738428ceb506fdf272ff2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00829-of-01024.json.gz": {"num_bytes": 397251538, "checksum": "91650563e9520b2d1ec2cd726304b781b4156ffb68bc172635a53f425fa6bb0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00830-of-01024.json.gz": {"num_bytes": 397653118, "checksum": "893ef017cbf7d46c99d9c69ba74344cfc2800bb23faf93e7400c0c282422945f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00831-of-01024.json.gz": {"num_bytes": 397299276, "checksum": "4eb3c91e52547f3b4af586f5bbdb0cdaf6a345b202a09c6aabff5c5f628b2948"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00832-of-01024.json.gz": {"num_bytes": 396915924, "checksum": "9fffd46fc1f1bce010484f2850102e2e153c5695c277efb67f65811630c2493d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00833-of-01024.json.gz": {"num_bytes": 397652261, "checksum": "3b89df9375a906c96eb1e21a6572a07de2f5d875996c01c744933984edb1af1a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00834-of-01024.json.gz": {"num_bytes": 396070735, "checksum": "b758b4cbfdfb799a8615ec9c3678b27dcd9b1d63af4f272879e0dae84cac9d63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00835-of-01024.json.gz": {"num_bytes": 398028152, "checksum": "6e07f1e6a099aa496fef3015514fe5f3cc665c742f8a783389c7da4ce0e0e72d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00836-of-01024.json.gz": {"num_bytes": 395941604, "checksum": "6bef1291a741ea5976749456185a3e3a03c3fcc9ac00370f28672ab39c552db8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00837-of-01024.json.gz": {"num_bytes": 398655070, "checksum": "b0b7e1c826302417630c3e1b1877bf106beefb5a7a11feb9bbf1ac3712714fed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00838-of-01024.json.gz": {"num_bytes": 396374435, "checksum": "3e9bdde8b73397a5fce143e91c92f9e66f46b45edfb30da1cac400b9aa7b2ecc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00839-of-01024.json.gz": {"num_bytes": 396388725, "checksum": "4154322b97c600742660125e6458787e603cf1a44b49267f4d1c569387fd132e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00840-of-01024.json.gz": {"num_bytes": 397564603, "checksum": "f9560028196fc934378389e355101e5e7f8fde9e5c921722704a18b24ebc5804"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00841-of-01024.json.gz": {"num_bytes": 397001678, "checksum": "0dad99ac959765280e6bf6d9d1a1468ef9dc9cc781e8f5bb832f7295e4e79f69"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00842-of-01024.json.gz": {"num_bytes": 397139167, "checksum": "e81fd683da081349629a0a7ae8ff7813351ed23caf4ef87041b64524034abc83"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00843-of-01024.json.gz": {"num_bytes": 396044889, "checksum": "d8e3a5b4148c7e86dea50ee5ba89ef55629d3550fd926c41754e5a26e7e52c36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00844-of-01024.json.gz": {"num_bytes": 397365441, "checksum": "c4d2ffe853b55464961b707b6d0264d6852817077204a0380c906184c077012c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00845-of-01024.json.gz": {"num_bytes": 396477802, "checksum": "7b3c4d435eca57a0fad05c106ec5928750aa01d95047618a3bc84e5342e912c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00846-of-01024.json.gz": {"num_bytes": 395983616, "checksum": "bdad2ba411291435ac0cdd083e46aa8369499f014a788fa85ed8c419fe9cb2de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00847-of-01024.json.gz": {"num_bytes": 397646062, "checksum": "3f6bddcefcceaa4184161432e4f0b9292ae4fe7dac3079d4191a31a38f48c7bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00848-of-01024.json.gz": {"num_bytes": 395958111, "checksum": "5ed10d926e5fd1dcbc777df82391eb3ba57276c7303d488d6f3591022d20cc4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00849-of-01024.json.gz": {"num_bytes": 396960036, "checksum": "ab82adc6f66ab0403cbbb38859009a460e6c8c38c789bc2b2420da8b87096a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00850-of-01024.json.gz": {"num_bytes": 396603592, "checksum": "5a6aa59a01504f5655d429dd5cb3ebc39e3994b22cbaeb5b09ceb29a26b94031"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00851-of-01024.json.gz": {"num_bytes": 396511886, "checksum": "f1954da7e217d893a0237a0f431dd2a9071723e543bf0f4943ce38fab048a44e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00852-of-01024.json.gz": {"num_bytes": 397626831, "checksum": "f5cdcd7ec4f3c855a1006f9278ed4df50574a3fa7aa1c5a2e255ea5fa1a770cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00853-of-01024.json.gz": {"num_bytes": 395811873, "checksum": "24b1033da877ebddc09cfe2d3325868448dab9083b5147d6cfc4fa63ab402a94"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00854-of-01024.json.gz": {"num_bytes": 396513614, "checksum": "419952e0bc38cce474190c0b9ea581ccbce77da5e045dd60f5ff1fa1d2833d19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00855-of-01024.json.gz": {"num_bytes": 396493352, "checksum": "3d2b529871c625fc9c1c59b9d5cede2a77e609041f1ea044d68ac16e9fa6a30c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00856-of-01024.json.gz": {"num_bytes": 396852729, "checksum": "a3b56e6171fc2b14ebe67f6a71af688ea6135597bb8f8cf83e2fb460727aa5eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00857-of-01024.json.gz": {"num_bytes": 396428653, "checksum": "de550a5d608bffde45c149bc0d4c1165cbd3b5baab3d3529f006a02aba6d53e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00858-of-01024.json.gz": {"num_bytes": 397039613, "checksum": "11374c2685676ac2eb3dd0d281b44b512ff1d2968ab320d9c857b44304eb8ab8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00859-of-01024.json.gz": {"num_bytes": 396515194, "checksum": "64879e565e5c467e630566ab75524bb300d58798c814637ffebd15646544cd5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00860-of-01024.json.gz": {"num_bytes": 397764125, "checksum": "7e22be61b3413c8fca2414087655b7ef7bef2ab5ee373fee74d13c8fb991675b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00861-of-01024.json.gz": {"num_bytes": 395314420, "checksum": "29c451c69c8c05f6eee2741b9ef6c241f551257a45da8342a1d6bb341f80314a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00862-of-01024.json.gz": {"num_bytes": 397763845, "checksum": "679668616899f548fb35da32c3e5f121002670cc3296c0c90f5bf45eb3ea1d79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00863-of-01024.json.gz": {"num_bytes": 397356206, "checksum": "43c5b3af2173d4293396f336ec363aa2f31580b65128f44ca8bb891f2022859c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00864-of-01024.json.gz": {"num_bytes": 395463092, "checksum": "77b7b6299955f4869e5db994fa6b20fe3007cf8cf2b6609442fb1ed49284cee6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00865-of-01024.json.gz": {"num_bytes": 396909291, "checksum": "7eca0e82842b52f99640ab574e4b2446309aba6ac262f980fc6d249a337d06a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00866-of-01024.json.gz": {"num_bytes": 397587651, "checksum": "931014d99ab2a765ebf90e876694647c265ca5e6bf2b459eb027d6b06643a8ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00867-of-01024.json.gz": {"num_bytes": 395992645, "checksum": "0976a5389aed40e4bca89cf22382cf121390c75bd755437be474c097c8fee0ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00868-of-01024.json.gz": {"num_bytes": 397789857, "checksum": "6ffd848d165290a746a21767e79a9f046b70534aaf7b14fc01f9365e4e3f7d93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00869-of-01024.json.gz": {"num_bytes": 398124116, "checksum": "5fb85058bdf40c0ee6cf748cda7483b1b3cfad18c26a90c2150c2a3f30ceeeca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00870-of-01024.json.gz": {"num_bytes": 396432487, "checksum": "89d50aaa3620eac4ad593a403ea637b2ff090361ead05c3aa8c7a3351c66ad65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00871-of-01024.json.gz": {"num_bytes": 397484772, "checksum": "490f4104981a9ab3ef04600a4865b9a2a18239e335d7fb7fff79ec1b7a225318"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00872-of-01024.json.gz": {"num_bytes": 397240896, "checksum": "d344994866bc49475f66e9937636afa787e1ff560e3f62dc1a0e4d0220d6ed39"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00873-of-01024.json.gz": {"num_bytes": 395450398, "checksum": "5d3b320aab1f7f09450531649666ded1aba8a9bbcf0f47992c43cb40a6d7a929"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00874-of-01024.json.gz": {"num_bytes": 396365056, "checksum": "346aae20204537ba2f4a865ca80b5d1c6da1e3a3b78d306d7570a69f185cc4fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00875-of-01024.json.gz": {"num_bytes": 396679348, "checksum": "ba81f9c1650d30853edbb9886dde84658c254dee5a3ac1062484f7194cd413f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00876-of-01024.json.gz": {"num_bytes": 398278881, "checksum": "88fb38aad7cadd76c818dbe7a372144dfe17d110f7d2123a80d14686fb43a6dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00877-of-01024.json.gz": {"num_bytes": 397051868, "checksum": "049e4a62056c98284b35d10a74ad5ef7014265a6dccb99a71f93a409933a685f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00878-of-01024.json.gz": {"num_bytes": 396132123, "checksum": "bb7b97a82bd6d31612de66a03af35d404b15808b925e7fd94bd0a8e9e928b927"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00879-of-01024.json.gz": {"num_bytes": 396520374, "checksum": "2a56fed53aa022e6a7956f604d54d99af89a15b6c7fc6b037f94d347f1d15f51"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00880-of-01024.json.gz": {"num_bytes": 397004524, "checksum": "1cadef434909d4508a9a6bf40d6a9323256f3089615a5d2963c83040d5f549f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00881-of-01024.json.gz": {"num_bytes": 397336334, "checksum": "0e36dcd0eb1773eec15ffd0fbbe8951343bb6961dd1838b51e74da2e055db176"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00882-of-01024.json.gz": {"num_bytes": 394949798, "checksum": "78c99406cb921c2b8f5b86e4e7eeed24c799678732e5a5450db6b12b7ceeef61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00883-of-01024.json.gz": {"num_bytes": 398647721, "checksum": "f0e7a0a9970c7fdb5f629771e76bb06bf62b79e9cbf5008e866f954dd436401b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00884-of-01024.json.gz": {"num_bytes": 396040500, "checksum": "05272a55eb2840f94a7dcc30a8d09b957511b983b0fc3fa618a8995bc594d055"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00885-of-01024.json.gz": {"num_bytes": 396460591, "checksum": "27511aa50410260d261866dc970b897b10a95dd4dfd92b0bc3a5fc41e6c75335"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00886-of-01024.json.gz": {"num_bytes": 396149133, "checksum": "e66ba9c7ceca631a4b43ecff1e151524a209368f298ca83624476ee9144cc3cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00887-of-01024.json.gz": {"num_bytes": 397164216, "checksum": "95e341054bd8a21e7f49e4a5aaa5fbe51517ff631e66e67ff1cdaea6e3178002"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00888-of-01024.json.gz": {"num_bytes": 398216402, "checksum": "6fef57de31fa1692d8a4021b317554688657fad3f55dc144e2971d63083e7879"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00889-of-01024.json.gz": {"num_bytes": 396976936, "checksum": "36da1bd0eaa27ca6e8510a3c005695fbbd7b0fedf63f077e3787590d4b1af625"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00890-of-01024.json.gz": {"num_bytes": 396903125, "checksum": "6bbbe5db2c0938efe5f8afe7b30765f45cedc9fd4209bb7826c489381175bc5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00891-of-01024.json.gz": {"num_bytes": 396404354, "checksum": "47601b1b1a0a725c32ae0c32364f7ac188b7e8c68d29a2dffbe1a4dbe39393f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00892-of-01024.json.gz": {"num_bytes": 398144052, "checksum": "a7b6bdafa5a226c22ccdf97c873e4915ed8dd8b59e2820a4dc62f600b4710175"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00893-of-01024.json.gz": {"num_bytes": 397990484, "checksum": "12f08cfa1fb4f94a3d7d9584cc3f5ae9fa518cc095e4cb07939d02ecfb7ffd9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00894-of-01024.json.gz": {"num_bytes": 398271782, "checksum": "004bf46ac7c8d7770b458ec341322f5cef643926aff9255954f08faa1dd43d53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00895-of-01024.json.gz": {"num_bytes": 395489909, "checksum": "3ea14b3dbd7a4c9cb7aad83d1311d335714aaea5b2dd0374debd63c56d02dcbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00896-of-01024.json.gz": {"num_bytes": 397589097, "checksum": "c0f1c7e54bf7a808f66d2acc9aec79f1ce936ba480f5d1e379c6853714413175"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00897-of-01024.json.gz": {"num_bytes": 399215096, "checksum": "20958123acf2d578448a5166f1209b0452db33ed395cfe512015106bf99ad31d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00898-of-01024.json.gz": {"num_bytes": 397044516, "checksum": "46c5145069d861c04b2ac1afe80c4c4453f91869f6cb6a1d9f7b648f1b08942e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00899-of-01024.json.gz": {"num_bytes": 397687759, "checksum": "2a3923d8ff2ce0eab5978a8e0198bc2d1512cfa19c69e673e048b8eaa72f82b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00900-of-01024.json.gz": {"num_bytes": 395192267, "checksum": "9cc72deeea7fbc0fa3782c41938d66315923dd9f53d89f47c00f85f93e454ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00901-of-01024.json.gz": {"num_bytes": 397806320, "checksum": "8cfff74f280636416f523c271f75e5704a570db4cddb8a70d033158868c21347"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00902-of-01024.json.gz": {"num_bytes": 398450537, "checksum": "7df8804eb5ecb79177001f9ce3c66f0ad20cccd8151e817816e9342d07c392be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00903-of-01024.json.gz": {"num_bytes": 396733151, "checksum": "89551a52d1e97b4ec3007f8c43191c1ae1475d0ba5b48d20818a12c85b0add74"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00904-of-01024.json.gz": {"num_bytes": 397497719, "checksum": "2bcde59dfaa642722969d1401a4ce43a35c57930bb1d664371efece1e2e91c32"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00905-of-01024.json.gz": {"num_bytes": 395760696, "checksum": "ec844272b0666a455dfe0cab065e00df44e8da2156a03797100418307c96830c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00906-of-01024.json.gz": {"num_bytes": 398496346, "checksum": "ff68909d470edef08929a91068e1de02841c16a000fbbd17ef042cb76f1fff37"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00907-of-01024.json.gz": {"num_bytes": 397085405, "checksum": "a9b26676af61a6a1355225bce5bbcd67aeaf0fb7dc2209f30235b275536baa85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00908-of-01024.json.gz": {"num_bytes": 397037103, "checksum": "e86688677a46103b0b224333faf1b4f89da062e4ec0ee35752c91ff9772697c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00909-of-01024.json.gz": {"num_bytes": 397394775, "checksum": "93082177607900bfce7fc53f1665a831093bb50caea33e014f327181579c0012"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00910-of-01024.json.gz": {"num_bytes": 396668466, "checksum": "dcfe639607c18a309e2c91864a6912dce3851abd62bbed3ba16390899e637327"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00911-of-01024.json.gz": {"num_bytes": 397926997, "checksum": "aa995c38d953237b1d6d53be7237958a00ca2dbab4a753c7c4404849fb416d5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00912-of-01024.json.gz": {"num_bytes": 397810240, "checksum": "e3f17ac285e8c9b04713713a957602a63e176f476d4a67018012e9cf2a3e5a84"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00913-of-01024.json.gz": {"num_bytes": 397143597, "checksum": "4082ab833be47cf881693ea4442e3940625e0d2c1117e15234886fdfa779bce3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00914-of-01024.json.gz": {"num_bytes": 396398347, "checksum": "7c62dfd17b21ff64af640e4aca8fea0240998596d11ca551a3ab045d5041fcac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00915-of-01024.json.gz": {"num_bytes": 398622100, "checksum": "69abe67cda4b1613d5f741804ccdb294cd5f457027818d9366db8cf2f5f40871"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00916-of-01024.json.gz": {"num_bytes": 397387266, "checksum": "6effa83cbf3345fd7e41e432ef82156bb1334f2cf17589bce313aebee9727131"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00917-of-01024.json.gz": {"num_bytes": 399730979, "checksum": "f0d0ff1ae76a84c07647fa1517410533862f1927fa85dbf38017dabf4607bc1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00918-of-01024.json.gz": {"num_bytes": 396895902, "checksum": "84cc56e725be31047d0b6a025cfacefc462f4a1a546feaa34af95a6f25a4e1a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00919-of-01024.json.gz": {"num_bytes": 395247578, "checksum": "daa3156989ddaa9a7eba228848697ccf6a385679359ab765881d2293bef107aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00920-of-01024.json.gz": {"num_bytes": 398305242, "checksum": "2a9e02ef643962f6009e42304b983c87bae7b74c1edcbf8e6808b320ea7ea776"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00921-of-01024.json.gz": {"num_bytes": 396446011, "checksum": "f83526ad11d81820fce4231e3303d613dbbe56a8fae878d9442c8d7e98023437"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00922-of-01024.json.gz": {"num_bytes": 398010331, "checksum": "e47cb9d7550644ef807c3ea9e19ca4aa1df54eb908b54651bf0e17f0ded9157d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00923-of-01024.json.gz": {"num_bytes": 399160018, "checksum": "470401e5b0777096806113a36dcb92b8d453d6e8f5f4f0b15df2788e382ca03f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00924-of-01024.json.gz": {"num_bytes": 396880756, "checksum": "c86e546c68bf8458951fa723c086d6efa5b210f53cd4fcb2de4b9efc7a71a275"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00925-of-01024.json.gz": {"num_bytes": 396806561, "checksum": "5d9b1105c0053dc9530c911046f4da458f41d92c771282d0df8a3a22838feaec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00926-of-01024.json.gz": {"num_bytes": 397479994, "checksum": "c3253305ac4ef226501e4fd4a6acfc6067a76c084ad852eb2a9f5916aa3d51a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00927-of-01024.json.gz": {"num_bytes": 397083225, "checksum": "8931df0ee597f72ea3592d0a4d236ce655a92cf4e7eb9298145f496246c18c21"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00928-of-01024.json.gz": {"num_bytes": 398000839, "checksum": "5e29e75231bdb413dedd1211bd87e9fc3f4ab8bba41999afc1ddcddc16f4599a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00929-of-01024.json.gz": {"num_bytes": 397731309, "checksum": "03f7a9199b7927a6d78a8aa4eed32c250d32dc409e3bb2847d7db948ee63d46c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00930-of-01024.json.gz": {"num_bytes": 398133003, "checksum": "b22a79dc228697394d0ce25b7d31112f9e1a6508cdc4b57af35e84e65167bfeb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00931-of-01024.json.gz": {"num_bytes": 396694508, "checksum": "dbbc65db3d442f9ace85498a3b27bb598c20cea171b3de17d409f9b989c262d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00932-of-01024.json.gz": {"num_bytes": 396255463, "checksum": "02af4162b084004e99dc6862c88749545593e342a83523597cada140e57a0ab7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00933-of-01024.json.gz": {"num_bytes": 399013035, "checksum": "dc4d3b4f03c36a8f1393ba15195c3f64b128862b812839689fa387e708ffabaa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00934-of-01024.json.gz": {"num_bytes": 396593138, "checksum": "02a5a8e02b2636c9e912a9ef8a79ececde4f4fc92bea74e59791d181bec104cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00935-of-01024.json.gz": {"num_bytes": 396748502, "checksum": "05d1d6290580d5c74b906ab03fe6773ecaaa1ff3be84dfdef48d1a2e7f5e1120"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00936-of-01024.json.gz": {"num_bytes": 397737673, "checksum": "351d3543b1457da9719061948a1b4bdd79be8a0b786ecd6a9a8cc0db49cd2181"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00937-of-01024.json.gz": {"num_bytes": 395377872, "checksum": "d431b01bddcf911d7da5bad74a78d0d1527d60d9720f77868ef08e1a65850986"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00938-of-01024.json.gz": {"num_bytes": 397193715, "checksum": "bff5e755b174e3608ba72b39898a2bb5e9ca6d3362b70bd66143566aeff52690"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00939-of-01024.json.gz": {"num_bytes": 398044482, "checksum": "03facf22c376f03a8078e99d1dcc1c22ed5d7e179de472019cae894f40c7a4ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00940-of-01024.json.gz": {"num_bytes": 398894204, "checksum": "3d3a2125262ee8ca498cd54db52fe626d010a2a93c000ea2b45f931e491ea9e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00941-of-01024.json.gz": {"num_bytes": 396758197, "checksum": "b3957de08e7779d8ec23af02a6d709189796314c70a99f46c90d0bfbd14ad561"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00942-of-01024.json.gz": {"num_bytes": 398181993, "checksum": "74aec8dec794c79683dfe43d8aece4c1c47c5389aa6d4bea847ac461cb5ba21f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00943-of-01024.json.gz": {"num_bytes": 396271547, "checksum": "231f63d05f81d249f618768c9f712cc31314dacf55a6004902a0e7d0bfb13724"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00944-of-01024.json.gz": {"num_bytes": 396603419, "checksum": "d5661730f3ed6cc5bbc5d935a6f1ac7d241b40c52dc83775a421e7a1a672f518"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00945-of-01024.json.gz": {"num_bytes": 396596660, "checksum": "3b5aeb0786dddf0b9cabe2ca071283b276822e2861d8688e38f927595c159b02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00946-of-01024.json.gz": {"num_bytes": 399900563, "checksum": "6d5549970af2c6987583477991552e1944b411642782c07d17eb52f91e714a1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00947-of-01024.json.gz": {"num_bytes": 395391489, "checksum": "f5544ecb42c385cd5d5120c82140e4a36051f6a401d89ce30c8f2fc08cd69804"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00948-of-01024.json.gz": {"num_bytes": 399257562, "checksum": "1448cca7f1b9824adcf8437a33d14a7e95b705396611f82e7aba9a69e0a25118"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00949-of-01024.json.gz": {"num_bytes": 396371965, "checksum": "a7eb228f1d1ff2744af3d1a1358a94611cd92c25d81edac0e209b9f81c8a0a60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00950-of-01024.json.gz": {"num_bytes": 398022110, "checksum": "8651693d2180e518039da487f638c532c53f6d79a33356922b2d8706aa6a83cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00951-of-01024.json.gz": {"num_bytes": 396224338, "checksum": "c46bc8aa1621153fbd913b5d0b23a82352a28b36ec997c4df4b92dcc6ef26895"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00952-of-01024.json.gz": {"num_bytes": 397581207, "checksum": "02775930e3c420978a9d2785ee0137c3963dba7bc34538b2155eb38dd6ee89a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00953-of-01024.json.gz": {"num_bytes": 397045599, "checksum": "9d54940cb594de6e0f8593f64293e96375f0a5c56f3569c72720476bcef1f1a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00954-of-01024.json.gz": {"num_bytes": 395457873, "checksum": "3c12a1c3061164f345d9e402bed28be9af84ef56d5df1b22a3cf9f818ed47ae8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00955-of-01024.json.gz": {"num_bytes": 396450938, "checksum": "45db78bea4fae6cd69d900c581fccda873d2aa9f24ac5e9dfc18b486c15c3788"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00956-of-01024.json.gz": {"num_bytes": 397120474, "checksum": "7db7ea23446bd8a66737546c5daa0c2dec7bd5c4743f52eb53685ccbf54d9b17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00957-of-01024.json.gz": {"num_bytes": 397403279, "checksum": "89de2950bc3f7dd4f95d8a0b7cba19e9678bfbc23175bc22d9f9599ec1ad9cd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00958-of-01024.json.gz": {"num_bytes": 396861933, "checksum": "f325478647cbec9d79bff2266672144147276a82f665d3014c5d2fa9c112c387"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00959-of-01024.json.gz": {"num_bytes": 398439950, "checksum": "70d786bb337c012269caf6aeea3bf9604d279d3e4335294c72ca6cb5a9fbd951"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00960-of-01024.json.gz": {"num_bytes": 395684257, "checksum": "e1d170b0a4d6954a920ef3923688a7dbf40398609ed2ae04b2635df9ceb07821"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00961-of-01024.json.gz": {"num_bytes": 397526287, "checksum": "47b90e3747f35bf67c872d65d843f6dd9bfca15dcb769b31bf3586c6645858bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00962-of-01024.json.gz": {"num_bytes": 397473683, "checksum": "d0ddb2c104f515144265bd3eed526a65ada46f848183688b420694751b113272"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00963-of-01024.json.gz": {"num_bytes": 397964876, "checksum": "74725b631c1699b1166589eaebb66374c031b170eab3ab359230cd4a23a8ae79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00964-of-01024.json.gz": {"num_bytes": 396523661, "checksum": "fa0d49a2cc726628d9a1b5ae2ace52ee90401af8ae15add27c3f4566dd99a79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00965-of-01024.json.gz": {"num_bytes": 399289514, "checksum": "11fb1878a8b204181f7f776a764f5e9e577d0fe62d4b2e4ce2164ce9fcc30b8f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00966-of-01024.json.gz": {"num_bytes": 397411408, "checksum": "5646014ca3c99f53bd13183187b1e6e8f84cb6c846d6f1f3a3c82edb4accc47e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00967-of-01024.json.gz": {"num_bytes": 395095282, "checksum": "b799b17f36d85235eaf1bed9f4f760a22b75fca736744218e44fae5917a2286c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00968-of-01024.json.gz": {"num_bytes": 397189410, "checksum": "8d9748f5a92a9e0b836fe74b962bd2da04b62a0a2943ea5e440cef19166a5479"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00969-of-01024.json.gz": {"num_bytes": 395651742, "checksum": "f42c71219641fa302692698b4944864f27b7f87d4477a86babe23745dad72715"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00970-of-01024.json.gz": {"num_bytes": 396180197, "checksum": "383d9586f27579b4a97c5901013b3e025f10dc813047d65158d6621430803aec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00971-of-01024.json.gz": {"num_bytes": 396574555, "checksum": "d2c9700fbac454d3b3a42b2a3c4eb0111eb7cca7cab3d545b0912aba60415c91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00972-of-01024.json.gz": {"num_bytes": 399639122, "checksum": "5d59e643bf20156a28e5e9dfcd811c5a6c3779e1875f375db09a0fa1871dcc90"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00973-of-01024.json.gz": {"num_bytes": 395456709, "checksum": "8b22e82588e30f30f664895b9716cbb0cf38d5ff4331d3be31ab25663c634a00"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00974-of-01024.json.gz": {"num_bytes": 396693438, "checksum": "5fba4f9d634d968f15d5d4fb29d253646494e3e125aaf1c2f8fab38a7e60180b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00975-of-01024.json.gz": {"num_bytes": 395697641, "checksum": "b4c5fceb9fa2397a9b7c75249bd3386b8dbf999d5b52521051a86e067d698448"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00976-of-01024.json.gz": {"num_bytes": 397172005, "checksum": "093aa01a944a222828656d31dacd8ecd57a24a51d361a8742514bb6af009dce9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00977-of-01024.json.gz": {"num_bytes": 396182407, "checksum": "1beef6e248c00abee5f8952641b12d3f5b12d58adc05c8d461c0a073a6ca9b39"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00978-of-01024.json.gz": {"num_bytes": 396180428, "checksum": "0f2bb125af300de2c9fe347899673a4bd2842ba8298146bfe94c9eddc41893cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00979-of-01024.json.gz": {"num_bytes": 396479117, "checksum": "1fe9d0e54b9be79722e6483e386801263ca51d6e9ad925dabbb58a38c4df877e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00980-of-01024.json.gz": {"num_bytes": 395119279, "checksum": "0f262ff2d4701497f6fd6d4f9d3cb1aa3a730ad6bef1961d890a3b0cb4747ee8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00981-of-01024.json.gz": {"num_bytes": 398285798, "checksum": "a295b85e63c176cecd9f5222ba417eeda307e41847eb38c61dec9b83101a8256"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00982-of-01024.json.gz": {"num_bytes": 397811687, "checksum": "2a3a0e0f454dd72a68ed1dd71c508a9b24fb2349ffdfc588cbfcef728cbaff05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00983-of-01024.json.gz": {"num_bytes": 397069906, "checksum": "5b4256392755c4dd79cd37cd6ede645a9a549c4436acd27495e974ebe1d80bc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00984-of-01024.json.gz": {"num_bytes": 397670152, "checksum": "68d4f5dbb3fa349a6811edce8056eb297e771cb9c9939c3a84d30c6ba3ad9dc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00985-of-01024.json.gz": {"num_bytes": 397949975, "checksum": "6ba478b8a1ebf3b1dd67ed7b4a055cc9cc3c01bc90c1852aea8f5a99f6c07e69"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00986-of-01024.json.gz": {"num_bytes": 397730984, "checksum": "a39a23589cc434e573613e3ead44f33adb005c2c13cea8b33601647c97300fce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00987-of-01024.json.gz": {"num_bytes": 399173506, "checksum": "eab46d9d0a0cf05dc5ba475017d98f02f1cfd756c8e707d9823a0463713ebf23"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00988-of-01024.json.gz": {"num_bytes": 398674037, "checksum": "88749d380aac85314df66448542b696e9ae6f61f1b27dc395556737f59ad9024"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00989-of-01024.json.gz": {"num_bytes": 395313344, "checksum": "bc565b662396e3ab4e108635e01873014515663bd5216926a59ae80f6cd4273b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00990-of-01024.json.gz": {"num_bytes": 398567254, "checksum": "e9b9bd97a30ccac353a2386babbd01c3a3bbede8c07bc28d17aecc7ef5af6330"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00991-of-01024.json.gz": {"num_bytes": 396958611, "checksum": "505ab5458d5e52d656048284fd22cc0fcd16e49ba19331669239be37645cb04e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00992-of-01024.json.gz": {"num_bytes": 396102263, "checksum": "59ac5b2b04f224be04a4ceac6a16e29a33681f19cd40cbce3d3e8eb961b9f33f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00993-of-01024.json.gz": {"num_bytes": 396935362, "checksum": "c804f2311de9f7ae5691280e16261b9f8385ef9a71929b2111dfade532b6bdd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00994-of-01024.json.gz": {"num_bytes": 398832432, "checksum": "594727bdc3756e678bd4d156216712ed6c8fc98d3f8e9594cfbed10b2e414554"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00995-of-01024.json.gz": {"num_bytes": 396699737, "checksum": "bb3c73c6d48aebf9c60cde56944faa5bb6727db4cc48ae23d67650742462c42d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00996-of-01024.json.gz": {"num_bytes": 398059244, "checksum": "ac1a7e6e2c2a5468c704f5a2318b5617dd4ce140b98271e2034e00015db6cd76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00997-of-01024.json.gz": {"num_bytes": 397439167, "checksum": "ce9664b29c86c05d3541aee377acdca7a32ef8f0220e0b4b6bf18276b692529f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00998-of-01024.json.gz": {"num_bytes": 397383159, "checksum": "1b4db1b59255f106dd2af7510112eef6d6b611d9f9e000a0e585b623fdb8ae98"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00999-of-01024.json.gz": {"num_bytes": 396339114, "checksum": "ee5e1508704b03f0a9cb3c4bfb578c08fb83a4d20760e3b40f101c58cbbb3ec7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01000-of-01024.json.gz": {"num_bytes": 395172166, "checksum": "f8cbf0bd9c2b90e588942048848fbfa1a20cf775364cb9c84b4d5dd7cf19e603"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01001-of-01024.json.gz": {"num_bytes": 396629363, "checksum": "7cad3f9a28e5988ef91073c48e9d85ea7030289690f817545cfa9f1165dd33d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01002-of-01024.json.gz": {"num_bytes": 396507390, "checksum": "b4ae1017913509855d6d8d4413ff3de4a8d519d91f354b6e5b5267219d20658b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01003-of-01024.json.gz": {"num_bytes": 397652598, "checksum": "0c115446c159d27e6e1354173ebec29e6dff5f38c4d2ddb46c07c450523309c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01004-of-01024.json.gz": {"num_bytes": 397408971, "checksum": "f0b559a832a9ee50225fe1417d936d6b898026d80a105b976deaeae75f9e30a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01005-of-01024.json.gz": {"num_bytes": 397753911, "checksum": "e001c9285ade7de6ac23716b596ddcc733f05bd6abd7e1a67874894c93fbd43a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01006-of-01024.json.gz": {"num_bytes": 397962701, "checksum": "acf13433824104e4bfc3a8aaf8805eb16712cd97b2dc1d48e7d771bee4bd41c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01007-of-01024.json.gz": {"num_bytes": 395966285, "checksum": "4c6069f6a95d036fd3e05a4246db932ad5ab89b9470274f23a17df0b77b9b717"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01008-of-01024.json.gz": {"num_bytes": 397075505, "checksum": "9b3b9c0cd4ee02e18a5d22142183874586da8fd23b4f97033e354f9681d150a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01009-of-01024.json.gz": {"num_bytes": 396881470, "checksum": "14d2d7cf2ebf3b2c73bad4a6099fa1d2b1cb341b100976b03232fb664a7d020e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01010-of-01024.json.gz": {"num_bytes": 397471393, "checksum": "01e6f56bebe0c874d82135f551a6b917759c41af48d127df181267dc9b8f6486"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01011-of-01024.json.gz": {"num_bytes": 398092801, "checksum": "ead5b6b13bd09136fccd9548c224398401bda0ca7ff62ca4db852760760f13d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01012-of-01024.json.gz": {"num_bytes": 397831436, "checksum": "daa2d1507f9b56de0c4aa9d86d93259c1e6f73f0cdfd553ce075a16807dbcb56"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01013-of-01024.json.gz": {"num_bytes": 395098326, "checksum": "c2b21a1a56e9879335c72008919e8f7998dcc1e8df2258fdf2196ea86194e3cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01014-of-01024.json.gz": {"num_bytes": 396164077, "checksum": "0df125946c83c66c6961eae2aa45ad7eea7038d808281d633ce30686a8245e01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01015-of-01024.json.gz": {"num_bytes": 397895284, "checksum": "f6f6eee8fc113b7e717654b9305cc5129c3ee1ce9f263b91f0202762f078a526"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01016-of-01024.json.gz": {"num_bytes": 397723033, "checksum": "48426df1f4665d3179251904c96a0e73c041ed5b57885b4dd852809e632685b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01017-of-01024.json.gz": {"num_bytes": 396761053, "checksum": "f33cf2d744585e0338b29a5a5638752123b7b59f9ae3b723cf7e7b536f9f80ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01018-of-01024.json.gz": {"num_bytes": 396562520, "checksum": "72adb0869cac573282c4bd938cdff556f659540dd4a0a6663711974cb2dc147a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01019-of-01024.json.gz": {"num_bytes": 397564701, "checksum": "3b64235effaf41ad61698b2c28f4d73ced1b6ec6b6d79e0f52314176fa0feb12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01020-of-01024.json.gz": {"num_bytes": 396053080, "checksum": "b16b9f815823d176f94388d4c482652ac656aa763ec738ccd8c8a2a3bdefc1e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01021-of-01024.json.gz": {"num_bytes": 394731398, "checksum": "f4c0044abadd339055bf13843938eef4c066856757250fc15f77060fc0881ba6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01022-of-01024.json.gz": {"num_bytes": 396548645, "checksum": "5ecd8432526eda57065e6161f0618a19cd5993c7dfe86575775f1bf01836f750"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01023-of-01024.json.gz": {"num_bytes": 396863581, "checksum": "c6cd29b8f6067152ccd584ded81df1f9cb905515d48815b8a546d104ec7a3565"}}, "download_size": 406611392434, "post_processing_size": null, "dataset_size": 2059256402722, "size_in_bytes": 2465867795156}, "realnewslike": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "realnewslike", "version": "0.0.0", "splits": {"train": {"name": "train", "num_bytes": 38165657946, "num_examples": 13799838, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 38165657946, "num_examples": 13799838, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00000-of-00512.json.gz": {"num_bytes": 30085821, "checksum": "6666a680b0a34eb8756dcb5fd2b12f0078237f3502e8a513bd3e5b71bb92be00"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00001-of-00512.json.gz": {"num_bytes": 30065900, "checksum": "61c3f9ab763067f76d9bea349d86efb97af7539d481b5d2807f362204971c327"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00002-of-00512.json.gz": {"num_bytes": 30028880, "checksum": "3aa4405d957ed42d10d643efe7c0f51b05e8f29cf4ad8783448083c1cd3f2a24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00003-of-00512.json.gz": {"num_bytes": 30136880, "checksum": "f6eb49e4c0d691e67fe96ddeb3f8370c5e63a7297a31a8da0c58f5cb3a9f6061"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00004-of-00512.json.gz": {"num_bytes": 30110499, "checksum": "6e0908780f555f4b74c6a5055e2c9708333a8466f0b8723a8ea38cc04828ce44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00005-of-00512.json.gz": {"num_bytes": 30097927, "checksum": "a333562df3fcd4c5ccf51b4c00e11f6619ac4a28a878383aefad277bd30131a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00006-of-00512.json.gz": {"num_bytes": 30013820, "checksum": "7c436cd0993077187988239cf74c3e64de440dacad62ba4b02bd4ac0a8d219b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00007-of-00512.json.gz": {"num_bytes": 30557005, "checksum": "dc9e43681c404fef1741e9608295b8dfae0953473993f3fc44fb83af07a6b82b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00008-of-00512.json.gz": {"num_bytes": 30369535, "checksum": "8de7a4005acdb60436b4e5d7274084e28df3aee31a5457c6837452094544c541"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00009-of-00512.json.gz": {"num_bytes": 30033048, "checksum": "32310a6c74cbee1dbb8b196e0cfad41f79e88e48d8f04c88692d42506113b903"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00010-of-00512.json.gz": {"num_bytes": 29948345, "checksum": "b7df217de849e26ecce5ed7a35b6e6238fcc1c08e969023f209307842dd496c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00011-of-00512.json.gz": {"num_bytes": 30558885, "checksum": "82e5428aaeecf27141a7105e48b78dc02516ae6ebc3d6cd4ef13963316279e1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00012-of-00512.json.gz": {"num_bytes": 29888513, "checksum": "f3d7e496b7c85ed7d020c8f8a24a0b27f9b2535abdb22b45c08441a29398c44c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00013-of-00512.json.gz": {"num_bytes": 29936292, "checksum": "bf04d82f0cdddc09ce4aecd9f71910b9858badaf6456253d43d89e6a8c56cba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00014-of-00512.json.gz": {"num_bytes": 30169338, "checksum": "15b4611513154de0dfc1c9d470326fd053adf70de814ecfe8ba7ccee66de947e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00015-of-00512.json.gz": {"num_bytes": 30071363, "checksum": "887bdea83bdefc50786c93e8014d1d49999f8090ff15168598c884cd0724fec2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00016-of-00512.json.gz": {"num_bytes": 30451660, "checksum": "288ad0d553d54052354be506f87878fa7c54b0fa65811c6e456b3262e1d117e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00017-of-00512.json.gz": {"num_bytes": 29940254, "checksum": "b13ad58ae9f38598cb9d560e3ab34c1d0200db73fe86da12230e50086b532463"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00018-of-00512.json.gz": {"num_bytes": 30282186, "checksum": "5a67e71955ab2d8f6531bd3949cd8ab71f4ff91863ea5a6ec3e7b33c31a05dd6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00019-of-00512.json.gz": {"num_bytes": 30373907, "checksum": "a70682315a0cfe0af815c7b2abbcd63310fabbc33ad6e19daad19f1f51506955"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00020-of-00512.json.gz": {"num_bytes": 30104199, "checksum": "980e544ce130a06e9e99ec906342eb0ab8aeaa96ac26eca01c56ebb463f5d688"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00021-of-00512.json.gz": {"num_bytes": 29733696, "checksum": "a69729b8f3ccb9db12476a31917783c1c6e036e7bbbb4089f430362aef71f467"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00022-of-00512.json.gz": {"num_bytes": 30012894, "checksum": "589e698fe450e22cba47813a5a28da5393e79702a528f6a8469f72f6d630caad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00023-of-00512.json.gz": {"num_bytes": 30024851, "checksum": "2a7b036c38fb4d2df6535631018c23d001931e5bf8d8a815fd5b2f9343ec4529"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00024-of-00512.json.gz": {"num_bytes": 29906809, "checksum": "7e512306cb6ebb0b0c3e96ceb16dade9e1e1f484e754bebd0078e7f545fc5b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00025-of-00512.json.gz": {"num_bytes": 30332268, "checksum": "b636b91fcd9a91ce05b8cbeea6f591a0e916175ab23b0cfaf688171c8a98ae8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00026-of-00512.json.gz": {"num_bytes": 30288490, "checksum": "9e2f8e2a37dcfe66873cc5355740448ef75a1de2deeb2d8c047c3c3a7ee485c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00027-of-00512.json.gz": {"num_bytes": 29897688, "checksum": "882616d1e8ca66c0b6e7aa2ccb18d9239021603ab1b9486638a9a3447ddebe0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00028-of-00512.json.gz": {"num_bytes": 30201690, "checksum": "0312b12f50c64fbe7b894a28e0940089ad57af95df8116cd7d43c0435ec2e79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00029-of-00512.json.gz": {"num_bytes": 30237920, "checksum": "1e8677140186b219d32e764889dcc344ccac9db51685363324d1bc13ddef2bb7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00030-of-00512.json.gz": {"num_bytes": 30048903, "checksum": "43558e81c291cbf53a5b6a016aecb0e07e26a98b8fb32f4a000037b281afa363"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00031-of-00512.json.gz": {"num_bytes": 30294528, "checksum": "c33ae8a2fad7e5264d093fbe89ed1611357110a4f0f26dd5a93a4dc15560f205"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00032-of-00512.json.gz": {"num_bytes": 29868168, "checksum": "5dc2a8f96db8da87607efc0b708e6a2172530f0c9b43665dc01286109b5c55bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00033-of-00512.json.gz": {"num_bytes": 30105916, "checksum": "c4cdc2b39a86eff251f903d7f3d39605b721615aeffa6a2753f3588b7dbef6c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00034-of-00512.json.gz": {"num_bytes": 30126174, "checksum": "6d874182112b0881dc929c0182a30ec4f9f1633372a2b822200a7b1faaf4f1bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00035-of-00512.json.gz": {"num_bytes": 30084101, "checksum": "5bea17f0cd4dd888f5d8a2d4092138e4777d80493a1f410d618d4cedf353b914"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00036-of-00512.json.gz": {"num_bytes": 30095974, "checksum": "6e7f42f3012d8ca7500c7e2ec82d27c26b3cd8bb5b8b66a7fc8355d77284f433"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00037-of-00512.json.gz": {"num_bytes": 30239345, "checksum": "54ee45bf25152060679bab3e5fc6f5cb5a3add6acd2664cb152f88c223f83239"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00038-of-00512.json.gz": {"num_bytes": 30247683, "checksum": "f738a2f0f156f7bd897d9d822748d4192a5fe46b566c7288ed5b840c4ffeda64"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00039-of-00512.json.gz": {"num_bytes": 30057005, "checksum": "60235900d69579334660c153c4fe384c08f14f4e729a06a1e8247e8b4ab8a213"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00040-of-00512.json.gz": {"num_bytes": 30185136, "checksum": "5a059d64fd6a1b42a2faeb4088db327c47f9e8328737ab74a0e0457f84433374"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00041-of-00512.json.gz": {"num_bytes": 30314653, "checksum": "2cfdc460c8dd0fb4766191ef2aec0af856af7c95d11eb3f1d731f63b71db4daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00042-of-00512.json.gz": {"num_bytes": 30123256, "checksum": "64e59b8ebde3c12b0a1d218a302252b96aeb5bb4976927463101a9509579ec22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00043-of-00512.json.gz": {"num_bytes": 30057043, "checksum": "edd200b97394f15f9cf0a6289406a83b42c3d6f961456f031f5814db4f6d482a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00044-of-00512.json.gz": {"num_bytes": 30029900, "checksum": "1b2980f21ee5cffb271591adc8eaa414438841426442f194b5f4b703356f4e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00045-of-00512.json.gz": {"num_bytes": 30367170, "checksum": "83967210891345b831956722e8dcd29cf55fb17b786c85c2dd2778528ab4d1c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00046-of-00512.json.gz": {"num_bytes": 30105866, "checksum": "6921ac4854e2eacaeb4be07669faab85f2bab33f744c7efae1ce17be25176bb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00047-of-00512.json.gz": {"num_bytes": 29957618, "checksum": "e8eba2ba9f51e76a06a2df43b6b120c47b6e41f61e46a2e3331518ebb2d0c84b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00048-of-00512.json.gz": {"num_bytes": 30329887, "checksum": "6af9c44a53d7eb9df9d86ee4d895fb9f7f2b9b3863fd30aae325e79fb792a10c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00049-of-00512.json.gz": {"num_bytes": 30116207, "checksum": "57dc1e94f73b55e0be5690b01d61188a62186ea9f5f85b556ecef3bcaa36fb92"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00050-of-00512.json.gz": {"num_bytes": 30236341, "checksum": "eb75bdf0e63e798838b3d7abfc6a3bfab5de2ba39af833c38048dfe39c1175b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00051-of-00512.json.gz": {"num_bytes": 30357091, "checksum": "f48b1f5e07311ca9d69787019a56ad849932e6868d1f7778681cf7e4cc9fc562"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00052-of-00512.json.gz": {"num_bytes": 29944959, "checksum": "debf9490c057f11e404898b4a57cb424c1eb523fa90bb7899b1317f970481638"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00053-of-00512.json.gz": {"num_bytes": 30240416, "checksum": "9e847a5c6eb80e5c045fbb405729c695911674bd8d29b1d0be0791303d02f41d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00054-of-00512.json.gz": {"num_bytes": 30174556, "checksum": "65a80db1cdde9153e08277ad2d9074dfba1682c0f771fbb9f4aa8f88ca557f43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00055-of-00512.json.gz": {"num_bytes": 30134394, "checksum": "beb8d280d322520ded21aec92ae087867d0bce64aac4e243a127a88f143ff578"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00056-of-00512.json.gz": {"num_bytes": 29891026, "checksum": "82fceaec35a2456487a59ae652d72f41a940d2d6bafdc4f05a6e02bcd7ed4dc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00057-of-00512.json.gz": {"num_bytes": 29920525, "checksum": "e4fd55ba5fb2825ef4209aec87706ecdd3db040242c6aacfc82f350765fbeff8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00058-of-00512.json.gz": {"num_bytes": 30060421, "checksum": "3cfc894a1853e3d1f2daa314873b7919fa52b7208b590637f8face6536305770"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00059-of-00512.json.gz": {"num_bytes": 30038488, "checksum": "4f06ab7b5ce8e8c696445db4a3e32896b6396e3f67d7414a593e7398d752e564"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00060-of-00512.json.gz": {"num_bytes": 30129718, "checksum": "7923385ee0c6801073feb10437ee3c59e5f5dfe82c2311ad8c4ec670dcc0ec87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00061-of-00512.json.gz": {"num_bytes": 30130505, "checksum": "5cd682e148b8488775622098214fc2009ef9c95355f46341bd78434f1b560fa2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00062-of-00512.json.gz": {"num_bytes": 29968130, "checksum": "53562fc23501f3a1d11c8ae6a59e719d6f4e67db8b8ea1d55e2b1b80849afd08"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00063-of-00512.json.gz": {"num_bytes": 30116532, "checksum": "008cc5c0cb7d60e84ffdfe2132f6bb49aafbb31083fd026067b3859326ca64fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00064-of-00512.json.gz": {"num_bytes": 30236194, "checksum": "8f9eee169071e80c94c248f1c37b7fa631bd75a7f6e401f6a963aecd8815910b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00065-of-00512.json.gz": {"num_bytes": 30077312, "checksum": "8c5e18ea3575cd350e98d062ef88d3fd1df068e4bd410be8732723bda03656c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00066-of-00512.json.gz": {"num_bytes": 29920862, "checksum": "e377b8112dc6ff6834607c27b927636429e887f4ab8edc0824363941b7bb311d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00067-of-00512.json.gz": {"num_bytes": 30278223, "checksum": "ec2c2ac74cc3f4f814d645410cccda266151949dd36aae518b8082b948b47edb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00068-of-00512.json.gz": {"num_bytes": 29940464, "checksum": "ddfc16a17cabf48a2c59fa8ef25ccd12d899d3462d08b45f2a301567ccc105c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00069-of-00512.json.gz": {"num_bytes": 29903118, "checksum": "66d9d1791cda56607b2561199503cef216df86b28d4519d5862905671a4ec4c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00070-of-00512.json.gz": {"num_bytes": 30082323, "checksum": "8072d3bd5e19c005493c0332b73ca5be253397f54be90be1bb7b2ef8df7ad117"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00071-of-00512.json.gz": {"num_bytes": 30128276, "checksum": "b7c68af5a6dcac3fbb3dcbe12123d1045a79baf657a8b3bdada60c1a97404c48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00072-of-00512.json.gz": {"num_bytes": 30458419, "checksum": "cfe5c6ae2ad1531271b0039042e033bdd7caf9604bfa219980ca27513cea755f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00073-of-00512.json.gz": {"num_bytes": 30366974, "checksum": "a132f5e85376b0d0a06c6ae6af9c226dcbc98394461578c4fbc6cd439ba6e721"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00074-of-00512.json.gz": {"num_bytes": 29987779, "checksum": "f905e808b50908a7d2a7f0944e7e6c01ffd97ec16e5f0b6ed7169a60d66b0100"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00075-of-00512.json.gz": {"num_bytes": 30070204, "checksum": "b57458683803936f6bc03b06fc26be9d1a09ba09517b5c1518676f468e404595"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00076-of-00512.json.gz": {"num_bytes": 30129238, "checksum": "81e88ec53e39d6191e40e5852564f592b745abf99c71ff78302292632f636792"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00077-of-00512.json.gz": {"num_bytes": 30051399, "checksum": "218b0f6e219e42113e35d99458861f8511266dee6c17d9e2780a17af8877f822"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00078-of-00512.json.gz": {"num_bytes": 30144230, "checksum": "c0a337619559362e0e1cd0fe87c9ced5c987313a7f3cb65eb44f8b861c41c616"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00079-of-00512.json.gz": {"num_bytes": 30544297, "checksum": "27e257efda6adbce01585b3b6cdeefa95d31f607012fed5dd4310bfb5a790ba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00080-of-00512.json.gz": {"num_bytes": 30188866, "checksum": "26411f1a0a7b299d0bf6cf78db04b0bcc617894cd87d59e54614f3258dd393ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00081-of-00512.json.gz": {"num_bytes": 30418881, "checksum": "87a659f6b24560a754ccbfb6aee019484e48e3ddc7955a6c7a18aa9098952cfe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00082-of-00512.json.gz": {"num_bytes": 30086460, "checksum": "708fe5108042b957688817625c84059c11700b18ddcea3814b86b6c8c66af8a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00083-of-00512.json.gz": {"num_bytes": 30138639, "checksum": "8d8681519538afdb7622b677ca5d3ae2a643382bae9639e3ad90c82d36477653"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00084-of-00512.json.gz": {"num_bytes": 30228150, "checksum": "db708760b9d45e0b20c8dde9b0008f01761d9bb0f37a194845b4d097a60e477c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00085-of-00512.json.gz": {"num_bytes": 30004564, "checksum": "19ba55c7cbc44ae30a6497373fc15b548e5c45667f790c392857f6fdaa7e2bf6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00086-of-00512.json.gz": {"num_bytes": 29696360, "checksum": "4cb07dd259a084818f9a79a4fe4fb7b24ea1adda0cd4fd405ba003e7bd481f12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00087-of-00512.json.gz": {"num_bytes": 29927300, "checksum": "7c3c07dbc9c57881a3c1abab85a927f1ba609c58da9dcec22d7415079cd336b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00088-of-00512.json.gz": {"num_bytes": 30038333, "checksum": "59158c87d7e9e5011516f98dec1313758072ca6685c7ad9df5ee4a075d9ff8a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00089-of-00512.json.gz": {"num_bytes": 30223506, "checksum": "d3f39f7e90b4a82257779290a3f2de5619049d69b2169577f1e3c81791d85419"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00090-of-00512.json.gz": {"num_bytes": 30266969, "checksum": "88ed3237aadff809cec186fa378e176774d3f32aef1a6d8bfdbc530f64e8aed4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00091-of-00512.json.gz": {"num_bytes": 29885840, "checksum": "b9a247993a8eec31b3f853d1329ae79da29397dd27eb4acdc196b71c091335e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00092-of-00512.json.gz": {"num_bytes": 29942337, "checksum": "3d83cc54c06cad8effdb7a38ed6666b5d912e6fffcf4c82471af064b0aabe05e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00093-of-00512.json.gz": {"num_bytes": 30129376, "checksum": "d72ed9855fa86ceb4089435da3d78e8d4151b92185f828329b534d1adf3821db"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00094-of-00512.json.gz": {"num_bytes": 29613450, "checksum": "f61f74aa65a81616b97cbc34a8be1b563f83f69709642b8156eb76cdda02103f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00095-of-00512.json.gz": {"num_bytes": 30469526, "checksum": "926d1ba2e4b191e75b0bce0cbe4c15f95f244445ec03a6095c009c34e36f897e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00096-of-00512.json.gz": {"num_bytes": 30126036, "checksum": "e74818ad94e408498644dc71f1ed967f356f539418222f1dfea467a21c99badc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00097-of-00512.json.gz": {"num_bytes": 30374980, "checksum": "d9cc8827ee38bddd1a31e48b2b0064a567520e3c0f2e1be745acef57d267e4d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00098-of-00512.json.gz": {"num_bytes": 29928579, "checksum": "090ad37fd9eaeb53308599f2da1053b19b1c6478adaea5a8a1c35d6c35340111"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00099-of-00512.json.gz": {"num_bytes": 29901456, "checksum": "c0e7d9a7cbc3b9b940077508441e471a1eb70e822479fcad726b900e6c196382"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00100-of-00512.json.gz": {"num_bytes": 30033459, "checksum": "b62033de618191de3200205e6e40725baf045e403060d10417211d47854d6bb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00101-of-00512.json.gz": {"num_bytes": 30280468, "checksum": "8726d092785856ec690dcd8a9edcd968cd04af1cfafe8a83192e3c0782f02b4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00102-of-00512.json.gz": {"num_bytes": 29805195, "checksum": "248edf4dd6c9a1137c7b45ab0b5a05a5fc93fd14cec17a5da4d758b9f7b359df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00103-of-00512.json.gz": {"num_bytes": 29995494, "checksum": "d66b75c3f08a0db141d2c0162eb3dbc351e656ba1ba480e77eda051435d1390f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00104-of-00512.json.gz": {"num_bytes": 30318447, "checksum": "09bd2068c20d33783f39322c95756fd3dbd0da91f4380fae3822cb33b7d06779"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00105-of-00512.json.gz": {"num_bytes": 30209523, "checksum": "0a399ecb1116890e1a0189cd2842d64d8ed53213b1623ae38229a6ac4f5c1c76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00106-of-00512.json.gz": {"num_bytes": 30476739, "checksum": "540f682a7c977d20f920b5af1ec7e40c14a0d54f1718b43271e22dece9cdce16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00107-of-00512.json.gz": {"num_bytes": 30203291, "checksum": "0dd51deb74ab391c54b20862f7df561f74d00be2ee4fc13987f91771870c099b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00108-of-00512.json.gz": {"num_bytes": 30265100, "checksum": "172b09a108b154014077a415f644cd16db6a66f178bf780c120a6c4fecc3c0a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00109-of-00512.json.gz": {"num_bytes": 30342649, "checksum": "214a8f147f2d77ec0f3889b0a2d782e5d44230878359e695e9523561e6723a1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00110-of-00512.json.gz": {"num_bytes": 30152418, "checksum": "dc0d34ce7918b80ecef3528ec2b063edf7b12223c453ac7fb9d39232fecd81d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00111-of-00512.json.gz": {"num_bytes": 30160329, "checksum": "d0594cb69d26f0e853575d86f92b1aa233b5bb236804a2f496a792fa031014ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00112-of-00512.json.gz": {"num_bytes": 30428351, "checksum": "2b0542d973bab88e696fb9efbe042167600da397d776ef65344dce868bbcb0b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00113-of-00512.json.gz": {"num_bytes": 30200133, "checksum": "10dcb929692795fefcf4623040191d9cb6199fbb3b164648b62b9867e8392379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00114-of-00512.json.gz": {"num_bytes": 30205273, "checksum": "f16631d5bcbbe133a01675286ca7667400ecc7e6df13d728015381d21ec71cfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00115-of-00512.json.gz": {"num_bytes": 30164849, "checksum": "bed27819db4bb7e02cb42cdda18acd232659a2eaa43eed910ba26d686cb3f837"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00116-of-00512.json.gz": {"num_bytes": 30117752, "checksum": "4eb4bec7adac3c2f431d356212f8a9d47136f0011f5f9e71dd29d82b1b823e2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00117-of-00512.json.gz": {"num_bytes": 30062588, "checksum": "79639624734885b3051b10f052f5486d7124bbc4bcd18d99348f3683ee2fc54f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00118-of-00512.json.gz": {"num_bytes": 30125828, "checksum": "e922a4a5332a4182ddcf6ac8ba910024fe4fa878b524f7368b27373f75bbfe44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00119-of-00512.json.gz": {"num_bytes": 30156741, "checksum": "a44aba8779b99ace2f212789389af058d12dfb0706221b296676d5e10528dd78"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00120-of-00512.json.gz": {"num_bytes": 30489925, "checksum": "82bec41bbea7bc5ddb67b3bccea51122da7d0922768f8bda7a0c9d489bd20cdb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00121-of-00512.json.gz": {"num_bytes": 29606989, "checksum": "b49238f5b75aaf876657826cfbd4346d250f564a86bdb010aa1e85b44a969229"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00122-of-00512.json.gz": {"num_bytes": 29770557, "checksum": "0803ccbd505db47cd09b20d86cc6ad459c7a8d1c583a5ee756b0397369d8b6fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00123-of-00512.json.gz": {"num_bytes": 30248121, "checksum": "d73a1bf285a0355bd61a25891cd8c5fd9da66535ec515dc7e1602a769b994727"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00124-of-00512.json.gz": {"num_bytes": 30131013, "checksum": "65d2dcc7e63a28e1911717d149b907d0c74fda6e36db2840353a0290f7880324"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00125-of-00512.json.gz": {"num_bytes": 30348971, "checksum": "5dee3c7afe0364ccb8e36647d01e78ffe61690f29f29aa033efac9a0413c2a47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00126-of-00512.json.gz": {"num_bytes": 30370074, "checksum": "1dc04b3755291842711623d1d6cf042e2d66987103a0c708f01c9136a8c42db6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00127-of-00512.json.gz": {"num_bytes": 30320846, "checksum": "e31a27ba25bdf13e6f929fd38d53409dd3f50be78ad955b69b1956709de5aedb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00128-of-00512.json.gz": {"num_bytes": 30076235, "checksum": "122ee9d293428a7a823c17b3a432b5b2198fa2a68bbb246b97e981bd09f78f0c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00129-of-00512.json.gz": {"num_bytes": 30569486, "checksum": "918bf43ce3ab54d535dd02cbcd09f1081890be3287e23fd81bfa032beec61ebc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00130-of-00512.json.gz": {"num_bytes": 30280169, "checksum": "ab0a53e8c10dfdd139281175b5fcfe3090fa238fcb383e27b1dcdfdbbe8a879c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00131-of-00512.json.gz": {"num_bytes": 30338899, "checksum": "e54771e12a6f3583c3accf9bcc01b598819231f367e7f80cbd44cf6683c5c852"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00132-of-00512.json.gz": {"num_bytes": 29969011, "checksum": "f69d7052ca7657fdebe547a6e196b109285d5d4e4f1a68f3900a37ba6fecc22f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00133-of-00512.json.gz": {"num_bytes": 30179558, "checksum": "cf2130dedafd8f47e97661a5b1555813433e3f7293b5c5cb222cf551d90a0604"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00134-of-00512.json.gz": {"num_bytes": 30080257, "checksum": "1a32902fc21633ae8d41e4e5518804f4c719dc8729b866ebc32d3c36fdadbc10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00135-of-00512.json.gz": {"num_bytes": 30284972, "checksum": "6e3a78e7a530d91ee4578caf462a4c685a5f221f0cd8eb9639c9067e2b655a7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00136-of-00512.json.gz": {"num_bytes": 30130265, "checksum": "defc57340cbaa5f325994a91b5134789c84a76a4ca7b9fdbf993b0e634735f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00137-of-00512.json.gz": {"num_bytes": 30146793, "checksum": "7ce5035f452eb2e1adeff36d0c6d6d65c245d139a86ef48bbe10c5275975183b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00138-of-00512.json.gz": {"num_bytes": 30180265, "checksum": "298849a53a8ea0e68d01cc137195bc36d686077bed722e1198337a1dee3c51cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00139-of-00512.json.gz": {"num_bytes": 30398387, "checksum": "ef2ac4b8f195141a79a357d934d5d97bd4d2c64027ec7509b5873a4ae32fcb9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00140-of-00512.json.gz": {"num_bytes": 29652990, "checksum": "290f1c99b696e345aaa6ac6d5a882a87dcf5d3939b08ba859a359d2459498785"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00141-of-00512.json.gz": {"num_bytes": 30083642, "checksum": "fb6a38388a25261d86fbd8ffea63e06bcbcbd6846a4eb6f13fd09d7fe5a1fbc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00142-of-00512.json.gz": {"num_bytes": 30131064, "checksum": "b61ccf6166ea4b777629bdc07d543f299bf7569deab18228ec5bb9edc8cd3eb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00143-of-00512.json.gz": {"num_bytes": 30244435, "checksum": "22812c50efdfcf2c0fdcf593639dfea09ffee8068321c30effc669c8234d4f3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00144-of-00512.json.gz": {"num_bytes": 29725094, "checksum": "79cfa65a3115193629d16606643d90dcf27d3108c320cc9e364ba19fdb9fb1d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00145-of-00512.json.gz": {"num_bytes": 30335033, "checksum": "e836f0bc9acba85fd1721d19cc24054e97defb0d12678bdc0d086f40deb9b1a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00146-of-00512.json.gz": {"num_bytes": 29905680, "checksum": "bf684871a235078390d6c6bb03fc2d5bbffec2b095806df652a19baf5e67135d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00147-of-00512.json.gz": {"num_bytes": 29852459, "checksum": "0e716de5b3b09ec287b039be0f0dd6edd7d541aa6d3f9d2be18768e1cd5f4cd8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00148-of-00512.json.gz": {"num_bytes": 30364788, "checksum": "4cef624e6b7c2b73dbfb47227e31681223a5a9369c4b7daef8606b796f010dd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00149-of-00512.json.gz": {"num_bytes": 30096278, "checksum": "fb448ccc7412f5ca8667004a70f3dd6e1b5e6cb7f6facc06564bd22b1d815593"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00150-of-00512.json.gz": {"num_bytes": 29776995, "checksum": "1e14268cf723bc7336b33896537643d21dbefc1f05ffd5201feb5fb1130f9683"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00151-of-00512.json.gz": {"num_bytes": 30205172, "checksum": "797224cf74063fbcaec741535278ccce141e6dbbdd69a2191d07f89816ab14fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00152-of-00512.json.gz": {"num_bytes": 29845034, "checksum": "77eeb2353f544c714deea68d4a781b498c40d7c1e27db3aade4987b381ca29c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00153-of-00512.json.gz": {"num_bytes": 30258796, "checksum": "0fc581e92e70dda031d72a4aa0bbd65b1e9b28884f0ef5dd5e895cbecb270609"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00154-of-00512.json.gz": {"num_bytes": 30249734, "checksum": "ba10dd0a24bded170541e23078264b82b35bc99e402db594e2335e31905ededf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00155-of-00512.json.gz": {"num_bytes": 30198742, "checksum": "fe285ac893126062bcbc20df75a9f65c57d3a7391354fa7e62b7f6a7122d6e77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00156-of-00512.json.gz": {"num_bytes": 30168323, "checksum": "d21826b71bc85dbc496dd947ae9ee79d62885cffb3fa7c47409feee6ab247f17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00157-of-00512.json.gz": {"num_bytes": 30241978, "checksum": "fc41765301b62849eda0b7b08f792e45f03db458fb92063af70c43d7cd0d0bb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00158-of-00512.json.gz": {"num_bytes": 29959715, "checksum": "1eded3ce0bc099c7e198e9277719d578c3fb6c425bb2110cb0ca6ce469d1d19f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00159-of-00512.json.gz": {"num_bytes": 30109595, "checksum": "eccaab5b694c2f0017fe1d423637872d5587f6deb316796f7c0ff5517fa28178"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00160-of-00512.json.gz": {"num_bytes": 30201741, "checksum": "4ceee71372da6112101665f5bbf942a85f065feaab924c6e3f83498169bbe255"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00161-of-00512.json.gz": {"num_bytes": 30176266, "checksum": "6ed829daaad190b2d50b626d840edb750a063afad95315ffe7604a193183a489"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00162-of-00512.json.gz": {"num_bytes": 30018118, "checksum": "dcf8509a55213425a41706e5209ad411afb715fb9cd8c1a8b8edca23fab7d6cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00163-of-00512.json.gz": {"num_bytes": 30236016, "checksum": "d93cfaabcc7197637f233896b5799527f27d5b2dc60f0f0411ee51f05f09c500"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00164-of-00512.json.gz": {"num_bytes": 30150055, "checksum": "cc7de5ed3c774ff1dc350fbb5167dc1610c4f9a0dbc7c5d60ed4cf08aaf23ce3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00165-of-00512.json.gz": {"num_bytes": 30348056, "checksum": "b41c4a3b7b4e96262fe5c87d06fbeb000dc48cc1d304a475bb4f4e1af84a9afb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00166-of-00512.json.gz": {"num_bytes": 30015834, "checksum": "0a0821b7628b9b019995a9f34223e2960ded84331ce1bb55089838becb8a170a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00167-of-00512.json.gz": {"num_bytes": 30282254, "checksum": "1285af56d024efe2166fa892878d471948e1d4c996922c7673e3c0f7f0f76bef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00168-of-00512.json.gz": {"num_bytes": 29815124, "checksum": "29ec54ed647725ca3b9aec3bae341151a8e2b708cf21cd87b4389329298442b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00169-of-00512.json.gz": {"num_bytes": 30346843, "checksum": "1791e3f8371a63f9f849b7bf430e70d3f4011dbdef572c166cc5d49d06162fd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00170-of-00512.json.gz": {"num_bytes": 30175685, "checksum": "de8f82986addfc64b88fd3041d7ee6fdb64e6f770758146dc4c9309df348e965"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00171-of-00512.json.gz": {"num_bytes": 30145505, "checksum": "0dda47f679666862de6343e1109ed92866a42e8fa129ee69e9f0b73f18b6aecb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00172-of-00512.json.gz": {"num_bytes": 30009998, "checksum": "2990dae6c16b7d60652439bed8b80ee4cf93972f33d8511d3d6aabaddfeca5cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00173-of-00512.json.gz": {"num_bytes": 30062185, "checksum": "e154a969bba2bf9430e0c8307561de78599fd2bd527cb1f15bbaf8f8e88cdf23"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00174-of-00512.json.gz": {"num_bytes": 30055129, "checksum": "e714ae153e8a927c88fe577d4c27017985d3ed7f3d0f5470f9a5f25c2e901a9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00175-of-00512.json.gz": {"num_bytes": 30091082, "checksum": "5f47c663d1e15d94fb0057d303048be990c713f3285ada2c6233137b1d84d60f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00176-of-00512.json.gz": {"num_bytes": 30235767, "checksum": "20b05e4e99e5a05f6a4c29b304803b895bb8816caea6203643723ca587d66128"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00177-of-00512.json.gz": {"num_bytes": 30071950, "checksum": "29294e4b224df4695c9342c6f23d5495de9a0ca6a1be7217aa2211506e8ac7bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00178-of-00512.json.gz": {"num_bytes": 29932121, "checksum": "6022ed3b2ceef02324e40d3c7407622c95ead2cd3d3c41ab15ff9dd218265673"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00179-of-00512.json.gz": {"num_bytes": 30119251, "checksum": "42fa0aa883d9db4303a4981e4e308b2432b031fbccc98c3e1994ec775ba8023e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00180-of-00512.json.gz": {"num_bytes": 30175456, "checksum": "6fb2ebd61524846f6b1f746f9c6356045623beb4b685fe265a23446037c9cd9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00181-of-00512.json.gz": {"num_bytes": 30029564, "checksum": "b779d721bb135fceaeddebb0dad1bdb43c9067a5e8595b3d544dfa7a084eb9f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00182-of-00512.json.gz": {"num_bytes": 30437016, "checksum": "b388fc0e862d7f6bb5b879ff7c69c301038faf5b542f6b40cbea4e2096a41e6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00183-of-00512.json.gz": {"num_bytes": 29994048, "checksum": "8208eeca7bc76f8b1786c95939d321ca0c7ae190b1f12dae86738810e412aa8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00184-of-00512.json.gz": {"num_bytes": 30338616, "checksum": "49859e75d999f65de99f9236e649a81989360f0328ba684671057b0dd7cf5e79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00185-of-00512.json.gz": {"num_bytes": 30088874, "checksum": "ff6d32fdd471d3076a9367c175baab84a5d699ccd6dcfe00c755f0b714ca6074"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00186-of-00512.json.gz": {"num_bytes": 30193681, "checksum": "82508ed104fc57de3062258eaea57854ab9e1934437a88dc0d8a9921f3641bbc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00187-of-00512.json.gz": {"num_bytes": 30171163, "checksum": "409d6576b25ad27455c755e5484e3f51d5d9788962efabe1c32e06bb3febacab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00188-of-00512.json.gz": {"num_bytes": 30060432, "checksum": "fae94de96fa2962ef51e2ea90a5f760a5cee5de249bfd9f56d7c7b4e5c20f6de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00189-of-00512.json.gz": {"num_bytes": 30180741, "checksum": "25293d5cba09980086f380d9e9ab44543adbbdcd05ed08601248b3a2b16d118c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00190-of-00512.json.gz": {"num_bytes": 30207152, "checksum": "ccfee160de15df5d88f0ff5a898a0c5b2d0ef4ebd6e6832715a9ef8a9904f88f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00191-of-00512.json.gz": {"num_bytes": 30143987, "checksum": "4c579619e465d9d97451801147202826a3855e772ea6dc4e9968e43ce2b8c05d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00192-of-00512.json.gz": {"num_bytes": 30072097, "checksum": "9c32ecb6d4ec9feb27c5b642879b464e68ca8804db161219503f624e7ca1166f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00193-of-00512.json.gz": {"num_bytes": 30172886, "checksum": "8442ddc3843c72aa169ca67801ff865ff85e4183beb38faa664f4f1d1c22a5d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00194-of-00512.json.gz": {"num_bytes": 30037105, "checksum": "2942ecacb22cb9a2953c68f21ddf3368cd47ab1f2b2d8e1f5c76b1c849b28d91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00195-of-00512.json.gz": {"num_bytes": 30014854, "checksum": "9e5c6815a5734403a7062bb27b2565d433a3520a401c836ac3f16e743a1dd949"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00196-of-00512.json.gz": {"num_bytes": 30020510, "checksum": "792712f0073c158b5f96f7a99d97970fca3819b69739d34d7d2b7f4b8b407b7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00197-of-00512.json.gz": {"num_bytes": 30072566, "checksum": "3ece37e2d0d0b26fbd839b5d3facdfd70844945a06867fb68b141f6b1378462b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00198-of-00512.json.gz": {"num_bytes": 30036679, "checksum": "c3f37a9b89987dde4578b394b5c3916c2d4fd87e0902309b4c81af19b1d2d5ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00199-of-00512.json.gz": {"num_bytes": 30195178, "checksum": "ae01bb5515097a083afd498d8530e788d99671e7cf802c4402957d6252b2ec77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00200-of-00512.json.gz": {"num_bytes": 30064374, "checksum": "2399d4869f3a8bb4a9adced5ec548a9a3fde1d4fbc4e3abd9a0a3b495fb9a8ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00201-of-00512.json.gz": {"num_bytes": 30136711, "checksum": "5c922040697bad8d7807d79f34f2b667eea63ceefba89b2d413fcd4d66497607"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00202-of-00512.json.gz": {"num_bytes": 29962983, "checksum": "e4df518d612a8614de73d5944a31d22ad06ec9ecd26fb52e500df71fe363c1be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00203-of-00512.json.gz": {"num_bytes": 30178998, "checksum": "e84a98a176451fc82d940a64cdec821e320a648780edba6466b74a1966eca47e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00204-of-00512.json.gz": {"num_bytes": 29988832, "checksum": "c6dc56388bc7c57cbdee8280895ab80da7b4d49c9a0101a685229c50cad2e2e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00205-of-00512.json.gz": {"num_bytes": 30229414, "checksum": "e7e5175b6a7372377ba3a0db439911e189db459787d48588183ac1a0198c5fa7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00206-of-00512.json.gz": {"num_bytes": 29914929, "checksum": "eb263433133660ebe219cd5817dea3b546ef2fba0e15396b2768d7091117cdea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00207-of-00512.json.gz": {"num_bytes": 29912800, "checksum": "7f8a5f62ba5912b64af5b02bd987b4d81727223ef8eff110022e89d01961366f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00208-of-00512.json.gz": {"num_bytes": 29900590, "checksum": "bc2af142244601bb7a96859dfd9885196940e675ca217cfc7c73ac9c614ea938"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00209-of-00512.json.gz": {"num_bytes": 30242768, "checksum": "fa51a4337faecfc790ca925802f87f10761552e16578b880ced80497f62bba60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00210-of-00512.json.gz": {"num_bytes": 30039857, "checksum": "3adf7482ec6a3ad106c8edca3645a94032c33f84fcd26bd9876f2b8a1f6b5722"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00211-of-00512.json.gz": {"num_bytes": 29846856, "checksum": "8e931aaa9c1f069c0eca0b4605277610df9d2d0c07a0dbe6191fb7081b0e642a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00212-of-00512.json.gz": {"num_bytes": 30022172, "checksum": "21c8bba1c83544c27977b22b077fd77f8df9cd06bc4eb5e9e9a532c511498d36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00213-of-00512.json.gz": {"num_bytes": 29877918, "checksum": "b64ebaa088df5c6230e69f207267a038705c38f4d327970e9117979e1c13d1ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00214-of-00512.json.gz": {"num_bytes": 29906552, "checksum": "55d833a2b78ad564e6532d1acd14511e8b48d703030e3bbc92d7c835c1ed38c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00215-of-00512.json.gz": {"num_bytes": 30075441, "checksum": "999c77c136d3df83601e33c823f389b133f33c4c0b03736ceace617b526cb293"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00216-of-00512.json.gz": {"num_bytes": 30507152, "checksum": "0b23d4e57eaa101c78bab46151add537668d2722bf0c50470c1b434ec3389ae1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00217-of-00512.json.gz": {"num_bytes": 30044236, "checksum": "6abacfd53e231a38c714d436018cef9a58f53320026c2ebb27d6caf08f02d7ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00218-of-00512.json.gz": {"num_bytes": 30047926, "checksum": "01120ef69493d84c44d112a41c69a851edaf89232679366e812f240fd26a0e47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00219-of-00512.json.gz": {"num_bytes": 30349211, "checksum": "c4fc219559f0f076f634fc6812d4b13c229908c1ae45c3b74c059fb3b8124f63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00220-of-00512.json.gz": {"num_bytes": 30063445, "checksum": "11f712439d54ef062cfa1225328fc4faaef5f6c9c0b0d87a0a81d25a71350e28"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00221-of-00512.json.gz": {"num_bytes": 30115660, "checksum": "9a344857ef4f9d141b57df38e25f717153b773436d72c23e10289ffe67c315eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00222-of-00512.json.gz": {"num_bytes": 30134562, "checksum": "227cd1847a948e388b404b5cda9289f05510d4e22f0ae5ec4d5a87a8f7f98a45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00223-of-00512.json.gz": {"num_bytes": 30120819, "checksum": "e0029aa6b612a98f76e37d82107fcb90f2b57ae8d52beea172b5153b76334f20"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00224-of-00512.json.gz": {"num_bytes": 30371365, "checksum": "1ce5242d163ca12dbb22655eb841bf80750b552353af4f84973285d823d0add5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00225-of-00512.json.gz": {"num_bytes": 30319212, "checksum": "71cb82bb95107a7e0b7777a5fcaa0f76b465ba828ac47401babcf7289eeb2335"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00226-of-00512.json.gz": {"num_bytes": 30020940, "checksum": "b7b8d98ade41f52ece23e896bdc4c19ad034a92ba18adb5fac85c7271afbfa65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00227-of-00512.json.gz": {"num_bytes": 30109958, "checksum": "b2ec382f44caf4e8e46fef2faf6bd2e4000420e6da2eb12a5d9f6e7efb4e1564"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00228-of-00512.json.gz": {"num_bytes": 29940895, "checksum": "ff86264683d0fdf9d689aa30e7889c4ceed21098b7c60a220db92d396614cb1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00229-of-00512.json.gz": {"num_bytes": 30080588, "checksum": "3a5502cedd61501055eb16adb6ef861c75880524c5468a69cd346bc03e98e219"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00230-of-00512.json.gz": {"num_bytes": 30376399, "checksum": "6d3a4171a1febe9149f6900e3cca5a38046ca9d59214b548a4ef9de7de754bbd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00231-of-00512.json.gz": {"num_bytes": 30031670, "checksum": "a2c8d9bb3eb260d5d8a7dcafc4703540332e2896e5127372d380d7efbd567a3a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00232-of-00512.json.gz": {"num_bytes": 30132612, "checksum": "c9dec917eff4d72c684d6f8373ca66839061e29d25f0aa5fd6fb7de5c30df469"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00233-of-00512.json.gz": {"num_bytes": 30178285, "checksum": "1eb83b8eb7e72b2b3e55420436bb17521b989d0627da46f8cc61fe9f420fd464"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00234-of-00512.json.gz": {"num_bytes": 29991258, "checksum": "5e14e2a9e8c0aba73feb9134c694e99baf57357bb524877322ff5181eedef1f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00235-of-00512.json.gz": {"num_bytes": 30045172, "checksum": "50a118a072498b5338802cceacb97a9aa9242252e8d76d305cf5f0d928fd4af6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00236-of-00512.json.gz": {"num_bytes": 30403542, "checksum": "7d7605576975232579e422a1b72625ad6f9d714d27770725dc7b99ba258e1985"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00237-of-00512.json.gz": {"num_bytes": 30242989, "checksum": "22d152fa02c5a959e978ea4887dd873dfef7267af0a577b4d796ff0cb52d5c56"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00238-of-00512.json.gz": {"num_bytes": 30214634, "checksum": "6d0af6f396fa21867e899a7678c633e47bfe79bcbda29b8072c5d32ab20a9aa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00239-of-00512.json.gz": {"num_bytes": 30255546, "checksum": "d35a93632638b6283053b121f0f30d47ea20b2747d871c3dd0beb13f4ffbcad9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00240-of-00512.json.gz": {"num_bytes": 30347604, "checksum": "fd052d532fcfe811d96f8433f79a684f68f76ec42bd959c76ae3b63aec0b2c3e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00241-of-00512.json.gz": {"num_bytes": 30135691, "checksum": "12c80c41dc4d6313bce4a171999ecda93ffc59f2c70cca363bce214cd12dc9f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00242-of-00512.json.gz": {"num_bytes": 30229834, "checksum": "fca5b81914ac0c5fe0b0c1a554a1e62c64af5c98740df1f8ce8f48f2a62b6a48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00243-of-00512.json.gz": {"num_bytes": 30053753, "checksum": "ba41c505579524e9d244354a70060c9a0131007e0b129f03e628bb7b7b512ca9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00244-of-00512.json.gz": {"num_bytes": 30216889, "checksum": "54a391c1d2de7627e739f3cd94eeccd50a80d56a40606f7c5392f6098df456cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00245-of-00512.json.gz": {"num_bytes": 29887569, "checksum": "c3263ea7e16e0036961dad28fef57ce4f0495219e59b4e800af82b67b3c6c506"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00246-of-00512.json.gz": {"num_bytes": 29906815, "checksum": "a3dcc92aed81708434edee84397010eae4ffeaa38b39aaf3919256f72deee625"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00247-of-00512.json.gz": {"num_bytes": 30074896, "checksum": "019e983a95908651bfae83e37bda5200b3888b03ab235fc8db2d5b16742f028f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00248-of-00512.json.gz": {"num_bytes": 30108081, "checksum": "6f68835ec02cf899f8f44a795b1e3117956ff5bb6c8946435d9861ae7a112df3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00249-of-00512.json.gz": {"num_bytes": 29957882, "checksum": "9bed6b7f56d93fa3973d4f177dde0973fa0eb6fe17d8d85279d865531613f963"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00250-of-00512.json.gz": {"num_bytes": 29822284, "checksum": "1848bef8d11360df55a576c64147e519327b1178f77d3ec14ab9522b33b1c423"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00251-of-00512.json.gz": {"num_bytes": 29956462, "checksum": "425f69c361a8671cf571df577ac0cfafb4894de494360084b7cbe9cb8869bc3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00252-of-00512.json.gz": {"num_bytes": 29733712, "checksum": "7198e831e75eff1e116513f9cbe098c071f051c545b41d1943211a1d996a3c67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00253-of-00512.json.gz": {"num_bytes": 30450662, "checksum": "0452804e723c919bd3c84217bb1dfc8764112fd70c5581f84520df7592f28ae9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00254-of-00512.json.gz": {"num_bytes": 29944765, "checksum": "dbbff2253d70094537de481344e5706315271fdfce7ebaddc8d277ed05ddfe24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00255-of-00512.json.gz": {"num_bytes": 30321363, "checksum": "79173dd85d535cee71afb52f7775bbf7289509bc555efe21a8700d36f7e5da25"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00256-of-00512.json.gz": {"num_bytes": 29982818, "checksum": "bacd191568e72da06c564fc7476225ce83440de6aea6c85ebe7f5279f1c15846"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00257-of-00512.json.gz": {"num_bytes": 30338592, "checksum": "998287203665559c27a66e889611ed716b7a389e403b2e857086f548b2c47b39"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00258-of-00512.json.gz": {"num_bytes": 29911193, "checksum": "ed9829f41a71cc187d0ddfeafc9cbde8e362b52914c988708a1a5ffbd3c152af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00259-of-00512.json.gz": {"num_bytes": 30227794, "checksum": "2fe86814499a3379601a179acca1d440b3c79467827ce9ef9787e1ab311904e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00260-of-00512.json.gz": {"num_bytes": 30206902, "checksum": "c4efdad05d3f5e9f27884399ab0ec82081c26486e87f0ed5408a9eb80b223daf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00261-of-00512.json.gz": {"num_bytes": 30035514, "checksum": "e47675a956a626a32b1870c61e6f98c3cfe9cc571901cf477abae982b4e63c96"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00262-of-00512.json.gz": {"num_bytes": 30406718, "checksum": "ae19c1389e26562322f745bafbd7839e7a95b3169743d48baa7ae7f2db2a0b5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00263-of-00512.json.gz": {"num_bytes": 30266531, "checksum": "289c9fee87f12ea22ad5329f80cb379e5e9c22c5cb6639077748958228c62bf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00264-of-00512.json.gz": {"num_bytes": 30100823, "checksum": "7c65dd5d90c6df49ca2dcbfdbf1b9fbb0789cb32043795942d88c5f2d7a99869"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00265-of-00512.json.gz": {"num_bytes": 29957109, "checksum": "e3a1b501b2cc3f5f2667ef179d7876db602daedefd0cd741c0898679b24984e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00266-of-00512.json.gz": {"num_bytes": 30196603, "checksum": "9337dd8240f168da5f6a8b57c5c169a2a400a9a160eccc8a6e44e7b32004ff19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00267-of-00512.json.gz": {"num_bytes": 30304605, "checksum": "513eea4e78c399cc045e25f13bb5f77ddb6c9b606522bed8216945c529894e8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00268-of-00512.json.gz": {"num_bytes": 30312562, "checksum": "0503c5bf6848213c5fcb81a5c94307fc010d910a8989e104ad5fedca58c76f7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00269-of-00512.json.gz": {"num_bytes": 30045257, "checksum": "59bd3011d12d7d70b5fd64bc2dd2016b1a9ca6f0d210dbb3e6c202bbbf74ced5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00270-of-00512.json.gz": {"num_bytes": 30027628, "checksum": "8d3ecf4c61acafc49b624d08b6aa31340643e030f6c2248f689e8a17d355359e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00271-of-00512.json.gz": {"num_bytes": 30014730, "checksum": "b2e4820a0a7287786f802b3b40602c8ca77c7813b5f50db8a336b89b89bbdf37"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00272-of-00512.json.gz": {"num_bytes": 30145705, "checksum": "20c73e4a9056a5201621a4799b86c323c5136af43caa63a74298a5c3bee890a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00273-of-00512.json.gz": {"num_bytes": 30165945, "checksum": "8f07a91b6b40444635d869b94558fa68e3593626808bc6122d4e17403cf76101"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00274-of-00512.json.gz": {"num_bytes": 30097947, "checksum": "9530522c841d8f09ccb89f4f0238f7b9048c211e85b27449fb3c09d3bd2bab7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00275-of-00512.json.gz": {"num_bytes": 30296359, "checksum": "51a358db81805a20df4f920baacf3adea05209282f800fbedfc7fa49638a072e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00276-of-00512.json.gz": {"num_bytes": 30311407, "checksum": "a51253cf73fb200053eb5fd5eca398a7a070fcaa27fc99b23389d09eef7fe5ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00277-of-00512.json.gz": {"num_bytes": 30372345, "checksum": "cc4f6d9040d8c4909d4ea5b661a7e54ba4775ff1c7c55db1ff686a56d428e2a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00278-of-00512.json.gz": {"num_bytes": 30379507, "checksum": "1052defa657524e1211e67d775a32243b164eda431c4c6ed351f0c6727f21b16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00279-of-00512.json.gz": {"num_bytes": 30195406, "checksum": "6f4fdc92c516ad779fd521afba7d8d5bcd40672e63028f43f70fff4d7605f5ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00280-of-00512.json.gz": {"num_bytes": 29902057, "checksum": "c26f89efd0977465f45fe321036d88e2d6ca3ee1edc4bafe4b40ad1895cfc0e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00281-of-00512.json.gz": {"num_bytes": 29779702, "checksum": "094139d741b7a47faaaaf50093ab4edbef6ad1943985c6f453ce45a67a95b190"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00282-of-00512.json.gz": {"num_bytes": 30063500, "checksum": "280d69bfc795f1502a9e744d53d1a189051a1e771042721f8e6f74f6559e25a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00283-of-00512.json.gz": {"num_bytes": 29956350, "checksum": "505e49b7eeab46c77a324959eeff103f8899da1efc4d0fef5c0e6c6f8879a721"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00284-of-00512.json.gz": {"num_bytes": 30146285, "checksum": "9b075f2cfdb9a90fcdc7f779a52b0c5dad36385214844d4fd9df1e528ae78b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00285-of-00512.json.gz": {"num_bytes": 30160056, "checksum": "d9b9f3cbb9ce2a0a0a1a2f7ce91e98621d48a7a900c278aeef437dc6c0a7cdf0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00286-of-00512.json.gz": {"num_bytes": 29844025, "checksum": "6de9ff1013484662305e414725be2d0a4a1873a941250b95b80b5dea8919cf95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00287-of-00512.json.gz": {"num_bytes": 30089218, "checksum": "444ff132c4a5330653b7319d34b2c7f4ae3b960d8b510cbd7389e3881f65ac5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00288-of-00512.json.gz": {"num_bytes": 30092170, "checksum": "46dc5b3b84e4387ad718fdf96b751354d7048e898ec664e0d3bdfc21ee841ec2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00289-of-00512.json.gz": {"num_bytes": 30365397, "checksum": "b42e35746112198143ac18509e4f0148772db75e19f5eea9ed0d7e2849dbba48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00290-of-00512.json.gz": {"num_bytes": 30275920, "checksum": "25d99877235c4b9dacd5d1dd7e9d16bba76cdf6cb1725fa617209142873dca0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00291-of-00512.json.gz": {"num_bytes": 30125784, "checksum": "51da68b6f2751a83e2534c342b6e9d69c419fb606b44c42b872d69f5f726df3c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00292-of-00512.json.gz": {"num_bytes": 30201021, "checksum": "1e0a42b5e7ea7049c3c86b96d37c5d1c36f3ba2e2dab02145a897ef056fa6a87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00293-of-00512.json.gz": {"num_bytes": 30124224, "checksum": "8c744f5c6eb92c0de70649cd773c0ad147bc7a1487b2ae7f1107bce9d19da601"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00294-of-00512.json.gz": {"num_bytes": 30074708, "checksum": "b3cfa4c4408c1a9f39b48e18a62e112ec3c132b226efe0850f9e58e2a517aa97"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00295-of-00512.json.gz": {"num_bytes": 29990007, "checksum": "012f63e147d22e34249e930975a2d8958a8d0b17350a9f6e368d702189b40d5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00296-of-00512.json.gz": {"num_bytes": 30093755, "checksum": "5573859cc485ae4535b83fd408dcc6a82f644832c93e6125db9a16dd6ded338f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00297-of-00512.json.gz": {"num_bytes": 30078472, "checksum": "25e694485171ba1347ccbd7916c1b87a0d46acfd13795a8aabb1cb57b5eb1221"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00298-of-00512.json.gz": {"num_bytes": 30327122, "checksum": "6d6832cb3b1c86b6392bc9ca52f69a0bb16bf71c3c7664d9fe668ee259a40a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00299-of-00512.json.gz": {"num_bytes": 30214180, "checksum": "9f3c3d87a525874ea117e36e0b30d7f5cc6c64564506808058a0788d74943634"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00300-of-00512.json.gz": {"num_bytes": 29895171, "checksum": "e99d296965da2f731ea660889ce834cd1d21edf427298bab3a059ff3ebc64a2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00301-of-00512.json.gz": {"num_bytes": 30131063, "checksum": "e5eeb0f237cf986134c946bb3c2a4b5483fb9c88b3c2b16b9db26135043036d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00302-of-00512.json.gz": {"num_bytes": 30184609, "checksum": "4ac9bf5ca6fac7f7293238852424340326347ceaa6f5dfa6fddef8003421bebd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00303-of-00512.json.gz": {"num_bytes": 29956412, "checksum": "559019fe1ef1f7e77ac53ad98b3556965ebc524ecb80bbc3f26255d5ae6e3609"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00304-of-00512.json.gz": {"num_bytes": 29974071, "checksum": "3c54edc4b6a7e34048cbbadb55cb3b16496a4e6e7334b4ede4e1368daf4c5301"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00305-of-00512.json.gz": {"num_bytes": 30338106, "checksum": "1c91c0c5bcc2bec0a698318ad6f576a06db7885c20ed7f36782427b80580a75a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00306-of-00512.json.gz": {"num_bytes": 30178986, "checksum": "fff99f2758c2de57ccbfbfc6388f67e624d00d4a6cccb5820a7a8f5fcf02d386"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00307-of-00512.json.gz": {"num_bytes": 29493455, "checksum": "5d08c6e3909e21bed456ff9d06c983f14d3a277cb399a91047a692184f87c4c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00308-of-00512.json.gz": {"num_bytes": 30228844, "checksum": "04bffac195e24383d06b0ab9ebf019959a4e7abe8e8e6a0cdfbf0a8e7c23c899"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00309-of-00512.json.gz": {"num_bytes": 30351688, "checksum": "3ce14d5104d1318c6a16d042735f0a71f4452897de60d17408181ec5b135bbb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00310-of-00512.json.gz": {"num_bytes": 29993012, "checksum": "afad2f39bf4cb932e50d9a0be93940b423e7abcc3d67dac15b1939e4e40f4ce4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00311-of-00512.json.gz": {"num_bytes": 30448951, "checksum": "a049c31ef6304084d33cb7bdd2e21ada0c60b40b1002b2369e60d36a5098c4b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00312-of-00512.json.gz": {"num_bytes": 30034189, "checksum": "557d1e88400a6d1d8ee4d717a959239edacbdd3e18d8cd20c5c85b77174dc302"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00313-of-00512.json.gz": {"num_bytes": 30066486, "checksum": "e4823ea1e9a59d5db84564a5b90c28fd8058450f238c60ad689ffd6b673d65f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00314-of-00512.json.gz": {"num_bytes": 30397706, "checksum": "1b4c0653e7ccf7fda0a53d8cbd5ddd57322ac83822e9d05bbdb9eb8ac979cf50"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00315-of-00512.json.gz": {"num_bytes": 30219107, "checksum": "9c364c9cab4ff7acdd1818b13de2f36713df8fa6c504ba15cdf47fe8e3c30206"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00316-of-00512.json.gz": {"num_bytes": 30098661, "checksum": "84dd8a8739b5abc39d8180f0894b1fbf2930d6d333d7c86b646f40763327397c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00317-of-00512.json.gz": {"num_bytes": 30178992, "checksum": "16e4791b4e5ab3719dacf79fedb0b88ed54346372874c37ccb71d86bc419edc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00318-of-00512.json.gz": {"num_bytes": 30022982, "checksum": "98345a826aab12bdaf5e639205d5dcdc1da8fecd7cafc1982df89ac8d4df7ebf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00319-of-00512.json.gz": {"num_bytes": 30360409, "checksum": "d53a39019a1627b42ae6bff68e283d37d0bb5f48b328c2c5cdcc1a3897f4e992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00320-of-00512.json.gz": {"num_bytes": 30347267, "checksum": "c343a0eedf58484055e58762802ae8cc05f2cdb0b923785c493d056a2cbdb015"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00321-of-00512.json.gz": {"num_bytes": 29967877, "checksum": "cc5795d254ad749ccfe613034927bdf95529545ae1f277b694dd24a5996aca83"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00322-of-00512.json.gz": {"num_bytes": 29885538, "checksum": "d5eaaa1eea983bd37ed34651e6c16b746ff7c92e48038b234149fa6d04d3d866"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00323-of-00512.json.gz": {"num_bytes": 30308848, "checksum": "a42cfaef5e088fd6b24dfc121084a6cd038f5b0bfaecb9f33997ab22a97fb155"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00324-of-00512.json.gz": {"num_bytes": 30351634, "checksum": "0e2e6933f93466e9c8fe966f7770fe4c34caf182c713dad3206f4132eed1d41d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00325-of-00512.json.gz": {"num_bytes": 30077168, "checksum": "77cdbf7040ce7f38d735fef41813ce63aaa16fcd87fce80e6ca6bd56d350c369"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00326-of-00512.json.gz": {"num_bytes": 30031750, "checksum": "8d994c2dc1b766e3270dce3f0b8f6f8fe22d5c1e0e9780e1bfed52c1292b8641"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00327-of-00512.json.gz": {"num_bytes": 29845765, "checksum": "f6279e351d016769d6fb5482d01a15ba054d5fe6f9f1c4e92c0663cef0083002"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00328-of-00512.json.gz": {"num_bytes": 30253188, "checksum": "2ea84aafd94d1843a2cc4428279dbb079c6ae0aae6c00f90ee4b5ace3c827afd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00329-of-00512.json.gz": {"num_bytes": 30124922, "checksum": "49e3d91126d53eada7bbd87bfe9eaae74f059c69cd70a3a3b8101f49c1aca154"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00330-of-00512.json.gz": {"num_bytes": 30026414, "checksum": "07442fc4f7fb1732362293bc15a6754d70ecf4743392cf89c4497b3cd96269fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00331-of-00512.json.gz": {"num_bytes": 29961847, "checksum": "f437c6f5f758a5d32c8fc949037060259162864c29aeaabf37032e79f5a1cf0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00332-of-00512.json.gz": {"num_bytes": 30167166, "checksum": "96018497eb6dec020436c1333ff81980a64fb615997855fdd8cf35fe3f658db6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00333-of-00512.json.gz": {"num_bytes": 30192963, "checksum": "1c12ea6b9031049dbc84e4da6b5fdedf480e989385d758c88322c415a1cabbb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00334-of-00512.json.gz": {"num_bytes": 29847008, "checksum": "c269285f15f626b4b15a7d1705ffa08e3f4d49ce13de8174b72f9f6276a1c6af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00335-of-00512.json.gz": {"num_bytes": 30262244, "checksum": "179ee564e6fc644d9ee139bdb02d470a1172221b0f6e510ee5935683500f8257"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00336-of-00512.json.gz": {"num_bytes": 30262910, "checksum": "317933afdd8dc8a3a355e44ee3d84bbab12a2f30c98ea1172dde7074ed4c0557"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00337-of-00512.json.gz": {"num_bytes": 30155329, "checksum": "c5b850399252ec41b0fd9cb2da87ce25e5a44df9f44c6ed9d8c559a5729e5a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00338-of-00512.json.gz": {"num_bytes": 29952961, "checksum": "48083123ba97a6212e0501799bd01936f0795bdd4d9c2710b9aa67d54b29037e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00339-of-00512.json.gz": {"num_bytes": 30403399, "checksum": "313b60f985dcf591f34d351b758eedace655b6c6d3946dd2ddc55f34a9a97ae9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00340-of-00512.json.gz": {"num_bytes": 29917484, "checksum": "2c72290f3bd51dea2a2877d68a968dc2b75dadf99ab3cc2230e41be45f3515d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00341-of-00512.json.gz": {"num_bytes": 29905522, "checksum": "1acd83a0da4a7a4912b589dbeb68b37396d0454371b2b71af4ae18b854d482ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00342-of-00512.json.gz": {"num_bytes": 30022369, "checksum": "8756be42335bba12d06de63e247659f8d603a092ff342360dfed645aec135c47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00343-of-00512.json.gz": {"num_bytes": 30229313, "checksum": "863e29987a3ccfa08e14ae987c81367a53b9fe08795184db086117a9555e058b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00344-of-00512.json.gz": {"num_bytes": 29924335, "checksum": "aa9003a7cc3527fb658fd807c78890587a8b35634a1f0838bc221a6374205d20"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00345-of-00512.json.gz": {"num_bytes": 30229482, "checksum": "a7e88b015bcf7761217e9b3ffd413f13cac48f6afe083353436de6cbd0d0018d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00346-of-00512.json.gz": {"num_bytes": 30029147, "checksum": "b862ea62ac032c203c0038c061a44edabe4644be03b876ec7322e96762374940"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00347-of-00512.json.gz": {"num_bytes": 29808182, "checksum": "62915b86cbbf61a76f73d05509a8e839aae0b965134ef79022377625df7ef741"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00348-of-00512.json.gz": {"num_bytes": 30091116, "checksum": "6c384c2c6bc8340b88e085f8bbc2616be68c96fa7b8b88306b4500367d053a49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00349-of-00512.json.gz": {"num_bytes": 29867618, "checksum": "bfb19508ecf8bd4d9a8847f0edab5acde6896182c27da706a6f2863bec43c152"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00350-of-00512.json.gz": {"num_bytes": 29723106, "checksum": "a645c62c94de9018175f15a0b38aa8bd2484601ee189b7c27d589288eb5af97e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00351-of-00512.json.gz": {"num_bytes": 30047620, "checksum": "991061a23834e6bb3dc0595cf0e8328e07746d10fbf7a7ba397c1410cb66175a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00352-of-00512.json.gz": {"num_bytes": 29808328, "checksum": "6c8e377a6cc82e81d66e2be3d23c1cdd42480015a68a1db458d542b7ff64ab7d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00353-of-00512.json.gz": {"num_bytes": 30040117, "checksum": "ead6f32d98a91c47fb9c21334143f02181efb0b831705baeebb9820d069598fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00354-of-00512.json.gz": {"num_bytes": 29953984, "checksum": "ba349e503d017abbc1c83da2314c0a4892a9f3e5e480173812578f44d9b5904c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00355-of-00512.json.gz": {"num_bytes": 30179912, "checksum": "2bfeab794bbe0432db52cc595d25864b17fdb0744a80d6d907f6f2ffc5c56b81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00356-of-00512.json.gz": {"num_bytes": 30312163, "checksum": "d0dec696d28c601d3a1f75b0b6e6e711e00809f0d5ea915f63cb6d9b7adcc597"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00357-of-00512.json.gz": {"num_bytes": 29931515, "checksum": "d43c75371e32d0c1e65f43acc00aac3ca43762d4c6eb6bb61759ac5fca593a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00358-of-00512.json.gz": {"num_bytes": 29739788, "checksum": "96fef1b4a5d6a080ff5d4a10bc90911dcb2ddecb4be91d0c9620e6d2484e3ee3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00359-of-00512.json.gz": {"num_bytes": 29913841, "checksum": "05b065d2d13b787ddee4707be7e2be46173c23794b9e8c773d0da743f435db17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00360-of-00512.json.gz": {"num_bytes": 29805295, "checksum": "826104b9f4c2634d128f15564bd4990057dfbbb4066f2a082039d243bab56935"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00361-of-00512.json.gz": {"num_bytes": 29839676, "checksum": "ee5ba4cb14ecee0c857828a866615c6bfe45f67b158173dcac44146a02d97738"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00362-of-00512.json.gz": {"num_bytes": 30154783, "checksum": "d67b49e6fa5dc293fbd3057b7ca0beb7e0bd1ff692cdad7f2dfb7abadc1f4599"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00363-of-00512.json.gz": {"num_bytes": 30126118, "checksum": "6940704da6cde5822d48dc806280b8d57e0593ba299731e68ca9c2a4f7cf65bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00364-of-00512.json.gz": {"num_bytes": 30184894, "checksum": "e740b4a0240e691f16a423fd658aa3c7539986695418af3b5a171a48524db74f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00365-of-00512.json.gz": {"num_bytes": 30386766, "checksum": "5a6a9461ef9ca579a849f6bef4d6225504a885aa797d3b2236ed8df6f5ea72ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00366-of-00512.json.gz": {"num_bytes": 30208411, "checksum": "8e0ce2447dfadaa4d41b991a2ce1be63b409e58e88944594dc8591bf9ab41403"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00367-of-00512.json.gz": {"num_bytes": 30266003, "checksum": "04ea00b46a583edea7740d74d719ef7f303b7f3873365b9ff4e94f08ef80832a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00368-of-00512.json.gz": {"num_bytes": 29993752, "checksum": "38b1a55dd4ff1b504d2dbc0b2ad54fe43ab16c8bdba55bd97f4a55dafa8c83dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00369-of-00512.json.gz": {"num_bytes": 29833222, "checksum": "a25c405918920ed00edf5f3007cb8895b59fb67618dfea266b048273303b9592"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00370-of-00512.json.gz": {"num_bytes": 29988999, "checksum": "2812e6d9865d77ca8ac2d1499ba86be1ceed868a1da2bd13fbd0967058a3516c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00371-of-00512.json.gz": {"num_bytes": 29866636, "checksum": "ecd1d3bdc41c3f41f8c9d3a63c75766c173f70ff117af748a08c221ca4273b18"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00372-of-00512.json.gz": {"num_bytes": 30296883, "checksum": "723d2c5ebbdd95ab84c53e458d81944b6907d08c7aec67300f012880624d0010"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00373-of-00512.json.gz": {"num_bytes": 30310322, "checksum": "ae45d088521f2faf9852cb169962176e84bbb81d5ba157d4228d348f7fcf60f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00374-of-00512.json.gz": {"num_bytes": 30340527, "checksum": "9b09c9e1b424fd05540b720c5a85f71eea43d743dc4ebb318e839125ccac9383"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00375-of-00512.json.gz": {"num_bytes": 30193692, "checksum": "c3ca4bb179cadf872f25f1cdb5c3667933bb8dfb7af21068a24b1b09c961dfa8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00376-of-00512.json.gz": {"num_bytes": 30184130, "checksum": "5d801f4bc20c4c6d8821ccfff06cb5dfe4214e571734feacbea3325462afa280"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00377-of-00512.json.gz": {"num_bytes": 30259301, "checksum": "ebf08508c24e29a8a14b72248f090d765b02ee7a31296811d0391f2a2e73c046"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00378-of-00512.json.gz": {"num_bytes": 29650049, "checksum": "c13e994e68b938ca069d2d412e7891cbaf2ee205d65b1c17c6acfea01adce157"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00379-of-00512.json.gz": {"num_bytes": 30265211, "checksum": "667da6f0650dd684aa50bc691b5783968ae8cab847dea14fc8d8bfe203e351f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00380-of-00512.json.gz": {"num_bytes": 30429631, "checksum": "7cf0e9ae00bec72f571d152730107efdd944176818600517fb2d0412a859d366"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00381-of-00512.json.gz": {"num_bytes": 29889471, "checksum": "f781b3128e92c54365be7771695555378067a65fb922e04062ab6f3f092ec827"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00382-of-00512.json.gz": {"num_bytes": 30029894, "checksum": "2d133def2bc4b840312ebe5c466c9f22729b67aa4c2a41dda2e6a9a55ddcddbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00383-of-00512.json.gz": {"num_bytes": 30249255, "checksum": "e8610abf7e2bd70b1067a1b2dbf392ac32be156945502629228969974d3899b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00384-of-00512.json.gz": {"num_bytes": 30362665, "checksum": "f217071bd0c1b1bddb3342c85064d7ebb54bcde2512997636f0638a0b3641588"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00385-of-00512.json.gz": {"num_bytes": 30080234, "checksum": "2db4b15c7391b6e6d3791721ee574d09101df597110feebc59e4f0aff4df6c26"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00386-of-00512.json.gz": {"num_bytes": 29897704, "checksum": "035daed74487c5262b8cfbefdfaefd17f2834c7b4a1d293934d755e059b58f5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00387-of-00512.json.gz": {"num_bytes": 30072139, "checksum": "73013fbd06eaf94a7c8a0f0de420f83bed56655fb2d4e5d93972e8ca1847d130"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00388-of-00512.json.gz": {"num_bytes": 30123843, "checksum": "5db846c3d0b36774ce771ddfa8c53a915767926a2ad48222256d839326336f19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00389-of-00512.json.gz": {"num_bytes": 30278955, "checksum": "9e4c590e67b2fbd357af955e39864ffe73dda201d76759935fda80b10b463500"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00390-of-00512.json.gz": {"num_bytes": 30013591, "checksum": "90974ba6eff489e0f4f52187b6241120740c782945e86525cb5d1e551a54e322"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00391-of-00512.json.gz": {"num_bytes": 29925212, "checksum": "10fcd62813434e2557b5861fd8604f534952561065bee9dc525b1cd3f5b2730f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00392-of-00512.json.gz": {"num_bytes": 30016498, "checksum": "da88b36bd3f15551d8fad115a86f111cc5c3d9a3c6fa9497214aabec7bcd6aad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00393-of-00512.json.gz": {"num_bytes": 30061083, "checksum": "1ed9881020f240e1277e6513bc2abf24ea48e9cb0046d7e87a6d3669c8b42a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00394-of-00512.json.gz": {"num_bytes": 30043459, "checksum": "a35c3de1b0c982df8471705574e6eb7cc730fff122ff17d1381f2c7b9f20d6bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00395-of-00512.json.gz": {"num_bytes": 29921106, "checksum": "f4cf52f8d6a1288773cc366469df140f885b233fb6aa1cb75387a450d88ec94f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00396-of-00512.json.gz": {"num_bytes": 30024980, "checksum": "5ebe04e54e4242d52aacb4c2e107dd10e609d5a7a6ff0425d9952bed98ef4921"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00397-of-00512.json.gz": {"num_bytes": 30096825, "checksum": "3ac381004d8257aa50fb28f0fd2171abbb93ad825c3f43422b9dbec6e1c6f31b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00398-of-00512.json.gz": {"num_bytes": 30059739, "checksum": "40c38af325f4d01ae7c74aa9cd8f8d1c96c6af851175f80d3c50d85c5f5d3585"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00399-of-00512.json.gz": {"num_bytes": 30049826, "checksum": "2ba0109b2d5b88422250bcbd2494cc6e11528710f38fa6e83a1f699b840b68a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00400-of-00512.json.gz": {"num_bytes": 29953506, "checksum": "010610ba3af3dbfbcf2fac93136b7066fc58eb914dce9ae999722d0cfec4d331"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00401-of-00512.json.gz": {"num_bytes": 30271141, "checksum": "29587bb4be2c367f6479705b5c3c28716affeefc857ac1f77e4c33e55264def0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00402-of-00512.json.gz": {"num_bytes": 29861236, "checksum": "8e399149c335ec599f881fada448c9b4be22326357153c74b0de627078f1d43c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00403-of-00512.json.gz": {"num_bytes": 30175831, "checksum": "0d2800836914a1e2ef4a1aaea6e70d19699fc2555582ec670223177cac05a4fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00404-of-00512.json.gz": {"num_bytes": 30097682, "checksum": "f9665e9199978b123feb962ce347b30cc1520626c32dfef0ca3cd8895a45e445"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00405-of-00512.json.gz": {"num_bytes": 29810961, "checksum": "8ea29cf9f7774a16a4c2aaeff1b6353de2951073676a9c411f19b0a5fb755b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00406-of-00512.json.gz": {"num_bytes": 29963498, "checksum": "90b10c91f6e0006576ec9b426c424e50fc1726c25ae8eb91bf91bb9001ade2e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00407-of-00512.json.gz": {"num_bytes": 30089554, "checksum": "cfa905514e4f19c4eb82e438f5eb987731004476f026f4bebbeeafbe519ec85f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00408-of-00512.json.gz": {"num_bytes": 30148002, "checksum": "dddada59e2ef306cdf83b7c9ce3c912792237852053a4ea683224438a242c5ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00409-of-00512.json.gz": {"num_bytes": 29989174, "checksum": "907667ac304b6cca7100a9606e915c003fee43f1640d5b01405beb16eac4c379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00410-of-00512.json.gz": {"num_bytes": 30519580, "checksum": "acd5cd2ecc46927046c81c9bb3459dd72a98e346ebb59c13c0db08fbb60961a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00411-of-00512.json.gz": {"num_bytes": 30408107, "checksum": "6a9c2d42717f853cd4a76fc5275e95e2a584b7465c6059f586f6a06417048a42"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00412-of-00512.json.gz": {"num_bytes": 29699198, "checksum": "29e76bdab47496ed61a102edd3c61c20e60ab52abeb8e6068f7aa4ad1868f4fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00413-of-00512.json.gz": {"num_bytes": 30065457, "checksum": "b4a33941d0b994b82e3be351542cb4a832742e050ebbd71481e7ba34c8dcbc3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00414-of-00512.json.gz": {"num_bytes": 30342960, "checksum": "4ba7edb3c77a45f0e4cb7e969053db6f44ce8c0a8ef262582512814b1161d9ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00415-of-00512.json.gz": {"num_bytes": 30201576, "checksum": "25cb4eb4bdf3cd1b29289a23696be8bd41c5f577294e94607bea7b91252a04fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00416-of-00512.json.gz": {"num_bytes": 30021170, "checksum": "60472bd2a2896bfb57baabb583fc6cdd402a1d776f6a4c9bb58ed556e67cd76f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00417-of-00512.json.gz": {"num_bytes": 30237505, "checksum": "aea8fd33c2acf1cef890549b1f88b18a2eeb37f6d4dd22b552f735811ad0b8a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00418-of-00512.json.gz": {"num_bytes": 29999334, "checksum": "93583d771ce7f0e1d044de2919a3ffdd48b7b7dab0cd3b6dc459200dd53d8762"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00419-of-00512.json.gz": {"num_bytes": 30194801, "checksum": "cd36e129487272742f3e60ab6512dd79b3d1ce3c22490d2e47c00c2ae595cfc6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00420-of-00512.json.gz": {"num_bytes": 29903898, "checksum": "6f18a5ffc7efe5f555b02d3a31ed43714e09e73f7462206220d70450f47cd6f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00421-of-00512.json.gz": {"num_bytes": 30015573, "checksum": "cfacef2cffd953425eaf4d7b2b6cf5d2637bf5d58c6ed2bd0002442795c7d36c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00422-of-00512.json.gz": {"num_bytes": 29966521, "checksum": "14f646b15948cf586ec1abd4bf4bf45bf180913e4d09049fa779bc7a196e455e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00423-of-00512.json.gz": {"num_bytes": 29972805, "checksum": "ad7d4ab443c7a8122976570891a225a44ff86d2299d70706066633a6204eb0de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00424-of-00512.json.gz": {"num_bytes": 30317886, "checksum": "37c8bf3b535ea4053aa2424c846e3449f9eb27d5ff999e1e93b6cee0aa975333"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00425-of-00512.json.gz": {"num_bytes": 30059310, "checksum": "674ca5eaf6a88f76881c8a1c48e1e0f93794785ee5ea17fb70f49228d7f39614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00426-of-00512.json.gz": {"num_bytes": 30182498, "checksum": "988d08cd18162d9a309155d2e75cd4980f76ab4c73ef8286edae94ca4628ebcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00427-of-00512.json.gz": {"num_bytes": 30253874, "checksum": "aa8c08a684ea0bbfda9297aea07429172a2fa4a161268b964421796173275b35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00428-of-00512.json.gz": {"num_bytes": 30055421, "checksum": "b1ed26e826bee7fcbc31cf1c368c9a63eeedbea1c2fd0fb07370b461a03d1a7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00429-of-00512.json.gz": {"num_bytes": 29830674, "checksum": "3efdc67ad7a108416dae47886e542da5c2ab1cd7e1aedd25c1c5d4e0607572f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00430-of-00512.json.gz": {"num_bytes": 29938000, "checksum": "3221ef5e4c28d44c1da4fa04689f318217991c07aff4fdee5e1091fe8e1162ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00431-of-00512.json.gz": {"num_bytes": 29829687, "checksum": "225f4e22df1b45a7dc9fef2f5a44da8f8ee25608cbe34195e21b49c8cd10f3ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00432-of-00512.json.gz": {"num_bytes": 30006209, "checksum": "9fc53637db7b16c8cf6f824adf21d4602efab715ad78eab62c4be7981a8bbc1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00433-of-00512.json.gz": {"num_bytes": 30656456, "checksum": "6bf7b701dc18f68d0facd7cdea49a26cdcfdd7829d5346eefe555485cfa7f336"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00434-of-00512.json.gz": {"num_bytes": 30138891, "checksum": "793532f72aa41c1dd7c549e9597fe8e73796c53eb5fe410a73de418ec446d686"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00435-of-00512.json.gz": {"num_bytes": 30430276, "checksum": "0d13d345ad12999fb4e7a9675e08bb1c90980fd193ed8530e4258e07bd6ea754"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00436-of-00512.json.gz": {"num_bytes": 30173309, "checksum": "fbce5fadb4b49bf833f77337929d873b2b25c3b564f7622f3672dde7a044e5d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00437-of-00512.json.gz": {"num_bytes": 30142240, "checksum": "76c34800a3223f5fe0f1960f3d3c9dd9ecdc2e652493d71ef245415b5027c902"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00438-of-00512.json.gz": {"num_bytes": 29979673, "checksum": "4784c3787d24b9d46ad7c835683c6506c2e55c84835391e2aca0355f032a1888"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00439-of-00512.json.gz": {"num_bytes": 30169105, "checksum": "5012d03e637769d7494bd3cef0a8dfc8b38c995e0d5780089c15d6b1495b3a8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00440-of-00512.json.gz": {"num_bytes": 30107004, "checksum": "529beaf4ad0251e35be574b1f623571526ec91a588ebd7df43e9d1cb99445f53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00441-of-00512.json.gz": {"num_bytes": 30324563, "checksum": "f5e5fbf5e329f5bb0e83f758b8fc76516d65c3f91ad97e328187eaea83e4b667"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00442-of-00512.json.gz": {"num_bytes": 30335681, "checksum": "b8a26ed60f87a87347886b4467aa576ec5e8c106931589a1aa821b99fdabdb54"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00443-of-00512.json.gz": {"num_bytes": 30155655, "checksum": "e27bfb813fd6aba96ada81b095a559f0b7847cd25f7f8973663b19cdc5b8985a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00444-of-00512.json.gz": {"num_bytes": 30340540, "checksum": "705dec13ba2824d45e801bc2cf3e709d6492b1ff6de2f9ddefb5a57dbdada4ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00445-of-00512.json.gz": {"num_bytes": 30248960, "checksum": "09a6b83910369cf269c4f095607fb2f0ac0ec7e25b501f577fe13920a8573ee0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00446-of-00512.json.gz": {"num_bytes": 30316703, "checksum": "8f88b794c08bb492f50073337a30aafac0d05819505b507ab283dba0cf17d125"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00447-of-00512.json.gz": {"num_bytes": 30184407, "checksum": "38c819df823197bea6d647c3f78bcc15024aabba814cae322c1663c45fa8382e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00448-of-00512.json.gz": {"num_bytes": 30238484, "checksum": "8c0abfb8dca37a179b01dadd2227206cbe6e5b916d0111c0b00d2edc3951c7f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00449-of-00512.json.gz": {"num_bytes": 30143151, "checksum": "9731e9644e5615d5d5ebdbacc6efa6382df856c8763b7485c9a5838864c1332f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00450-of-00512.json.gz": {"num_bytes": 30122606, "checksum": "3b746f616f21c91277cde8e6d0d7f792ead7874de7ecdf11830a4a56db3dc799"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00451-of-00512.json.gz": {"num_bytes": 30128179, "checksum": "d6cadfc64ee39c9beb93f0bf8c169ca9d9053e0f76e1c9697841438e20dddef3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00452-of-00512.json.gz": {"num_bytes": 29979326, "checksum": "42de19ffc3ec821fbf5ff686d1b36d189ad9ee5c4553a2ff0d003ee1a754c9c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00453-of-00512.json.gz": {"num_bytes": 30118272, "checksum": "22f9b2d3a9f089f1015f74d1ca0aca8f2a4970595326d964817177cbe6859271"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00454-of-00512.json.gz": {"num_bytes": 30018294, "checksum": "17c16895edccbb8b40fcc52cbafc0c15957020eb530e071dcce34544d5958bd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00455-of-00512.json.gz": {"num_bytes": 30155903, "checksum": "8b9d49837b309c3389d03dd3bbae92395bf7086134fbc69d28d9fff60a90d4a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00456-of-00512.json.gz": {"num_bytes": 30282104, "checksum": "ab63fd2efb0cc883d303241b3488a8135a196db7edc844458cfc1483898ceb3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00457-of-00512.json.gz": {"num_bytes": 29920723, "checksum": "dbde2eeef90144b209ef5afa6d5165ad638ae57d919926a379a10fccf6850a61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00458-of-00512.json.gz": {"num_bytes": 30163167, "checksum": "800307106f5861e0bc246bcaae214e6dadeee849905cac184ecfe6d0b560fa68"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00459-of-00512.json.gz": {"num_bytes": 30248893, "checksum": "3e78d327a9463929f33311e18116f5d1d2ae4926f7a600378875ba854cf5ee47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00460-of-00512.json.gz": {"num_bytes": 29840067, "checksum": "047568a5dad00b04ca1ea4aa262c7a4af9b61e87bc4ea02ffd5c6c8c049bf8a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00461-of-00512.json.gz": {"num_bytes": 30179062, "checksum": "ed8abe7b465bc19150b831632cb7afa298d6cb4beb9b6043a35a0f8afb5f730d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00462-of-00512.json.gz": {"num_bytes": 30266398, "checksum": "d7b74f5c1c1f7bb489700adcfb7e48400c4fcca7669e2d56396d9fabb5a63b91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00463-of-00512.json.gz": {"num_bytes": 30158800, "checksum": "224815aee29f6d04ddbc7457c84338eef9b127a767e7b50ed77283ff166d4f93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00464-of-00512.json.gz": {"num_bytes": 30393915, "checksum": "0dd019fd2c19936ce2e6410b65872f630131c5da7543c8e66fa87547fd1a2209"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00465-of-00512.json.gz": {"num_bytes": 30148939, "checksum": "6d74dc9d74d28c2b8ba8d43ba3d594af0cb176cfa7bf738f3933be2a9c37bb85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00466-of-00512.json.gz": {"num_bytes": 30268228, "checksum": "0e201327066f28c19b082fe35e4fb3bd76c8fd2d32236d1d6e2309489152aa66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00467-of-00512.json.gz": {"num_bytes": 30121937, "checksum": "7352e5a9ee66dcbeed2c9e1fbe6c9355f0e5dd1b30b592a9fd5690958945e5a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00468-of-00512.json.gz": {"num_bytes": 30004669, "checksum": "53876848336ac57c082c9d5735bc1717f69ef38688b221d5e5ab9cd9cb4ec620"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00469-of-00512.json.gz": {"num_bytes": 30049860, "checksum": "a5a720b38f106dd5d2a2b7647748b52b4531ac12294e3b0d8dbc92062639c0c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00470-of-00512.json.gz": {"num_bytes": 29961380, "checksum": "9611764fc4f84b92e86fa6f9ea41464f6c26b07d1c51241b627a3d155e99d163"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00471-of-00512.json.gz": {"num_bytes": 30449164, "checksum": "db508df549d518c3e8b99b2f0098ea93fead1e632f53d8ae2cebff1d3476577c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00472-of-00512.json.gz": {"num_bytes": 30312620, "checksum": "1993b5e292c6c60a3373aabe896f1a57afaad73fdce0ec60e30696368f7c0afa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00473-of-00512.json.gz": {"num_bytes": 30406764, "checksum": "913045c61fb5a145379d9fe08c91ea63092b197400c0c87bfa65af91720b563c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00474-of-00512.json.gz": {"num_bytes": 30078563, "checksum": "c495119e150b083d709ca915abd760683793361ebf3e079b04efc9b7e1900379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00475-of-00512.json.gz": {"num_bytes": 29860761, "checksum": "50bb5f40d2e91ab136aa63063fff860529c8961f2a38500a645b10339751589e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00476-of-00512.json.gz": {"num_bytes": 30199778, "checksum": "c969cfbb7ed7716f665b336b2ed9f7b10b532c7adc6d8a347964831a39cfef0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00477-of-00512.json.gz": {"num_bytes": 30130742, "checksum": "54c8b89102cf882eda5208544a6c5d317c1defa8d997f9450ebd576e58f91830"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00478-of-00512.json.gz": {"num_bytes": 29901444, "checksum": "f669299d794ecc0523c64ad31af8fcce5cf3f880e87fd73f4c3f434425e9b238"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00479-of-00512.json.gz": {"num_bytes": 30587214, "checksum": "25d0fbd9027deaf140650f0b82a2316c37939f199fe7633b9f643684404f2029"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00480-of-00512.json.gz": {"num_bytes": 30145237, "checksum": "68a29728290e1199ce8d1ac060365bc443ea67c24292b2b04f1b4ca44ca7238d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00481-of-00512.json.gz": {"num_bytes": 30204159, "checksum": "1605034b89e33f6794c901adac1eb200bb489f76b9bae6bc56b01e9f6ab4c254"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00482-of-00512.json.gz": {"num_bytes": 30430794, "checksum": "2dce9df095e89ea6645fb599f518612511a62b6c475808ad004c32968b19bae8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00483-of-00512.json.gz": {"num_bytes": 30102412, "checksum": "c7c626977521b0d1f5bcc02c484b3eb4f517ba71006a4802df08a0f4cfb8ea9e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00484-of-00512.json.gz": {"num_bytes": 30171871, "checksum": "519ed997f1f1f1de7864b0bddf202b25e25bed349f63593a88337262d7705968"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00485-of-00512.json.gz": {"num_bytes": 30049539, "checksum": "8d2314fd3239ba3dfa99962c1d0a38e05edf9194e1faebae88f6b19ecab8fbf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00486-of-00512.json.gz": {"num_bytes": 29949995, "checksum": "a7521e09cbe77098c23172427bfb931dd50f0c9d58b034fd1621687849a8d379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00487-of-00512.json.gz": {"num_bytes": 30345072, "checksum": "ebc6254a4d241afb886b8df20819301121fcb234a32a1dd4ee8ae49571081f92"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00488-of-00512.json.gz": {"num_bytes": 30300622, "checksum": "509bba28ddf770d38554a2e846f2ce0d2af59e3662a6d6ec4dddb75fb509f8d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00489-of-00512.json.gz": {"num_bytes": 29949909, "checksum": "996e61f8e674b0a016a568630ee13a7473f99a919437c225a4198d232861e628"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00490-of-00512.json.gz": {"num_bytes": 29995429, "checksum": "9730024ad352eb12f74ac446ed32b9c57898658954be5dd639184fc5264527cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00491-of-00512.json.gz": {"num_bytes": 30293919, "checksum": "65b2a7de3284e892441b0fe8e850d89de842355d78fa9944358b1ee5912a948f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00492-of-00512.json.gz": {"num_bytes": 30115831, "checksum": "26b535c3175bb86ef721593f81d9cf006d4c3749f156c63ccd2a2c04e1201236"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00493-of-00512.json.gz": {"num_bytes": 30187809, "checksum": "a0918223c5523da20bd8230de1985b0a3cbb1e239af3d62a83d720a3a528c567"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00494-of-00512.json.gz": {"num_bytes": 30149878, "checksum": "6e9a5e329f834e41b4a8a9a6809df3243e5bffc580327912288ad7f790b43ab7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00495-of-00512.json.gz": {"num_bytes": 29711944, "checksum": "3b9ba9d667e1241692ff9a654a68e98e8e94e32244a9419b2542137b63fb4705"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00496-of-00512.json.gz": {"num_bytes": 30114815, "checksum": "24b78cc36bb0abc67c998320e7029b6e7bbbee267a367eb538f23956c13f27a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00497-of-00512.json.gz": {"num_bytes": 30048480, "checksum": "29c3606acf298498fc3498bd769544e2879afbd0d5c46cee298cb25058694aac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00498-of-00512.json.gz": {"num_bytes": 29934973, "checksum": "8afaffea92dfad745be8aa8cd3de0ee97cbcc26fbad6c71d56683aef6a27055f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00499-of-00512.json.gz": {"num_bytes": 29796509, "checksum": "9cbbd8f6d8fe92207c4cb2f0422284726deca1bde7f30cb01cce7fcd4665b380"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00500-of-00512.json.gz": {"num_bytes": 30221736, "checksum": "902904aa9fadaecbe698402a27b4e68b00813e67b79f84d4c696cd9c72f08f55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00501-of-00512.json.gz": {"num_bytes": 30108320, "checksum": "76e848f8dbc082158fc5d3a2f7c10cd6e03585667c00efc639f2c6f47d44aeb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00502-of-00512.json.gz": {"num_bytes": 30381907, "checksum": "885bbc9788235abf33728737f72f267e60d1f5d4a77493cae76f161651d89579"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00503-of-00512.json.gz": {"num_bytes": 29983805, "checksum": "5134934392b13e3f84dd32dcb1c59f4d5416d6dfd925bf896f3eb61881d82136"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00504-of-00512.json.gz": {"num_bytes": 30041413, "checksum": "4978245a7f545d676bad6edfdfe60ffdad94de47af0fb10649fa39e9b068939e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00505-of-00512.json.gz": {"num_bytes": 30021620, "checksum": "64933c28ea3f608326f1c6ef56170886767f1ab4f9ecbc4bf3263c7043901fce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00506-of-00512.json.gz": {"num_bytes": 30260343, "checksum": "84667dbe68ecf1f9bbdaba0e73eca6fe0444f6594a1e9a4b46e9812ae7bce7d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00507-of-00512.json.gz": {"num_bytes": 30173739, "checksum": "dd6d44e4f344f3ab1cd61bacced7b5f1429cf6823fc9282452a539012bda028a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00508-of-00512.json.gz": {"num_bytes": 29903443, "checksum": "4afc46096ac2697867c3a75896c5ceb36617c4c21a749dded58a1ea4565e41df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00509-of-00512.json.gz": {"num_bytes": 29862664, "checksum": "74a720dc16b389e8122d61aa94bc12a5bc4253ca6f39679781c938e2eb556878"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00510-of-00512.json.gz": {"num_bytes": 29744368, "checksum": "6a302049e7a1668c5fb2e4b5afca518fa53ba1a9dc717015ecb5768e85ec4139"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00511-of-00512.json.gz": {"num_bytes": 29896714, "checksum": "48b89e909c0e33fd59c9623f8517cdfa90fa35a4641f999c6f68e1cc9f2a309f"}}, "download_size": 15419740744, "post_processing_size": null, "dataset_size": 76331315892, "size_in_bytes": 91751056636}} \ No newline at end of file From c7ab0a459fc9624def253235f0e92fc6448b7bd1 Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 1 Jul 2021 14:14:40 +0200 Subject: [PATCH 03/19] dummy data --- datasets/c4/c4.py | 2 +- datasets/c4/datasets_infos.json | 1 - .../dummy/en.noblocklist/0.0.0/dummy_data.zip | Bin 0 -> 5689 bytes .../c4/dummy/en.noclean/0.0.0/dummy_data.zip | Bin 0 -> 5689 bytes datasets/c4/dummy/en/0.0.0/dummy_data.zip | Bin 0 -> 5689 bytes .../dummy/realnewslike/0.0.0/dummy_data.zip | Bin 0 -> 5689 bytes tests/test_dataset_common.py | 34 ++++++++++++++---- 7 files changed, 29 insertions(+), 8 deletions(-) delete mode 100644 datasets/c4/datasets_infos.json create mode 100644 datasets/c4/dummy/en.noblocklist/0.0.0/dummy_data.zip create mode 100644 datasets/c4/dummy/en.noclean/0.0.0/dummy_data.zip create mode 100644 datasets/c4/dummy/en/0.0.0/dummy_data.zip create mode 100644 datasets/c4/dummy/realnewslike/0.0.0/dummy_data.zip diff --git a/datasets/c4/c4.py b/datasets/c4/c4.py index f88959ea5a3..01838eb53e8 100644 --- a/datasets/c4/c4.py +++ b/datasets/c4/c4.py @@ -74,7 +74,7 @@ def _split_generators(self, dl_manager): for index in range(n_shards) ] train_downloaded_files = dl_manager.download(data_urls["train"]) - validation_downloaded_files = dl_manager.download(data_urls["train"]) + validation_downloaded_files = dl_manager.download(data_urls["validation"]) return [ datasets.SplitGenerator(name=datasets.Split.TRAIN, gen_kwargs={"filepaths": train_downloaded_files}), datasets.SplitGenerator( diff --git a/datasets/c4/datasets_infos.json b/datasets/c4/datasets_infos.json deleted file mode 100644 index dfb882a7201..00000000000 --- a/datasets/c4/datasets_infos.json +++ /dev/null @@ -1 +0,0 @@ -{"en": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "en", "version": {"version_str": "0.0.0", "description": null, "major": 0, "minor": 0, "patch": 0}, "splits": {"train": {"name": "train", "num_bytes": 828589180707, "num_examples": 364868892, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 828589180707, "num_examples": 364868892, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00000-of-01024.json.gz": {"num_bytes": 319308785, "checksum": "8ef8d75b0e045dec4aa5123a671b4564466b0707086a7ed1ba8721626dfffbc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00001-of-01024.json.gz": {"num_bytes": 318039285, "checksum": "b945059cd1a343cabe311881b7840a6f0363f570e745a0eff0e687e266f6b55d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00002-of-01024.json.gz": {"num_bytes": 319748667, "checksum": "2967dc7e587ced6ecb9ba617ad2d4c44901467969de5bf5b0f5a9e5b70555d75"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00003-of-01024.json.gz": {"num_bytes": 318564193, "checksum": "b79d9abef5741578929be0d59db9ca652a8276207ef18a944b7a5f11fef5beb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00004-of-01024.json.gz": {"num_bytes": 318579884, "checksum": "cd9f98eac2bc6062f55d9a36bd744cc924a78ea2fd998830e0034e4456f5d014"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00005-of-01024.json.gz": {"num_bytes": 318003681, "checksum": "8ac5907a54dbc7ab9c14624448c7c3f6afed33af9d0a855f1eae955e62e255b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00006-of-01024.json.gz": {"num_bytes": 318495137, "checksum": "8fd9b9a4b74c9414466b245ebda7db041e7bd8603971de51b5db782bd758aac7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00007-of-01024.json.gz": {"num_bytes": 318417273, "checksum": "41dd377a1ba6b72eab0260c39c626fe45ab6b649d42d57b311d3ba21a0337cd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00008-of-01024.json.gz": {"num_bytes": 318131845, "checksum": "64da652c235f089a0b52f6db5883ef5f1e9c31edc4c950332b34dd12439c99a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00009-of-01024.json.gz": {"num_bytes": 318185592, "checksum": "807a548efbb10153c9eff0df5733a97a1b51ab1743242530de1b02a8ea17ace7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00010-of-01024.json.gz": {"num_bytes": 319045292, "checksum": "3bd0f6f664069c3bd964ce48ceae60ba47b55b54745a4b00c207bdb3a1926b17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00011-of-01024.json.gz": {"num_bytes": 319686980, "checksum": "5baa0c010083459ba58e34b4e93bb758caa878f7db6fba0528921329fa1a6cc5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00012-of-01024.json.gz": {"num_bytes": 320119088, "checksum": "fdee7442c06856e2c4b7665cc51978e9011b5e0a2112c30dd15bc9e53818842d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00013-of-01024.json.gz": {"num_bytes": 319474856, "checksum": "a4ab3b24087781c3577945492525696e182ffd7ca5265b958f49803a02867ecf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00014-of-01024.json.gz": {"num_bytes": 319693210, "checksum": "62215b2451e71b117018ef73570c944aff890624b384c538950b64c37f184c49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00015-of-01024.json.gz": {"num_bytes": 318427305, "checksum": "9893c9f413a1223e7b535527829bcd6df3219929fb1abf8f2a114dd8f6ea0919"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00016-of-01024.json.gz": {"num_bytes": 318785714, "checksum": "bd0ade8b8a57348952ca31c39efdab538f54c852941a225ccd13d0a7170724e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00017-of-01024.json.gz": {"num_bytes": 320134331, "checksum": "4132cfff3f5126d9e783191a5ccc34e5d85938bebf0b8489657805277a227202"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00018-of-01024.json.gz": {"num_bytes": 318653930, "checksum": "4675ab1d77da3d676d9743dca15bfce8478498f7738f79816a25ed790d28fa46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00019-of-01024.json.gz": {"num_bytes": 319468974, "checksum": "1d2f3a6aeb0f6c159295f283d302794cd3eb944cff3fe68691997bb2dc4c7780"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00020-of-01024.json.gz": {"num_bytes": 319109754, "checksum": "b5f26d832a0ec9b0489a27169d94496f5ea33c7fb046868c565c7b5a2407221b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00021-of-01024.json.gz": {"num_bytes": 318514423, "checksum": "428da5a8d4585de16f6b3f30865a5ca7a8d1ddcd3b6002dcc1283368b0c3d60a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00022-of-01024.json.gz": {"num_bytes": 318715623, "checksum": "9bc4812ba5e08c0b2d83cd3804129ba3d77cf84ba3d8828159788ee02e155a51"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00023-of-01024.json.gz": {"num_bytes": 319874293, "checksum": "38843ab4f5c60ed2b9ec0cdc65074eaca454014d5702edd809a266190689d2c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00024-of-01024.json.gz": {"num_bytes": 318105764, "checksum": "4fa0c7ec94445ea57dcecda7864b1346275e711c9820c2c39dbb9fdb95c97674"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00025-of-01024.json.gz": {"num_bytes": 319122521, "checksum": "0758514fa2e2c133c995c00d5f4abfc14b66582a4eedd0e721bdd95c4632a755"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00026-of-01024.json.gz": {"num_bytes": 318116783, "checksum": "56a73b9a556d6794d9c706e1b1c7e729fa13b711ddc25dd403b110eb5ed857f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00027-of-01024.json.gz": {"num_bytes": 320171191, "checksum": "fea1eabb734cda33d72f3d959234a240080b4fd42cc70494814a8429b087f9e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00028-of-01024.json.gz": {"num_bytes": 319047090, "checksum": "47d1c385952d6c18c431a7294339a030c213b8832f970ac987965b621c8181a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00029-of-01024.json.gz": {"num_bytes": 318705639, "checksum": "3c744d3dd915ceef3a93fd18c3ff5b117fb5118d1ced2089979b6cafc81c4525"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00030-of-01024.json.gz": {"num_bytes": 318327902, "checksum": "7f6959020242fdc841adfc10c102bbe79e2ef8502a09dac8451e0cec6f2add16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00031-of-01024.json.gz": {"num_bytes": 318990600, "checksum": "e56f29011594c765192c34298558e7227a829313196748f9a16ec34ecdb76d23"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00032-of-01024.json.gz": {"num_bytes": 320451482, "checksum": "9ea843dfd85e449439f3106d657762daff8f326730fefb342455c43cb48144e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00033-of-01024.json.gz": {"num_bytes": 319878207, "checksum": "2633cdb7b058f126173608897f69add614659b0b21cf54ecc8a2f4a79bc16073"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00034-of-01024.json.gz": {"num_bytes": 318701510, "checksum": "853c4b9ff2d79621ed27a6be826dae198af609d9f9dbd1c2773b778241cf6137"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00035-of-01024.json.gz": {"num_bytes": 318529104, "checksum": "fb50dac3f35cb71472464f511e6b8aee72ded10b3b6896d0d1f74a18ded2b8d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00036-of-01024.json.gz": {"num_bytes": 318849657, "checksum": "5cef5cfd50cfafd58feb452b85324a3d8198fca48789f0ce69227755e72d8e53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00037-of-01024.json.gz": {"num_bytes": 319621215, "checksum": "f0b67abf30e2d58d291aa9bcc9c8a03668afe819549802e4e591a261c171d970"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00038-of-01024.json.gz": {"num_bytes": 318135467, "checksum": "991bad578a83294d34a1b11649af07339aa8cb26d49330afa9fcbca0b87942c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00039-of-01024.json.gz": {"num_bytes": 320131759, "checksum": "abbbc21f81555e94484e6afe1975e13f67af19a820cd6f8d090c987a250bd4fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00040-of-01024.json.gz": {"num_bytes": 320214476, "checksum": "48020d2656709899abd2572b3424c0455df3c1089a69fe26b776aeb24f0da0ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00041-of-01024.json.gz": {"num_bytes": 319581259, "checksum": "db6fb8db7162ac87ea002c153ef0c54322f24c8f7ec263cfa290ac8c3683b194"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00042-of-01024.json.gz": {"num_bytes": 318100985, "checksum": "d499cba2383b16bb0f26b98416211eabf2599641ecd6708a5ef487692ca9e791"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00043-of-01024.json.gz": {"num_bytes": 317803029, "checksum": "dc6f1ccc3fcce79b16c5157f7125942e351d74744efc593f8372f8a408720340"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00044-of-01024.json.gz": {"num_bytes": 318837063, "checksum": "6170fced793461bd687640a658a085d02f971c2e609f6ff33b90df944fb56409"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00045-of-01024.json.gz": {"num_bytes": 319659188, "checksum": "b2f79e8600815578ec326cfc6c5242c2827cedbfac51772fdcf15ef5d027aa38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00046-of-01024.json.gz": {"num_bytes": 318771753, "checksum": "e4b4a3e53ee66c280a5e7ee33602ea0e910903748db8c2adbbec4b48bab1580e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00047-of-01024.json.gz": {"num_bytes": 318088661, "checksum": "bf8597fc359d8e9c721fd1d98b8ff3db5c011afd0fec9640670f31c7a7dddb79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00048-of-01024.json.gz": {"num_bytes": 317777133, "checksum": "369db8e9646b8229a23044a7257c2face97b8e05738f0413b581892876f268e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00049-of-01024.json.gz": {"num_bytes": 319329891, "checksum": "5cb2aa0432984b355b0ec6aad92f926b2fb75aea2a0e08b97f4c6a62838e6cc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00050-of-01024.json.gz": {"num_bytes": 318172322, "checksum": "11a7cc48539ac97eaec87beacef9d9bbb71fc875a0bff0c9ff096044bff46a44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00051-of-01024.json.gz": {"num_bytes": 318704544, "checksum": "ac2beee992c2b1ae8b1f162054e843e2b971bbd7cec45a0a7a7b7795fcdc7c26"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00052-of-01024.json.gz": {"num_bytes": 320806303, "checksum": "3a591fe9993c3d98a9e7949e98ca215ce164cd313fe53f3ce762c91b5fec7c53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00053-of-01024.json.gz": {"num_bytes": 320565764, "checksum": "60e67c8e6f3bfdf8b490ecfe62c79a13c5d04d393fbac712a6cda49fd78e883b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00054-of-01024.json.gz": {"num_bytes": 320425170, "checksum": "d69305c853e9e516f5fd4e2a9afb1939d829925f71102d8aa09387ded5d000df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00055-of-01024.json.gz": {"num_bytes": 318713224, "checksum": "e01737df8097a1526d6c31d37d7aeb1b92c0a7253b39f6964fcc897bf0eba9fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00056-of-01024.json.gz": {"num_bytes": 319441227, "checksum": "fe516c8c0a9e59f9f035ac5fdd13e973d25dd6635eee05d648740d3e8c1fc742"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00057-of-01024.json.gz": {"num_bytes": 319821142, "checksum": "7e058ed9072e968e9c8b92f9b50dab318515873cca6c617b544dacab5a2f018e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00058-of-01024.json.gz": {"num_bytes": 318643105, "checksum": "3479dc5a5b111b7f45f87e5a91c433907af97dbe15b9db1637bad666dcbdec40"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00059-of-01024.json.gz": {"num_bytes": 318053548, "checksum": "8208b0943f59b5914fa13d29108ede31a8d8d34bc6d603a2278ab8b80d28b1d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00060-of-01024.json.gz": {"num_bytes": 317935826, "checksum": "71324b62706aabd6faee682205cdedcd10dad289579b534d0e53f8d9b92bf2c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00061-of-01024.json.gz": {"num_bytes": 318870698, "checksum": "cdf0abc5804f0991871de48b249e30b666cb96f2254762a570c39904c5780f8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00062-of-01024.json.gz": {"num_bytes": 318945246, "checksum": "5ac676e16108446bd2980f9601c787eb754811a68e92ab6403c333820a6b9622"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00063-of-01024.json.gz": {"num_bytes": 318827790, "checksum": "a26f7cfe123cfdf3db7687996d0163212e70ff7635872b0754c03cbd5c31213a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00064-of-01024.json.gz": {"num_bytes": 318914155, "checksum": "858a145617a5902ab02bc77e47ee2f036a6211384c4f2285767c7558eb93e245"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00065-of-01024.json.gz": {"num_bytes": 319794084, "checksum": "52742215df5aaca43bed5405a397571efe7c22107ee2caa8c05e3ed229796efa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00066-of-01024.json.gz": {"num_bytes": 320294453, "checksum": "5b11cd54de0e95a75e53e4e32f72912cb01053d3fb609de6b7a45afafab414d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00067-of-01024.json.gz": {"num_bytes": 319468309, "checksum": "4c6c69b3eba9bcd6786d7dce893340f2d7093012ead04f3539352beccd2794ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00068-of-01024.json.gz": {"num_bytes": 318800742, "checksum": "ce94afc3c612e9de423a412147505ad7757216100becba2677bf5eaf443c4b6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00069-of-01024.json.gz": {"num_bytes": 319416585, "checksum": "ff3084a3e5a3960425a5c605274684c42fa638f99045527f77e74d165e52b6ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00070-of-01024.json.gz": {"num_bytes": 319165846, "checksum": "04c368b05f0ea42b3a51ed9bc0e817894f205c0ecd74084da015158d509ff2a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00071-of-01024.json.gz": {"num_bytes": 318017381, "checksum": "e8320e9982fa377b07c5b3e8a4451ac143b05ab7a4a03f748034b37fb998bfb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00072-of-01024.json.gz": {"num_bytes": 318874499, "checksum": "920f8d5ef2cae6bdbd52f724d0952e04146ff29f4aaec4dbf10bef7b66a98f40"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00073-of-01024.json.gz": {"num_bytes": 317890112, "checksum": "06a41bdb7bf0d52e2fe8e71f594de8d36d77880639ffdfb41e883237f76e8a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00074-of-01024.json.gz": {"num_bytes": 319201956, "checksum": "e0267d6782d30f1619a82c49c20be1c8b5424e653c093e4652a5c8ed117c6533"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00075-of-01024.json.gz": {"num_bytes": 320575937, "checksum": "42108758abc3c3197e7dca8293eed3800f3e79ceae80d3208d90c7a9fd205594"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00076-of-01024.json.gz": {"num_bytes": 320070510, "checksum": "c904b6e6041e23edeb1d88b7b69f07a339b7ff9835d0c22e0b6c354519369842"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00077-of-01024.json.gz": {"num_bytes": 319042024, "checksum": "1eb2b70ad4d12b7587eeb1ce86477817ad992c08fecafe5ccafc26af6b5657f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00078-of-01024.json.gz": {"num_bytes": 319997520, "checksum": "070370654960e02f766c10321546b280e9933531b796c252a94999d645f360b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00079-of-01024.json.gz": {"num_bytes": 320736487, "checksum": "3aa4f007660706563030b590cef9be992c18ba7ec1876210bc92665ec42c4be2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00080-of-01024.json.gz": {"num_bytes": 320082337, "checksum": "3b54eaf407bb593c2b16df99690446f26497530d21cf433a7d525e0eaebe9c3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00081-of-01024.json.gz": {"num_bytes": 318008114, "checksum": "d01975cdbd4360331b1a0f55e9b7e731d7d9fc70c7cdd0f33f1c772eff7aa03b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00082-of-01024.json.gz": {"num_bytes": 317829809, "checksum": "2a65dd37027fae03819ea5a5f6c3b16d921706ad758442881dc1d15b08bc5048"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00083-of-01024.json.gz": {"num_bytes": 319265318, "checksum": "e14cf18c687f7eb304df6abef7235e263a5736c799d742524205dead2abfb043"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00084-of-01024.json.gz": {"num_bytes": 319166958, "checksum": "1dc3fa8702a4477e3a3128440b68d4cc17e6d2ce7f3c53da28d50a57b8332020"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00085-of-01024.json.gz": {"num_bytes": 320338078, "checksum": "0222db7b1ae14c9b10aacdb05d055d1432b6d035e3937df5640facd242c52aea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00086-of-01024.json.gz": {"num_bytes": 318941314, "checksum": "55ddf7a27dc91bf8d932a5efec4aa458122ee337f2cb050e2c4b0ae8e770f3a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00087-of-01024.json.gz": {"num_bytes": 319218368, "checksum": "c61552d76bedbfa750c599a674d6732fb224c8a1e6c6583fca7ccabb20532920"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00088-of-01024.json.gz": {"num_bytes": 318974308, "checksum": "693fae3d50068ec39ad27a14335372c3e1530138cc65931edac5268dd62b7e96"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00089-of-01024.json.gz": {"num_bytes": 318781044, "checksum": "2d90b9318432a2313dfaec542c8b91431505035cca7416a63e3197ab26ad6e75"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00090-of-01024.json.gz": {"num_bytes": 318569651, "checksum": "ee674beda8ed39395e69c899f666990c5190dfad5494867e51fa727e4d38d86a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00091-of-01024.json.gz": {"num_bytes": 319683433, "checksum": "add2489350310ce500dde6637518c747c156f95f079a34367842bf875a8fdf5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00092-of-01024.json.gz": {"num_bytes": 318734793, "checksum": "5cfd4f25e9effaa2f7381bfcf49f9263e10619811aeaa32a77d3fdfc13517006"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00093-of-01024.json.gz": {"num_bytes": 319161014, "checksum": "bed8774909bba5ac656ebaad6e5cacca9e5ea12c80a41fd5689e6798c74f3c89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00094-of-01024.json.gz": {"num_bytes": 320143246, "checksum": "96abe370925f6962b4e75da530b5234eec21fab820d6cb02ae59b6070ab63859"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00095-of-01024.json.gz": {"num_bytes": 319707377, "checksum": "37b68cd632e8f86f364fd61c9581f48ad7602122b7f33c55103ac5bd727f015d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00096-of-01024.json.gz": {"num_bytes": 320159279, "checksum": "fb93c7467f0361c1d4b186d5e25f4bce4f237adb33b4e0ef56f57831b4f97f81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00097-of-01024.json.gz": {"num_bytes": 319841818, "checksum": "7f4d4a9536e37a0c2b9a1806fcb472784ff4d3840aa57e9603e74233b877fbac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00098-of-01024.json.gz": {"num_bytes": 321001731, "checksum": "239b9fefebe3815c8d785bd48086013d1a6dcd76c142786502c674d2d874fb11"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00099-of-01024.json.gz": {"num_bytes": 319475885, "checksum": "0a610d25a547839b8b6dfc2fd964e3ca64b23f0edc52d311c89dcb5e8a44a2c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00100-of-01024.json.gz": {"num_bytes": 319515329, "checksum": "f24d17cbd27296a15f51b9edc713c74a6997bbe82267403fdb6282404c2f4e6d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00101-of-01024.json.gz": {"num_bytes": 318803422, "checksum": "54b8b0c72ffa325abce3dd15bdcd0856b5594500c37f4bc6a6327721ba91e4bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00102-of-01024.json.gz": {"num_bytes": 320934688, "checksum": "24b99b4afa3b631a718a487d679026c91e2c936132df01df969e3173b49e091f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00103-of-01024.json.gz": {"num_bytes": 319835920, "checksum": "a2c68654ba81fa55bc24beb4319c8905f7b532fcb6793a6a311344d4f98a82b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00104-of-01024.json.gz": {"num_bytes": 319402378, "checksum": "27764d82793e35b8a7be3a3fb0470d018243a89283b5501c0b76056de1879389"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00105-of-01024.json.gz": {"num_bytes": 320100928, "checksum": "3bb2499337ebe52b63a5f20ec6ca6283971937962439699bd5e483cf80fed02a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00106-of-01024.json.gz": {"num_bytes": 318707110, "checksum": "83510312aa188431a8dda8746903d70cfc7ffdf5437e44c1f74b7670b78bd52b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00107-of-01024.json.gz": {"num_bytes": 319904239, "checksum": "40d42c39dea8e4898efba1886aa3be67742501f7a51d5bc635b03a2c6c2bd63e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00108-of-01024.json.gz": {"num_bytes": 320050265, "checksum": "88ce3ddae88e8024e76614a1b701c157f66fe39c6f0852a4869c5063876f6e87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00109-of-01024.json.gz": {"num_bytes": 318053254, "checksum": "865a124b663037f36a5738f25c82f8bea2ab54d4bbf8255ca0d1d00d76f8b250"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00110-of-01024.json.gz": {"num_bytes": 319794699, "checksum": "b17e210c8ceef98219ee12eba5dddd2001ded0d417c93955743c238360d96e76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00111-of-01024.json.gz": {"num_bytes": 318761540, "checksum": "05be318a057bb33bf9d7faca58569cdb0880fe8eeb0fc3f57f5999d5f2af55fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00112-of-01024.json.gz": {"num_bytes": 319121509, "checksum": "858dce8e43b06a0c1e26ab3e4f109814b6cc50c6b0e4d146ec79fda001ad471d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00113-of-01024.json.gz": {"num_bytes": 317916736, "checksum": "2e3968e48cb15a3326457d5a6ad49838d20d38c8138c529eee51f94e6bf269e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00114-of-01024.json.gz": {"num_bytes": 319319540, "checksum": "b72dc8207d93848f4fcb265b3e618d0eb8649445f7b9187c5165f4adec3e0708"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00115-of-01024.json.gz": {"num_bytes": 318863372, "checksum": "85ef0bf3cb12bc2fede4158853ed2259dff5d25adf99b43e8c35d7e0b9d4fdd3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00116-of-01024.json.gz": {"num_bytes": 318898370, "checksum": "a0c82c8b48e086be7396338cdda0fed52e8c4753f04fd086b9472c1bedfb150c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00117-of-01024.json.gz": {"num_bytes": 318153138, "checksum": "531d5d03fd8099806d92fbff2a48a0d68dcf46325e732e698e9c142902d152f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00118-of-01024.json.gz": {"num_bytes": 318966511, "checksum": "24b1c5ebbd07d50043be0d5d5c5427e042bdc53280825260226a2823e9b7546b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00119-of-01024.json.gz": {"num_bytes": 318733748, "checksum": "ce1fb1192b770e625430798aee94c93bd748ed474ff815a7f95cadebb826161a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00120-of-01024.json.gz": {"num_bytes": 319672996, "checksum": "4c2a6874921ac4a626a9c8ac4c6e91dae58f1f5b52e79124b3abf254b7433119"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00121-of-01024.json.gz": {"num_bytes": 318779046, "checksum": "029d3ab92f3e1724e3708790148e63b4c211d2ddfd04e3d194b24145e97c922a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00122-of-01024.json.gz": {"num_bytes": 320861175, "checksum": "4bb595140e5cf92147f99b58d236634ddfafbc0b160b4c88b337255482611ced"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00123-of-01024.json.gz": {"num_bytes": 318338141, "checksum": "d508261be287fa3d27e5f44524e22870269054213b61011ee8a6728a77910cc0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00124-of-01024.json.gz": {"num_bytes": 317655056, "checksum": "7612cb9fdd9f4b3a4f8958087ace120d4a73cf26bd16289bb20fc871f5744f2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00125-of-01024.json.gz": {"num_bytes": 317524610, "checksum": "049ebe4971811bb1fdcfd10cc264b2074b3ace18536340644e718dcc3cf3affb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00126-of-01024.json.gz": {"num_bytes": 317902192, "checksum": "d97bddf003b8f647c587fe9a9a9aed75ea604478e0b550d501ad7f07b6061b86"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00127-of-01024.json.gz": {"num_bytes": 319243191, "checksum": "6da4c882f88816a452af54ed217f84d6e4601c11a8e33bd47c49c0a1ea04f49a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00128-of-01024.json.gz": {"num_bytes": 318045852, "checksum": "ea43f63e6ef3bb5723ce75bb51f7183a525d8ccb00c93f49aaf2d9b560f7bdbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00129-of-01024.json.gz": {"num_bytes": 318436174, "checksum": "72ceb525367d6e8d1c0fca94d99d4fe5353ead08a5d52bf00e30e3b596fa90a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00130-of-01024.json.gz": {"num_bytes": 319017217, "checksum": "92f1b2687bee78441eeb4e05bbec2a491469b23c3aad0d951fbbe35a3c27998a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00131-of-01024.json.gz": {"num_bytes": 319237739, "checksum": "0fd07585a82b7d71ddabbc315195c84e2fa78a8319de7dea971cfcc9b38707b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00132-of-01024.json.gz": {"num_bytes": 318123742, "checksum": "c9f5604ca28ea2a9ae5267db50f6e3d1e576841abe840134b3817f370c057073"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00133-of-01024.json.gz": {"num_bytes": 319009751, "checksum": "7ec982de577e0eeff57dc60346ce35a7b35b3c4f037987316cfc071b0ed58a87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00134-of-01024.json.gz": {"num_bytes": 319750057, "checksum": "2619d265d76d82f6b84e2686371e5b6d6c08058cbd5765dd2906af9f549af092"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00135-of-01024.json.gz": {"num_bytes": 319068231, "checksum": "5e1bf5b09f2cd132a7747116442d6f26ce0002eaeb9f56fb02bc00e3abee8716"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00136-of-01024.json.gz": {"num_bytes": 317800994, "checksum": "80ebbf64fbd91215da553e3a8d9442380cee6c3b09fbbf8353a0817993d15862"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00137-of-01024.json.gz": {"num_bytes": 318954070, "checksum": "3b5d2ccafe526a19c52ac0fee50109b6a95ac3c8f7f2272a9a0302c4219e82f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00138-of-01024.json.gz": {"num_bytes": 318452853, "checksum": "2dd88569a62003383a3bf70d68143f16f234535469bdc8ab01a8764f6babb5fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00139-of-01024.json.gz": {"num_bytes": 320013821, "checksum": "f32ca62f6a9d2c8a72901e6f2c08880c2d1907f52beb4e8fdc30f4c02c7ad10b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00140-of-01024.json.gz": {"num_bytes": 319510423, "checksum": "7799838d8019d7cd71a505951f155bdfb862b4a3b3b77e182c706a624617169d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00141-of-01024.json.gz": {"num_bytes": 318339814, "checksum": "1601f6dbcbf4e7f1db119b232e862f3c9fe29e9abe5827177458079299ed511e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00142-of-01024.json.gz": {"num_bytes": 318438444, "checksum": "71d891be156e1b608733a3abe8f8dab7a6213c02931117b99889bc3fe8329d38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00143-of-01024.json.gz": {"num_bytes": 319413540, "checksum": "88fb2e7c3d426a6bb5775041658c07005a469306af0d97df7d68f148b64cbfe8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00144-of-01024.json.gz": {"num_bytes": 319901095, "checksum": "2734ff57f4265653b0b1f292f513017ba791c3091cf8ac0bbf6d75d0074e3386"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00145-of-01024.json.gz": {"num_bytes": 318500183, "checksum": "da2e6747f7230af5941c6bee262a606b4f7792da359dbf7516d82d8301cdf90f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00146-of-01024.json.gz": {"num_bytes": 319315120, "checksum": "6daac97153d51addc8b1e43b686e3d641666df3a106270a141d734079db2ad35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00147-of-01024.json.gz": {"num_bytes": 320621434, "checksum": "fb2584e0ce366ad30c8110591484b84798e9f06e8a27cd864e7800b8d5e2d225"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00148-of-01024.json.gz": {"num_bytes": 318269045, "checksum": "1c963c0ceb6cd776822352b186ae7e3d829ef334efcba0fbdd9182dde4deed05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00149-of-01024.json.gz": {"num_bytes": 318576426, "checksum": "6a21397e0104c7fe0fcd9f1d43a8e546000596d896a95eb9b6c4ab92235e6a49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00150-of-01024.json.gz": {"num_bytes": 318447048, "checksum": "075b113a73e6e21d7cac49391ee559ee8aaa2bb3338f709017077a4007a7bbb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00151-of-01024.json.gz": {"num_bytes": 315388730, "checksum": "bd47e3ac0209676d8a32490eb20ca8c07ca3c45c2beb88dae18b5c8d925f349a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00152-of-01024.json.gz": {"num_bytes": 319701880, "checksum": "241d9cf003f49d95168ebdeccd8209230507d4dfd0d170fa1b57d2355240a95d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00153-of-01024.json.gz": {"num_bytes": 318370254, "checksum": "3aa86900a749224dfed8a67960c166e43c3b9ef3ac7b49d28129b496c7193e30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00154-of-01024.json.gz": {"num_bytes": 320064875, "checksum": "3160c723cea6717fa9f5a9eb627d76107040d084a64106973099fa0e8de48758"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00155-of-01024.json.gz": {"num_bytes": 318089754, "checksum": "5b6e76a85bb1093eaba698864a54a938329b04494f9f72c3c3bbb155174da5e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00156-of-01024.json.gz": {"num_bytes": 320049467, "checksum": "cc013e8aa7c1cf7fc28ebecc64d893d03b092a09d725b5e626851de0b311c814"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00157-of-01024.json.gz": {"num_bytes": 319931950, "checksum": "2a27b4c29455bcd813a84aa3a54100d16cb6bfed25171aa3c552ea452ae569e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00158-of-01024.json.gz": {"num_bytes": 319963615, "checksum": "e477f769ea1513cf607932a29d793fdf1722cdea757e00c814dad594329cfac7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00159-of-01024.json.gz": {"num_bytes": 319000491, "checksum": "ff5d09415753c2aa4b51196e8f4bd6c77ba100ab281314aede118f501565cea2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00160-of-01024.json.gz": {"num_bytes": 319069618, "checksum": "e08c35aef8a20dccad80f6bb1579d6d2ce80113c8bf8459730c69fb7048c3cc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00161-of-01024.json.gz": {"num_bytes": 318750642, "checksum": "13eef84873b58e29894f9bf68a4de72a530c1bfc80a5654262fe71420292b8ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00162-of-01024.json.gz": {"num_bytes": 319847814, "checksum": "a8579c6bcc906fe018881a8474724576c3d0f7f1787f1568b79e5accbd9f962c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00163-of-01024.json.gz": {"num_bytes": 320370365, "checksum": "b97a74837ab9f659c13dcb4deb53c600584beb9e5ceed29e99974c4953f644c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00164-of-01024.json.gz": {"num_bytes": 319894618, "checksum": "9b63afffa2b84c91b749991ddb384399f1d408bd7b6b643e7329e49531ce9a53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00165-of-01024.json.gz": {"num_bytes": 320166197, "checksum": "5b2414477dc4e2b080b34f3b98672bfe3de6028e7ad83c323a7dd1ee08c05a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00166-of-01024.json.gz": {"num_bytes": 319612575, "checksum": "2cda682db53000c14fcb5d251bae4f50c8c4159348f8594c3ef020260f277a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00167-of-01024.json.gz": {"num_bytes": 319183884, "checksum": "5c406d7a8a404436039fde7c2019f0174ff8855caff319fa62bb7960d341b41a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00168-of-01024.json.gz": {"num_bytes": 319396348, "checksum": "df6a422d57a2e1443d10d61b13ab2c5227734195c82b43e1ead2db723cdea293"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00169-of-01024.json.gz": {"num_bytes": 319452933, "checksum": "81c81138e7163072e3779dd10ea8af7dff12b705fa008665298e08cfc2699f03"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00170-of-01024.json.gz": {"num_bytes": 317748609, "checksum": "6586ae8862b8ac925f424afb6ba779e95a147323fb83fc8c4bb0813877b17718"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00171-of-01024.json.gz": {"num_bytes": 319052376, "checksum": "8b3cd21d8ffbe963ce935ef9e0b6efc45f4d5abab703fdfed19a1309b700dca8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00172-of-01024.json.gz": {"num_bytes": 319068859, "checksum": "a42f5f5a10bfc84d51dd0855166959462faccd6a182af4c5d2115ff9995f5324"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00173-of-01024.json.gz": {"num_bytes": 319142377, "checksum": "e26514c5d6cea27c0cf7fcc1daadfa6f218ef9e62039c6d6fccfc31660c0c96f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00174-of-01024.json.gz": {"num_bytes": 319134484, "checksum": "75349aa8c734ed894965500eab2fdf59657a63e40e5a53e822ef1e5a12838a02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00175-of-01024.json.gz": {"num_bytes": 318330467, "checksum": "a3d0d14b28a5a3cc559d6d89e2ec09e49e92aa189e44e68dbb4ea47978e1eca1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00176-of-01024.json.gz": {"num_bytes": 318584643, "checksum": "dd68b42e5bfc656b71fe5701bacb929edae84055131f1dd65bbf3f3ad734e57d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00177-of-01024.json.gz": {"num_bytes": 319275087, "checksum": "05a8ff159006241cf938ef27b292f65906158ac25ac28919aa6761eaa634052f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00178-of-01024.json.gz": {"num_bytes": 318490550, "checksum": "a3aa38083c85baada29b207240bcca1a0d562a93971b420428d039092e58bd31"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00179-of-01024.json.gz": {"num_bytes": 319083249, "checksum": "12858fecd1dec728eba2c8c4311b17e4f2ac1fdb27c23e9adcd9258c5c4fc777"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00180-of-01024.json.gz": {"num_bytes": 319752094, "checksum": "67e968cb8d3ebec2f68eddfc539ea7402aa72c9274034494a43ea7d207b69a88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00181-of-01024.json.gz": {"num_bytes": 320476195, "checksum": "c1bd59eb7ca799e31bf037dc7c087c1ad94e4f88a4f12427c454510d97e1c803"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00182-of-01024.json.gz": {"num_bytes": 318538551, "checksum": "dbe7205a1919dca9d6936158d5653a20d239f2e547ec73280956da4f8c609220"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00183-of-01024.json.gz": {"num_bytes": 319620265, "checksum": "46f9e603e04040b59df8da6ee01d1c30588aa7233a00526d6f0fd84c4172ba93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00184-of-01024.json.gz": {"num_bytes": 318301621, "checksum": "880a02eabae231da388a5782a7194eef0d0211c2d1314db0c56d740647a114c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00185-of-01024.json.gz": {"num_bytes": 320515340, "checksum": "f522147aed30ebb3ab352c92a9dd24cd2e8b93df1d4c4a6284d89ceaa2858509"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00186-of-01024.json.gz": {"num_bytes": 318374733, "checksum": "5005f1c42038769e225a626a88c10bd4f6af98dcc14deed475954b00c088bc53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00187-of-01024.json.gz": {"num_bytes": 319116182, "checksum": "cbd7e0f486c6dac13090cd344337da1c336973e7ec75e32b0bd5b18b98f24bf8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00188-of-01024.json.gz": {"num_bytes": 318981305, "checksum": "064ce8c30b7a960b20720c133c3dd3281d27752a66def44d5133ff8f1b8279e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00189-of-01024.json.gz": {"num_bytes": 317036462, "checksum": "acc052da4501691fdd28f269c633ed826840f2634be49b5e2c5e1273de0cb4a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00190-of-01024.json.gz": {"num_bytes": 318061662, "checksum": "5a436e97c59b8636ca5081b71ca6fe8f8a3a99dd3f426c79edb2bf53345ee810"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00191-of-01024.json.gz": {"num_bytes": 318556228, "checksum": "2eebc89381ff78ae63f311c98b07853cefcc42fbcc210995095d568a6ff70ead"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00192-of-01024.json.gz": {"num_bytes": 317987733, "checksum": "99de46c4702c06a2303262b185b92fad82e12e189c923d5b76d9d8f96faabfa5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00193-of-01024.json.gz": {"num_bytes": 320294532, "checksum": "bccb7d8fc34d6cd6eb41e2a1c6234596b00a5517fdca7c47562fdee0e675377c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00194-of-01024.json.gz": {"num_bytes": 320852679, "checksum": "bb1e7768a57145fdbca7957ed964648d1deab5edc5dfad4722a81ad411c5e0f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00195-of-01024.json.gz": {"num_bytes": 319016077, "checksum": "ac520468a5bd933dbac1aa5f7f21ba276bdce15abf99963ef9d73af294e81e70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00196-of-01024.json.gz": {"num_bytes": 319289881, "checksum": "9eec5740115ab52ce98ac9efbed4fa1c5c06787fe93b4b28f6a1e4df06272870"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00197-of-01024.json.gz": {"num_bytes": 320180232, "checksum": "07a03763b84b4a86b4f71d725927d62c40925823ee454122a00fdb625ddb3a22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00198-of-01024.json.gz": {"num_bytes": 320004709, "checksum": "a1b250b01289fdaf6dcd997ef31c59c580f81f961aa0fd88ae0d175bd07c02ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00199-of-01024.json.gz": {"num_bytes": 321006991, "checksum": "650e57c3dbbf4ed929da8c6c5d78f35fbac4644722a84d98f93342a8d33b2140"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00200-of-01024.json.gz": {"num_bytes": 317913111, "checksum": "42caf6dee42bd73d9e4bf0c7bb16383caa936b2e0a913489b9f0aef57b6004cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00201-of-01024.json.gz": {"num_bytes": 317897148, "checksum": "990974a82de2b1c27465f6d097d7a5718c5ff334271e722ab3736e7aa5b89d4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00202-of-01024.json.gz": {"num_bytes": 319510250, "checksum": "8467066f2417af774363d4984a37968a0189adfe3a581723eab15004930e621a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00203-of-01024.json.gz": {"num_bytes": 319762388, "checksum": "4e7e20980dea2d5e77f380b24580f0df9319a0d1d73ec319e17d8cbe044e53de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00204-of-01024.json.gz": {"num_bytes": 317418128, "checksum": "2c027c5225ea7ce3c31f5f32dda12b7c892c6fdc9c52da6d0af749171cdce738"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00205-of-01024.json.gz": {"num_bytes": 320157174, "checksum": "d953e79c60be0e2c3b072c2186a845a351392ef395fa95135f47e6b8491c6f88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00206-of-01024.json.gz": {"num_bytes": 320459080, "checksum": "bc70c34931942ca143f7eb555e86458afcc36110aa9559151f31d781969d4458"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00207-of-01024.json.gz": {"num_bytes": 317361718, "checksum": "fad5ebd7a81bb737e12e9d4c803aea1a9e905d43a3fa87cace32a64eef01e8e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00208-of-01024.json.gz": {"num_bytes": 319976693, "checksum": "21381c727d945d8d3b4a275e3622bce64b07ed87d7f2371ac28b5d2023359cae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00209-of-01024.json.gz": {"num_bytes": 319550585, "checksum": "8b74e5f1780c4bf12936ac3a86be7a3d11287866522da8275aa4232c1e3d8898"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00210-of-01024.json.gz": {"num_bytes": 319574289, "checksum": "1594bd49cde9641b49a1ad9373a53e10d65440000363f7532a7d326d17c44236"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00211-of-01024.json.gz": {"num_bytes": 320615302, "checksum": "5b6f7eddfa3a9ffb0d6668d10f398b1d86482b64daa9817ca0af549433071244"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00212-of-01024.json.gz": {"num_bytes": 319395225, "checksum": "db58fa453269c794fedb595c6193dea5a85c72ff8b2d43e77c9bb371b8c86b78"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00213-of-01024.json.gz": {"num_bytes": 320131797, "checksum": "1d21d19b5e36820559590b339c049be29f27505ab4e88572edbdb84b649e0b66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00214-of-01024.json.gz": {"num_bytes": 320153141, "checksum": "55c9b4ff1cd8cc88738196f867aba620dec3c8b27b9a485c7e75d3129d76e9c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00215-of-01024.json.gz": {"num_bytes": 320525443, "checksum": "dfe9f44676c1abf0e2875924c094c0d788f8a0172d641d5f810258e948e37feb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00216-of-01024.json.gz": {"num_bytes": 320100146, "checksum": "57f19f5437b0428d9f40799af14f8bfba8f6c82ebacaea8f6fc7531524a6d4af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00217-of-01024.json.gz": {"num_bytes": 320688377, "checksum": "fad4f3143aa303c9c35165a15c6d90087c204c586fe20b0c0f45cf4238311b70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00218-of-01024.json.gz": {"num_bytes": 318896471, "checksum": "aabd471960d6db1e93e1129410d9138d9d9efa3292af7491b3b6844c2bd3f543"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00219-of-01024.json.gz": {"num_bytes": 319298204, "checksum": "f676701589e39802779a0947585638347bb4fe55376a33c6d0afcdc40c5f8938"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00220-of-01024.json.gz": {"num_bytes": 317757045, "checksum": "f3d0994379d244054c5e2db366a081caee28d301aa6b0d9431e7d9eb1cb38c30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00221-of-01024.json.gz": {"num_bytes": 318568870, "checksum": "8026854c8a8cc1d16b52a898b9dd8a8df7901dd8cdf285f5d937c4d5d45919f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00222-of-01024.json.gz": {"num_bytes": 319096912, "checksum": "71f76f898864de3ae60f7c0cdbc68d53cbfa04b2f8493c40d55e1cb56727b275"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00223-of-01024.json.gz": {"num_bytes": 319350414, "checksum": "ba01faf3fe41a738c255b5da83daf53a5858144557af6c6f8d6208a049e4245f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00224-of-01024.json.gz": {"num_bytes": 319007151, "checksum": "94200d12c61f7c73a9e3a2bb089a05b017a215348d52018a34e3224578c0da06"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00225-of-01024.json.gz": {"num_bytes": 319502985, "checksum": "0b7ce650e555baa546bb329d7f0567a3dc0a7ec9d49149792032a86321a73d6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00226-of-01024.json.gz": {"num_bytes": 317983607, "checksum": "40cf6d4b3deb05cd97ebed01405d08ae67be6e896736e4f371d15e5404567599"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00227-of-01024.json.gz": {"num_bytes": 320199564, "checksum": "e65ee475e3b6682b57bfa3f7b9c1cdabf36a7282fc793865df63dbe6a6a3d1fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00228-of-01024.json.gz": {"num_bytes": 318852183, "checksum": "8b27f2fbb0233802229fc776cfcb0b6b43af3149d217d0ab00cca0f1286482e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00229-of-01024.json.gz": {"num_bytes": 319407418, "checksum": "f2d5199a0022134ae127c88f0ac20d1b2b8a88014a774b5432b41085c83ecb5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00230-of-01024.json.gz": {"num_bytes": 320787790, "checksum": "e1b040895ac6068dd1aa892ec93d733096afc4adda698379006ef89926491255"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00231-of-01024.json.gz": {"num_bytes": 318220053, "checksum": "648a6349206c50c17d4e3562fd6fcb0a723b4cb40005890173d5de0c7ecc2ade"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00232-of-01024.json.gz": {"num_bytes": 319702777, "checksum": "0a44b7cb4f354e1eede683a697aba4051c1542fd030dd59767065f5f0204554e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00233-of-01024.json.gz": {"num_bytes": 319154465, "checksum": "4070448b7844776db6754bd33791900bf9ac8dbd81e4cd774a3055ada67f6fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00234-of-01024.json.gz": {"num_bytes": 319846160, "checksum": "b1e8c73078c347fa062ed408e81bbdcb2f714675bab2c082016e822e91ef63a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00235-of-01024.json.gz": {"num_bytes": 317722912, "checksum": "d8aa694e870157b2b5411f496db46dc71dfeed01a42973a65499596921198abf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00236-of-01024.json.gz": {"num_bytes": 318593592, "checksum": "e0c4ff6c8a12128da88777074d0b097664cf2f2395913c4d82b0eecd501946f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00237-of-01024.json.gz": {"num_bytes": 318902831, "checksum": "adce772ed699d7e908ae1fe1ddf1d9875305c7875c93cedf1b3ea0bbc21ff922"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00238-of-01024.json.gz": {"num_bytes": 318696723, "checksum": "926f9fc42cd248077afec1f4b88603c646fc5ae47c4ee3e9b8a5f6b8b6ff7f46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00239-of-01024.json.gz": {"num_bytes": 318321822, "checksum": "439d756b0ffc97ebecc6c48a7dc90da77de7ada05a6eae929db98057ea15bef1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00240-of-01024.json.gz": {"num_bytes": 318992553, "checksum": "1f57af6ff9477263806c0827c0dd8e494e103b6f54eec2cd5f8f8327b01ee39b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00241-of-01024.json.gz": {"num_bytes": 319345185, "checksum": "493932a44e09f4b311ac5bdb519111fad0982708d4b467688f2b1105316544eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00242-of-01024.json.gz": {"num_bytes": 320108156, "checksum": "de5603f1b276f1373011c8884f06af017c71b03c5de3b3bb89cd6d550a0d5902"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00243-of-01024.json.gz": {"num_bytes": 319855563, "checksum": "7c1b74de8ae3699c567edaa6e2d1a1f1ae82f4810e769c710a23cd2dfc536c60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00244-of-01024.json.gz": {"num_bytes": 318966332, "checksum": "d3ada80bad9fa776374878bc7504138e14c161bc9798ea8114b0d187d4c815f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00245-of-01024.json.gz": {"num_bytes": 319541864, "checksum": "3fe5f26e32795c49743d1b2497c333be57248c9db2ce12fb93e103d1a9595347"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00246-of-01024.json.gz": {"num_bytes": 318530369, "checksum": "a0bdeb2dcb5dfb46f843c4086230ba918f2d3ec125654cb924ea11e7c75cafbd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00247-of-01024.json.gz": {"num_bytes": 319496627, "checksum": "0c4099f832ada6b24ef6c1d15267cd3c179f5b3d79e3d813d944e3ebea908c99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00248-of-01024.json.gz": {"num_bytes": 319132981, "checksum": "608b1cd27ad345f6511fb677c00d56b6e827f288877d68aea1bcad3b02dd040e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00249-of-01024.json.gz": {"num_bytes": 318529093, "checksum": "8fd580be09f913cc3809e3b0e467e2faf657a5db6f71b75aa931043267b9b0f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00250-of-01024.json.gz": {"num_bytes": 318248903, "checksum": "faeac675c3634b0834939046e60cdfad6a13558d7a6799c5bde25567898d86a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00251-of-01024.json.gz": {"num_bytes": 319184870, "checksum": "038972e03db75417fc4cb25e54c3aee01e4f022eb0fab202142f539e4d866e28"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00252-of-01024.json.gz": {"num_bytes": 319631399, "checksum": "2fda0c2cec4624c6068556e16630c3551ef3110759bed59628913a9debd547a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00253-of-01024.json.gz": {"num_bytes": 318275716, "checksum": "b5da4bfa564fcc6c49a573b90e679d60c4e222249858f4e58fdb3727a5f279ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00254-of-01024.json.gz": {"num_bytes": 318638865, "checksum": "279eb2978fe94e1570318a247b82487c04d7494ceed74dccb1d7a5734ea84e5c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00255-of-01024.json.gz": {"num_bytes": 319640339, "checksum": "aa0a1ef845d0df7d81d2588d53f29205a4e3858a0888c1b7d9c83eb2fe1d32a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00256-of-01024.json.gz": {"num_bytes": 320353593, "checksum": "407133ea3b32a9e004b992a1bccade0440a39d0bfbd12993ea78c6526c0864a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00257-of-01024.json.gz": {"num_bytes": 318165587, "checksum": "72b7a72b8402b22cb51db44c9e7859460366c7c9d33e16a4c038ad07f7ad8f3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00258-of-01024.json.gz": {"num_bytes": 318003534, "checksum": "e5f9f2f74b7f9958dc9535f04a8965749ca4bd68005a6efa36f480fb487ca930"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00259-of-01024.json.gz": {"num_bytes": 318990454, "checksum": "7cb3c284613537fc6b1a85d7187dfca30b37a7a1a5708094f17486e3184e2d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00260-of-01024.json.gz": {"num_bytes": 319514850, "checksum": "0067e36b7156196e2451cdf78dc8832352f2481a4740afbef9046104b6810bdc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00261-of-01024.json.gz": {"num_bytes": 318747661, "checksum": "b1e4597420035c355abe15efc576751169e2b5e4c38e073c178346a7202d5ab2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00262-of-01024.json.gz": {"num_bytes": 319868329, "checksum": "374f4b951e545968da45b5055af2aa0b128c1d65d6c854f5b8f7e02d22c352e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00263-of-01024.json.gz": {"num_bytes": 319268788, "checksum": "7168e635a32859a85a152b29bcd1f699257ee4e340517e218ea9b8dac3922210"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00264-of-01024.json.gz": {"num_bytes": 319270640, "checksum": "1da08b65c83e79a0f5b7215e5a4ee58f21383b69f09dd9a3ba95381ba3d56d25"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00265-of-01024.json.gz": {"num_bytes": 318744354, "checksum": "0c908e81d59b2099eda038731b387a0ad86fa3d168eb2955413dde9cf29d947b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00266-of-01024.json.gz": {"num_bytes": 318518406, "checksum": "115e375464931638de4af669b7301b6112d18b23835f2db2b092f47545b1a855"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00267-of-01024.json.gz": {"num_bytes": 318921711, "checksum": "6d66c715137885a46f2472489b21751284ec8ecfde6dca6be3ec1ee75f6cd5af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00268-of-01024.json.gz": {"num_bytes": 317786222, "checksum": "588865d8f9d3da5a70c958997060ce4792e175c8fc5323f1887787070c8c160f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00269-of-01024.json.gz": {"num_bytes": 319004956, "checksum": "163ec7497602931de2eaffad320704e508e491937a2965e39907a086f640d975"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00270-of-01024.json.gz": {"num_bytes": 319175186, "checksum": "794e0e7ceccf28457a8ed5b0724337545661da16feafd0a53e4823b2cb1c92ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00271-of-01024.json.gz": {"num_bytes": 319785821, "checksum": "9c9ec0348f7d4ffc61e5f19f1f60c8382b33ca2fe4b852567cbc3c16024a4627"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00272-of-01024.json.gz": {"num_bytes": 318933435, "checksum": "883d85985237948018b13c20f4d4ee567c6ee36a135b326e8117d73dad4fe37a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00273-of-01024.json.gz": {"num_bytes": 318456664, "checksum": "fdca13067e8e118e538b8de538e164fb5397724045a5b1b02764510c8de90969"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00274-of-01024.json.gz": {"num_bytes": 318418161, "checksum": "27556558fe8a91a4aea4800ba9b7e844336a7638c5b96e652fcdb359f631b04f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00275-of-01024.json.gz": {"num_bytes": 318437784, "checksum": "6ad4e6a3e1cee04aee3051a66531e3f4aa97f7bbb7602c6aa5f46a727b319f2b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00276-of-01024.json.gz": {"num_bytes": 318470946, "checksum": "145a4d85ddf1e72fcdb8477dcd2f70a5554d9cd9349e02e058d3e7837204b6ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00277-of-01024.json.gz": {"num_bytes": 319580624, "checksum": "7116de0dbc5c7f6621f7c107dded9d85788937a87f2d56efca32ae9f25fc6865"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00278-of-01024.json.gz": {"num_bytes": 319619699, "checksum": "8dabdf2d26035d30c22204e6f46f292c58f4a4c3b0b77a1826a43341d4282df9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00279-of-01024.json.gz": {"num_bytes": 319344020, "checksum": "c2b7d5bf62be1772c6bb80f597b28d948cf3cdefb10b6df6f777f0ab7d8fb015"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00280-of-01024.json.gz": {"num_bytes": 318997864, "checksum": "025457720b0045e7bf01f9b4b847f28ef94af9ca250675efeee73eeb340a3f36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00281-of-01024.json.gz": {"num_bytes": 318718146, "checksum": "2979c0ac06570a9ee437521778c514bd8755193b9f1ae6a5a671ef885243f019"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00282-of-01024.json.gz": {"num_bytes": 318434530, "checksum": "a17bca50ec20c364adb899a9073bbe3a1505f81803a58190efc5d4f3f78b58be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00283-of-01024.json.gz": {"num_bytes": 319317663, "checksum": "9034f524fc5c2e246b22e2dee00b47e0c4da0316bc60d0a11d966c28db917f9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00284-of-01024.json.gz": {"num_bytes": 318957832, "checksum": "f08b96047e711831dfb8a44d90cb712d3e78c98dd28ec6b937ee83949bbef5b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00285-of-01024.json.gz": {"num_bytes": 318643283, "checksum": "c5df1f2e2dad46d71f8aadf856a5139020da8afc2ee010d53c0372ea09b2362d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00286-of-01024.json.gz": {"num_bytes": 318064839, "checksum": "16f7fd6abcbc69750b8131bca3e38ddc40bd7c86c48122ad2a9a77cb9cfd552e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00287-of-01024.json.gz": {"num_bytes": 320328448, "checksum": "41e82bd357b47a28f28a4a203d5b54263aadb3c9a08899f78302c727c56d8b38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00288-of-01024.json.gz": {"num_bytes": 319559271, "checksum": "970b9df224b58ca50b3023d92f6be0c37dbda479155c29c535e457ef6f2bca0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00289-of-01024.json.gz": {"num_bytes": 318786822, "checksum": "36a6515e7f516335d3fe057bb6ed9890a2aea033e08edd8588b3168b3445b2f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00290-of-01024.json.gz": {"num_bytes": 320634782, "checksum": "7d19fc82b9a5aa0e0046cd17cd2c46f356f8a4a7d203d5e03e1f319156f05cb8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00291-of-01024.json.gz": {"num_bytes": 318746713, "checksum": "86d610d4590bca69281348dbfaaec9e704fd6194141c50c71e84aad51ce26b91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00292-of-01024.json.gz": {"num_bytes": 320049630, "checksum": "d045df646213e29d4e7de4ec8915eb3b65bb962f35b0d74abf00889bd5aae8ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00293-of-01024.json.gz": {"num_bytes": 319966146, "checksum": "c66fff1a64b495211bfdcea650ff76115f8c857b9154c1b869062e702714b9ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00294-of-01024.json.gz": {"num_bytes": 318805332, "checksum": "ef3d9204ec85a1e65ae48af7924f614403d297a15f232ba41eb0e4fe223e507f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00295-of-01024.json.gz": {"num_bytes": 318898465, "checksum": "2a071fc28b1216f2dc0579528d9b04e597b5cdac9fd14719e312092242da190a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00296-of-01024.json.gz": {"num_bytes": 319406630, "checksum": "ea71e9fd444860d70d3728f7e2213a4bccf3aa31a164c9acfa8df7a0b6619786"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00297-of-01024.json.gz": {"num_bytes": 320312971, "checksum": "ddaeba8aad38b7e9727c579cc44f15b3c82d292e2901b47b785e9c8d3d5cdb9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00298-of-01024.json.gz": {"num_bytes": 320660744, "checksum": "814460ccfda29b45edaee5f44e3c980889aee2ee52e4e5323931ea489fbe938e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00299-of-01024.json.gz": {"num_bytes": 319848186, "checksum": "3b91fe32d3a731a5be3bf778eedfe13e8a7e26ba9eda51c278c5212aa7925681"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00300-of-01024.json.gz": {"num_bytes": 319647278, "checksum": "1e0424631f7f354bc63b3e71c5c6516c85343dafd3896acb9560eaf93b672799"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00301-of-01024.json.gz": {"num_bytes": 319080252, "checksum": "46c21af013f611729cc06ec033dbae80151987f9098e57fb98e2631f6fe76c8f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00302-of-01024.json.gz": {"num_bytes": 320028246, "checksum": "d1ca8ad6e5bd6cb18db1f1be9154dbc8ba9df7ca02db4c1f8a7df9d40820d8ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00303-of-01024.json.gz": {"num_bytes": 319388787, "checksum": "bce87161f77464adfb1fc04fc2993211bcec502d7172b86f726daf7096b04f82"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00304-of-01024.json.gz": {"num_bytes": 318627831, "checksum": "235b8085cbeb7b13f8e1a5f6d2225a9461b7bcd76e21466a189c2411ff4c4107"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00305-of-01024.json.gz": {"num_bytes": 318148428, "checksum": "f13f124e0ea150da13ebeb3390c311b3db54018de0d640579307bbcf2c46068d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00306-of-01024.json.gz": {"num_bytes": 319451712, "checksum": "de5c3fa2cd6a47551ab43268484d017602e2c3e1f66f43f1a1d8f95bac52cad5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00307-of-01024.json.gz": {"num_bytes": 319026244, "checksum": "88769fbf393671db352227a64cb8ba6b4ba60c5bddb4a14294b1ad9a65a750cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00308-of-01024.json.gz": {"num_bytes": 318447454, "checksum": "555bcfc0ba4db0551ce5ffb18057027ee695af166856125aeb79f7ce013851cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00309-of-01024.json.gz": {"num_bytes": 318147676, "checksum": "bf28e60a7970c548190cf0f4fe56f27ea55a1ad8313fa353a8013f0a0e7919f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00310-of-01024.json.gz": {"num_bytes": 318930650, "checksum": "45a68c0ef70ecd10838d604d51fecd26e5199f5372022b9c2af461a71c24c6ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00311-of-01024.json.gz": {"num_bytes": 319955339, "checksum": "fb3c4e93166f1cb2ccc8a7b68da0246f0827d3a81bb5614c8c84f1c01c6d53c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00312-of-01024.json.gz": {"num_bytes": 318554567, "checksum": "0dce2ac88ba7ac5340d551add9fe7b1a30772a6cc082347c536427b48daca598"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00313-of-01024.json.gz": {"num_bytes": 318978931, "checksum": "c5f99dab085fb705769a514626c9af8a26cf846fdaee4b403a3d6f84c892cb66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00314-of-01024.json.gz": {"num_bytes": 318158197, "checksum": "79de4fa2aed5e3efa71e75d13f08d7c1869aa59f42a819f4429430b3db6c1b27"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00315-of-01024.json.gz": {"num_bytes": 319744521, "checksum": "5a47a89a1537662a91853bbe2a5b3e243f5de74489f820621192cacef192593f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00316-of-01024.json.gz": {"num_bytes": 319861527, "checksum": "1cd34f17f3ae3c8bf8e1636714a9ff600a26799d5ec02ba42abefa5db9d00e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00317-of-01024.json.gz": {"num_bytes": 319286030, "checksum": "a3e34af81264a72b523b63fdc0268f450675f7993fa0885eb2b4c747b0d6703c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00318-of-01024.json.gz": {"num_bytes": 319054871, "checksum": "02fa8cf278578108083bc9a3c5cf07b0a9d243f2162397091ede6c85a1df31e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00319-of-01024.json.gz": {"num_bytes": 319943810, "checksum": "93ef0d7f1610043a6f7634af73e89ee9f3d7e87828ad34558a4d688e6fa6b6dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00320-of-01024.json.gz": {"num_bytes": 320037211, "checksum": "06fbd99a3d64df293db2655f321117f1afcf1cda51e421edef9335a25cb1a902"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00321-of-01024.json.gz": {"num_bytes": 318584237, "checksum": "a224e4d902f7368f91d6a72fc9f5730996dc37de576bc2211eb632e3690f1b38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00322-of-01024.json.gz": {"num_bytes": 319686632, "checksum": "57fba28c7104ff659f8a0f330ae89c68d3a392dd14a78247fa357a3bcc8b94dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00323-of-01024.json.gz": {"num_bytes": 319834993, "checksum": "e61c760cd3c42f71a1a7bb6adc4e0bc970bbf864b69e2a4a5d56bf0a14d4e0be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00324-of-01024.json.gz": {"num_bytes": 319243057, "checksum": "61d21ab1e7729f172ade5ab6c0dcaf07eaeaee6e047ca1c24722c06ddd919678"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00325-of-01024.json.gz": {"num_bytes": 318569583, "checksum": "2192a891ecc2a6aa9f6ea64f1d76ce763e0a3963ae03c95275ccd626171835ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00326-of-01024.json.gz": {"num_bytes": 319175980, "checksum": "d35e4d5f8e924ad97520db51a2c361bbc02097721195932b6768e7460df092a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00327-of-01024.json.gz": {"num_bytes": 319892298, "checksum": "ce967065d3915d466982b5258e07ad2c46b02d7637057e0547586657ea0f53a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00328-of-01024.json.gz": {"num_bytes": 318004026, "checksum": "0676d556f46b1f057669d3378c6fc335db6e3ac67a02e11dce3823658730f4c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00329-of-01024.json.gz": {"num_bytes": 319066225, "checksum": "b00bb4bda957e1287b98c432165448b3899f9155363f7b61bfd0f0181181acfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00330-of-01024.json.gz": {"num_bytes": 319268288, "checksum": "d14d1883941966ef3b35203d06e6fa1bb485dd77118bd7b6c811b0d06fa72fae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00331-of-01024.json.gz": {"num_bytes": 319131311, "checksum": "4d5d41c2b2242b299fb67fa8c9327db8b4f612bdf4ee9af4d4e45aba8cd1e409"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00332-of-01024.json.gz": {"num_bytes": 318827508, "checksum": "68cea08d4805b392bf4c2894a4501ee3fbbe9aac4b1b6533e686ea749ced2dcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00333-of-01024.json.gz": {"num_bytes": 320572240, "checksum": "06f211ae2fe1c4eef5e41caceda8ebbc289261057911fcf2583a59c730b7951a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00334-of-01024.json.gz": {"num_bytes": 318121862, "checksum": "46c62769e04ce8acde4562ba24d72e245babacdfb50600da4e6217948ad71d24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00335-of-01024.json.gz": {"num_bytes": 318692168, "checksum": "dca69a6976e7387a12c8da16b696ed4f604254693a3280be0f90fa694700b595"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00336-of-01024.json.gz": {"num_bytes": 319479902, "checksum": "c52969fad97f1dc0e1e115428e7dad1ac6cb6d804db0cd34f0fc7846b1b50c7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00337-of-01024.json.gz": {"num_bytes": 319987407, "checksum": "2c570f02aa6a6bac96be1e02663996c87f9a94c160f22101ce8ae1d549ae1de2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00338-of-01024.json.gz": {"num_bytes": 319051086, "checksum": "77132df95b147c471ead74bef16ed4fa11e15209f518dd460110132358816834"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00339-of-01024.json.gz": {"num_bytes": 319473192, "checksum": "7f3ac20a72d395c02ed3cb50052821521dc2d8d97303d00e0d0982e2c29e7659"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00340-of-01024.json.gz": {"num_bytes": 318423485, "checksum": "d1127da89e960d939cfc06cf1985df415b60d4bf02b12b7fab02b796100feaee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00341-of-01024.json.gz": {"num_bytes": 320087690, "checksum": "f753423f82157e95506566d3653d32af6a181e69ea0e10b4d4eb24b626d3ca49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00342-of-01024.json.gz": {"num_bytes": 319767100, "checksum": "db7410e6a6ca74163098681038f497faa373e1d81434b45c1a2f273d467c0a2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00343-of-01024.json.gz": {"num_bytes": 318389429, "checksum": "7ea1e432a1ffbed8f4ad6cb985c5cf1b2584d8eb7d2fa091a2db3f104a3f7210"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00344-of-01024.json.gz": {"num_bytes": 319117212, "checksum": "c7317a81a6224dec9be07b41134ac7a7db4039b7c98b2061b20bb59b82ed0a1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00345-of-01024.json.gz": {"num_bytes": 318504232, "checksum": "1498efe8280609d9d66c324e332c9433c6351bb7b99c5891a8f27d6841410407"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00346-of-01024.json.gz": {"num_bytes": 316721169, "checksum": "0cbc6b494d653878c9d52a37572064b88356058ed291aa773e5f47259fbfc722"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00347-of-01024.json.gz": {"num_bytes": 319007736, "checksum": "6265505e19a42a01a159297d33b1a91cd0e042a31ba6a1a867404a143ae565a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00348-of-01024.json.gz": {"num_bytes": 320167918, "checksum": "cc8b29deb44c8348aa4d05836f89cbae995c946f38d9cb8e7fedbd4762168ba0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00349-of-01024.json.gz": {"num_bytes": 319901226, "checksum": "2a0f2188b43ffedc8b95a8276c7647147587c5e544c9e6475e790f4b5e362992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00350-of-01024.json.gz": {"num_bytes": 318999223, "checksum": "1fde48c503998872aa71fc524c7408dc84cbc1faa0d885895d5c57708a15fced"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00351-of-01024.json.gz": {"num_bytes": 318935410, "checksum": "72d577eabcd814a7ff61b894b3fe9089f483a793e692d3ab20ce4ee59921f975"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00352-of-01024.json.gz": {"num_bytes": 318655907, "checksum": "8686dc0e4ff7b35cbc4fa6f3abce50c06f8b95378031c132a117e1d458cb4616"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00353-of-01024.json.gz": {"num_bytes": 320619683, "checksum": "cd5816469ef54bfeb0db6b55a78e0d34eb2e1f82448a41f67dfb70061c3ea91e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00354-of-01024.json.gz": {"num_bytes": 319352400, "checksum": "bf082c093423d562da4984b1f0428225d853a05b5f8fb3696273f36ebb5a235d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00355-of-01024.json.gz": {"num_bytes": 318868462, "checksum": "3b8baeca48e55a2cd268d6aef75f7eed96ef10fceca593a5179d52a2b0121f8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00356-of-01024.json.gz": {"num_bytes": 318903295, "checksum": "4c9a9926a4bad6721807d99cc02a9b6bd28bb0a6254aa1c15527b745c56a06a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00357-of-01024.json.gz": {"num_bytes": 318881446, "checksum": "84b4c2e05bc162fef4824e97ba7a03b1cecb41eda08a3e0aedd264b66e859a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00358-of-01024.json.gz": {"num_bytes": 318521100, "checksum": "aee99528ffd0323fe81e4ed26ed1b9295baa2a3910771dd2a42f4f378fd82569"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00359-of-01024.json.gz": {"num_bytes": 317796778, "checksum": "7b01f2d5ae54f60c2aeb7b96bd366d21e558e2dac48c83a78df9850f37e02f1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00360-of-01024.json.gz": {"num_bytes": 319502919, "checksum": "5b54f9a050e6f9008a1806101ea553d90eead56c949a5f3f46c8ccb88812081b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00361-of-01024.json.gz": {"num_bytes": 318595505, "checksum": "49f4164d66187d46adff7f9bbac97b232ab7906d812e571c2e0bf028895e7f47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00362-of-01024.json.gz": {"num_bytes": 318851572, "checksum": "17accad3c0706c54530f128260cacbf986cbbb20427d4ba8d3444a3702a22c55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00363-of-01024.json.gz": {"num_bytes": 318555337, "checksum": "2327866e541aa6aa73f7289c3ad82a19ff154d39657d98cb78a2f481a8765920"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00364-of-01024.json.gz": {"num_bytes": 318641145, "checksum": "6f52354d804e8d4a1af1f6c2c6b759ae115c4f23a63f1206a73e7e25acfbdd02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00365-of-01024.json.gz": {"num_bytes": 319212614, "checksum": "8f1834eeacc9bbdee95b1f0a4078eb9488bd1a7c5693489bff7943869674cad3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00366-of-01024.json.gz": {"num_bytes": 319336585, "checksum": "a9cf01b76104eebb4ef8462a924f61c262fa197a7c68a50e48d925cb81586e3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00367-of-01024.json.gz": {"num_bytes": 319161263, "checksum": "5ac822027d50c3196026fbaffc7d968e1ca702b947688a6f4d268b942b5067b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00368-of-01024.json.gz": {"num_bytes": 317911640, "checksum": "f9acffbe3c6617e85911ff9dcecec2378b3469ab4546a6973cceb460f9003cea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00369-of-01024.json.gz": {"num_bytes": 319585031, "checksum": "9234553649cfa5265c5a9ccc88486402f88eb81275067c51d9deef16bbe7211f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00370-of-01024.json.gz": {"num_bytes": 318345879, "checksum": "2fbb410346d31a33e8532602f4e3340fcc75c96be803250e9f0f1a6894ca0052"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00371-of-01024.json.gz": {"num_bytes": 318996184, "checksum": "b069b0c8a830ea841e82077548706f286308ef0420e163ff6d8312c8853af172"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00372-of-01024.json.gz": {"num_bytes": 317989343, "checksum": "bfd62e448d4d9f89353abaa384007b0b72bd860402ade3a9d938051a6446530b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00373-of-01024.json.gz": {"num_bytes": 319770759, "checksum": "e4e176250aceb7362ce38d496556a46409e9872e69f45166afe71aa750de8fcb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00374-of-01024.json.gz": {"num_bytes": 319212902, "checksum": "28aa4510c3ddb9ee0ac56aab3792bfe5e899531919ccc0214a4b68bbf2ba18a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00375-of-01024.json.gz": {"num_bytes": 318968029, "checksum": "35326b1f2280e07dd754e89dfa29989d0dfa5c78995d393b36a752d8364bfcd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00376-of-01024.json.gz": {"num_bytes": 318685188, "checksum": "0060dbaccf7f2f956fb8b57891cb176914ddac1bc485dd86c2fd110c46d174b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00377-of-01024.json.gz": {"num_bytes": 319291982, "checksum": "99fc38654197e506868e099c15b2cb15b93238dafd33f81a7d069b3e01c3b085"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00378-of-01024.json.gz": {"num_bytes": 319259094, "checksum": "9b8d97f9d57dd97373c4f57eae2b9c01a58e49017ee41d3969e94fb4dbabc260"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00379-of-01024.json.gz": {"num_bytes": 320228224, "checksum": "82913f2d182d2a57f6c93e9b229862cb72feaa6331d04cd4419113e1eb9d52cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00380-of-01024.json.gz": {"num_bytes": 319738339, "checksum": "e0de43f754ab97d103a02c708d1cd7e771ba079bd9e1f7c532a80a30bd5182ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00381-of-01024.json.gz": {"num_bytes": 319210620, "checksum": "df74823f78564b544677410508e675e2811905c56afe2a60d19d3e049dd65394"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00382-of-01024.json.gz": {"num_bytes": 319810275, "checksum": "f5d5291a695fe2cd228213fa2bf090bf6513c49c6911826aa43ecaefec0622ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00383-of-01024.json.gz": {"num_bytes": 319190426, "checksum": "a861ae79a66b72d6cd5e0a030daae52cffb85ba1272c36ae2be04a9b7c0287c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00384-of-01024.json.gz": {"num_bytes": 318501845, "checksum": "b8d0f5078ae82980f0f64120530bbeb20f627be0a8629d68885acb867091417f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00385-of-01024.json.gz": {"num_bytes": 319530458, "checksum": "7da119f3f63e25ff63cacd8ba0d77987b2d576be1f4b86e7e45aa3f2d194624b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00386-of-01024.json.gz": {"num_bytes": 318938980, "checksum": "c21f3de56fab26d7fb60bdb47c216b22793f67b8fa6d382520c79b88d1896f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00387-of-01024.json.gz": {"num_bytes": 319207426, "checksum": "e28b0884092f75836eed4d73ed24b7403d7b0530fc389386a68887420b0c2603"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00388-of-01024.json.gz": {"num_bytes": 319835376, "checksum": "b4f0db632cc9af66e8aea109c80d73a6281207e29ece131d5bf8b57ff8f81262"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00389-of-01024.json.gz": {"num_bytes": 319346837, "checksum": "413a8d8df1f6cf3094839b57231da5323f33f7115768c65d83f0af1574f71b6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00390-of-01024.json.gz": {"num_bytes": 318632301, "checksum": "a3e8664fbb3ec2af5a217225dbb7fcf3e93b427e5da1a88e35c04c319d61e4c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00391-of-01024.json.gz": {"num_bytes": 319066082, "checksum": "e22eed3415c90510e97768be5a685e0a8035e2635ef773c56e9ce2718c278658"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00392-of-01024.json.gz": {"num_bytes": 318356286, "checksum": "ddbf325390648d9d86f1e7901b75c99fe8db538d203de8dfb4c304282f82cd74"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00393-of-01024.json.gz": {"num_bytes": 318048288, "checksum": "974fd05f356c86be2f9109b0272eee69c5b2eaf0b16104cc573846c925d13b4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00394-of-01024.json.gz": {"num_bytes": 319444683, "checksum": "0d27d6f8c3b935cef23ea60abfa82bd6a4f5e2e061080419dc9c6bc455b9f868"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00395-of-01024.json.gz": {"num_bytes": 318353166, "checksum": "24d9956bd857484ffbabb3ba6f6ac688f48a94b50228238c7c9153a5c6878a7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00396-of-01024.json.gz": {"num_bytes": 319960396, "checksum": "9425f4f18e1690ded866c4b5313cbac8a6210092dc42f720200b7143b69eabe5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00397-of-01024.json.gz": {"num_bytes": 319030577, "checksum": "dee166674b835b9849d281a87238aa136e14d26edaa72d0ecb6b7e82d556a72e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00398-of-01024.json.gz": {"num_bytes": 317664320, "checksum": "f85e08272f73ce4aa602719d59205db54d230a6b7247830d78f91eac63d753be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00399-of-01024.json.gz": {"num_bytes": 319623875, "checksum": "85dea0672a0362a08503b70623907c8c92bd105f788fbd7f3816212a9181e7c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00400-of-01024.json.gz": {"num_bytes": 318840274, "checksum": "a104345698500611cd1a71a6647555300d315490918740a8c6e3b8dcff315407"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00401-of-01024.json.gz": {"num_bytes": 318336377, "checksum": "808327d156e183e102fd75cfbdb7b5a1fbde3740168f59b767ea380608305b67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00402-of-01024.json.gz": {"num_bytes": 319270185, "checksum": "b6a5f7c1ade628091fe86744a6011147ec32795ad694ccbc82929791b93aa307"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00403-of-01024.json.gz": {"num_bytes": 318038520, "checksum": "108904ab05b3ad23318f8aa0f7ddd00d97aae1872fb157eea73273e011cbec04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00404-of-01024.json.gz": {"num_bytes": 320933185, "checksum": "cd0c068c0831218849149eaab8f8a98748823911c745ca0ea33ae839bd625e04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00405-of-01024.json.gz": {"num_bytes": 317694827, "checksum": "d99909ccd59e2ec183b41a7c6d1bd5677798bd7fd784ab681546a7bf8292f353"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00406-of-01024.json.gz": {"num_bytes": 317937468, "checksum": "c7f2bd7a366b8c389e41fdfad4891068c86039e1a5fc3b8a0b993253badf33d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00407-of-01024.json.gz": {"num_bytes": 320226074, "checksum": "765db6f9f0c8c3d9bbb0499f0010928fe4f90d5915dfdd3b6d09d3dc78ad07a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00408-of-01024.json.gz": {"num_bytes": 318613788, "checksum": "165e78c858dfaf010307392474d4917846c9d21658558912e5ffc915803bd2fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00409-of-01024.json.gz": {"num_bytes": 319212414, "checksum": "5f7d5952aad1ae31413962983971b2b422d77c262ededd2ce1c1e186aeb6d87d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00410-of-01024.json.gz": {"num_bytes": 319023647, "checksum": "24588d41f40e3fe389575b97d41ef761be46bc9a9b3965c5e3f994760f7a4070"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00411-of-01024.json.gz": {"num_bytes": 318408922, "checksum": "b35d4ada5a000f51169557b00e508706d51a7becd33370014ff07c8b8dac1af5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00412-of-01024.json.gz": {"num_bytes": 317166932, "checksum": "d3ed1cae269ebefe4716843bd7954bf7e44ee889f72066afbdcd95f4e1f06703"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00413-of-01024.json.gz": {"num_bytes": 318519121, "checksum": "07fc61a7e164301113201e78c99d40289d88e0b463048e14aa5fe69c7490ccac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00414-of-01024.json.gz": {"num_bytes": 317417235, "checksum": "c5a7222b2eb8e8fe690f29a0fff7e214ba94e4d9dae62f67281fe25dd385b721"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00415-of-01024.json.gz": {"num_bytes": 319690993, "checksum": "37052fff729bdff124577d5ba041906b2ea7420c5cb28195e6cfca0e41d560c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00416-of-01024.json.gz": {"num_bytes": 319466518, "checksum": "6e8ce2b9e6e8208ad7e43ce709454cb0b96572d793e0b11c15892f5df18f6137"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00417-of-01024.json.gz": {"num_bytes": 319694381, "checksum": "20892d7a33c31d7967ae0cf595a2108de96a61c0bbd773aebc5d3d083f6ed93b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00418-of-01024.json.gz": {"num_bytes": 319048918, "checksum": "fd795ae8d53e632bb3e89a2becc5b801e10db781b14f2c0ed50b12def5376c8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00419-of-01024.json.gz": {"num_bytes": 319791424, "checksum": "5a8e56faaa0892249e5694ae01e2e4dcd22d9750a9aeea5ca390117c77b8de2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00420-of-01024.json.gz": {"num_bytes": 318060925, "checksum": "795ee64f4c9e2e35d9dc0c91ea593c9e41a3924162901fbf782dc7112f8094a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00421-of-01024.json.gz": {"num_bytes": 319328927, "checksum": "2670b7b6b53e9082c90e4a4e915f72673831ff15e9f55918a1244e0c19c8f963"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00422-of-01024.json.gz": {"num_bytes": 320065363, "checksum": "34df2d1afac2ae4699524492d6b93e4a2a1e551cb4a4ae35fc19353930afab8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00423-of-01024.json.gz": {"num_bytes": 319349887, "checksum": "a2b19afafb45cf30493ac2a3eb013e136e7213f63bd633374ca0d9fe2780efe9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00424-of-01024.json.gz": {"num_bytes": 317515288, "checksum": "ec2a84fb16dd16f9547f0c3314a91968324f2c537118ca36e982b235e23527ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00425-of-01024.json.gz": {"num_bytes": 319092219, "checksum": "1ac0b93c0faae7d446add3af3173637a4b0d638dbd5285b0f4e1bf3abd0d1542"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00426-of-01024.json.gz": {"num_bytes": 318421245, "checksum": "bade501dc71c0b4968a9a7c833751cee5d8f7067a45dabd53aa03534df48886e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00427-of-01024.json.gz": {"num_bytes": 317847935, "checksum": "7aef554aa2b120c4d787395e28aceba743e309f2540fab283e077a1429a2f7ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00428-of-01024.json.gz": {"num_bytes": 318822008, "checksum": "cd94547fe1953a1cc074d97558a70d1e55834606379a8f5e6e60e1b15b56fd35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00429-of-01024.json.gz": {"num_bytes": 318507684, "checksum": "4d3c9245565a808058293558603c657d6e9a0c87b6d2d4b871b856cea2eb3a19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00430-of-01024.json.gz": {"num_bytes": 319042136, "checksum": "9c5a4fe50db5d0822923fe29a5aa8ca6cb09e3629472b1bf61f670388b6c2076"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00431-of-01024.json.gz": {"num_bytes": 318925124, "checksum": "8f18b35bb952da090ade742753e30861ba39c6c54c8ff2d76b358ca7be475ed6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00432-of-01024.json.gz": {"num_bytes": 318680251, "checksum": "7968c370d0efa4601ab8b5ee68e480b211fb969593608bf7e00a0153f00f99b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00433-of-01024.json.gz": {"num_bytes": 317822797, "checksum": "f62d7e74434d52c36b22f6a8cd56ed3937ed6aa03f140d0fbdf5e360632d51fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00434-of-01024.json.gz": {"num_bytes": 320094364, "checksum": "55d7678c7e197e165b4e09bf3f8ac159853120acbe5801ed6ab3ab0f801c11bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00435-of-01024.json.gz": {"num_bytes": 319008936, "checksum": "09b451c8ee06bc06507b3e75a60c544a6b70f27e3d07daa29c59803f785faaf5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00436-of-01024.json.gz": {"num_bytes": 319023456, "checksum": "6fbcb93f9dfe65e12b7efeecc8af7823471787438b1ce90e5f48b68b2dcb1d14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00437-of-01024.json.gz": {"num_bytes": 319484997, "checksum": "9e70c8c1ccbfe93ec9296811ae496a518dcafbf38c81b7972f885e297da9e726"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00438-of-01024.json.gz": {"num_bytes": 320319141, "checksum": "eaab759d8c603e8a2ad3ebacd99e30338fb904ba307aeaba0d2e0e63679cfadc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00439-of-01024.json.gz": {"num_bytes": 318410397, "checksum": "7a03a92bf97b6750941c1070f933c68f1b2a3e13fb68b3a21a4726676ea75d34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00440-of-01024.json.gz": {"num_bytes": 319447470, "checksum": "bc899e436da7b3bf13c1bfa2fd2bbf9d90b42a0c00f2971259a14d858ca3e5ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00441-of-01024.json.gz": {"num_bytes": 317582955, "checksum": "4d777860c2750e43038ef709d77bdc403b3b3bcf0f08e3c4562952c9ac70b113"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00442-of-01024.json.gz": {"num_bytes": 319592118, "checksum": "d9e5dc244bb6f0b629b2a929aedf506dadaf5eacc80f0997816b95279552fe8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00443-of-01024.json.gz": {"num_bytes": 318104403, "checksum": "56133bbd7cf96dbe87d48898b886a024af69ca405d7cea1799bbd30f185e9c1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00444-of-01024.json.gz": {"num_bytes": 318547808, "checksum": "8be0270c3cc96dd7f7b3aad08bde81ea245feff4a09923277fb0d38a7c095604"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00445-of-01024.json.gz": {"num_bytes": 320463920, "checksum": "e02316fcd355914e4d08ecf37036d4727ae9ebe45bdc5c98279aa3437c2c1eb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00446-of-01024.json.gz": {"num_bytes": 319583221, "checksum": "80c9b8c47665b2cef6c291b0eefdac5b14be1d7cd4a4c06c2e14cf48b42da92d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00447-of-01024.json.gz": {"num_bytes": 319546881, "checksum": "a18d5aaca1717ec33fb1822a633268003bf88093dd7b48db080503c3d01b6ffb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00448-of-01024.json.gz": {"num_bytes": 320234711, "checksum": "c41595d2b9cbf0e23fd65df1cb51499ee262d345d79d2625388cf149c3c39f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00449-of-01024.json.gz": {"num_bytes": 320043698, "checksum": "3bef99334be9d39f41296f8f134c88f04fe66502da2d2639f0d6d2485338e607"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00450-of-01024.json.gz": {"num_bytes": 318033740, "checksum": "9cd05b1b70ffc3c004b4b4a2f21f91abee1395f3a485efd1aafda550193df9fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00451-of-01024.json.gz": {"num_bytes": 318549622, "checksum": "b2ef6cc4ac7c4c69fb1661d7ed9b2ce4da261c72f9e49dc3c934180501ef3a24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00452-of-01024.json.gz": {"num_bytes": 319317230, "checksum": "89927f1fd79a5b1439988fd37e0377175176d9ed22d14611f67a81e185a336b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00453-of-01024.json.gz": {"num_bytes": 318952561, "checksum": "427f55bbcfb6c1a0ef12f96cb122f362b975169770ce1d392b763c4b4408cb34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00454-of-01024.json.gz": {"num_bytes": 317545286, "checksum": "2fc3b172ea721bc92b0f7614e8fea61b0781e6f4f3e6b7263cf0190beef3ec52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00455-of-01024.json.gz": {"num_bytes": 318975631, "checksum": "c96f688ecb19bdb1592b0124021fb80d48965303442de76751d82fa03ab8f6d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00456-of-01024.json.gz": {"num_bytes": 320016575, "checksum": "61d2be7a4b9e34cfb994ae2c120ed5a51a6669564046637445a46b9872812416"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00457-of-01024.json.gz": {"num_bytes": 318236935, "checksum": "a74dd51c3c490458ea0e61196d7e0085aff80d50cd149a673f54f661b364a671"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00458-of-01024.json.gz": {"num_bytes": 318495925, "checksum": "adf9cd717f2c79504dace22b5929d4c4064353e869457c20cc81a0b2db390c89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00459-of-01024.json.gz": {"num_bytes": 318956821, "checksum": "d7be5bcb738a75586125e56a25aa234618528accda620eaac421beab6288b992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00460-of-01024.json.gz": {"num_bytes": 318968681, "checksum": "6181280df5418fd9ebb52aa26a631100b6c3da0750dc5fbae152a6a44fccb942"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00461-of-01024.json.gz": {"num_bytes": 320810761, "checksum": "5e943c458674371dffb2466274b8f2a9df9902a370901ef97992bdf920cdae0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00462-of-01024.json.gz": {"num_bytes": 320154899, "checksum": "76b3d1b120cbb7cd71d004440e0c6bd9f9c4395424c568e8362973038017a90c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00463-of-01024.json.gz": {"num_bytes": 319247449, "checksum": "9de2c86d85289113b24c2f7eb4771ec1391511930f5f26a12133d41faf0ce908"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00464-of-01024.json.gz": {"num_bytes": 318150152, "checksum": "85fce3104ef0b247798c1de8d9d616d3de754841fb6c49a01cca5b9da5efa94e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00465-of-01024.json.gz": {"num_bytes": 320342803, "checksum": "ddf312f0b8de8f53ed556483fd998ae308d4829d18195a48869db6bf1866c332"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00466-of-01024.json.gz": {"num_bytes": 318619029, "checksum": "01239a1ff6ffe9032da320c5a7d1a93125d0724851e3e10746821c9452070887"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00467-of-01024.json.gz": {"num_bytes": 317677227, "checksum": "41783d20189a4bcfc33f543597a5473900e692ea13fa522f2724e27e810b4e9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00468-of-01024.json.gz": {"num_bytes": 320038217, "checksum": "7131b6f4dd423f2efe55c3f598893676300b31651cce7eed32ce633a015f8ca8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00469-of-01024.json.gz": {"num_bytes": 318359701, "checksum": "925bc76c045f25532414f29820adb0cf1a56c54b406333a6f348c29e5efda9fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00470-of-01024.json.gz": {"num_bytes": 319329235, "checksum": "9be740483aa7bbaf94dce550f2c20404c89326f6ec4ebe1b7070f85f93507038"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00471-of-01024.json.gz": {"num_bytes": 318792779, "checksum": "0e3d9492f15dc9867bb0dc803bdf45608fbe67255014b4488902d7bf2e2554cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00472-of-01024.json.gz": {"num_bytes": 319552622, "checksum": "00484bbc10bace3dfd93b57fc53d6f5fac26b7dd54fd5b5428d75eb9e6dbb0e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00473-of-01024.json.gz": {"num_bytes": 319466828, "checksum": "5db5d585798e8ed8e4a3bc540871f1185f67125f397a12942d21b24e6b374519"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00474-of-01024.json.gz": {"num_bytes": 320014669, "checksum": "db07fd0e972c1a474806c1b4464ad4cefdd2e8fc15806ba0d259d4f9e594c3f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00475-of-01024.json.gz": {"num_bytes": 320379280, "checksum": "e6e36a9eed8be84c928980fffd8177b177182726c9e13b41a47343d431f76a7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00476-of-01024.json.gz": {"num_bytes": 318820301, "checksum": "0543ed2d0b3aaba0b0fccbf0311836143bd19175c5eed9bf0f024ffb9ce3c50a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00477-of-01024.json.gz": {"num_bytes": 320577830, "checksum": "a62fd62ad771dbcfb7af73841e15a49e9d7239c53dbbbd84de2282131bca9c99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00478-of-01024.json.gz": {"num_bytes": 319593908, "checksum": "beae9334a8e93e4b036c4a9b3c5b3a75fff17264177184d243d9e6da286dbe2b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00479-of-01024.json.gz": {"num_bytes": 319728825, "checksum": "ae5b475c7be35d98b77d6c4aed5d61cbd1c98544c9a6e73a53ef2911757ab7f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00480-of-01024.json.gz": {"num_bytes": 319903674, "checksum": "51e0611378455d909e8b0f292eb62038848aa7afaa4f93c9c83061258b211a95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00481-of-01024.json.gz": {"num_bytes": 319998409, "checksum": "68c640304ac952f544ea88c88d7c994c8d2955b95036f8352a67b57a836fa1bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00482-of-01024.json.gz": {"num_bytes": 319047238, "checksum": "74cefa57158d0008a06ae85b2a7a1c04d57a79b7ae3f7b4b3426dbe9918b36ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00483-of-01024.json.gz": {"num_bytes": 318775875, "checksum": "e99faa71222017521f1fc9999bbb0832df5c91f8b9f6e2ef501d3f827d3a1e85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00484-of-01024.json.gz": {"num_bytes": 319190491, "checksum": "4518faae7c9d51a51f0b02cd895cf27e7c87a623b787346c844a8d9f0b52d6ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00485-of-01024.json.gz": {"num_bytes": 318974502, "checksum": "1bc8b207583b9f36169e0e9facd258de8eb73dee8bf831051dd1ab04b7726c6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00486-of-01024.json.gz": {"num_bytes": 318599424, "checksum": "0b1d9900e1921483b85305491f914b6b78fabcd0686a20695e61b89b7380a894"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00487-of-01024.json.gz": {"num_bytes": 318958015, "checksum": "c0c789c5f3b34d170d2aeb72642c70d2fa5eca567e7850d0c89b3d170f3bbf64"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00488-of-01024.json.gz": {"num_bytes": 320205671, "checksum": "6eef7a1ea80be43e84cb0c974215a477c909844899ac694afe1af2e8f4ac171c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00489-of-01024.json.gz": {"num_bytes": 319193967, "checksum": "eccf5d7f682a76e11332f07e7d54a080f76c0be58a98a853a9fe90c815a22087"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00490-of-01024.json.gz": {"num_bytes": 319833603, "checksum": "afe99e32ba36134f23b59a2ee43965bf185432de947740fc19e26eef41027aef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00491-of-01024.json.gz": {"num_bytes": 318912982, "checksum": "e981151b23b233bd3e5798f78658b5f52a73f69db39c30615f615069cf0c4984"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00492-of-01024.json.gz": {"num_bytes": 320057824, "checksum": "0cc5f7df318e0718fef93d24e7ff904b3e8e2728c4fc0b1d13893c81d8e6e2c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00493-of-01024.json.gz": {"num_bytes": 317967559, "checksum": "93749543b04a5a7093177d2a03acfc0bf6f26d5b53864ae35839a9421fb48169"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00494-of-01024.json.gz": {"num_bytes": 320426917, "checksum": "e461f56b461a4d5ce353c60889dcb99e10818985d3788440c6119bb145876277"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00495-of-01024.json.gz": {"num_bytes": 319528392, "checksum": "e530f3030ddbf7191bc4082e8209f63eb48733d7085d79a8469ce3611ccb79b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00496-of-01024.json.gz": {"num_bytes": 317570766, "checksum": "ddec34b528bd5314019d12089e600df27e781d78f43b6722b9c0202ccf385755"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00497-of-01024.json.gz": {"num_bytes": 319154838, "checksum": "e7438a08000fc7a158f887755cc496edcf51c8bdf2bc4a888ddd2c829bf8fa3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00498-of-01024.json.gz": {"num_bytes": 317955368, "checksum": "ad133d808ca5b6181bae1921ab1261d79630c09bf9d6c904db036f22e6f32e6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00499-of-01024.json.gz": {"num_bytes": 318286671, "checksum": "cb40879ea08db5a9eb6f2c23756574bda34deb9acf039b992f0ab90fdbb01594"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00500-of-01024.json.gz": {"num_bytes": 318510936, "checksum": "21e5f7468a907f38c3dc0a5c19f09921476f9186beff967e829329f191dad6b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00501-of-01024.json.gz": {"num_bytes": 319611074, "checksum": "38829434c8539bb9fa9ea32bfba3c6732c5021ffb60c16fc502fe61de83906ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00502-of-01024.json.gz": {"num_bytes": 318630954, "checksum": "22d1ca1edae179d2587495fcdf1d3e515c6f547cebafc54996c93a121731fd8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00503-of-01024.json.gz": {"num_bytes": 318253198, "checksum": "e95689993390086880e630ec4540e0629551076c0cad2c70f5aedd3aebfec181"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00504-of-01024.json.gz": {"num_bytes": 319497151, "checksum": "0cd7b986d247e010fd76fa2ab2b62d5f9eec292b28c1e7bd3e4c577042b598af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00505-of-01024.json.gz": {"num_bytes": 317498965, "checksum": "f1504912fc53cc3690e26ec3babf736ddbeb8f7d9196dac83f757699310b30ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00506-of-01024.json.gz": {"num_bytes": 319684193, "checksum": "9f6defbac132e097cbf7cb7d181cb154bace6af48964fe09d111bc610fdcd2bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00507-of-01024.json.gz": {"num_bytes": 318394726, "checksum": "a58f39d0bef19abefc089342d8bb6d75dbb2c663f67127673ec395404bcf15ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00508-of-01024.json.gz": {"num_bytes": 319013108, "checksum": "176443b39840826bfb1db2cef2541449a6fd0c465ff9bbf0cb2479f07fb8baa8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00509-of-01024.json.gz": {"num_bytes": 319832758, "checksum": "cce5a142cd7a121eba8c182d499442f4b0a397ea1484c33ccd79b1acbae832fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00510-of-01024.json.gz": {"num_bytes": 318762241, "checksum": "bfc910625f0fd6074955906bb86e789b0d0adcd1f8956cb8da276933dceac256"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00511-of-01024.json.gz": {"num_bytes": 319240643, "checksum": "ce53021b90d1c86e2d46293e7053aa174387d7408bf0cf907898be69b1a7befc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00512-of-01024.json.gz": {"num_bytes": 318353376, "checksum": "e9333c6f73c30c9cb7f31794025eb9129455fac2edd64f8b3f22f879124c6a85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00513-of-01024.json.gz": {"num_bytes": 317653011, "checksum": "d9450c6f541e82922b37d3b7cc25611707b44884f27825db4dbd65466b59e8b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00514-of-01024.json.gz": {"num_bytes": 319391160, "checksum": "20b77f5fc2a939fc291f901e8774acfbf04ffaacb08192b724673eadc9f83c12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00515-of-01024.json.gz": {"num_bytes": 317994258, "checksum": "32ca1f60d0deb395538a93ce5044a48fde05864f2c26af42dc53405b6dc05031"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00516-of-01024.json.gz": {"num_bytes": 318786801, "checksum": "eba4f34749eef4da2b0729abbdfa2ada77bd65383c01213d4f86625670430a65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00517-of-01024.json.gz": {"num_bytes": 320010732, "checksum": "617765f971b879182db7debf879025f8dad4fd8846b11728ee1230767c031c04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00518-of-01024.json.gz": {"num_bytes": 318681019, "checksum": "6987893764c56b84fca014532824a05d4187db5c313be4f7bdcb363b7e8cc8db"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00519-of-01024.json.gz": {"num_bytes": 319951543, "checksum": "ba151c4734db52e7c220dbefe380825ac6d66a9c6abb901b8096a87d97a2deb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00520-of-01024.json.gz": {"num_bytes": 317948056, "checksum": "7e53ed26c3c068b0dedd026219b7cdab79775545ebbf31b5dadadb45364c9985"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00521-of-01024.json.gz": {"num_bytes": 317993802, "checksum": "4d1d4a5583430e373bd2cfd191e59cd8911953fbd73fa924e0c15be76499b54b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00522-of-01024.json.gz": {"num_bytes": 320189449, "checksum": "71d851498785e312acf93861a43169794d4d576f5fe8b960303419316c8c898a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00523-of-01024.json.gz": {"num_bytes": 320443871, "checksum": "587867d619115c2accb69322b197239b79f12de41ae80427fd369813ad8d81af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00524-of-01024.json.gz": {"num_bytes": 318192840, "checksum": "7324c02db00b06d0f41d6e5ebfa4e4dd6554f5f4849d6de187ebb84162d0446d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00525-of-01024.json.gz": {"num_bytes": 319294602, "checksum": "24ae3495e5b59883967c62b8fb3a4fa7525d33c40957fd5fa3be413d66c24eb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00526-of-01024.json.gz": {"num_bytes": 319783465, "checksum": "27cd95e7bc6a3f156f1f8f26dc5e490818fc4810562e3964a19fad401cceacd2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00527-of-01024.json.gz": {"num_bytes": 317240081, "checksum": "6b84920fe7e28c01a03800512915c7a9e47816267ac652f9ee0314e3428bca72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00528-of-01024.json.gz": {"num_bytes": 318320694, "checksum": "fec06589f714ffe1343cb6781898e29e5d0cb789deba3aa4a4ccf86514d3f690"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00529-of-01024.json.gz": {"num_bytes": 318391515, "checksum": "a98c34c04c1b6f0ca3acc9e10fdf4bd0ead2ea7271832ce4972df8677590918b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00530-of-01024.json.gz": {"num_bytes": 318473966, "checksum": "1677d541c7bc10971c711f1eb030faa2e85e0967112ba57d7f04712908e4f040"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00531-of-01024.json.gz": {"num_bytes": 319463272, "checksum": "92b5d82a058554d3396a2b54504f45fa88581cb2951140c0f0bde67ed11bed0c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00532-of-01024.json.gz": {"num_bytes": 318228175, "checksum": "291bb3d7613f7f00b6910a0de78dbab0d87602243c9c83014de341c131200853"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00533-of-01024.json.gz": {"num_bytes": 318966937, "checksum": "a0ce39eac6d6ecad3478373c264e88b2ea20b77fb2049537c229ad3da2769c85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00534-of-01024.json.gz": {"num_bytes": 318968162, "checksum": "387db79d4aacf8fa4c512fb78023ff94a43d5d597d5a8c2ec6198e62e4b8c98b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00535-of-01024.json.gz": {"num_bytes": 319253588, "checksum": "3ff8f4a926fdfb6201a94d75c17ec5afe662a339a65019eb5e1193c1238bd388"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00536-of-01024.json.gz": {"num_bytes": 319662526, "checksum": "0c805e83d8cfd979701df5714713d062e14853d7e2b0f77c0b414a626686cd33"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00537-of-01024.json.gz": {"num_bytes": 319177095, "checksum": "f9a0ac216e316075e5c2219449a954f989eb160ead2ca07ac9f3813274e18f2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00538-of-01024.json.gz": {"num_bytes": 320109104, "checksum": "a425ef4dddefb40bac5a8cd3191161a41737aea5088a614410d10d83bbab5e37"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00539-of-01024.json.gz": {"num_bytes": 320600564, "checksum": "3580ea8da9c4aff1296e89136c5d7f1a37d021e0b10f3ebd1e05612c092faebb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00540-of-01024.json.gz": {"num_bytes": 319993281, "checksum": "ad8dc83bfbe7c8976f08708c5f0229cd4e1a2d80e272b225a8d208133b129dfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00541-of-01024.json.gz": {"num_bytes": 318256020, "checksum": "c7452669237323fdd09ce97624791a0261f3ec07d8a5f98e71a4b1252a2805e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00542-of-01024.json.gz": {"num_bytes": 318843744, "checksum": "1e5a11c25f82ce717302dbcd9acc1f8b916d83eca88d345d8434b1f88768137b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00543-of-01024.json.gz": {"num_bytes": 320482002, "checksum": "bbf96edf50c913d5162ee154423242e7c8faf490ba229f325bac98a5e3eb9477"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00544-of-01024.json.gz": {"num_bytes": 319059260, "checksum": "22c04506b5744df8c71727fc6527fa2bc495a10a237c71762c66d09625d34097"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00545-of-01024.json.gz": {"num_bytes": 317874034, "checksum": "84a78bb62eb6f72de7a75325870d9ecd419f77c4f6728d29609b2f7ab1b8bcf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00546-of-01024.json.gz": {"num_bytes": 319891407, "checksum": "28631c527dc398c9626fc60b39ad94ed880b41c71f55b9c7c670f6a1837f98d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00547-of-01024.json.gz": {"num_bytes": 319361268, "checksum": "273b8598405def0165ceaf9723d1425c9b74368fc22a414616c7ac9327930225"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00548-of-01024.json.gz": {"num_bytes": 318360761, "checksum": "59990568c0ea055fab27f2b9cd028e1c7177df0479712d1e2d8372e9b017ccad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00549-of-01024.json.gz": {"num_bytes": 317320452, "checksum": "fd1e361f28cf099df6088e26d06d79f7f62bd8bd89b4524b9baa80ea49a1a4a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00550-of-01024.json.gz": {"num_bytes": 319017444, "checksum": "4424833afcb143f6fdbfc2f5fa2508d6226a4a1df391969b2a751d2d0070158d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00551-of-01024.json.gz": {"num_bytes": 319118159, "checksum": "77b78f94a8bc8f905cf8b1997df1fc3b8c6d77ce65fc28bef68c6083275a832b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00552-of-01024.json.gz": {"num_bytes": 320058125, "checksum": "e7b71167c4ad947232b6acba26e4d3cc9214c25b50b853b5745333bba942f50f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00553-of-01024.json.gz": {"num_bytes": 319220671, "checksum": "ce7891f3820ce065e3bd7afa006e90889428c80bd8e771d66fbbf023bb2a9eba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00554-of-01024.json.gz": {"num_bytes": 318858928, "checksum": "015a707235f46f179a08d3f6674b6d368dc9612841e2bf39f700f11fef8e64c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00555-of-01024.json.gz": {"num_bytes": 320490725, "checksum": "041dd2e902ed04dfa143476da03d5fd00c30ce1259c0658150af5b77a5a092c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00556-of-01024.json.gz": {"num_bytes": 319863694, "checksum": "22e3d9e4dbdf2b1b822a7bc8c889f4747aa16c71f4c91436d028a228bffe4b87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00557-of-01024.json.gz": {"num_bytes": 318940362, "checksum": "4cb8b113ad9687b7dee590242c5f50fb3ea3a8775c67492a8ce0cb5c15fc26d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00558-of-01024.json.gz": {"num_bytes": 319797786, "checksum": "ad157a34c6a8d496859f55b00c79fcedf7305d8502ca86a511026f39cdcaca59"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00559-of-01024.json.gz": {"num_bytes": 320156705, "checksum": "816d84753b71fae446428587f41de5b3490e88321f1fa0cfa2ef1fd5eef851e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00560-of-01024.json.gz": {"num_bytes": 318346216, "checksum": "0b1b3d26316f2c0e973ff19820793bcfffa957c3869f74f62fb40cb6839227e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00561-of-01024.json.gz": {"num_bytes": 319571572, "checksum": "4f92594382c897bf94211f1446dbb38c2cc1fff3647acba731dfe0ad89ba4061"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00562-of-01024.json.gz": {"num_bytes": 319453711, "checksum": "2a6ba0c64806add776081f417c8d1afdb324dd8b9aebb603372afd7fc2c4cd6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00563-of-01024.json.gz": {"num_bytes": 318990092, "checksum": "e3032365b9b86883c24bfe387d810c2d9fd1d0a55ff88acd1f5b5357246b13ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00564-of-01024.json.gz": {"num_bytes": 319491917, "checksum": "da6196ab8650fc9f8fa391b821ff070070946412277bd423c40d9fa1de325f93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00565-of-01024.json.gz": {"num_bytes": 318756269, "checksum": "edeb5b13aa0d65354d78a5ca5d1698732e95f1fcba249c42825a0351d4a34f79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00566-of-01024.json.gz": {"num_bytes": 318461036, "checksum": "f179addbca50d8612612b0e09138d7ecc89ba7ef2d6e857d7ef0b10223dc71d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00567-of-01024.json.gz": {"num_bytes": 319625728, "checksum": "eaa1d0ee28eb17c6ebe3d85c8af8b7adac28a720b2975f86ac83f3f4d2bffbcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00568-of-01024.json.gz": {"num_bytes": 318428567, "checksum": "3677e88545f2d76b601995cc3e2b6b12fcf65e350ed7eb4137ab4beef3d475c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00569-of-01024.json.gz": {"num_bytes": 320114923, "checksum": "2d8810d8bcfc0fc19d82313be6516b2fef4cf68f56b0448af48b512c98e1ae8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00570-of-01024.json.gz": {"num_bytes": 319148416, "checksum": "8e5356dc0fa2b4e5fa16b36a1586f16920306af1227c765e5d2f0818e74d30d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00571-of-01024.json.gz": {"num_bytes": 318223973, "checksum": "c87cf8b88e8e4fc0a664f4b3a381b78b317680253a83a672cb86e02adb43f2aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00572-of-01024.json.gz": {"num_bytes": 318322508, "checksum": "2bdc857dfeab99c8f83f0267ed5ed7529bca8ee086fce268534bc0264ff738f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00573-of-01024.json.gz": {"num_bytes": 319203246, "checksum": "564fc77dec25ce0d47f4e3d8d04bf114dc06119b28b3ab00d6092a799d496e51"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00574-of-01024.json.gz": {"num_bytes": 318397937, "checksum": "dc3f206e1b5da963184da72e47959844bb164335c76e3261f3a189a4b7b022cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00575-of-01024.json.gz": {"num_bytes": 319183651, "checksum": "7f0c46955e37d5d52b305f71b4ce4fca5368d72e8698e8b832ac0177f868e145"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00576-of-01024.json.gz": {"num_bytes": 318690625, "checksum": "b37d0fbd439bdc05021a71c192ce5e61ebce27448a17819bb53156d9d5f27e17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00577-of-01024.json.gz": {"num_bytes": 317926085, "checksum": "3092d1ad70fb2d262ecb33f3fb6ea554af3ddd26498ba42b644c383f6d4bd1a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00578-of-01024.json.gz": {"num_bytes": 319190472, "checksum": "d9833fd591a618a167b31b7aaca420f3e719ded98987dbc0f46fd4bfd12564c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00579-of-01024.json.gz": {"num_bytes": 318958744, "checksum": "a11217af10c85ad828de38847eeddcde6af6899563585d581c20adaed3c9e7dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00580-of-01024.json.gz": {"num_bytes": 319893900, "checksum": "71e8be705bfa8563e33392d1c14decd84f52d6a0139b98344f1a0ed9bdc94198"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00581-of-01024.json.gz": {"num_bytes": 320109861, "checksum": "c5f13ba973803ef069762d22bc37ee02a4348af379c75848d93b2685fc4280cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00582-of-01024.json.gz": {"num_bytes": 319238177, "checksum": "da815527ca68b5c2ed604d00ccbcc7c631c60f33e3132f79212634a82c266844"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00583-of-01024.json.gz": {"num_bytes": 319375634, "checksum": "a332b791df0801f0b7227117f0ea3971563e8e420ae24dd94b38d532c1ab0573"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00584-of-01024.json.gz": {"num_bytes": 318596018, "checksum": "e6496d31f42921eaf9f85047e7c2eeb5fef46e01e99760fa676da96481d7d5bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00585-of-01024.json.gz": {"num_bytes": 320156294, "checksum": "08b978ec05d65edd22c301ddc6ab44174eeb7bef5c5997a84342b6faaa47a79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00586-of-01024.json.gz": {"num_bytes": 318716838, "checksum": "567ce600ad99e543507fdf27b9009fe1782bc867f44f3dabbeb93fab1208f337"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00587-of-01024.json.gz": {"num_bytes": 320247814, "checksum": "8f5c82f5eaac4a315d8615c9700cd81f3b9c2e1a17376d3b2482f8694dfe2492"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00588-of-01024.json.gz": {"num_bytes": 319546079, "checksum": "bae91422f87091b3974ca92781a14fae8f10c5c41de9c9132f745b3dcb8bc468"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00589-of-01024.json.gz": {"num_bytes": 319771959, "checksum": "babb615d77f80e5ef99aeed3889a26cef5c9918a7fe68b70a503815e69b0b189"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00590-of-01024.json.gz": {"num_bytes": 318926571, "checksum": "61f2ed732f3b2b5e24882f47b4eb84fea28bf89d112f6f173cbb50523a43c4b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00591-of-01024.json.gz": {"num_bytes": 319669791, "checksum": "3aa2e792ec775a52ee78447b81204867e58b0a46727bab4b7974977aaec2889d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00592-of-01024.json.gz": {"num_bytes": 320393142, "checksum": "1419c263fb74409cb0e39ebd87b1c020ee6863a3a6f2f427be27d3c76b84043a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00593-of-01024.json.gz": {"num_bytes": 320977171, "checksum": "4f16f33217c35a2b155d5b6fe8014c2e52014e63c419e7d3aaf71a35246c1323"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00594-of-01024.json.gz": {"num_bytes": 318211092, "checksum": "c9301ddcafea22d085ae48f551f486e73089a76c7990871f787064c61e4e60b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00595-of-01024.json.gz": {"num_bytes": 318978629, "checksum": "349e104763320eaae96ac3bc53c5fa7a73e7dec93b8cc3afaad108a97e7c170d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00596-of-01024.json.gz": {"num_bytes": 318573003, "checksum": "0eb6c25cf57764ec3aa7f74d6d967c52003f872f2f3b140fe6d5ac6360241a8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00597-of-01024.json.gz": {"num_bytes": 318931514, "checksum": "b42b7b984aad729185ca9b3a6ffa856b2a79165ce2feebe519b10f8ff42c4ab9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00598-of-01024.json.gz": {"num_bytes": 319002677, "checksum": "8306c5971408767b3735288fd0ee7ee7d01d9af4ef4cbec2e57c97b1f78e6d63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00599-of-01024.json.gz": {"num_bytes": 319637870, "checksum": "844df34f2a263011f9d1d85eaad5a1d95243769e9cec5a104807dd55e1fe431c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00600-of-01024.json.gz": {"num_bytes": 318099852, "checksum": "b05e66568a4472feee31f20918e9813aeae2d881f47b5281ff29fbcfedf4d5b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00601-of-01024.json.gz": {"num_bytes": 319136069, "checksum": "8dff2d56c9915d73e6154533e5de0ca9d867c5fdedcfeceb3e0ab22f3ba509cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00602-of-01024.json.gz": {"num_bytes": 319369121, "checksum": "45b2c1757260395afeb168b545892b315fa0bf14b3d144bfcab1fdaa6d79086f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00603-of-01024.json.gz": {"num_bytes": 319499076, "checksum": "46edc9f556ccae692900b222b8e4843360dd5dbe0798a8ad9cb51c07a451dbb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00604-of-01024.json.gz": {"num_bytes": 319132921, "checksum": "0cba8c8738ea7ff9a08bd1bab215010b03c6c83fe35206d83344d78005bdee6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00605-of-01024.json.gz": {"num_bytes": 319315562, "checksum": "0dc0d37658fd672c8d72775bd8855dce9037cf9715feda35a76afb1f0e87bebb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00606-of-01024.json.gz": {"num_bytes": 319223528, "checksum": "f679e437a3acda1a81013dc0f3fa93fde6c3309905e8142f8699a76bc04b7114"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00607-of-01024.json.gz": {"num_bytes": 319326218, "checksum": "7fe91f86f751b9aa3abf1c5ed0fdab89a76c7fa4eb7ab8b809ef29b0cf4a78d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00608-of-01024.json.gz": {"num_bytes": 319393715, "checksum": "a5daf706100eb797b5b0770fe0c790856637b22dc849aeda5b445ae5fa63cb3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00609-of-01024.json.gz": {"num_bytes": 319554192, "checksum": "4434338fe97d398d9565ae940c62539e868fa261be361ede1b5b0feb004160f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00610-of-01024.json.gz": {"num_bytes": 319786301, "checksum": "6b0d0e0457a721af6c67a31f5016432011e717302cfdc7ee39feb253fbae4754"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00611-of-01024.json.gz": {"num_bytes": 319356910, "checksum": "bfe201b1775270afef3a09fcfc074920cbb01093eef90d46f26b6b813d603994"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00612-of-01024.json.gz": {"num_bytes": 318780229, "checksum": "29248c4732fdfda2ba97ed38192ab391457e20fd70f713ef4a7cf084f9865846"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00613-of-01024.json.gz": {"num_bytes": 320190496, "checksum": "f5cb9be2442797d967b9041e48771196a6c0595933ef2102840b704e355f4d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00614-of-01024.json.gz": {"num_bytes": 320245862, "checksum": "89b74d0daea02fb69289ad259bbd0ddb1a64c5d6380848f7d51669be952f8a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00615-of-01024.json.gz": {"num_bytes": 316874605, "checksum": "78600c8703d5ebf80c99c089bb7a7c1cde843a66d706fd219eeac304f80e8525"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00616-of-01024.json.gz": {"num_bytes": 320237707, "checksum": "630ee29d4dc4cd5062eeca7877e5c1b204b36eb0b3aeacadf036cdb75c1ce840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00617-of-01024.json.gz": {"num_bytes": 319739365, "checksum": "d418fd284d06b1d2d9daebea3047ed06286640ac75d23893f1effc2ee9d7aa14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00618-of-01024.json.gz": {"num_bytes": 318634299, "checksum": "f5d75d129ab6c0f052028cf0139c3cf20eed3a9c5cdb151cd88ae42d5d1a32d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00619-of-01024.json.gz": {"num_bytes": 319086471, "checksum": "c558908f6e08b0d02f377c9aed1655d80106f4cfe26e955774bb420d19b2f74f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00620-of-01024.json.gz": {"num_bytes": 320665446, "checksum": "977f959e5b5eaa24081ce025d137647fffd65f1a54d2c45db9805a232e0c0364"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00621-of-01024.json.gz": {"num_bytes": 318576410, "checksum": "d07f3c31d7ec1c71b5ab9539a2ed49f6d5f46b48ee2e51800b9e28cee588a163"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00622-of-01024.json.gz": {"num_bytes": 320053075, "checksum": "58b897603eb83f789a1cfc6bf40a091093cbd8a0c20702018c411adc7b07a437"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00623-of-01024.json.gz": {"num_bytes": 320045187, "checksum": "3665d7579b3c57eb21ec9e55850e39307cc6f4ef8aa8b9937076ad6f142063a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00624-of-01024.json.gz": {"num_bytes": 320136842, "checksum": "35db069ae090e95c5a4d3db44eae73bcb29463c120584d7f6ccbe235983c5fef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00625-of-01024.json.gz": {"num_bytes": 317314201, "checksum": "7f6ddbbc8815e8bd10c99361fd8113cbbd84ebd92799eb6958cf98af825d2aa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00626-of-01024.json.gz": {"num_bytes": 320219970, "checksum": "4e2c46d1e3a94957717bbbf1e1e4300bd27ac17e588d426e0ba688983e83f4e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00627-of-01024.json.gz": {"num_bytes": 320083102, "checksum": "851ce6dfa6a4d1a4e3b8bf439e36db9ceb59eefc60558d429e2fec80655e1775"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00628-of-01024.json.gz": {"num_bytes": 320386844, "checksum": "86d8927f16d0790a07d6c68e745501188d13887df4a137e937ae00497d07c055"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00629-of-01024.json.gz": {"num_bytes": 319476643, "checksum": "c48cff721137b641fe9d5bcf30462c7e4e3a3ae631b7b4e39979c8c77f0890ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00630-of-01024.json.gz": {"num_bytes": 317961579, "checksum": "cde626b34c6c8455227fbb18a577877b518f529b6c8e16881cfdf334f2875cd9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00631-of-01024.json.gz": {"num_bytes": 318952266, "checksum": "0401582821f7b15f0b406f7ce00c56351b8e86a3c3282bdf4dd45b2f6146ea22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00632-of-01024.json.gz": {"num_bytes": 318261820, "checksum": "be48396ef18ce0f3650eca86eb36039f90b51737f9848086494f34fa28d60e70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00633-of-01024.json.gz": {"num_bytes": 319748854, "checksum": "9d5c342d82fcace21de2900202c3f2af47229aeae9d487a8b77b7f5b86c05f74"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00634-of-01024.json.gz": {"num_bytes": 317806530, "checksum": "00a70705afb91f6570d17257057c15b45386597b917061686f131bd41ddce421"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00635-of-01024.json.gz": {"num_bytes": 320313573, "checksum": "22a1286582d65975ed94f0ba25bf87e94d52a55214d0a51979a3e0fd9f95e3cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00636-of-01024.json.gz": {"num_bytes": 318151690, "checksum": "026c699ac6fa30f9e156a957026d8fa8df72daee3407c8fdc5e0bd7d6a3b50fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00637-of-01024.json.gz": {"num_bytes": 318665365, "checksum": "9bd931dfc074bc99df31d7fd31a5ac1dc8c8bc75f8e87b763545cd824edcdcbe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00638-of-01024.json.gz": {"num_bytes": 318521250, "checksum": "4b30ad531f7502ef7bc6398ab286e5c6c63d340c22792da9258ea95b496d1c0d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00639-of-01024.json.gz": {"num_bytes": 319997068, "checksum": "2bfdf36396e49ff625138d29925f54eb12b18d35f6d0bf5ca9e79194977cfb43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00640-of-01024.json.gz": {"num_bytes": 319355927, "checksum": "d0d0ed7304b5d79318b5230a1ab48d3ed03183f1eb11d96070604a7008cd7b30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00641-of-01024.json.gz": {"num_bytes": 319002081, "checksum": "1461ecb6b92819bfdc12808a5442d70f94538931f856c91dea602a23ba86ab98"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00642-of-01024.json.gz": {"num_bytes": 317689465, "checksum": "aa0af0169cf13db1f8133e8d76afeeae5f71d63d179794377a55b6c2eb938dc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00643-of-01024.json.gz": {"num_bytes": 317523344, "checksum": "5c060166e776f8efda48882c118dc0fd5e058d9ef40be578bad31e477114a16e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00644-of-01024.json.gz": {"num_bytes": 318876813, "checksum": "ad98ee119742cb8a6efa1be46e9670969397c7bde10049886d7d6fceb82387ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00645-of-01024.json.gz": {"num_bytes": 319981258, "checksum": "8930ae8e14c124218793d2fd1bbfb1b624e918cb092b21c6ca74347abd9dea4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00646-of-01024.json.gz": {"num_bytes": 319624889, "checksum": "a40705c4f9a4db4d2d698cf96e43b99fa0790b886506300eb4986a26de7063e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00647-of-01024.json.gz": {"num_bytes": 319240920, "checksum": "7129182faeac82b47127458e92903a209acf8272166024e8313c167d6f358456"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00648-of-01024.json.gz": {"num_bytes": 317305623, "checksum": "3124091a6c438fecbfc948b1a35ffb1462287ae06866b02a6dbb1a6651ccf1e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00649-of-01024.json.gz": {"num_bytes": 318998755, "checksum": "fdb286cfe9e9091a57b31be61a56a425fae07d6b44f0b45f8743d7aab0e980dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00650-of-01024.json.gz": {"num_bytes": 319612451, "checksum": "ff88c4310f049344b8a3f701bce12d08ef5f9b037e82fef7f1f670b3d51e59c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00651-of-01024.json.gz": {"num_bytes": 319098081, "checksum": "9c3b1843082aae39b057bbc7364e69cbc39bbdf91d5bff4f52b12cf1a264adf2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00652-of-01024.json.gz": {"num_bytes": 317107981, "checksum": "e6199d12a893ae5d05c5388ae7a679df419ef6a050c8e3ce3c15fe534943a774"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00653-of-01024.json.gz": {"num_bytes": 319623884, "checksum": "333ac93cf1f1f4da0f72c5e57b675052453b42dffe1e4d45ec680f4e3e075d97"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00654-of-01024.json.gz": {"num_bytes": 319055728, "checksum": "1efe352f2f2eba826231a5bff6c79390630b44039b226a5041a087e116b60f5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00655-of-01024.json.gz": {"num_bytes": 318539829, "checksum": "613c741cfb738017b3fa233512296d9127d661738721d3fccd806aad54d19d84"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00656-of-01024.json.gz": {"num_bytes": 319970377, "checksum": "51fa9b217b6bcf664c472cc2b258813e1f1d7a0f501c29b822221bccafa4e201"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00657-of-01024.json.gz": {"num_bytes": 318548629, "checksum": "c542c6fd2f3284d64f8d53b71ab8308bbba59f7f13e9d9eb20bbbaf13ad4782b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00658-of-01024.json.gz": {"num_bytes": 319845984, "checksum": "b3d8fb6ed2258c463367108e2942742e88eac657c859cc8d128035110fc87e7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00659-of-01024.json.gz": {"num_bytes": 318887872, "checksum": "02feb4e03020d767a4468251786d4857d5dc833969626bee616c7882bfda9ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00660-of-01024.json.gz": {"num_bytes": 319854892, "checksum": "a997d9187a185a29fb3bbeb1e696d32898efba8f5e9d6ed816493669f0c5ec02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00661-of-01024.json.gz": {"num_bytes": 317599289, "checksum": "86d9189ebc534c99da5a4407624a623561b159f758fb04373a270887d0b45709"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00662-of-01024.json.gz": {"num_bytes": 318138720, "checksum": "9c626f7aebcc4fc9afd533b6c8a372d884d01f508ce49c01ddd830e4e9e8b2d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00663-of-01024.json.gz": {"num_bytes": 318110835, "checksum": "441d4dd0d5d2ea7b6098a3fe006b9d7afd526188824a3325d44538fc5655942c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00664-of-01024.json.gz": {"num_bytes": 318996945, "checksum": "08ab0739c3565643b6a83d7091936f5d75a4d8418c956146114aa0315f205dd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00665-of-01024.json.gz": {"num_bytes": 320612903, "checksum": "1ab7bc2d0f7c6704c97848a9325015f06228339bc52cc1fb593d9c56145e7c48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00666-of-01024.json.gz": {"num_bytes": 319241006, "checksum": "8b1213325ceb2a2c89dffb891a31317e903d08fff911e4ba1ae66fc3bcce9973"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00667-of-01024.json.gz": {"num_bytes": 319650665, "checksum": "14676f97937eb3d0734e5f121c5f63002ba2d2c62b6c41b4b46d2fcab9ea9614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00668-of-01024.json.gz": {"num_bytes": 319198651, "checksum": "a406fceed5b7d17ff6d5773679c3df50e747215e39926228ddc9a60c6bf9d152"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00669-of-01024.json.gz": {"num_bytes": 319363200, "checksum": "1d3267d77f43d3d720dcd79c40bc3e8c0cd777d421b1b7d0e69e140199e34552"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00670-of-01024.json.gz": {"num_bytes": 320079826, "checksum": "85111c229b8fcc8428b3c13676bde8268f027fe06e1f576a3adcd82bce1603bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00671-of-01024.json.gz": {"num_bytes": 319494773, "checksum": "eeeed8d9f63a5c16ab9d62454fae5bef1896973cfa69cedfcfaac4565a793b27"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00672-of-01024.json.gz": {"num_bytes": 318304853, "checksum": "6793ec3ffbc147c36e471e1c06a664ac2143408c9ee46305694708eee0fb38cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00673-of-01024.json.gz": {"num_bytes": 319031236, "checksum": "3c886ff71973805a59312d8d43ee9e616bcfafd76c03a64d53ab548036b1fa90"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00674-of-01024.json.gz": {"num_bytes": 318647345, "checksum": "fd7f4efc0c8af611e7e137680342843d0471ca072421ab3c172a169ba2f5d217"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00675-of-01024.json.gz": {"num_bytes": 318313871, "checksum": "3b797b2ad717749a24866a97acb95aace0dd4e91ee7d51dcf1fdd46a9232b794"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00676-of-01024.json.gz": {"num_bytes": 318858652, "checksum": "2ccdf652fd413dc624643d35a76223e8a44e6241997841ec2d13ae11b56400fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00677-of-01024.json.gz": {"num_bytes": 319236091, "checksum": "bbf069c696f09e5467b17ba98479948a85101efa776094084e37581e72c01123"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00678-of-01024.json.gz": {"num_bytes": 318996096, "checksum": "3e3dd21861c713bd38d1803c32da1c0bc2496899648b4cffe1fa2e61b35ca056"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00679-of-01024.json.gz": {"num_bytes": 319915466, "checksum": "6ed56468a31564cb25668ceb5df325ff7138dd231afa85f676ac7af5e81e0642"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00680-of-01024.json.gz": {"num_bytes": 318537417, "checksum": "959ce407e7a892495c477b9e0071dff496fd20db9cfb04dd035ac59dd5b2f309"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00681-of-01024.json.gz": {"num_bytes": 320181225, "checksum": "0aa77d778f24bfdc8566b390a7a1ef1d7880a42b98b3e82e9b37ee3ed821a8e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00682-of-01024.json.gz": {"num_bytes": 319087756, "checksum": "a4da802570ee7bc27e752069612b633edf226078f48d5f55280f73a6dc934127"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00683-of-01024.json.gz": {"num_bytes": 320019766, "checksum": "587497efb7bcd4ca85ec0559e372ea285c1b95e3889d406f142cfe454d8e0e2f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00684-of-01024.json.gz": {"num_bytes": 318814245, "checksum": "6e904f73976ca18aed3375d1c1b308d749b9a4405a333dd0a2cf85360822e205"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00685-of-01024.json.gz": {"num_bytes": 318586686, "checksum": "c51012772c5bae73821b67f72c035f22a40725d42bcf51e439bbdfcd84393ef2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00686-of-01024.json.gz": {"num_bytes": 319648436, "checksum": "890b7408abd0cc04a84be3a3992d05714dbd30a9d33a8a9b05316a980fe51313"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00687-of-01024.json.gz": {"num_bytes": 318909835, "checksum": "b54b20c21ae9834b630a8aac057d47069cf137577d30b91fd1475f5824b61561"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00688-of-01024.json.gz": {"num_bytes": 319381735, "checksum": "422091d5ba0d44c64bb0c84ab4757318414bc01455a97f53190eddda89c2f3f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00689-of-01024.json.gz": {"num_bytes": 318995026, "checksum": "ad5080fbddc914c649027d5e2214f1d75e0cf0617eb3ca0b1fdb8ed9129f99cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00690-of-01024.json.gz": {"num_bytes": 320745318, "checksum": "d45492346bb4bf519e657356ecf1805b6b592683b98c20c93da2f07c50b06092"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00691-of-01024.json.gz": {"num_bytes": 318575084, "checksum": "43a07e8a98bc99f381558c938fc83acd4a37d565459c0f3f83aaadda816f66c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00692-of-01024.json.gz": {"num_bytes": 320651368, "checksum": "21a790ef1dcc9c6ffa071d1a2e21e330d6afcb45368dde9cfae8933c6d029742"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00693-of-01024.json.gz": {"num_bytes": 318429145, "checksum": "85558018ee61e33c4f3e05acc2029e69447a5717be880e9a0aa8fa715dbd0c05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00694-of-01024.json.gz": {"num_bytes": 319562061, "checksum": "894f4c906a33c644ea80c3a00155ced807a62e1bcd9f6e254cb6c88efeedd142"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00695-of-01024.json.gz": {"num_bytes": 318298964, "checksum": "06eb05f651f1d2fff495c48475894420334070df10c051c7253b7afb0bc38291"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00696-of-01024.json.gz": {"num_bytes": 317473664, "checksum": "59ea4f951335553945a644f7628403ba1a99a27e0d93fcfe5db18cbc3dd48ce9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00697-of-01024.json.gz": {"num_bytes": 318839008, "checksum": "f0203b0f2caa3287b8f7a64288af52bafbf033bcdf31dae54e501e4da47b9935"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00698-of-01024.json.gz": {"num_bytes": 318288032, "checksum": "fe2a581cd174429a81424e407aceb1d81b61d9796d74db4590327778fbd5016b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00699-of-01024.json.gz": {"num_bytes": 318696527, "checksum": "edf3aabcdb28fa2feb532b3bd55cd167c2200a6d8e19f05152be194e48acf87b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00700-of-01024.json.gz": {"num_bytes": 318900366, "checksum": "67d89417d1440afeeefd59a0993e4d12fb5731e917ec7f4e65d9319541b4b9e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00701-of-01024.json.gz": {"num_bytes": 318901212, "checksum": "64d302459e6871325282fd890d2922cb1fb25b47d677ce793bc065acc8d1bd07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00702-of-01024.json.gz": {"num_bytes": 318913325, "checksum": "f0bb360189166a0bd717bad85edf06943333b1854687839864aef3ee02814795"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00703-of-01024.json.gz": {"num_bytes": 318730274, "checksum": "c4e027079b9cf9b1adae3e285c5cc5dafeee5c74cf3621c424b6df9801d508f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00704-of-01024.json.gz": {"num_bytes": 320112232, "checksum": "37540f6a00523cbf429764893aa15aae6a57e53c89cf51d82a815feef02b1210"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00705-of-01024.json.gz": {"num_bytes": 319643559, "checksum": "9dae018569fa4bf33674f67ba03732a2f85cfceb53ec2cbb9457eaea607b8dfa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00706-of-01024.json.gz": {"num_bytes": 319941519, "checksum": "03926405dc629f0664a3d27c700a4fa2f606496f0b52a9bbf2fd2d75faae2f46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00707-of-01024.json.gz": {"num_bytes": 317628508, "checksum": "fac92295e4c85f087d27e0a6f231d782be7b2448e99cfc42c09c0e1e20964c3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00708-of-01024.json.gz": {"num_bytes": 318863059, "checksum": "39d4880d3e47e65ab6351e94b015810d66295a86a9f08534260ccbef41fdaf04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00709-of-01024.json.gz": {"num_bytes": 318412651, "checksum": "044fc99a1307737bc8d6d8a9b67997010309fc695eda6e8dd42e5b6bab2256d1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00710-of-01024.json.gz": {"num_bytes": 318631334, "checksum": "0b2c93cf298051864b8660e57182b38408ad738cf930afc09afdde26d952f819"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00711-of-01024.json.gz": {"num_bytes": 320587866, "checksum": "f1f6bb9770b76742d0131495879fa38ed8aebe8a0b38463e7834f0697f174ede"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00712-of-01024.json.gz": {"num_bytes": 318191204, "checksum": "b6873a7d375aa29ff39ca17c3bbc7e328292b1671b59a35e7b01c0e992da90f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00713-of-01024.json.gz": {"num_bytes": 319472539, "checksum": "3bb12a0a806ecb8a5eeaa00188c655f399460609b8a19005a7141bbcb3a7a694"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00714-of-01024.json.gz": {"num_bytes": 320196397, "checksum": "ca6e1fa6f27c9dbadbbaa767fd21dddee7c84ca96bbb6735640ba2631668ad0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00715-of-01024.json.gz": {"num_bytes": 320075706, "checksum": "1a773eec7d738c0e1e253bfd4533f0c43c0d133e564c3458159e0c47d767689c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00716-of-01024.json.gz": {"num_bytes": 318736413, "checksum": "c17a6b2115e56cc3d6bbbd94e8565fb14287057f80199528e6cba20adf557bf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00717-of-01024.json.gz": {"num_bytes": 317351537, "checksum": "cdba391e16c3bcb5569d978a8d11518103e7687714710ef4eba4f7c0821d67d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00718-of-01024.json.gz": {"num_bytes": 318017965, "checksum": "a25c494e4baead0af0afe6eabaa054bc15f80b6ca0ac8dadb1b354d72ffbe63b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00719-of-01024.json.gz": {"num_bytes": 318124432, "checksum": "94f5dfbec85a8c5b22ff1368a16ec2eb7fb4be25c0c8f004096156ae40bfa2bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00720-of-01024.json.gz": {"num_bytes": 318235852, "checksum": "c0248326e698599dcad01eca25d747c138881c61b5636ba765b21f9cd0df996a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00721-of-01024.json.gz": {"num_bytes": 318817834, "checksum": "c11df487a966e748cec522fae4ed76abf3e8cc9bcd28c301117fa52ddb83dc6d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00722-of-01024.json.gz": {"num_bytes": 318553851, "checksum": "63d3d0c3f5dcdff29a0a6ef41e3a9df3fb505c73c8554839e3032293a78bae2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00723-of-01024.json.gz": {"num_bytes": 320174720, "checksum": "29c97bb8ff301080547255af29bb5019a2c1fbc74f0a2711e626461d5a5f0b54"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00724-of-01024.json.gz": {"num_bytes": 317805413, "checksum": "65f8932f3c77b0fee5f2224643a71ff95246720368fe66d45c22df25ea4b9c2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00725-of-01024.json.gz": {"num_bytes": 319460597, "checksum": "dc785a8aa3a1f4ed77512d51a9139dfb24b356b5499ae67dd5b860101b1e0e4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00726-of-01024.json.gz": {"num_bytes": 320934004, "checksum": "45d857536d3535d08cddb6cf50d08d89cc28138a5be082465c3a8c27c02ae2bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00727-of-01024.json.gz": {"num_bytes": 318393879, "checksum": "e4a02e43eeabbecb81b971f4201212104b6214078cafd9500d5b5f323595f060"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00728-of-01024.json.gz": {"num_bytes": 318826577, "checksum": "cfaa0d0c8dfb333899c73e0c2aa00dfdadd00e5b4a3d477e7518c4141899c8a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00729-of-01024.json.gz": {"num_bytes": 320390067, "checksum": "528fe99b0c8dc917ac0f02a555603f9ae81e690b4ce1040f65ebbad3390c0426"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00730-of-01024.json.gz": {"num_bytes": 318156386, "checksum": "786e6913b4417a87cd4cb1882e181d8b2e1eb4b4db5b4b9ad2120b5efdf3e2ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00731-of-01024.json.gz": {"num_bytes": 320013543, "checksum": "f28fc2794c280fc1de263b9b2a81e42423f8dac3af7c4fbd3b3aff888821ca9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00732-of-01024.json.gz": {"num_bytes": 318753697, "checksum": "69491eb25dbaef78235f769422e773de7a2578e678ecde29dcaa663f4ebfa78d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00733-of-01024.json.gz": {"num_bytes": 318640706, "checksum": "dfde8960d738b873bcb75abe1661fcaa096d70c76aef21846b173b8adf049bbc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00734-of-01024.json.gz": {"num_bytes": 319447398, "checksum": "145add76dcd73916b548e7e3b161757c1bdc1f22a0f127019f24827afd6f85e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00735-of-01024.json.gz": {"num_bytes": 319868149, "checksum": "dcd4ba95672630f89e75b70dc08cb918bbe896f5d32ffeba7d3e4921b27c1f4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00736-of-01024.json.gz": {"num_bytes": 318404586, "checksum": "4710b1569342b7aa7ca610d8b8cbb2248a1c5fcd8c6ab3b7f875657dff4779cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00737-of-01024.json.gz": {"num_bytes": 319915151, "checksum": "7091dc758fd14c206514663eed0ae446178ff38e76c4cb7e711c63d419506e49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00738-of-01024.json.gz": {"num_bytes": 319709793, "checksum": "afe1a96ced49662b14bc60b4ff8fc1f610bbc6f3c515bb73f2fade7a0ba67678"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00739-of-01024.json.gz": {"num_bytes": 319789716, "checksum": "9e2332cfc994483d4b913c6556ca9c1698b95e81033b7bbc5a4f5271e5cce708"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00740-of-01024.json.gz": {"num_bytes": 319102226, "checksum": "61ddcc3af919b753638dd46f18f790d7783cdc3090dfddbbeb40faa93bed340e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00741-of-01024.json.gz": {"num_bytes": 318717589, "checksum": "aa3038c23a37561f2ba92e95ffeaa3e3641c1a69f8688b724116edd128e9ba52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00742-of-01024.json.gz": {"num_bytes": 319456536, "checksum": "ea9d23abfed6e3e8ab900291a3bc1faa27751ff94e35378f8c4eb07207036a9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00743-of-01024.json.gz": {"num_bytes": 318641730, "checksum": "6efcec6cd087be4eaa98491e463d0fb9c1253aca275971de08c56a20be9aa579"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00744-of-01024.json.gz": {"num_bytes": 320264992, "checksum": "71653351253c8f7fa18673a3f956bddebd158978708c5a4c9e9b5318f598e1f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00745-of-01024.json.gz": {"num_bytes": 318665967, "checksum": "347dfd824d6f4afe58c6f418ab5d332909038c880f4dcda7f774d3d7a588c3f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00746-of-01024.json.gz": {"num_bytes": 320005833, "checksum": "812bc3c082e3a65c8c77fc7767bb435f9be9a999961d84eadc9e0c602e5ce168"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00747-of-01024.json.gz": {"num_bytes": 318575441, "checksum": "a4414d376c69ae8dd5e60b206315cf920d5a797c6ef7c08fe0c4b4e28b4eb4ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00748-of-01024.json.gz": {"num_bytes": 319266882, "checksum": "f08aee694b85d5e7120652350bfafaa05495e609aa6d2fb0b913ed8a718d7dcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00749-of-01024.json.gz": {"num_bytes": 320205042, "checksum": "b3402b16a5cc817d89a19fd3456a50b5b6d5f3f555eea725167558cc85366d12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00750-of-01024.json.gz": {"num_bytes": 319198252, "checksum": "6b95232f6d53cff8045bd5ebaa87d6e6c511a74dc646d2a960eb87e801ff4f2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00751-of-01024.json.gz": {"num_bytes": 317855407, "checksum": "badc9d82efdbc8db5dc328e8aa5e80155c52f00b105b136d8c5c948fe237d61d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00752-of-01024.json.gz": {"num_bytes": 320283992, "checksum": "67c32eb497533d6fd20b206c38483d171275029ff525bba3da13b0c62e1ef073"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00753-of-01024.json.gz": {"num_bytes": 321030653, "checksum": "5e95b1cb54d7d7f12bec1559ababcab0c364a0af99e10a42a08357647ef5d3cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00754-of-01024.json.gz": {"num_bytes": 319059779, "checksum": "32cb59ad16dfda8a5b52615498fe2e6d85753fa44ab667af2f525a2467508da5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00755-of-01024.json.gz": {"num_bytes": 317737268, "checksum": "0ad2fef2fe37d59b163e29c2287938a768ee87acc34752394809295d0710c602"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00756-of-01024.json.gz": {"num_bytes": 317293218, "checksum": "db737ceace329fb1f8fe1aca38db048a1dedcb5226a4132485f26afecdc6c3c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00757-of-01024.json.gz": {"num_bytes": 319529375, "checksum": "8b823e97964894189a13df393e1b3978342fb24bd81f07af6e54b7bfa2992796"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00758-of-01024.json.gz": {"num_bytes": 319297548, "checksum": "3f31d7ad99d88dde757a651b12db909a30cfcae5796fe3f85722598d92344ba5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00759-of-01024.json.gz": {"num_bytes": 318154496, "checksum": "a4b780127d6f22aed49d155e234e21a847a60626143a8e7dc6e31a5f204e79f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00760-of-01024.json.gz": {"num_bytes": 319386997, "checksum": "020e68dc60004d0661de8a22fe2b9fa7f481fcecaef8fb06efa43093a2a9cc52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00761-of-01024.json.gz": {"num_bytes": 320035555, "checksum": "8d7b5a97770a062276ca909a3bd20365cbaf3931fcbeb8b7e479f5ee03b47053"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00762-of-01024.json.gz": {"num_bytes": 318099583, "checksum": "b8fcbbf9b55cde2ff66ca046884870e1e5f2d2a729a8eedb253c16fe0d7658e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00763-of-01024.json.gz": {"num_bytes": 318354409, "checksum": "ce2d9e44161b13f6226cfb9f93ad42fa0edd18eeaee923c8ab31c25aec1fc976"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00764-of-01024.json.gz": {"num_bytes": 319181291, "checksum": "53ed1ef77f24bdd7c189aae0905d63be97f48aa3233fda139e59af53baab242a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00765-of-01024.json.gz": {"num_bytes": 318147738, "checksum": "26b9b9ea2f94b322c03d1b83b25ab4e9a1a203fe9923728c5dd91f22d5f8fef5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00766-of-01024.json.gz": {"num_bytes": 317964368, "checksum": "e59fec52abde3fb4cea58a5a4e511f4cc61e21062bfdd1e3ffd60131a847e0ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00767-of-01024.json.gz": {"num_bytes": 318750919, "checksum": "0e5eff983e793a3d7cdd1ec85a45d58e5e6ecf7a12cf83a01888e148ab08acf9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00768-of-01024.json.gz": {"num_bytes": 318978892, "checksum": "171509b0bed8854b6de92fe146993be80ab31e0aa56953c7b0a66eeb738ff70a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00769-of-01024.json.gz": {"num_bytes": 319386097, "checksum": "704e7daa85c0e3ac974d51a6e2cf6df2ee053613fd2b77b5fe16d10b29a50a4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00770-of-01024.json.gz": {"num_bytes": 319623528, "checksum": "e787064473427fe17ba95d9326d009e9723148fb314a7a9605dcb6698854dad5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00771-of-01024.json.gz": {"num_bytes": 318911381, "checksum": "c54aaffd8162b30280e974e81e9d0669357b74394e0da2d1ca2ce613f5715e4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00772-of-01024.json.gz": {"num_bytes": 319386949, "checksum": "2f9c83681632482df6c65e4c70718c83f500305ee1d061626cdef35bd794a412"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00773-of-01024.json.gz": {"num_bytes": 319962599, "checksum": "f47c487ba09051c9a4bf320d69db9546e98948e3de68050ae2ba025c71e09146"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00774-of-01024.json.gz": {"num_bytes": 320370991, "checksum": "69a1eacfdb6f6fd49ea2b729a7ab291b96fd5bd42f993e2306d044871b069aa7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00775-of-01024.json.gz": {"num_bytes": 320433220, "checksum": "d35934fb537d1283d40897d05c1486f629776fe9e4ef127694ecfd0221f860c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00776-of-01024.json.gz": {"num_bytes": 318809986, "checksum": "9079970aa1618b6be51caeab7a2cab26e61c30aa53af361a6184ef6249bf65a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00777-of-01024.json.gz": {"num_bytes": 319617796, "checksum": "5e200e354ece1713a32a3e1ebcea33412de814dd5843df3523afa1ec9a4d5275"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00778-of-01024.json.gz": {"num_bytes": 318039278, "checksum": "b79309eb335c0c860c85d2b724df52c3613f61b92ab6cd6276c2be8c25a7b01e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00779-of-01024.json.gz": {"num_bytes": 319078058, "checksum": "fc6053d53255e4d4a4c22c42049ce3eabc224320a51c94c1116f3201f87b377b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00780-of-01024.json.gz": {"num_bytes": 317637428, "checksum": "e38c933003910b02beef64af2d330f32af6e6f3b7346fa121e89045c136c13af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00781-of-01024.json.gz": {"num_bytes": 318792407, "checksum": "b6795b4db199f7a7a92ef195aee3753e5e00df05fad2d8401b2b9feb56d71a76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00782-of-01024.json.gz": {"num_bytes": 319081289, "checksum": "dc20640bded03596eeec689f1293be55e72d138cf0c576df9768c7631931ceb9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00783-of-01024.json.gz": {"num_bytes": 318663257, "checksum": "ac2b4ee9ab8f25ec010a17358d2f3f1fb9d8d50c9f4b73357429277710e6564f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00784-of-01024.json.gz": {"num_bytes": 319687102, "checksum": "fb93dee8a974f2ea204c240ed4c24e1b64f91ccb421070be305487e4e53ca083"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00785-of-01024.json.gz": {"num_bytes": 318909034, "checksum": "2f298b358cc619fa72097e3dbd9ac91e7dc3f7c5f9c4f2ff6881c988921d2a6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00786-of-01024.json.gz": {"num_bytes": 319213094, "checksum": "60ebe35e0f23ccc61fc0eedc891ea9deb43001beb8205d31360a05b5d58e31f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00787-of-01024.json.gz": {"num_bytes": 318335621, "checksum": "a7b0aa4dafdda2f3dc3c1832b71d4a92af08f99a70a315b4cf9f60c1768bf2c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00788-of-01024.json.gz": {"num_bytes": 319444037, "checksum": "874dda510a01a2f78e51d917d309bcf1a0f21e7e1ca46661f93931a6200b3d01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00789-of-01024.json.gz": {"num_bytes": 317955670, "checksum": "ec949a05ec7750dacfdf692c1ba118a33454097fdcaa56626fb042eb93933811"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00790-of-01024.json.gz": {"num_bytes": 319033823, "checksum": "0939164a602d7c7140c619130977b6814639122d0038aff7bb840093def5172d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00791-of-01024.json.gz": {"num_bytes": 319366402, "checksum": "fd6ea942b3402b5da4acb1a03bf59b17df402e90c47dbb66fb198ca2f4b5e1cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00792-of-01024.json.gz": {"num_bytes": 319218667, "checksum": "9e8af5aaa6d5ed915eae334c6101948fbcc7bcf6c8c6beaf80fd1adecd67b078"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00793-of-01024.json.gz": {"num_bytes": 318865241, "checksum": "675330d6736a677760d854dcdd9a174eb7c1d426f94e34836a048c2139befac0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00794-of-01024.json.gz": {"num_bytes": 319384084, "checksum": "fd4c2623d9cbaed3fefd6bb88c2d88b58fe8f08e9e8ef0cea6bb22cac68dabd2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00795-of-01024.json.gz": {"num_bytes": 317654308, "checksum": "157533ddb56290662e25cb60842327daec23e377e116496338c9313cbf6991b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00796-of-01024.json.gz": {"num_bytes": 319298258, "checksum": "fd90f055499095efa9cb848dee62406d25820f929554b0e07674d4c95db574b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00797-of-01024.json.gz": {"num_bytes": 320048871, "checksum": "e089a95e96a081dd76e38acf9506bfc7b86c682892d3a8774e9784019db39306"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00798-of-01024.json.gz": {"num_bytes": 319291246, "checksum": "e29133ab6f83c84a69752a451053dfe20887ea884e09cc373afd89bba7458664"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00799-of-01024.json.gz": {"num_bytes": 319175282, "checksum": "8f3f3a67946615bdf499d64341d200477280947e5be8538748e28db768115947"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00800-of-01024.json.gz": {"num_bytes": 316687275, "checksum": "c9a17dc92658ce5d062af25e5c8610a7fbae501627cfc7324ace7ca6a8d75d8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00801-of-01024.json.gz": {"num_bytes": 318710698, "checksum": "4b7d1e130fd8ba536da073069221f68d567492b2bff27d8769fb4ef124cec3a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00802-of-01024.json.gz": {"num_bytes": 318914381, "checksum": "9f186b8d08f5d3090b7c9eb8a6954cf3202caec7cbf5c308221333cd115af561"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00803-of-01024.json.gz": {"num_bytes": 319111424, "checksum": "117b0590a976805001a879c49c42db55579e5bb9a5d4db9ce20e42746f59d574"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00804-of-01024.json.gz": {"num_bytes": 318186018, "checksum": "ea376d6cc1043dee9a00e1eca1c431aa59755d8966162701817f9cf274a758c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00805-of-01024.json.gz": {"num_bytes": 320382848, "checksum": "1e69e7896202206f9f804b2497c4d99cca5c1d139efc782b8ede2cb88f68b48b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00806-of-01024.json.gz": {"num_bytes": 319508172, "checksum": "9da7e230c7abed9beaed9d6090efa8ae1029a418dbbf6d04bb4386aafde3dbce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00807-of-01024.json.gz": {"num_bytes": 319995091, "checksum": "2e3ba0dbe85c004c6a23b4caf340282e0d0004ab574a14bedc9c83c67cc2c0c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00808-of-01024.json.gz": {"num_bytes": 319880961, "checksum": "f53fd08fea0f874d727422357521176c6810a54abf4fcc7019357b50f1928daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00809-of-01024.json.gz": {"num_bytes": 317100774, "checksum": "dbeed220f330b489cc262fbd7cbe84f04ba8a5118ebbd8f48bc7a4f5f63ae7b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00810-of-01024.json.gz": {"num_bytes": 319625750, "checksum": "fe5dced88ccd54b258c6740d8988e10b128a869ecf28e7096e689c59fa147d4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00811-of-01024.json.gz": {"num_bytes": 318375975, "checksum": "e4bcc5571fdc4f51b733d975e78ff02939d3463264a02d7e651271ab91c81df8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00812-of-01024.json.gz": {"num_bytes": 319663092, "checksum": "b1e41c198bc69d026ab997fdeaa4e687f7a8ddfca751add9bc85f00481708a63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00813-of-01024.json.gz": {"num_bytes": 319094357, "checksum": "c07287aedf6854f581aaf83b75c4939aa4b10181977d4c4be97c20989ab8f992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00814-of-01024.json.gz": {"num_bytes": 319521327, "checksum": "c96203ba5461ef92a7a2b0d4e598efda943b5b3adf42a7268c26f1c224410c01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00815-of-01024.json.gz": {"num_bytes": 319098749, "checksum": "72f2e65c5b482be0d9e3a3d8f5cdb703cec7a515e927bc4411e2f6ff5085ed5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00816-of-01024.json.gz": {"num_bytes": 320377295, "checksum": "df95ac17a25cebb854088cca345f60c2634d07f088e45e251d7f9afdb334c0c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00817-of-01024.json.gz": {"num_bytes": 319007451, "checksum": "bad1cc25de4f66ff36c69284e6b615f68bdc25e45f08e04e33ee463a0c6ef0b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00818-of-01024.json.gz": {"num_bytes": 319609737, "checksum": "acf1b390f1c492d97bf027f06898f1dd5cf8cc6def41f4d43b38a0c99f4a85e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00819-of-01024.json.gz": {"num_bytes": 319164157, "checksum": "3d973eb401876c57e9cd1420fc938da9dd7b08f97d4596c66a8c159e2b56b1b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00820-of-01024.json.gz": {"num_bytes": 320181073, "checksum": "101d5f0079caa840b934c14800ba5cbb7fca22e9e6915b98b4dc5f37c57f5b4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00821-of-01024.json.gz": {"num_bytes": 320949305, "checksum": "34ba423c93c4262234e6e2005aba0436daa99b05570cff0a58e9d27b65d76896"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00822-of-01024.json.gz": {"num_bytes": 318392521, "checksum": "4a586e220fe34f544dd068f4e1c310459cabd5dbea9a991c21c09f70079eb4c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00823-of-01024.json.gz": {"num_bytes": 318526893, "checksum": "3b10a8e32a3a8f6541400d697516fcd3fffba3554e8d8a96451f01fc6b729d8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00824-of-01024.json.gz": {"num_bytes": 318640792, "checksum": "c921270db8004d309f91e3209340c476191793d47b3cfa9d19fdc602d43dfe65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00825-of-01024.json.gz": {"num_bytes": 319524026, "checksum": "a6eb347db464976ba5d1aaa4fa64e103ba36520dd1e9c103644caf187be471a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00826-of-01024.json.gz": {"num_bytes": 318469810, "checksum": "dc5f88e6161ac06165f3cd4cb91a00cdff75d2f900e8f53d62bacfd833e352b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00827-of-01024.json.gz": {"num_bytes": 319391185, "checksum": "66a240be851d6622adf7801d9634a456e83e9edfd135601c0dc1aab48902d7cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00828-of-01024.json.gz": {"num_bytes": 319625277, "checksum": "2e989beeeb2a63bfb87a5a401619a8e4155a961b44441cb5f627c29f25962dd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00829-of-01024.json.gz": {"num_bytes": 320001237, "checksum": "0653e4052fb7a4ef503bdfbbee332d650492e99c130a85c04250e18d91cfd30c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00830-of-01024.json.gz": {"num_bytes": 319240468, "checksum": "bd56e55e75a8237b5292fa65e5ecb0dfbabef6ef0dec6695b13522803210f40c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00831-of-01024.json.gz": {"num_bytes": 319174603, "checksum": "ca9d6c643127a390823655256a45462ee6e75aa2485141f6530a3bdf6ce4f572"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00832-of-01024.json.gz": {"num_bytes": 318909883, "checksum": "e91c35d94e183515e660cd8c874c12bbf22e1fd683312446f02287b0d032fb68"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00833-of-01024.json.gz": {"num_bytes": 319095835, "checksum": "971d9a4f8bfce564d42dc0a80009acfa7d2f47557ac19836ab426defe1877714"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00834-of-01024.json.gz": {"num_bytes": 318319786, "checksum": "159412a58fb8deb59e039fa0102bdb746065cbc6b4d1d3da892930fbf8b0f178"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00835-of-01024.json.gz": {"num_bytes": 319959334, "checksum": "814518d53b3023e3b8ac22dad9d65dd50d455a4c7db1490022f447f793f4d24f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00836-of-01024.json.gz": {"num_bytes": 317642779, "checksum": "19ad4fbaa3ff5c638b77980300b8c162c21a8237b87d054a30c46aee67d0ad94"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00837-of-01024.json.gz": {"num_bytes": 320687986, "checksum": "190de7948a4b163047ecdfc856e5f78bbff52ca883edfad26b32fbc0b57ffe36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00838-of-01024.json.gz": {"num_bytes": 319802866, "checksum": "ccb4d342791a187f3bde225e008ff8cf70465f7fd3eacaa8bbce1ec4e52c2622"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00839-of-01024.json.gz": {"num_bytes": 318621894, "checksum": "3ff5cf5b33996a663df5783f3f41a5b5b2f6e08a2cf91e74cad3bf82291192fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00840-of-01024.json.gz": {"num_bytes": 319757379, "checksum": "8292e0854c01ca79ef03dcc1752ddc1f0df747ad67551b7c0fa5208b6aa3f822"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00841-of-01024.json.gz": {"num_bytes": 318779722, "checksum": "9eee9e089bd396adf5a276eddca9f6352e07f8c33877f85c1f65968aa0c06128"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00842-of-01024.json.gz": {"num_bytes": 318692591, "checksum": "caf3f40a144b43af08687e41a1eb7d08da1b78cd1600574566e11f29fde9cd34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00843-of-01024.json.gz": {"num_bytes": 318944616, "checksum": "e74d624534091173546755ca236e5912cc8acf8cfef5f9c197b541ebe76f0818"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00844-of-01024.json.gz": {"num_bytes": 319392887, "checksum": "e47d3f44f996398b54f18729f4e81d88d04b19bc529847e86277a6a91ae74e6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00845-of-01024.json.gz": {"num_bytes": 319215311, "checksum": "de7cffe64f422b02668137272943537946c15539954b564345d6722c4eb06345"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00846-of-01024.json.gz": {"num_bytes": 318129297, "checksum": "1d5ea0ab8fcb3975735aa421d646cea4544087f60a79ec209b63c93b6318523f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00847-of-01024.json.gz": {"num_bytes": 318134095, "checksum": "6fa4c50808df2aa8efebae3bbf832ba2b0be2f7113633fef720cffb3c50143a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00848-of-01024.json.gz": {"num_bytes": 318521356, "checksum": "3aeb657aa448af82551c653802c669c985c00b7daa593de07f80733ae5dee84d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00849-of-01024.json.gz": {"num_bytes": 319541694, "checksum": "1cc016f58a4a2c54625214f028df05247ed319b8c1868c96c2efe8147a73d08a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00850-of-01024.json.gz": {"num_bytes": 318861613, "checksum": "eb5fbe6eeb4b0281604df264a5b04a3a0db96ff0d04f252375a788a0d3345c67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00851-of-01024.json.gz": {"num_bytes": 319356648, "checksum": "ffe1397f1d412979cc66820555ef27345f3a2a48b8bcfe682d48301135e8c12a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00852-of-01024.json.gz": {"num_bytes": 319662372, "checksum": "fa78ed98d602276520e823e17adc7f796320d95e27e08d84d06e66e415b79161"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00853-of-01024.json.gz": {"num_bytes": 317625507, "checksum": "b10cff62fac5191b9cb5e2025227adb838088773e79bfec0937a34bb857e1b1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00854-of-01024.json.gz": {"num_bytes": 319665550, "checksum": "15441b2a7c09a477389a8fbd7401c549dc8281f2bd44251b1546077301e24624"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00855-of-01024.json.gz": {"num_bytes": 319059897, "checksum": "f6127845b162181dd7157dd316021a4e6b5d41393c66d3e577491cdb74657f2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00856-of-01024.json.gz": {"num_bytes": 319243991, "checksum": "ec9f0884c5ddf82550105f969222d3ee8b0d4907a0a2540ea6c8c67c2d2e9179"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00857-of-01024.json.gz": {"num_bytes": 318546680, "checksum": "840205fa73336ff51d75008ce8c530164ebcef3b50f1ad8deab879a67acf8d5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00858-of-01024.json.gz": {"num_bytes": 318306547, "checksum": "e9b3819e9dc98d66a61f8f4e8f6ecb03099c79ae87a175fe1ae484174b173b44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00859-of-01024.json.gz": {"num_bytes": 319088302, "checksum": "eced8de72f8755fa0dfb690c626cefcacf5fbbce97029d4589058913c31b9339"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00860-of-01024.json.gz": {"num_bytes": 319704792, "checksum": "90a169718609f16abe120c4b63a20adc0bbedba51de14b004d34dabe530339f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00861-of-01024.json.gz": {"num_bytes": 318444445, "checksum": "d020840f09fa426ee15d19f05e5afd9cf674048e0dc4438dae0b6f02c7227d9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00862-of-01024.json.gz": {"num_bytes": 318606300, "checksum": "e02bf9d3f1a398972f7d78b9b1aaff9a92146554a1358ea1b16ce7873a9f8fd8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00863-of-01024.json.gz": {"num_bytes": 319273730, "checksum": "c977f143cbb5e61160ce76f1cabf7bea6c158abb7e159ec3362aad1cc7af0ade"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00864-of-01024.json.gz": {"num_bytes": 318143165, "checksum": "bdf20dbde61f0663feb70be419c39c60acdc7ecbbe1430d47bf79ae2e114f168"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00865-of-01024.json.gz": {"num_bytes": 319041356, "checksum": "11c9c068ec5c1b612494c1473b7cace67a55ee66155559b19035df180ee260a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00866-of-01024.json.gz": {"num_bytes": 319758401, "checksum": "ab4436f283af0ef2d33b93cf026907cf68255beee9d9dc1d6c542dee9c3f48a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00867-of-01024.json.gz": {"num_bytes": 318991336, "checksum": "56beb5edbca3b66981f5f8e65f2a13a0f6e99e68ff50cc263cc529a4d8ebf371"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00868-of-01024.json.gz": {"num_bytes": 319984390, "checksum": "b9368d2ae0eff869c70c1a1214126c1d084f56887102d3d46e450b2c934102be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00869-of-01024.json.gz": {"num_bytes": 319462888, "checksum": "68ab404e0ca2247686eb264a0d7feeb9d2460162434f5babb2b1da82d865343e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00870-of-01024.json.gz": {"num_bytes": 318426018, "checksum": "2d60208a558f6ba92d6c6307e1ab626acd7ff3b7bc25963b09e87e464751c42b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00871-of-01024.json.gz": {"num_bytes": 320233396, "checksum": "ee2517922079c713605dafffe6bc0db0a947abf64ff92c409aa1015b92cdb099"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00872-of-01024.json.gz": {"num_bytes": 319570251, "checksum": "83ca4f125bd628cb28210fb874db717635009e36c60b42237bda48fcb611a53f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00873-of-01024.json.gz": {"num_bytes": 318755978, "checksum": "d94ce49fd17da5f70d1a89bc9e5323daa54f0b8417e1ee5d991467c80c068ec7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00874-of-01024.json.gz": {"num_bytes": 318986904, "checksum": "f634915d1b529d9d728fd96993bb151dc07016767cd44ceeedddec73eaf37074"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00875-of-01024.json.gz": {"num_bytes": 319116193, "checksum": "6367b1216e1c6ab18af66471d866f39caeb9a538209134a9e6bbbcb81bc51db7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00876-of-01024.json.gz": {"num_bytes": 320829257, "checksum": "c9ad4ab8c6e5995aaacd72ebc6654b43b4756804bf3cea808610f9b618f98fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00877-of-01024.json.gz": {"num_bytes": 320082625, "checksum": "835ae7d54732c309bc9aff231268474af66653b06ad6ca17b54dab6f4a7d30c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00878-of-01024.json.gz": {"num_bytes": 318964554, "checksum": "49c761449d5052dd6c408268c77196bffc5125eb5189390f73ba0ce8550f0175"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00879-of-01024.json.gz": {"num_bytes": 318699617, "checksum": "521e1c5fa967a6f29641e7c4c2b210acda0736b32f318e24aef0e587895ed492"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00880-of-01024.json.gz": {"num_bytes": 318723630, "checksum": "dee1814b24f9bbc3aa3430cd80302b08b863eb1b92698158960b6be216845843"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00881-of-01024.json.gz": {"num_bytes": 319839271, "checksum": "9e57ea6a0e3d8a7798a0cb3e6344e1711e8fd879e2e396294718ff360fc7c4df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00882-of-01024.json.gz": {"num_bytes": 317773196, "checksum": "2e5e5749618e53668222c7d310929e2177772dd7c14592e61dc86f163e353c8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00883-of-01024.json.gz": {"num_bytes": 320262049, "checksum": "f80afaa4495a2d41ad4d7380b79040569179b24ef5c2df17f75ce8e135d786b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00884-of-01024.json.gz": {"num_bytes": 319146213, "checksum": "77338479b420dab9316a4737fc243de84b5e88392cbbb46fa0619045a42432cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00885-of-01024.json.gz": {"num_bytes": 319022605, "checksum": "3a67fee2fb77e64aa13fd595d7786b432203f36712ff723ec5999a341834b38c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00886-of-01024.json.gz": {"num_bytes": 318624429, "checksum": "2afe387f2500c57294acf1403a8c27f27f6c7c2d228dee0f1ed70a02c438f838"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00887-of-01024.json.gz": {"num_bytes": 318733911, "checksum": "3fe087b3441f74730ab137ba9486650cfedfe2d724573c3d166565d7d1e40938"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00888-of-01024.json.gz": {"num_bytes": 319926754, "checksum": "dd2df1977458cac34ef1e52059bbc28738e541761d7ad11c0ffc8ef3ca061190"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00889-of-01024.json.gz": {"num_bytes": 319085344, "checksum": "4172244cc3fc4a4e9e09f04f8097cbc678aebaedb9d1fb97b1daae16b0b8ef45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00890-of-01024.json.gz": {"num_bytes": 319838671, "checksum": "8ffaf34eb8209e7ec250303298f9eebd2833fedcf80414c20331e8dbed42251c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00891-of-01024.json.gz": {"num_bytes": 318169092, "checksum": "daaf74ba5d12a7415da94be0f4454336aa3d86ad5cd300dbe30cef596835ac8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00892-of-01024.json.gz": {"num_bytes": 319662776, "checksum": "6d99c0419a6c9633620fb0aa7b7610cc5d06696e839a1a52953fd7db7a18e053"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00893-of-01024.json.gz": {"num_bytes": 319541919, "checksum": "5f246aeacef0dc8d40a036bb1eeecf278f66d7215a134fb746d30f3420d18c18"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00894-of-01024.json.gz": {"num_bytes": 319528897, "checksum": "9975fd5d23d25938f00de3fc9240d77c27b4784c2f443b1914652a06d3b59fcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00895-of-01024.json.gz": {"num_bytes": 317548307, "checksum": "7af9e2abfaebd4afe05a0e28d3e6e3126800a8b9b7ad49de360e42f2eb2c8506"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00896-of-01024.json.gz": {"num_bytes": 320278601, "checksum": "1941689d6a0e449423faad6e41714f33d5b23cdb1bb73961a888a87678fc74b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00897-of-01024.json.gz": {"num_bytes": 320161831, "checksum": "3d951cb1ae4a9b3c6ff70555139435febda83d24bb04ea27b229a05424b470c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00898-of-01024.json.gz": {"num_bytes": 319341305, "checksum": "3227b97aa9ff57b62be2a26fd8131e9ea45f7731673acb43432e529ea4978a25"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00899-of-01024.json.gz": {"num_bytes": 319658969, "checksum": "c746f8bd5fffac933640ff39db0b9d7b022edb28d7a4b3237d8c69fd919b7b48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00900-of-01024.json.gz": {"num_bytes": 317494627, "checksum": "0327f0c57a668b2b34e72f4c53d4cfaeed787d879843d0bba27b5be58d1ee5fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00901-of-01024.json.gz": {"num_bytes": 319683481, "checksum": "886449092779ee26fccd11e0c89c36e449346dc6b1f0a7cb15b6b53c897790a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00902-of-01024.json.gz": {"num_bytes": 320228529, "checksum": "6960d8539df78e98858ba8cebb2e637b6c2ef20890b5f2af1cbf4621b52c364e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00903-of-01024.json.gz": {"num_bytes": 318961279, "checksum": "4ddb3c9e9276d220f1d4dfc32bb61a090e895e9e3c9f53c169db99a024e7cd95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00904-of-01024.json.gz": {"num_bytes": 319926290, "checksum": "69a941cbbcb673efdb254c162854fcfff6fe1132182210235b91d1d21ed4d2ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00905-of-01024.json.gz": {"num_bytes": 317982280, "checksum": "1d9613f366b91102d018e57894df520aaf1910aa98e06cf369d9676e498610c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00906-of-01024.json.gz": {"num_bytes": 319012210, "checksum": "4855989c814582f5cc0a5e9b8f9d1f642ae33de81625d4bbafaafb709c1cd260"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00907-of-01024.json.gz": {"num_bytes": 318515420, "checksum": "8f34dbaa454215922a29fea975357e4e705381a65e4dcaf8b0d8c200f9a277bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00908-of-01024.json.gz": {"num_bytes": 319286320, "checksum": "536bf0610a2c14d1d59aea0b52fdc29cec19cd7eaa4c3a5e5fec04dee103b29e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00909-of-01024.json.gz": {"num_bytes": 319938295, "checksum": "3bb3943183f579c15d0d30440f6c82d0c9c64d6ded398dfc7c67502d73868781"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00910-of-01024.json.gz": {"num_bytes": 318423425, "checksum": "adbdcf170531c725b54c1e5713676b789589b2fb77310f3e64a0cc30b83602ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00911-of-01024.json.gz": {"num_bytes": 319578185, "checksum": "a1342a95ce77013820c36e7d038ed47ca4d40cdf3584a66abc310132435b25fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00912-of-01024.json.gz": {"num_bytes": 319154715, "checksum": "4973afcb1d7b4816e3a3df1b9ce1e48a0eea4fe8ead5f83ea753e46a934e5ddc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00913-of-01024.json.gz": {"num_bytes": 319011218, "checksum": "c9a158f69a123859569e1cdd475355afda32d7e5c48001591f0b6c20dc17d572"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00914-of-01024.json.gz": {"num_bytes": 320027387, "checksum": "61f6c0f839908e7d3105a6926c501bcacd293d1ba50c3b8639ee227c9a8270b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00915-of-01024.json.gz": {"num_bytes": 320280632, "checksum": "a74fb91d8f7d79b09017a7f996b6ca5d59e4ecad9fec354ac977c0076d53fc66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00916-of-01024.json.gz": {"num_bytes": 319278877, "checksum": "cbbb8dc274fabb4435db5fef5da1d91671e1a4c7f3f652742324f9632b01c5dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00917-of-01024.json.gz": {"num_bytes": 319616831, "checksum": "31e62cbd6209fb7831078e4a262d1b25c0590f9425c62b2b208d4030ed5722d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00918-of-01024.json.gz": {"num_bytes": 318635363, "checksum": "95e5c2f51abc9ef4c0422e91b77f79ff83c8cc38e585df621fbc0dfef48a84c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00919-of-01024.json.gz": {"num_bytes": 318885096, "checksum": "ea5960d4fbc7d5e7097edbf2c9c706e6b7c7e9d3e36633be9bd68c4038955f10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00920-of-01024.json.gz": {"num_bytes": 319228627, "checksum": "73b721ae576dcfa83bd963e49530f73d76b788a669e3abc1c02189900c80cf02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00921-of-01024.json.gz": {"num_bytes": 319557114, "checksum": "710c65cd504e87b5019c01f658e669d1e023473d879913a9522760d33546cf24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00922-of-01024.json.gz": {"num_bytes": 319356053, "checksum": "f0b54b3c6b51a356debc9414df0438ee525ae5114cbb7c8176634b7493095022"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00923-of-01024.json.gz": {"num_bytes": 319766600, "checksum": "d5b80091c8113c283d91ff5826b46068b96c423c0dc74a646e2c8d1c5d815cea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00924-of-01024.json.gz": {"num_bytes": 319733540, "checksum": "56a54c7d4114c21c1657df0d295839c2bd4904cd1b651104e2a155c2bf1b5aca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00925-of-01024.json.gz": {"num_bytes": 318944357, "checksum": "4d396c29cd1d9ba16016fac37c333c0a872f6cb0e9faae7966e53f6e5c879d67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00926-of-01024.json.gz": {"num_bytes": 320276135, "checksum": "39a64c261a76d5e13f187f12c886b22e2db08fba968bc9d0c1cb0d3c241abda7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00927-of-01024.json.gz": {"num_bytes": 319181837, "checksum": "86db529dd52fb67173588fcbc9f0e52c99ad6dd34e44865150bc6c962de5b3c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00928-of-01024.json.gz": {"num_bytes": 318966114, "checksum": "d232df8033ddaa7397dbcfa8ba4ded9421ee9bfc091c725b311fd963b29f13eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00929-of-01024.json.gz": {"num_bytes": 320087917, "checksum": "fca6bfe8fe17c867681c58df081f2186dcc6bf22e46ce3783f85b918644c0b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00930-of-01024.json.gz": {"num_bytes": 318921677, "checksum": "b8031359e758cd835c44e81303e04ef7b2137d2e1a9472d7e04552c353d883c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00931-of-01024.json.gz": {"num_bytes": 318978028, "checksum": "bb5f2ea8a2e56c69813bdc08cb243c0763126e7b5f6c5cb57e7f4767d2126f89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00932-of-01024.json.gz": {"num_bytes": 318627424, "checksum": "f6fd2065ce202d5347243a2b396707bb606be20c1829989bd7dff6d9fb7adec9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00933-of-01024.json.gz": {"num_bytes": 320226802, "checksum": "b303d2ece81c1f7b882703b915765212796518010aea6a108a441dd0a84a6128"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00934-of-01024.json.gz": {"num_bytes": 319908526, "checksum": "e5b05714922d132073122e83933853f52f0046c9f51f985cfbdbd310e8d677de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00935-of-01024.json.gz": {"num_bytes": 318941663, "checksum": "4296055a31409a778c516afe25a8108f23dfffaf13cac33e5ed834a37c46b37c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00936-of-01024.json.gz": {"num_bytes": 318430860, "checksum": "4634630c012ed184b264ea01c97f7bb3f1af030f2466f1d99d20bb0472f74511"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00937-of-01024.json.gz": {"num_bytes": 318008229, "checksum": "131cc9a2fef4ebe81749f1844b7c4b194b97de7db4f5253ce59207e68d8b4df8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00938-of-01024.json.gz": {"num_bytes": 319099506, "checksum": "fff55e3b2ff8b53e56ab99def626a7334ce67d2414351b2e83d84298052dd9b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00939-of-01024.json.gz": {"num_bytes": 320457851, "checksum": "8431e38c86516ed88d5c028f4a1dad32b02bcccdc03f9687d18f8312e493bcb7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00940-of-01024.json.gz": {"num_bytes": 320607829, "checksum": "a68c577555781adc777c09c68f623431469d67e9b66af7b0813f09a512b7d777"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00941-of-01024.json.gz": {"num_bytes": 318923471, "checksum": "807ffde4034b6b95a5eacb71f093686586ca11e417517894cca99dfe7b12563d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00942-of-01024.json.gz": {"num_bytes": 319880902, "checksum": "d03d04f619a8f3afbefa6d67986f50d5ee264c45de36c0ba67b069e343e002ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00943-of-01024.json.gz": {"num_bytes": 319079341, "checksum": "e482c4dee03a34a1a5756e6def26134c9a3f18ee386f5569d6cbf16d3875a429"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00944-of-01024.json.gz": {"num_bytes": 319436318, "checksum": "6241f9f35640598c05bc5cd00d8cc024dde59c0065c8935da229a8a583de32fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00945-of-01024.json.gz": {"num_bytes": 318998098, "checksum": "85f192c1ee9734da0f1dcad31c2b8111076977582e139ecc1ba959bf2df6b262"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00946-of-01024.json.gz": {"num_bytes": 321951470, "checksum": "44bccedf6a8db115bb6563d6775ff03c67511ce4e23a2de77e79edcb568c9fa1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00947-of-01024.json.gz": {"num_bytes": 318689631, "checksum": "36f0bfa191ad7d51452d51249c724150f8c3774142df3720f176f2772f42f3fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00948-of-01024.json.gz": {"num_bytes": 320347661, "checksum": "f4a7afa90b6d81a4cdc99100b75b4d3174c4d5d670042766c3e0418b7a97ef80"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00949-of-01024.json.gz": {"num_bytes": 318054841, "checksum": "f39d0c9bfc0a562ede67b8cfc57e6974a8a999e2bbc1b6940f107169b4f06e4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00950-of-01024.json.gz": {"num_bytes": 319722042, "checksum": "bf376260e5a838b3b901ceb22f922829619be710718446ee95c24400cbc73495"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00951-of-01024.json.gz": {"num_bytes": 318315382, "checksum": "987cd895f63bb74c9d4ce229ee853c7bce53c75c324366a0d06377c36030e39f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00952-of-01024.json.gz": {"num_bytes": 319247792, "checksum": "d218dda02748a22821c2ecccf1cbb136dc8772a25ddfacc7ab354fc089470e87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00953-of-01024.json.gz": {"num_bytes": 318411551, "checksum": "698768f3d7959b33fa74a3827e995b0c184bb3b4c46eba667d7dc3365fdd07f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00954-of-01024.json.gz": {"num_bytes": 318809810, "checksum": "651d9ff43d5a3f7f5945ccf26b9410018248bf64956f3485c50b0df9034fb2ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00955-of-01024.json.gz": {"num_bytes": 319761211, "checksum": "29fa5c68fb8d3719e5f5f17568ce888522de64499554b5f0f4dafafb4ee5b40b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00956-of-01024.json.gz": {"num_bytes": 319255736, "checksum": "333a90a9c13f71e41a7cdd4784684bc142c79ef99155b9d62d062db318798b93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00957-of-01024.json.gz": {"num_bytes": 319504417, "checksum": "730c90615fca09c81d9644cfae40d325851bb9bbc1af696caaadd67d8282ab5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00958-of-01024.json.gz": {"num_bytes": 319066016, "checksum": "bb565af6529720ba2a3e989769b33d978ef49cb2aae49c60f2ff98a981414280"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00959-of-01024.json.gz": {"num_bytes": 319887940, "checksum": "8992783693dd0ad5ce07427f6b5739c818f13952d90bb61312ec98f9c813f313"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00960-of-01024.json.gz": {"num_bytes": 318051437, "checksum": "4773edbc822ff8d51ec13af6c371214aea7545047d9babeeac0b29180d52fa0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00961-of-01024.json.gz": {"num_bytes": 318373291, "checksum": "ff33854746566f7d3b4ba9eadd1329ece48c034345fda000d9af73cb26d197af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00962-of-01024.json.gz": {"num_bytes": 318572513, "checksum": "a6d07f7caf55fda0df74a22b454d196fb2e29312d433bc5506b00448c22b579c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00963-of-01024.json.gz": {"num_bytes": 319488084, "checksum": "453f666c6578376508b1fe8bd3fb8ea5bf030aca5cfedf383cd23b27de15228f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00964-of-01024.json.gz": {"num_bytes": 318905670, "checksum": "74f64ed6583e6a4df4b3c3f8a76263a2d63905d51d5680d9683d86f5039d5b56"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00965-of-01024.json.gz": {"num_bytes": 319452844, "checksum": "88016c1a0663b89dc3d76689c827c82a6d128401ae05f7b70c8727d75302cd47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00966-of-01024.json.gz": {"num_bytes": 319334588, "checksum": "dd9300bdc27513dd62578e1cf3c8302647b49c61185c282a684011d788c43d17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00967-of-01024.json.gz": {"num_bytes": 317872396, "checksum": "90747ee63ac7d8176fde1f2afce8deb7e39bf19e682e17d0fcc1711d09d5f1d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00968-of-01024.json.gz": {"num_bytes": 318988069, "checksum": "2cc785d650013d35d5d31b1e85c5530b197687c69117881362bf6b98f47c22fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00969-of-01024.json.gz": {"num_bytes": 318324244, "checksum": "83750d93c788ad32a256862b8173db3549eedf52ac131f09f662f1fe0f46bd13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00970-of-01024.json.gz": {"num_bytes": 319494164, "checksum": "e0e46e185851ec569dc13a18519988ad926bdcd9bf448eff00aebf6df141f5cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00971-of-01024.json.gz": {"num_bytes": 318714665, "checksum": "941c9bf116353230417950d292c38b12b00935184162227eaec01870ab7f4510"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00972-of-01024.json.gz": {"num_bytes": 319518275, "checksum": "de30e19a155a6f4303afb0311416aa84cc3baf5a09cef55b8e2adc2a4f478f6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00973-of-01024.json.gz": {"num_bytes": 318092574, "checksum": "f70bf6727f1f308d93684ca41e9c2c68dfbd737a90da6375b58f162e8470fdea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00974-of-01024.json.gz": {"num_bytes": 318555677, "checksum": "109fe184ac9498ac571cd9c6cb38ae5ed566b0e98e8b7718984656a70cc6b224"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00975-of-01024.json.gz": {"num_bytes": 319045215, "checksum": "03c4257851857450f7397ac3d627a60ffc98708ad5aac6e1f73e6ce818fe7be8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00976-of-01024.json.gz": {"num_bytes": 319172031, "checksum": "7d98fa662aa9d0ff7ed50cc72195bdda2147212b34a3d22f0f757a4eb158d5b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00977-of-01024.json.gz": {"num_bytes": 318650530, "checksum": "bb8ccc07ecc6fd39ae97136418efc543efe5541e85910a7f333ee5cebaa3b595"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00978-of-01024.json.gz": {"num_bytes": 318609909, "checksum": "40b49f3fbb2fce73bb1851304b290fc7fb400d13c2448ac7e5e559dccfda7ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00979-of-01024.json.gz": {"num_bytes": 318881197, "checksum": "b29f96cfba574428cb66f54b20c4a848bc83438256167afdaed576a3931117a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00980-of-01024.json.gz": {"num_bytes": 318506081, "checksum": "a15996adaaf41e5615cb5c7fa2ef1b4e3003836542d0851d1c6907522f534fee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00981-of-01024.json.gz": {"num_bytes": 320000305, "checksum": "38e282b433c4e3dcc9fc2b056f6ddbe4eb857c5137f7c51301d53ca259d6bdc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00982-of-01024.json.gz": {"num_bytes": 319959158, "checksum": "97d5e58088a87a15b71db975d5e09b69daf497b7dff3ef809e1b8292caa27905"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00983-of-01024.json.gz": {"num_bytes": 318921242, "checksum": "f062e04f89132576ac1969fdaa43db761a0ff7e4269a6f173d87fa011a4c289b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00984-of-01024.json.gz": {"num_bytes": 319577980, "checksum": "e52a6c08d5243717f21120b4c3ebc8fcf77168928945adf68bc665392a6e8d11"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00985-of-01024.json.gz": {"num_bytes": 319812101, "checksum": "8b4f5645ae0e0b190af4ca5335c57735ae919d3c6402438af506c7907f1d1494"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00986-of-01024.json.gz": {"num_bytes": 319582409, "checksum": "3654109968d918aa4d8db17cb7057111c42894cfc7eee093df13036cfb3ac6fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00987-of-01024.json.gz": {"num_bytes": 319957581, "checksum": "4b9e6febb461940b993c50945a2ed06736c6786aa8f758565ff545814ebfddcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00988-of-01024.json.gz": {"num_bytes": 320346479, "checksum": "2891565dd75fd4354777b4f4f393983180584ee9c64b5d9b4557dbf26a3c4cfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00989-of-01024.json.gz": {"num_bytes": 318546717, "checksum": "929d0236c9fb77d638e0a18aa97b00004316bbb0ef3c4323e39f61aaf7c0af53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00990-of-01024.json.gz": {"num_bytes": 319606761, "checksum": "6ebd2552ecdcce7b194d4f6d5b5e66ede9d65da4e4999ee8ec4705d847e473ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00991-of-01024.json.gz": {"num_bytes": 319117521, "checksum": "1b3496964d0a895b347529ddb7b712d211c9419317fb41cdd6e20bba43f39f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00992-of-01024.json.gz": {"num_bytes": 317781551, "checksum": "9f9cfb5f9152b9a60121b03c24d944129c1ee43e862112fe3896e2772fef99a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00993-of-01024.json.gz": {"num_bytes": 319341839, "checksum": "fb329b7470ae127efe1be4adc960b06eec4f55bbcbe1f3f0f0b794d70a8aca14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00994-of-01024.json.gz": {"num_bytes": 320357337, "checksum": "bbe9a60c3c2b3b5b11a5d531d1d85f0a90ebe3dbc79189b3825e169ae302932f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00995-of-01024.json.gz": {"num_bytes": 317824612, "checksum": "26643091ae3425b63036453ffca7ed82c85c24b6a24264197e6516b68a39a4c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00996-of-01024.json.gz": {"num_bytes": 320453890, "checksum": "db33809437e62bf1f086f40e4d66ad0133db7c7d406b2ce52ce5d9c9b0809961"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00997-of-01024.json.gz": {"num_bytes": 319469732, "checksum": "3447b74f09dc4d63dd04d6bbd4382147071504338e6ea428b37c3a5174877537"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00998-of-01024.json.gz": {"num_bytes": 319562604, "checksum": "270a1c19e6321541398836d3d982c2e396db99abf94317912714251d1f68e8ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00999-of-01024.json.gz": {"num_bytes": 318895764, "checksum": "d68f8f4d85d91679c20e972b2b1955d41a8f6601873bb311a2621f4b3f3152a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01000-of-01024.json.gz": {"num_bytes": 317697031, "checksum": "68b47464ca3e97e9d3f4075b656f804c1bab667f231701db9cce1f0b0a921088"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01001-of-01024.json.gz": {"num_bytes": 318915840, "checksum": "582216879b058ccd4d0ca2edccaa2db49b64459371f8798a1d9c66c06a0cf908"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01002-of-01024.json.gz": {"num_bytes": 317811256, "checksum": "6864299a7d0174f92abc696dc293524291623891b86cd69132348fdf78760a4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01003-of-01024.json.gz": {"num_bytes": 318605529, "checksum": "4ef35b7546266f99eae5f332cbe3e284801c5d7b39f840297d67e71c036edf62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01004-of-01024.json.gz": {"num_bytes": 319379897, "checksum": "040dfa80eaf8355370d8a50692bc3ad03a1d57272af340d70031a4398f37b9ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01005-of-01024.json.gz": {"num_bytes": 319515177, "checksum": "012ac70ef2715181ec1fb578a2366d68e786d3a9ea41c59c08d7c494b89b429c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01006-of-01024.json.gz": {"num_bytes": 320078217, "checksum": "46030d85d8333ae224320fa54e487f3770de7de280cd0001344136b0bd87c431"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01007-of-01024.json.gz": {"num_bytes": 318526753, "checksum": "dd432d865ef3dba4b5af30e42b11ace96900bd7b97af053ea892292e75bd142c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01008-of-01024.json.gz": {"num_bytes": 319407137, "checksum": "165cd3a688be6f9f5a4cedde198a9dda4f9d3dbc1d275d1e99411f3ee96a0d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01009-of-01024.json.gz": {"num_bytes": 319763066, "checksum": "e44e86d497f8471e53531374b0e6ee61aac54996b6af64a4af0f5620673f9f7d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01010-of-01024.json.gz": {"num_bytes": 318653930, "checksum": "61115f16e718d3a2b66574cc17841aa5d02739762138abe3c9a7f325cf9f2e31"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01011-of-01024.json.gz": {"num_bytes": 320037079, "checksum": "65e18df845f1e6cce1bb92a45f71274dca94d3f0ece1d556116085b5c0e6338f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01012-of-01024.json.gz": {"num_bytes": 319753418, "checksum": "cd5a8ee1bc7d9ad58e98aa6fe56d60501115592519a19efcf9fa370668c6327b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01013-of-01024.json.gz": {"num_bytes": 318657671, "checksum": "986ead2c1b37f4094aa6f7a7882824ff013e6393323d5290d7f3e9215589d07b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01014-of-01024.json.gz": {"num_bytes": 318028602, "checksum": "3c82c0611fb1fb0f635eaedd2bbe7cfc9d53d1ae967a9cbd0416def046e4b104"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01015-of-01024.json.gz": {"num_bytes": 319164504, "checksum": "5eb5cf76022b12d8751a2fce5c4d4831066785a68edd7b3cd3dfc10017f91621"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01016-of-01024.json.gz": {"num_bytes": 318474894, "checksum": "a99d827be814e27d948264d6ae55c6a032a664f3ff0ef6ae94bda90f7faf29bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01017-of-01024.json.gz": {"num_bytes": 319516762, "checksum": "7eac25ebb9383a4592023634b852d88a128604c494972a8fd9e2b183fbb303a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01018-of-01024.json.gz": {"num_bytes": 319433935, "checksum": "35adb751748043a36f22b412d3ea0e01166037cd96216f516abc547e9d2609ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01019-of-01024.json.gz": {"num_bytes": 320305440, "checksum": "54c4d52564221e48dc5354cb51d447658707ab8edaa3d6d8fec5ec379a29d462"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01020-of-01024.json.gz": {"num_bytes": 317445661, "checksum": "edf1c6ab9900d75b91738fc7e9e3db8cdde3f9ef2234ff249833b5cdb04c65a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01021-of-01024.json.gz": {"num_bytes": 318134525, "checksum": "1c5e670ec9d815637e9bdbd75289c7ef7f3ecf384e32f403ae8a9fe2595cc983"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01022-of-01024.json.gz": {"num_bytes": 319809162, "checksum": "9def881764ca614c88ceabb41032d3e145f06c843a7ceebd87dba6b93c974a6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01023-of-01024.json.gz": {"num_bytes": 318155801, "checksum": "552a6a2be423c0ecbb767611074200c5b85c1cf76c8640c79e3be5e967b293b5"}}, "download_size": 326778635540, "post_processing_size": null, "dataset_size": 1657178361414, "size_in_bytes": 1983956996954}, "en.noblocklist": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "en.noblocklist", "version": {"version_str": "0.0.0", "description": null, "major": 0, "minor": 0, "patch": 0}, "splits": {"train": {"name": "train", "num_bytes": 1029628201361, "num_examples": 393391519, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 1029628201361, "num_examples": 393391519, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00000-of-01024.json.gz": {"num_bytes": 396728190, "checksum": "06fcf4d9bf6ae45fac94245952f000c924d2a0b5cc8841c916b3ee949333410d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00001-of-01024.json.gz": {"num_bytes": 395686133, "checksum": "8a0b64c5efb1db1ebcc0a664c801221049f5812652dc1a727a0e9f8d0df0cd0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00002-of-01024.json.gz": {"num_bytes": 397762165, "checksum": "087fabf9563297a6eab8bc39b68c0c6d15169032001d3a17c9bd964080759f2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00003-of-01024.json.gz": {"num_bytes": 395307518, "checksum": "1e5b89200528320e354f60be0868a3ab6dbbe667a6b16b48e4739b988a6360e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00004-of-01024.json.gz": {"num_bytes": 396280504, "checksum": "8291badbe84854960c0ddac3d6c226cb519268d1b3fd267bd72cfb4f10800de1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00005-of-01024.json.gz": {"num_bytes": 396636600, "checksum": "c74226ceada7d78e3e7a2ad931d0a99df93f4cc4377ec69d4f1fab4164c3d845"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00006-of-01024.json.gz": {"num_bytes": 395364336, "checksum": "4e52e99dfc4e55c41226978b4dbf48fac2f886b9b0446bc3bd576f32bdd7cfea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00007-of-01024.json.gz": {"num_bytes": 396428805, "checksum": "283ae93ecc3f8daefa9c47651ded763dc5f339ddc619c8cb5e32dce9cb9cfe4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00008-of-01024.json.gz": {"num_bytes": 395030041, "checksum": "d3fc7fffdf9c2172d233bea3bb7dc485d753319e6196672d0186b8ba04a1d903"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00009-of-01024.json.gz": {"num_bytes": 398255693, "checksum": "61e10cef5c2cab162fb1d26f97fd9d76b30c9ee989c01ef8597d2a4e35b303da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00010-of-01024.json.gz": {"num_bytes": 397825333, "checksum": "f72040887c2a2c17564c2c6a9a4b5ff95fce6a0eed4f0800cdeff8277af651ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00011-of-01024.json.gz": {"num_bytes": 397877458, "checksum": "ee34ff11164e10a86f76593205cb13986c70ea3d3a8849174a6dfb5b4ec91262"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00012-of-01024.json.gz": {"num_bytes": 398317059, "checksum": "7a3ef558efaca3e5d19e9ad02b47dd61f9639dd806130b62d66e9c3341c0edce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00013-of-01024.json.gz": {"num_bytes": 398518794, "checksum": "f5a6c18992ab2b59a9c02469d20768bf5757624e03bcaf92957ce736a3a9edb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00014-of-01024.json.gz": {"num_bytes": 397026214, "checksum": "c174b625c1534c69814f8e4879169b58af96f801dbb433113740af0d78535abd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00015-of-01024.json.gz": {"num_bytes": 395621683, "checksum": "4e8e52a602d4eb4b27104780f4a36617505505fb66a82f36e90631a4e668f5b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00016-of-01024.json.gz": {"num_bytes": 398138551, "checksum": "a3e7a95b16f09e09e45f1c3bed3524415581e21b065d8efcc66cece705dee4d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00017-of-01024.json.gz": {"num_bytes": 398720813, "checksum": "79cdb89052e8dcecd1f1319e47f4c4ae1d350ab81777a9ba8077cebdb558e795"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00018-of-01024.json.gz": {"num_bytes": 398538940, "checksum": "8da6aac3a794ce326b5a3971fb75a2ee848f008940d4f1bedd724ce7c5874278"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00019-of-01024.json.gz": {"num_bytes": 396834319, "checksum": "b57c93502949dad9001e89847947f6c65943927eb519e16de4eaf5590b235faa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00020-of-01024.json.gz": {"num_bytes": 396402861, "checksum": "05e14c7e21df3d4af7be7a597fa22463868464d6475282376536e12e82367401"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00021-of-01024.json.gz": {"num_bytes": 397560852, "checksum": "756d15d8b07414dffd7cff3efde606aa62cf8f73b85d8e1cd17408d6a339414b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00022-of-01024.json.gz": {"num_bytes": 397210987, "checksum": "60aa08d9c5d813d5f2448d910bc23a705cdd0828a9403c18ec223e53623889cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00023-of-01024.json.gz": {"num_bytes": 397563062, "checksum": "bd865213ffb2b40c2cd3eb16724b68c0f37e29f68215990dc84d91852c7c0d72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00024-of-01024.json.gz": {"num_bytes": 395799120, "checksum": "08ff3615ecea3eb5b55703e123475c95afbecfe7107eedf05750147c9ffd12ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00025-of-01024.json.gz": {"num_bytes": 398336372, "checksum": "e3e30b97e585fd881b3a1b006775854a11a2b967d992e7eea886338d8beefb13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00026-of-01024.json.gz": {"num_bytes": 396819084, "checksum": "fddc9e1a8405c5e05e63ce98b19c7833c0fd46392b4b55532b317e7f81426590"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00027-of-01024.json.gz": {"num_bytes": 397912380, "checksum": "d3e597b3a96b993840e47adb761cce2f2ae1c96aefcbd6c250198dedaecde15a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00028-of-01024.json.gz": {"num_bytes": 399078461, "checksum": "abd6d2341b6c61cdb89b80a8b9bfd938bb6d8a423a89e6a9f997c22c6479d537"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00029-of-01024.json.gz": {"num_bytes": 397303107, "checksum": "ee35a3af1056cdab79b644f6352150aeb6fb19a630cd6bc893a072e35fbfbad2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00030-of-01024.json.gz": {"num_bytes": 396602401, "checksum": "1d04d4bc295aee2ab80b24f587f8c483599db7d5a8157acc99a1d8b001f8353e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00031-of-01024.json.gz": {"num_bytes": 395941329, "checksum": "cf1dd244555511245c0e6a5b1dc9c24f747b8377674aa3690677ce08ebb8c26f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00032-of-01024.json.gz": {"num_bytes": 398049663, "checksum": "c83e5572647eba5ab14fdc4dcba8efb6981740b99b8f634e2c6b1942a051c249"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00033-of-01024.json.gz": {"num_bytes": 398044404, "checksum": "b76815aadcf4ad802071428864ce0b406cabd73dfc2be5e20b44885ec6a85419"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00034-of-01024.json.gz": {"num_bytes": 396885224, "checksum": "da00d92418fbdb9799d8f16977b3a33f67cb98a31808544cb68cf3b42ea9adf1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00035-of-01024.json.gz": {"num_bytes": 396185021, "checksum": "265ad43ce00666c83fd441d35ff29ba1ebf7d62442cc3e3c176091b4c725ea9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00036-of-01024.json.gz": {"num_bytes": 396702503, "checksum": "4733156df48f2dd0f2e859fef28f56d12a84e8012085ca9318073ae647b0fcdc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00037-of-01024.json.gz": {"num_bytes": 397582277, "checksum": "7d62d03c3496ee2e17ab6b9635710efef9e4cefb88ddccdc16ed720a414c38c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00038-of-01024.json.gz": {"num_bytes": 396186761, "checksum": "670affddf8fcca6933af3f5b30efd1bf490c3e38c3e90f2e8e9a464994d613f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00039-of-01024.json.gz": {"num_bytes": 397056953, "checksum": "4acbd97f9c8fd9a930a6f4284a11cfe37f6cca3b5858ae3c2cde747dae35e0d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00040-of-01024.json.gz": {"num_bytes": 397809786, "checksum": "d350e48a36bb1ba3125f72a07ed8024d26eae6d89ecac686ac0bdf3d5d89e1a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00041-of-01024.json.gz": {"num_bytes": 396944358, "checksum": "817a58dc40440b8b1f54d129db08ae9124e0293e5a0e45f034fbffb2140d90c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00042-of-01024.json.gz": {"num_bytes": 394327995, "checksum": "6bd6bc1269c2dd81db466ae9c41f76b8b8cf71cc7bd6e131452fa1a1318ff459"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00043-of-01024.json.gz": {"num_bytes": 396476043, "checksum": "f3525d9c861d984ea0cdacba7fddffaef058d8f95aa99ef1f09f9f0792fde5e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00044-of-01024.json.gz": {"num_bytes": 396893614, "checksum": "292ca2b6b9ba41567fe7cc60e5424aa1f3e431ac874d06ae8eb98794563a7d35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00045-of-01024.json.gz": {"num_bytes": 395885483, "checksum": "ea2c8fac41ededba7da8bf2bb48463d83f148e5c0970a689876d4932ab18a3c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00046-of-01024.json.gz": {"num_bytes": 396963386, "checksum": "97672d9bca357cd2721f51301aa37d37a271dd3ca7487244c057570b995da66d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00047-of-01024.json.gz": {"num_bytes": 395856712, "checksum": "52c517670ba4eefb262cb71373d6370f86ddeb0aea7391a47a22d52a55bff7a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00048-of-01024.json.gz": {"num_bytes": 396091027, "checksum": "49f5b68e29c55eb50da941eab1cf446c7d8c9d0b30290318977edb39ef0b887f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00049-of-01024.json.gz": {"num_bytes": 396892998, "checksum": "82a51eb6f301c00d927ca7920338247038cf4e9e0072d74c02bac897701f5859"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00050-of-01024.json.gz": {"num_bytes": 396308050, "checksum": "d72f92ecd27b716cd90cc4abe562d25fe6d49740b4a3d1fb9beac2526a61988e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00051-of-01024.json.gz": {"num_bytes": 396137777, "checksum": "a956e4d086077f7ab309ff10b0eaf4833e4d3ed74435293e96588f4361e1536d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00052-of-01024.json.gz": {"num_bytes": 398302544, "checksum": "5a54f7faa07661ea6a5f0585ca49ad66c8f7025fd9627b3af832dc886d50f78e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00053-of-01024.json.gz": {"num_bytes": 399616791, "checksum": "7f8fa496d50a0b7c399faff4c1864e24717b3f9c86b2552536c8f91e3e0cf9d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00054-of-01024.json.gz": {"num_bytes": 397332881, "checksum": "ab862f26b4fa38b6c16d8cfd0d63a9f0973827e45915e85aefb95d4e182b7b9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00055-of-01024.json.gz": {"num_bytes": 397075146, "checksum": "cb67aa9229bec8b88e496829aa0a60ca1c3ff4a2293632cf7782b69aa71aebfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00056-of-01024.json.gz": {"num_bytes": 397827600, "checksum": "2f63e3ec40d32237d4a50c873b966d7fc2c16ef5c04a2bcfc33328b128654e7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00057-of-01024.json.gz": {"num_bytes": 397533583, "checksum": "7c90bf39bddf8ad0c6a8bb3dff02caea8bbc2abbd76047c5d523930d2a00dbc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00058-of-01024.json.gz": {"num_bytes": 396411363, "checksum": "ee6059f3c8a2df34858a0110a06ec4e9673555fa56c1a2b40930337ba5b1b39c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00059-of-01024.json.gz": {"num_bytes": 396735510, "checksum": "d9dbe2421edba1820294e757d88aa25455db42ce8992f8933b51cd84cfc35a36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00060-of-01024.json.gz": {"num_bytes": 395694553, "checksum": "b05d6502fc95587fa7047fac64978d6be13761dcc6954629332812e5937c2731"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00061-of-01024.json.gz": {"num_bytes": 397740757, "checksum": "39303faa5dc33995dfec683b44fc24066ecccdf6b5001b9c0644d8e9899d45f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00062-of-01024.json.gz": {"num_bytes": 397358263, "checksum": "fe27dd467cc2c34abe5b0bb34473ee68859f2198eeb78304e1d2e54460a67383"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00063-of-01024.json.gz": {"num_bytes": 396826654, "checksum": "1da2c414bd03e5547d8c9c7447e42b8dcff5f6ca8ba35c53076f2895e8ea63f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00064-of-01024.json.gz": {"num_bytes": 395781869, "checksum": "af96de4d6b5bc1ab0527efa33a73d7eb788dca15829acbb7291ce72ad05e6c66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00065-of-01024.json.gz": {"num_bytes": 398192274, "checksum": "7f46ccfc1703fee106e932bc9a1bc5dedf7de944172cfa34ec9b31413bf0bbda"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00066-of-01024.json.gz": {"num_bytes": 397133438, "checksum": "dd3b67d8578927d7474dae76bdca35f35a2aa125fc50873e4a9f6e73d7a81831"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00067-of-01024.json.gz": {"num_bytes": 397204214, "checksum": "4cdc87a7c9fea33e15d638e5c921f45149212769bfba5f59f0a5943398ca0d55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00068-of-01024.json.gz": {"num_bytes": 396489592, "checksum": "64d175c23574998f8c5d28ce3d3f3934144b1fd4f6527ede1aa3420c28bb90d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00069-of-01024.json.gz": {"num_bytes": 397697351, "checksum": "3329857f531c9fa22d98bd567638f0564f73062da1478ca84385246f71baabff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00070-of-01024.json.gz": {"num_bytes": 398449973, "checksum": "bd13494aa03a95d943a01f3436f62c46ee3390b30f6ff0fec0636f3c0b09fa1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00071-of-01024.json.gz": {"num_bytes": 395498960, "checksum": "5e69529ae82c305acbf1f58a7021b4e3fc67285a871dcbcaaff0781d0e721070"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00072-of-01024.json.gz": {"num_bytes": 396170387, "checksum": "9b9c7e11b9bb2cf6ea0fcdfd58754f522a95070feae74c29559522e12e1b41f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00073-of-01024.json.gz": {"num_bytes": 395915819, "checksum": "87a2069589fee8de23730b8b994ba59d63d5128175b5326ba0a8c8ac9e01a3dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00074-of-01024.json.gz": {"num_bytes": 396986018, "checksum": "e073efb3f00db65c1ee14e8bfa6e8c807f7827d0f3dd4d4026f823bc6f61b1cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00075-of-01024.json.gz": {"num_bytes": 398555103, "checksum": "a1793748c7979e241ca34291c843ca3cc90dd7643f04810b6cd324220efbd6e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00076-of-01024.json.gz": {"num_bytes": 396357420, "checksum": "7b1cd69788ca9a7e614de70a8b908183f41f316eaadf3b0236a7c4e126db9844"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00077-of-01024.json.gz": {"num_bytes": 396666167, "checksum": "aec828d3c2a1f7fa970de328a8fd1a85a90493dbcbec4f50816ccbc2275a1fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00078-of-01024.json.gz": {"num_bytes": 398167446, "checksum": "e14bdf5af810574aca7c6f3daa67e503f24ab1705435a62129c66c248667ee97"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00079-of-01024.json.gz": {"num_bytes": 399696096, "checksum": "b63756f81b8b19ecdc9bf227045df10840cbf973b60bd8ffdf28f58a53cdb028"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00080-of-01024.json.gz": {"num_bytes": 398755610, "checksum": "dfc118f680b79260e7ece75f27c0459484eb8458f2422df9f1918f726b54ccb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00081-of-01024.json.gz": {"num_bytes": 396606787, "checksum": "17d6a503947f5132728f53ea62fd093f55bf2dc6a32316a5c0413353cf13eff3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00082-of-01024.json.gz": {"num_bytes": 395714484, "checksum": "8ca41818ee6a0ffd5b00714779289c18cd97d620258c5d3d741c482b72344300"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00083-of-01024.json.gz": {"num_bytes": 396807173, "checksum": "12d87c0a948f32f788497858751c3ef22f289136e6ae58518a97a2e976f5cdc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00084-of-01024.json.gz": {"num_bytes": 397241529, "checksum": "7c3da4ca4d2b2077f0ab7be511038255732fc88d954f2f17cb0f3ab144216206"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00085-of-01024.json.gz": {"num_bytes": 398357369, "checksum": "26df55183e78f8d69fb16e21d07edf98659b69bcb3c48f340da6a5bc44007f4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00086-of-01024.json.gz": {"num_bytes": 396997317, "checksum": "09f0641e9075cb88800d0eaae3f7b99b047552edbc71d1fd2d8594f645d22c2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00087-of-01024.json.gz": {"num_bytes": 397978000, "checksum": "c9437ef5f58a46b8a6d8efcae37fa658da3f2c4f1cad0f9cf47fbcd09bb82f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00088-of-01024.json.gz": {"num_bytes": 398468913, "checksum": "be187fc14017f666b84ed7049c169c1a28654441c2f523eee8b655b3b9d9ba8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00089-of-01024.json.gz": {"num_bytes": 397071121, "checksum": "637c3f964ee2c750a0a175f2e5d24b786a37d37701f10616b448804d68b72f4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00090-of-01024.json.gz": {"num_bytes": 395753807, "checksum": "8eef7ff1a8080aebe5226cc3539baac46ab64d93f8e3ffb6e8b7ab3346e151dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00091-of-01024.json.gz": {"num_bytes": 397039764, "checksum": "a2904ae5bf69b393a697afd62ae9b8a560c1f076e8a141e6f3feef29cb5d1352"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00092-of-01024.json.gz": {"num_bytes": 397058578, "checksum": "eb4d7e2712a9983bc1581133fa8eaa2e1d28b314861833bd8d810d615ec1ed81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00093-of-01024.json.gz": {"num_bytes": 395855981, "checksum": "5c9a7573a5644d89d46666306d333ff1e4af3213f287cb9adb48ef87a023d479"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00094-of-01024.json.gz": {"num_bytes": 399516118, "checksum": "de7ae1508815e48ba031762c084cf6946b084871463821407090d23c197c6474"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00095-of-01024.json.gz": {"num_bytes": 398236235, "checksum": "616cef1f21ef078ffb9fc2b4148735668debdd15a8bc1be281183ba3659e9fcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00096-of-01024.json.gz": {"num_bytes": 399526010, "checksum": "eb754381b8a6f3c74dda5ee5852958f7b69c707a3908cbaa9410c972e002a0cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00097-of-01024.json.gz": {"num_bytes": 397935028, "checksum": "6d6d2ca80708b7c6ad4240a042dddc2170060e8976c2e7b4ace446d2f2395076"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00098-of-01024.json.gz": {"num_bytes": 398645934, "checksum": "568db6971230fb42df8973ecb5a2a6d77204aa8cf0bdf47b386c04370da8dfd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00099-of-01024.json.gz": {"num_bytes": 398110916, "checksum": "9bacb381e3b06976619e816e40ac2ccd3bcf3cb9ecd30c294b388cfb75c8bf77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00100-of-01024.json.gz": {"num_bytes": 397631228, "checksum": "7d515ac0f767736600a216ebe7280b9751f16e70df969ba601d1aaae15f201e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00101-of-01024.json.gz": {"num_bytes": 395102356, "checksum": "87c5c81e154e136f3e090ba91682ad54fe678653f86f6f32002ae5ec3c9aa743"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00102-of-01024.json.gz": {"num_bytes": 398926159, "checksum": "2df85a9ac13812c3870180901dbba99b52e53fc045da019160a3f06d0dfa5e95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00103-of-01024.json.gz": {"num_bytes": 398383820, "checksum": "8134d12e84ed4a58a5f8f6eff8a4349f7d6ded6a1d7539b5c23193571569d6c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00104-of-01024.json.gz": {"num_bytes": 396628542, "checksum": "208f0cb3365b0243d70e7b4e52ff977e9b11d8e451adea521a5bf6e10cd40ee0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00105-of-01024.json.gz": {"num_bytes": 398737797, "checksum": "855ac7b8cb621a240319ef00197d2f20338d17db71a1aec68fb66930bc17c59c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00106-of-01024.json.gz": {"num_bytes": 397281064, "checksum": "544d5d91d066f2450bfe622ce55bdfe16a300aee9c05aaffae8a645966bc695e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00107-of-01024.json.gz": {"num_bytes": 397919761, "checksum": "f4af405c0f19c9139d93b3073f3fe328be998c9dc6f74afc7e21ad068964b92c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00108-of-01024.json.gz": {"num_bytes": 398810219, "checksum": "bdfce29353c6caa33b178bdebbf7e48526c391bc6c71180e3fa378b723879563"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00109-of-01024.json.gz": {"num_bytes": 396605124, "checksum": "ed6acc172bc9af0e31170f5533001a8fcd344e6732a4b3a714b7ad43740f25f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00110-of-01024.json.gz": {"num_bytes": 397491755, "checksum": "428b6c91f12c4f7032fa692bbe887f1a4c02635eb88b91d876da4c71f3da5e4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00111-of-01024.json.gz": {"num_bytes": 395754897, "checksum": "a723863559edf291fd8a6c2736cc1cefed70dd3c8625b967df049ce0d373f68a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00112-of-01024.json.gz": {"num_bytes": 398567649, "checksum": "a90ddc9ccfbca20b9c75bd2b7d63ee6abd03236a0f0dd2827eb9f7350d9c3931"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00113-of-01024.json.gz": {"num_bytes": 396706569, "checksum": "479052b6b9edcc2bbda40b982976e7e28d84fad7b2dce46b017f4e3d1f61e0d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00114-of-01024.json.gz": {"num_bytes": 397384355, "checksum": "a95984e4c261a3057d1bc51939aefd9413853111e19030b19c5d26f778be00ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00115-of-01024.json.gz": {"num_bytes": 397702826, "checksum": "5eaf7fc2c9d4b2ee3e216c215da7f4fc7558e89d6993033b95a940a78061ab05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00116-of-01024.json.gz": {"num_bytes": 397252590, "checksum": "268033cbbdf3be9790cb6010791693f1b490af06f9fef91b0b307420a4e30a08"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00117-of-01024.json.gz": {"num_bytes": 395506730, "checksum": "cb80908eee1054ddaf7e2e5d66c9a41505025c2b6dc7fe6aa287db0a9f3829ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00118-of-01024.json.gz": {"num_bytes": 396452136, "checksum": "d75bf895c88ff2e9c4031c1f65b067222cfbb1a937d685ab4dd33369f5f5ff7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00119-of-01024.json.gz": {"num_bytes": 396777389, "checksum": "2c00362f4d99cef2bae2f13f17b79ec56a5ef8aca18ffd56a12fea2308e5017b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00120-of-01024.json.gz": {"num_bytes": 397730478, "checksum": "e31296949f7ce2e2a74fd2443552cb64b9f3cddcca691097a56992f51033fd11"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00121-of-01024.json.gz": {"num_bytes": 396593647, "checksum": "c2f0f81e3c835848a47532d8fd1c215a624f47740196a7bb45b5099916853014"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00122-of-01024.json.gz": {"num_bytes": 396576172, "checksum": "72edb7581a623e20f26cae4885f3b9d7f329581921253ca4d7ceedfbca17b7b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00123-of-01024.json.gz": {"num_bytes": 397378329, "checksum": "4f045ce7bd077b7f878012aead8c51073022448de66d2e35a755d4c8c4a6f59d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00124-of-01024.json.gz": {"num_bytes": 396545003, "checksum": "dc7949657328520d31a27d8e267c2ab07cd4e8639036d4b1bb59454c309f862d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00125-of-01024.json.gz": {"num_bytes": 397630505, "checksum": "530bd95e5ef9a1d5989c595e60e0ab11583e0f42d16b2bd37c49ed09a67af207"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00126-of-01024.json.gz": {"num_bytes": 395483747, "checksum": "d9df071edec6959ba842509f72ad43be3ea3f529b60d48f3dfbf390908887a5f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00127-of-01024.json.gz": {"num_bytes": 397295159, "checksum": "02b61f5bc7d1d241484c4f04fd517960ae755a69f35192bdd5bb471baeba5614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00128-of-01024.json.gz": {"num_bytes": 396276865, "checksum": "0c7d618df232c36ba018269ddf3b2863cd6d63bb7fabeaae33fd508715bd8ce2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00129-of-01024.json.gz": {"num_bytes": 395314703, "checksum": "03443afda032187d2dc2e696ce6eaecbf2219e6dabbdd593379e97c0e00e3112"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00130-of-01024.json.gz": {"num_bytes": 397411481, "checksum": "8969873d5efd3df0cef1742e4bc67f2df7a5b5d9e641f7a12e77c7e8e96a1bf1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00131-of-01024.json.gz": {"num_bytes": 396925311, "checksum": "31adc39ea4eda8667662608bdad6bb32bbc82b1ee1ad53ceb4df50924a933bdf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00132-of-01024.json.gz": {"num_bytes": 395826124, "checksum": "d2f035ba2c388fec2d847bd43449c885eadd0bcab5fb8afdf031a53e72c4ec32"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00133-of-01024.json.gz": {"num_bytes": 398892794, "checksum": "b7ed60983058a5f9f0ef72602789f50359f415ecbe60dc967e7a869866d833b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00134-of-01024.json.gz": {"num_bytes": 398206890, "checksum": "9ba78624879aabb72bae0b4119fa2625793915382031ed897a0b4c3f2863b8aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00135-of-01024.json.gz": {"num_bytes": 397161888, "checksum": "9fa6fee55f5e8f887dcc64d94cc65ada6f283a580edc7926cb159b80d0084ea8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00136-of-01024.json.gz": {"num_bytes": 396185585, "checksum": "81a1fcafcedfdd9bcb32d2467d9c963cc7d8b2f32e13e52ee04db41b0d3f5483"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00137-of-01024.json.gz": {"num_bytes": 396933735, "checksum": "c7558304b614e1cff13b0f6e967fc5ef77e4953a1eea1f39ed925c33076d7723"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00138-of-01024.json.gz": {"num_bytes": 396371698, "checksum": "3e896da8bf296403f7b4061ba0b24d3c3978993de4854fabd688cfce9fbf7bba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00139-of-01024.json.gz": {"num_bytes": 397289537, "checksum": "1a5ffa3aaf565ccf4db7444983643ad06e386938a0a2d313aecdb972c36111e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00140-of-01024.json.gz": {"num_bytes": 396983259, "checksum": "4047916916fd9dd7b76a8cbc595d52803344467135f744b23bd10296004a47d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00141-of-01024.json.gz": {"num_bytes": 394947050, "checksum": "7edfc9e5870d80d470e3797e8bef5183e9d170eab410ab50957e946dde2e8199"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00142-of-01024.json.gz": {"num_bytes": 396852755, "checksum": "4affc3a24616858fab84211e3825e90a1ea7d9c8f2cfabbe9a5c9b24c21a116b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00143-of-01024.json.gz": {"num_bytes": 397579248, "checksum": "d5aa9ba68e9b30576bd640f647d4069b6c56db276cc5229573440e4a38a7f1e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00144-of-01024.json.gz": {"num_bytes": 398800367, "checksum": "fa104e63eb7a8a6b066a5f00bf05b3ea095bad35a902bc728251f096173f1417"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00145-of-01024.json.gz": {"num_bytes": 396709510, "checksum": "b615ecd58821b1697c82094cb3435375924263827c342ab1b87e53907d4aa63b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00146-of-01024.json.gz": {"num_bytes": 396042389, "checksum": "6004c782f3235490865b6634b2c4840a989745b70ef2da674e75c62aeedf8a6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00147-of-01024.json.gz": {"num_bytes": 399840661, "checksum": "5e8b46726f7ff2c3dfd381fb252f1b4bddf9436fd9ffd10fa300cb0fbe76998c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00148-of-01024.json.gz": {"num_bytes": 397098215, "checksum": "0851cb274aff2ec4f781c82af11c94f8938a797aca5097fb0089299cb4c75aff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00149-of-01024.json.gz": {"num_bytes": 397540697, "checksum": "7cadf4ef9b0e29d9e8f68474464dc072b78e909a0f03c74e61b67912ff9b551d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00150-of-01024.json.gz": {"num_bytes": 396347701, "checksum": "521e4f67d12ae47b8f2a02b6f77e0c85cdf9a0efbcb45602d09ae116110ebe66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00151-of-01024.json.gz": {"num_bytes": 394890490, "checksum": "2255bf3e1940ea28da9656028dee26865a9ee682cbaab4d5aeb34c081062f8fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00152-of-01024.json.gz": {"num_bytes": 399584675, "checksum": "f8ca4aaf5706ffb0f5518c7461d9045d18c645df068aa436137299e5ca77df82"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00153-of-01024.json.gz": {"num_bytes": 395606567, "checksum": "24f0e81dc3140f063ac89173fc262b01f2420133025b114f29632262cdd2e7fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00154-of-01024.json.gz": {"num_bytes": 397925578, "checksum": "5f40a87b15b0acebbd324e7c5cd2c0f31f911558d57f774f278634db94f2d5f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00155-of-01024.json.gz": {"num_bytes": 395428741, "checksum": "36281c154f187a09a83822878da815cd9b7f659a41cd90ac64653b437e798c72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00156-of-01024.json.gz": {"num_bytes": 396799274, "checksum": "0fb66965107e54c9fed0013962763e874b940b0e174d775b21fa5e688fa53b33"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00157-of-01024.json.gz": {"num_bytes": 397321211, "checksum": "014d1443a4940fe95089bf87e245817d3a90c50e3e371a703098f5b9c3f6c759"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00158-of-01024.json.gz": {"num_bytes": 398736992, "checksum": "f912d27d68318fc0089fbaf8e0481ebe8dc5d2963cb89ed315f3bec637460bfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00159-of-01024.json.gz": {"num_bytes": 397250687, "checksum": "1bfd02a301b09bfd53058522d0613e1fbecb788d3173eb30b58115cd1cbdb477"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00160-of-01024.json.gz": {"num_bytes": 397492158, "checksum": "149a7bd76e9ea41185d99d21df870ddd4f32857fdd628cee927d6bee7d6a527d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00161-of-01024.json.gz": {"num_bytes": 398383574, "checksum": "0c385b4c9b33574cdc75070309a0aed46aa7b2e3b8754a7692035a3c5a04f916"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00162-of-01024.json.gz": {"num_bytes": 397126197, "checksum": "5c012b2a6bbc9413914ed1420b6150a5549cd74185bf2788d8809005034d433f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00163-of-01024.json.gz": {"num_bytes": 398201223, "checksum": "79448c338e86cea2609399705268fc6011cb21c4f0aff82e3fb7660391ce85c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00164-of-01024.json.gz": {"num_bytes": 397914908, "checksum": "dfb89631dce146ab4713a03f184e864472eb133b2cd04db8b4bccab688e9e287"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00165-of-01024.json.gz": {"num_bytes": 398142696, "checksum": "74acc88d6612aae7bdf5187d3b9eddcdb04cf60f1cc350661ffa50219a747f9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00166-of-01024.json.gz": {"num_bytes": 397533050, "checksum": "757d23402b3a155cfcb6b30bdc305c8014c9b64ba4e067753664670c2c5e9534"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00167-of-01024.json.gz": {"num_bytes": 396241119, "checksum": "521bd7a9dcfa0390c35e50a3d0cde3ea627ca538dfc419a97ed83b251d8a3005"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00168-of-01024.json.gz": {"num_bytes": 396041761, "checksum": "dc540ec27d5999f6a4c71f075ae1ec64ea84415c720cd2b6ef3fdac925e576da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00169-of-01024.json.gz": {"num_bytes": 396350882, "checksum": "36d5d35075a82038dfdd5abd29a839f4e9ab79d51f0bbc635d3dcf3f5f1e2732"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00170-of-01024.json.gz": {"num_bytes": 396885157, "checksum": "db9a3f6a7e085007eee381357ea9e4d5d6f702580d38220860967ec441ba3525"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00171-of-01024.json.gz": {"num_bytes": 397266368, "checksum": "7f8098cb6532bc888d3c1f0ea5072cf8419ce1689b9ffe1c370ca20071e7e1c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00172-of-01024.json.gz": {"num_bytes": 397140430, "checksum": "90ae7e2551b1f3bf2e5ccf4fb3fac8fa3512add5e299ba7c90319611baf8c840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00173-of-01024.json.gz": {"num_bytes": 397069631, "checksum": "a86f5ab72e1a9b1d491988154fd6400e6ee8c74378a9e64276df438a3c4edf9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00174-of-01024.json.gz": {"num_bytes": 396743897, "checksum": "451cfe8e14c17113a2f6673ece27e01f8d54bed1b57d1b20cb84f125879939ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00175-of-01024.json.gz": {"num_bytes": 395780705, "checksum": "3252e9781545bc3f9f19ac6e8fdb87d81cdc5a94838798daf6037c9f4f473db4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00176-of-01024.json.gz": {"num_bytes": 396205053, "checksum": "49d1648d37150b90632a6459828eedd82deb2fce7f108bf4e1b050f2f9ad1668"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00177-of-01024.json.gz": {"num_bytes": 396248718, "checksum": "99346ccda762ae85038a10baba937ef8ef668a0beab483c4005dce77e331768b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00178-of-01024.json.gz": {"num_bytes": 396634813, "checksum": "8d3bb1610ce79cf359d75f32e7624b6203140ed3eb276362b040615e9ffd4b54"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00179-of-01024.json.gz": {"num_bytes": 396524113, "checksum": "971e5c9499425294cf5945436b2ee419379a75bdd72d4cd6a33b1d17c17de298"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00180-of-01024.json.gz": {"num_bytes": 397938782, "checksum": "dd6b3e60219788b82ab3fc63a9e65f38f64aa2f7b294135ec2d16b36350f1f40"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00181-of-01024.json.gz": {"num_bytes": 399155769, "checksum": "c6a806d627a9d197789bfc6257a92b0223ca51e724c3c2ad10fe2397dbe30848"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00182-of-01024.json.gz": {"num_bytes": 396136228, "checksum": "2c48e3237253eaad9afc121e6946a9e1856bbe82c5a7cb287b05cff3e6ea8e8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00183-of-01024.json.gz": {"num_bytes": 397083292, "checksum": "52645e03ab47da01bb40226eb90042be914f1170688ae940314871e16cbb1037"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00184-of-01024.json.gz": {"num_bytes": 397402964, "checksum": "1edbdb41edeabc108f0147e18b439a75e390e0a843ed915f1cbf73a7c7f7867d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00185-of-01024.json.gz": {"num_bytes": 398411052, "checksum": "ef071e52174a19597e567696262470906275c2cd1cbbb0b1e98864999ea2d463"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00186-of-01024.json.gz": {"num_bytes": 397122443, "checksum": "0d87080bc08f7f8a1952a7df57ce2bdbf61e40c05b61937c8c19ae0ecd952b1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00187-of-01024.json.gz": {"num_bytes": 397244868, "checksum": "4aed75ea9f885fc3dab599c19c7bb98f7d57ce2b2ec11ac8ab3258fa479fc0db"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00188-of-01024.json.gz": {"num_bytes": 395677432, "checksum": "342882e436ea826cda9fd38c0caca68bb35444a2a07596f8de0e53a3e2169f59"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00189-of-01024.json.gz": {"num_bytes": 393653750, "checksum": "22ed9e389f6c8410c9bde898d97ad798c236c2da4d0b2c76b86d013f8686da03"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00190-of-01024.json.gz": {"num_bytes": 395437920, "checksum": "b3f9ba5834d4f0280d6defd3bd50fdf961bee6be4c71ed47046cf4e115acab01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00191-of-01024.json.gz": {"num_bytes": 396944861, "checksum": "4e7ed636a60edc44b5ba709dcd83bf4263ad8d5a06a02827d3d27191bf3731a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00192-of-01024.json.gz": {"num_bytes": 396611165, "checksum": "4fea34466d9b470bf0bc44455183b2c61994c4e71e4bfb684dff3b5e3870d1e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00193-of-01024.json.gz": {"num_bytes": 398283211, "checksum": "4c4e6d31f455831330971ed1e0c33221203401b817adbda5b53de16f8299a9ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00194-of-01024.json.gz": {"num_bytes": 398915952, "checksum": "dfd0b1ceb2a437da8cd38c9c791af809e94f2e36ab4399b2a45a5b916f4ccaa9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00195-of-01024.json.gz": {"num_bytes": 396352694, "checksum": "0ccd90ced34b3ff28c21d015a87eca3f31eae2bf31f11f25ac073139f9d50c22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00196-of-01024.json.gz": {"num_bytes": 398582922, "checksum": "f22e59765cec074a0c687c500f4e6348250d0e418d12dcba211e39c133aaf290"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00197-of-01024.json.gz": {"num_bytes": 398839554, "checksum": "95fa68cd75d77a1b5bb526dd5ef16a2f04a3520604f734baeb6e2d95608b5973"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00198-of-01024.json.gz": {"num_bytes": 396202192, "checksum": "f0e6343e8105178b38f75eade6774aa6e85b62a271622fcfcbe2745f1cae11ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00199-of-01024.json.gz": {"num_bytes": 398029364, "checksum": "4c58736410c8d3c7174ce011e2f281cb16e4949d756ff4ace86b4a9d4795c04e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00200-of-01024.json.gz": {"num_bytes": 395867629, "checksum": "1cb798ee6609e670053987d881d130d5b73db19d9f37fecff7a6da41152aba05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00201-of-01024.json.gz": {"num_bytes": 396858169, "checksum": "7357eb22b2aa75c55885252c62d12e08cf8f7ef285c0052cf1d706c3f0f74fef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00202-of-01024.json.gz": {"num_bytes": 397955766, "checksum": "8901d0f27c4c11916cda7cf806cd00000771b6351954c8503bc312cca5ad3a10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00203-of-01024.json.gz": {"num_bytes": 397737882, "checksum": "ed51917fc8936701b681cfc49ef95b2dab451ca597e76b34ba90be9405a1a0b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00204-of-01024.json.gz": {"num_bytes": 396094006, "checksum": "88692bb8da78347cb97c0e0849d1a10a97b1686cde1f75626236b89bd507e2b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00205-of-01024.json.gz": {"num_bytes": 399027636, "checksum": "fb17fe19d1f0fcaa43fb31a3ad9b105b3d93fa287351c7f93fb599edb7f40bc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00206-of-01024.json.gz": {"num_bytes": 399406254, "checksum": "668d2a9927080b686a4d728236e4cfc780b262f9045dfe9575cfc48cb69d6adb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00207-of-01024.json.gz": {"num_bytes": 396291803, "checksum": "928f451dddfe42bb2ca791dbc61c36ddc618006ef709eaccbc2beb665c8427e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00208-of-01024.json.gz": {"num_bytes": 397807368, "checksum": "11e8627b758588056b61d31de07c50092222013a38ba802b7a9ae34b6b8b84a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00209-of-01024.json.gz": {"num_bytes": 398085408, "checksum": "d49d31d1719698ab7a2b9ee91d887f3192c8fc1b6108152a75b39de2a0ad25a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00210-of-01024.json.gz": {"num_bytes": 397670254, "checksum": "049b3294c3e22e6db6c115979a4a55f0650966c600ca17250e91b241cc97bbd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00211-of-01024.json.gz": {"num_bytes": 399643598, "checksum": "7772f26fd90f47033670e7f1d3f6fe092116486bb9a991577f9560b54ed3832c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00212-of-01024.json.gz": {"num_bytes": 397390768, "checksum": "7a24e4a70f43f6227fe6491fcc7bb6b2a19cae203521c803bedf8882c995d7e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00213-of-01024.json.gz": {"num_bytes": 398657925, "checksum": "21d0ee8d1a01957b56ac503aa88c6f3269b4e4692762a3f929fe0e7069be8c0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00214-of-01024.json.gz": {"num_bytes": 398282324, "checksum": "ede2d9824d8f99dd578a36ea82caae942ebcafd99f308cf5d0ff8aa4a56f0a05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00215-of-01024.json.gz": {"num_bytes": 399178235, "checksum": "82516fa361dec02c7ed59ea2d0510d9ee4187609b449dca649a04141b12bc037"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00216-of-01024.json.gz": {"num_bytes": 397630870, "checksum": "4a6d5e60354b7b93f005010c6fc55c0a81596e98a116cdeec99e1ab4e58fd03e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00217-of-01024.json.gz": {"num_bytes": 398628848, "checksum": "02dffb623b628a3a3ea38084fe6bb840aafab8419feed3d1f2bd3598cfa80aab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00218-of-01024.json.gz": {"num_bytes": 395087998, "checksum": "e1e9a7ac7a922d6a9bb90f82cb48dff11ab7208dac08511e9613cd2726ca67ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00219-of-01024.json.gz": {"num_bytes": 397622792, "checksum": "955afc7d45a080ae137e9dc25ba3d85629a6a14c3d9bbe4065aa37d710345b7a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00220-of-01024.json.gz": {"num_bytes": 395112655, "checksum": "a3560918bec20087e9908009a362957ecb06401924789e20b36c26e363db5ae7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00221-of-01024.json.gz": {"num_bytes": 397132000, "checksum": "d8459bb5b6fb6b341b24fe517cfc5dc099765ad70c3383bae913229e06cf99e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00222-of-01024.json.gz": {"num_bytes": 397138513, "checksum": "20d3c6219921dc9c2928d637000e488635fd9a12b5636de5a6a7e52c1b67d781"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00223-of-01024.json.gz": {"num_bytes": 397167661, "checksum": "43a18accd194646893324537991e0162f6f98a9cec5ff59fe8fb510d81d707bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00224-of-01024.json.gz": {"num_bytes": 397905941, "checksum": "a516485cbefdef2e31a493cd8827a5f936f10674ff3525b71d414e17f48241c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00225-of-01024.json.gz": {"num_bytes": 397218123, "checksum": "791c85c78c5e7f3557855a1fc71acd860521710515b89f92e54e02960549f46e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00226-of-01024.json.gz": {"num_bytes": 396619135, "checksum": "52a36037696e6245efad80e00d1f123c36dbd79e7ff52b1fb99f579e712d2b30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00227-of-01024.json.gz": {"num_bytes": 396654998, "checksum": "e31123ab579fe95bd50afa10d52a51e9c15a4af28c06583fb5aeac4e3418f129"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00228-of-01024.json.gz": {"num_bytes": 396899165, "checksum": "86481361fff334dee3183fac8ab3f346e44ab3e6e7b35bbd7e6e062b2d2fa0d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00229-of-01024.json.gz": {"num_bytes": 397489378, "checksum": "bbb717711fb4c78ebe8a0476296a21a50285ec41d9fb9f08d5d66d899577e04a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00230-of-01024.json.gz": {"num_bytes": 397462301, "checksum": "054414aac29b5c8faee71a918f2586ad3fce8ee44c71e7a2e2af4b91e0169523"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00231-of-01024.json.gz": {"num_bytes": 396097584, "checksum": "8136e320fccba75a493954fefbb560f92532be44a6e0990404edae659d48ce1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00232-of-01024.json.gz": {"num_bytes": 398984795, "checksum": "3d9362aab157beef3b5fcd4a0a0236d59de635a565b1c86423f45b26e8b437b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00233-of-01024.json.gz": {"num_bytes": 397258012, "checksum": "e1a532922477d17f7cbea7db72c2391d26b4db580e526ebd5a90be23607a8d31"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00234-of-01024.json.gz": {"num_bytes": 398350453, "checksum": "c464829565bcaafdba165b2d886be4580f3c0a516b5417853ffc4fe30049cffe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00235-of-01024.json.gz": {"num_bytes": 397147353, "checksum": "573a6a1d33ccc6c5b605d381f04d73989504bb6d24514b938e92c3d4f61501e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00236-of-01024.json.gz": {"num_bytes": 396963006, "checksum": "21318462014bc185d0da7cbd342fddd07521401ca2b73e47eb5cb4bd42a82bbe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00237-of-01024.json.gz": {"num_bytes": 397087111, "checksum": "49459c97b078726bf8377748d4bb2066bdfa47e2717315a9b3c8075cfc4b9b10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00238-of-01024.json.gz": {"num_bytes": 396984031, "checksum": "befb46e9f928876edc580c60ea4242f63cf6df77c6c107fec6e4280d279e348d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00239-of-01024.json.gz": {"num_bytes": 395915197, "checksum": "dc5ab17e04e4f2678771094af67909dcaa8be36a6cb047cfa66e75f986c91312"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00240-of-01024.json.gz": {"num_bytes": 398321096, "checksum": "25b92f7a499e9aaf0496a57f6292a7f65941b34dd6c78f14b08358d180070029"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00241-of-01024.json.gz": {"num_bytes": 396626980, "checksum": "1ae21ee5585ec718763a3c7bd70d9338aaf77d0e02f92a41f6ed213d1eefa5b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00242-of-01024.json.gz": {"num_bytes": 398220596, "checksum": "c29f98174a0c02a817d5cfa3ebb2a92d5f49df8a34fa40abd360f1b39b4bde05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00243-of-01024.json.gz": {"num_bytes": 398250083, "checksum": "819387c95ea7183b1f9e1e78d077de65023c4809198ef3a0c946f46f8b6c19b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00244-of-01024.json.gz": {"num_bytes": 396943969, "checksum": "7a0b0b984d7afc4181827705212f917cf4ac12412f640a2c8120513763cdb390"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00245-of-01024.json.gz": {"num_bytes": 398365865, "checksum": "a424157137a5eeca89819d600deea2a1619ea8f5ae1ed395c88ac600a85e3afa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00246-of-01024.json.gz": {"num_bytes": 397285385, "checksum": "73029f721bdaccd9d126e871973e70a551f48f077f5903656b305ea9885c4798"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00247-of-01024.json.gz": {"num_bytes": 397132841, "checksum": "b223cf1270d2c728592ec65b09599bbdef8d64f7df2eb525e114f86268500daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00248-of-01024.json.gz": {"num_bytes": 396316645, "checksum": "94102d9bcc086ed5b203bc0c6b830dd245c9bf6c695b23b19922b2a98eeb6a52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00249-of-01024.json.gz": {"num_bytes": 396644237, "checksum": "36be793f4d76070ba1c696b3274e6dbab43f415c8fbaf752145cc99af6558680"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00250-of-01024.json.gz": {"num_bytes": 395860541, "checksum": "313febcf026d2cd1495fdd3d5ba3b492ce5d5749153e189672b6d9dff3e26a61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00251-of-01024.json.gz": {"num_bytes": 396709140, "checksum": "7e2480b3d5869ba35007c40e18585f3fa208cdf8e004078cc8de4fac36773507"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00252-of-01024.json.gz": {"num_bytes": 396508847, "checksum": "25df46ae56c0d4a6f945922e31fc697d12e0b7c525be9bc2b8eced802641488d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00253-of-01024.json.gz": {"num_bytes": 396364816, "checksum": "6b2125b9eab9bf893e7f8913a6beedbeeef5de53893fbd6172f706e33bab5177"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00254-of-01024.json.gz": {"num_bytes": 396122930, "checksum": "7947e5152c5305863e2d664622e3de49f9386b4384eb09630c5bfcad21fb458e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00255-of-01024.json.gz": {"num_bytes": 396929803, "checksum": "a1ec8c609ac969c24e2524f0f3dc31ef43ca0147ffe66569d3135e4f28394325"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00256-of-01024.json.gz": {"num_bytes": 398432943, "checksum": "3fd0373f5a8974a3499c436d96ea73be95f5619b8388dc316f51aff01e9ecad7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00257-of-01024.json.gz": {"num_bytes": 396003748, "checksum": "516cf3626076f083962983b2d6c596ef355609492f2e81c6c3cdec01acf8c5d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00258-of-01024.json.gz": {"num_bytes": 393890690, "checksum": "700760a7764f890c8aae337e7ee458c8467eb9048347edd237e341dd2bd5d236"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00259-of-01024.json.gz": {"num_bytes": 398130606, "checksum": "d868f8ef5e1cc971ffd00908bdc7eace32ec151d7405d7cac5fac22df9ea10c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00260-of-01024.json.gz": {"num_bytes": 399765969, "checksum": "7d5eb3b88eb8a0291ae70c1997458cf5aecac645397e50a67fab3d1193064353"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00261-of-01024.json.gz": {"num_bytes": 397418895, "checksum": "ca607c9e13d7cfb73a29ee3131f77e6bef3130d8627037cef9f57ed459185f0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00262-of-01024.json.gz": {"num_bytes": 397925991, "checksum": "ca789394ab4398c41490ec6147a41ffc8847155ea9ff74d7ff8b3402ed0634e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00263-of-01024.json.gz": {"num_bytes": 397082336, "checksum": "aac81d1bf0ade80758c14d01842b9b06c89ebf2fcdb9a06b1472bf2f70bbc348"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00264-of-01024.json.gz": {"num_bytes": 398101079, "checksum": "3cf56a2989b5c3f26ba94124cc534f5c9ae9770bdc6a3431dd745603b480ab19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00265-of-01024.json.gz": {"num_bytes": 396949669, "checksum": "d4f252a6c2f43833d6d89bf69337449b4cae5dc88fd08fb20b35fe7194a50ddb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00266-of-01024.json.gz": {"num_bytes": 396242007, "checksum": "71c745968d8ee4a0d64f38930a76e65d68ea094ba3e0b963d5d6878f65f51b34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00267-of-01024.json.gz": {"num_bytes": 398342031, "checksum": "706a560c862979594265925c3200d4bd0981a9eaa279841f2cba673634f7074b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00268-of-01024.json.gz": {"num_bytes": 396399468, "checksum": "eb3dea553c37f220b3b9b5f377d5a4ef94243b3c0b6b46981e3e5b7ba5b4a935"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00269-of-01024.json.gz": {"num_bytes": 397181296, "checksum": "4f0feae035dacaeb720ca3b6ea17685144895a0d78cfa358e30983f8d6c4ec76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00270-of-01024.json.gz": {"num_bytes": 395712883, "checksum": "6e0f6de1e5a5c6d4bf23d0539ee72ecc2b4285da2b0f1ec2cdcc443d2e22aa88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00271-of-01024.json.gz": {"num_bytes": 398066980, "checksum": "4c5cd1ef1917ed762d7d8c5c54e1da05db74e45721697df8b0626e0aeac96966"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00272-of-01024.json.gz": {"num_bytes": 396667308, "checksum": "77a33c37a5d88e419e2b31cf560d53f129a38e5bc2306b5baccc187b7e94e589"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00273-of-01024.json.gz": {"num_bytes": 396020214, "checksum": "b18e40c00b8e0e02dfac40ea0519964e231c8a2f28bc1294b044fb090f41a9fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00274-of-01024.json.gz": {"num_bytes": 396300833, "checksum": "34c8945a6ebac564fe87881d6968d05363a89985f297692a3df7104128b9c26c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00275-of-01024.json.gz": {"num_bytes": 395206463, "checksum": "1e41d7e2a6117224dc23fbaae8e9d20df9d7744adb4687d2b0e570bf8d9e47f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00276-of-01024.json.gz": {"num_bytes": 396667995, "checksum": "45973b91c2f1140f79265a24f484fc6d6653f43f83d5bd2d18954892dfa4dfae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00277-of-01024.json.gz": {"num_bytes": 398134029, "checksum": "b7da91889b6695cf01bceddfc139b23f9465bda5cad54088b84a1f5a4d7a4f9a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00278-of-01024.json.gz": {"num_bytes": 397422615, "checksum": "e794a2903bda1f3c082e8f590383c714a518c202ecb99eda5513d6b320f70e86"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00279-of-01024.json.gz": {"num_bytes": 398776175, "checksum": "a5528d3e33151138ef9bdc2433744f1797de2b20673a570de5bd4d81b306354a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00280-of-01024.json.gz": {"num_bytes": 396208086, "checksum": "1be2d8c3d0eca510fac7b06a5401b2b8873bc6dfbf85a3c736301756f9681309"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00281-of-01024.json.gz": {"num_bytes": 396893734, "checksum": "1db3e9017561d38a91c417ffef875b7a948c4f64c51b90b0983c71bc9d950903"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00282-of-01024.json.gz": {"num_bytes": 397411883, "checksum": "4e23d39fcec2c310cbde3fdc5d9c185046086877ac03bbf9d772b092614f93da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00283-of-01024.json.gz": {"num_bytes": 397906911, "checksum": "850eb5e60b84bca4d2f10b2e511fdb2661e3d08444a07db1782ad85c754fe808"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00284-of-01024.json.gz": {"num_bytes": 396043261, "checksum": "fea24050c6aec13eb706a6f3854b4debde62b1b842f2992fc027820c66218b0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00285-of-01024.json.gz": {"num_bytes": 396961329, "checksum": "6052f82887cd2362320f72f6545d2e5b5a775e9bef95783c9b9995ecb7a5ecc4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00286-of-01024.json.gz": {"num_bytes": 395697481, "checksum": "f4361838b5b679c8306447364166c1c3083af392b4c8793399c122af09c7312a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00287-of-01024.json.gz": {"num_bytes": 398773520, "checksum": "9add91f23f31ff8c5d8d84e6a0af75fc6fa08ceef8ccd9b633d8c49aa1d0104d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00288-of-01024.json.gz": {"num_bytes": 397684645, "checksum": "64dc94555a122353c3a3c9999e67d17b0e4b682096ba80be2258c791ce1c2b9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00289-of-01024.json.gz": {"num_bytes": 396655864, "checksum": "2472c76b1cbcfc3cb82126795673126e8f532119a03722a304396ceee9b7db3a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00290-of-01024.json.gz": {"num_bytes": 397415313, "checksum": "960b71edbdc6a6a62a0d3cc1069bbbfb11893cc017aba543e10c9a23cb759d1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00291-of-01024.json.gz": {"num_bytes": 395617977, "checksum": "96e582d7a750bee597331f373ec2e16d3a9686f48a49d39765d39550c8cbbad8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00292-of-01024.json.gz": {"num_bytes": 399332500, "checksum": "cd6ec4941aa5babbe274684945bf899447ec2459b8f7076ec8c74d2b3fe794c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00293-of-01024.json.gz": {"num_bytes": 397021546, "checksum": "d0d0c4d80e75c5d02103b49027d9e2e6f7db74c12f8b53f600d7fe420b2d0a7a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00294-of-01024.json.gz": {"num_bytes": 396272726, "checksum": "caf5708a6989f867ec6c4c56f338aca9f3a43a1806a27ef473d9b0f219001cb4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00295-of-01024.json.gz": {"num_bytes": 395233811, "checksum": "a7b5f904e34c0b370238e6beb19149d4bb96d0cce43a1eca3bfaf181952ede53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00296-of-01024.json.gz": {"num_bytes": 396480926, "checksum": "4fcf284d98c2f7b63e47573e9d084eeec2516fbfa62be42c3ff94e1cf518e313"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00297-of-01024.json.gz": {"num_bytes": 398883718, "checksum": "c1cb458076497e7dee645f50281d1af2fe5dad556d28a2cbbd73abe6537c8a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00298-of-01024.json.gz": {"num_bytes": 398733629, "checksum": "4a612c715025292e62860fb0018e9fa2d3fade692342746d044be6297e25a034"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00299-of-01024.json.gz": {"num_bytes": 398155026, "checksum": "d33f4043fad9551f92084a45b7f54d920ded9d6fec271cbbf85f71b021f9ee4f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00300-of-01024.json.gz": {"num_bytes": 398612975, "checksum": "61b1181b796a2f40db3cb6954f2890397c3722c486dccd4075d74679cf61a70c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00301-of-01024.json.gz": {"num_bytes": 395385748, "checksum": "95a78e9d3cece0620430c85822fedf4021ebd88ece57d6714933c268d3b6af6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00302-of-01024.json.gz": {"num_bytes": 397620059, "checksum": "321aed402a5e779febe9766294ad040a3f8dcf57bae68648c03d3c59023aafa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00303-of-01024.json.gz": {"num_bytes": 396549027, "checksum": "4198f6a2b5bdaf90ac4251f013908123a5964429870ccd6b245a9069278c4e17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00304-of-01024.json.gz": {"num_bytes": 396596460, "checksum": "74a6440e93d18d0d6d0622ab7d8832d7ccc91c03297faf20c8090d16f7c042d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00305-of-01024.json.gz": {"num_bytes": 394881271, "checksum": "654deec494bba4eece19c27140426049574cf529c93ccb422fcc09fe4496af15"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00306-of-01024.json.gz": {"num_bytes": 397760377, "checksum": "e0840cbc94db6cfc35df66d413a11261756392dd59b0fdf89d9ff166ec76f3e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00307-of-01024.json.gz": {"num_bytes": 396671816, "checksum": "31ceb8cfcd09fda621a9a483b09dfb43f5436e867363f6736ea3f710a6af10fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00308-of-01024.json.gz": {"num_bytes": 395961013, "checksum": "8c1e5acc3f964eaa5aff300731a74dde84ed0671cd764b121ea638fb08c3dd0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00309-of-01024.json.gz": {"num_bytes": 396035179, "checksum": "7d555942b1bcb2518aa5ff9c0549d98fabe7bb563cdc6c73d3f11e6a0bc502b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00310-of-01024.json.gz": {"num_bytes": 397140669, "checksum": "859eeb7a9d2ed03d5299bbf7f1c3e719236477950d7601112a458ea5a2adf7c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00311-of-01024.json.gz": {"num_bytes": 398170419, "checksum": "1e7661637b0a4445119ba403e4f8ede129c829fb7d1907ca7660870b536b8b29"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00312-of-01024.json.gz": {"num_bytes": 395605627, "checksum": "87a3ccd2ac9deff1ac4a5dd02bba269a48692d4598c5899630e8d2e4136dbb99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00313-of-01024.json.gz": {"num_bytes": 397081206, "checksum": "c6952116cf573a6e20c849cf1b7d8d0edf3b9d00fc7e717e7bacde915c4c52a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00314-of-01024.json.gz": {"num_bytes": 395555727, "checksum": "762066fd85c596ee01b3b8070708517cc5759bb1e3c4bb65f4645fd62b550d13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00315-of-01024.json.gz": {"num_bytes": 397871218, "checksum": "814f19cc5e81144f5bfd7037f5f522dd5c44faf150c10337c675174a5965a5b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00316-of-01024.json.gz": {"num_bytes": 398577523, "checksum": "27643c7c3c0a1a78c9003b936ea27785709a2df80d09817278a179eecaedc352"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00317-of-01024.json.gz": {"num_bytes": 396388623, "checksum": "5f840180e2017c41c6b1c865784788dc3b002478a9ecb43c3859174af788ba5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00318-of-01024.json.gz": {"num_bytes": 396173471, "checksum": "2aeab99fbc84a2640a05081e2c7438451e75f76cbece3cbe5d82e85463a61966"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00319-of-01024.json.gz": {"num_bytes": 397912127, "checksum": "fda805ed19f4b996b048386f4bd73924dc965a069e85b8b4452a54a1372375fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00320-of-01024.json.gz": {"num_bytes": 398765416, "checksum": "bce244d024c076911c1c6dbd35609be5442c8b0440690e2cbb342ac64bdc494b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00321-of-01024.json.gz": {"num_bytes": 396005962, "checksum": "763584ee096223b8aeffb1576ec6e4f3bea674ec4de40fa163c2f2221b3701d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00322-of-01024.json.gz": {"num_bytes": 398615672, "checksum": "5c12ec1d0c450fb7515c586f24311bad145050dfc64180d65bacbd346c2ce9c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00323-of-01024.json.gz": {"num_bytes": 397861187, "checksum": "93326f43273fb963593e0b1caab1e9588387291c23d5c14b5ae40b46b199998c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00324-of-01024.json.gz": {"num_bytes": 396679008, "checksum": "6ebfe6e28851e6d79cfdbf370602373fc2136e88936eece302ecaa8ef8251827"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00325-of-01024.json.gz": {"num_bytes": 396358086, "checksum": "51190fbfd48479842ec3c7d910b5519e01ff797ca0143c39be142c1650c5e893"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00326-of-01024.json.gz": {"num_bytes": 396490692, "checksum": "f4d9bbfd1bbc6e939fce9a2df26e45c79be73dbe2650fe79af395bdaa39cd121"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00327-of-01024.json.gz": {"num_bytes": 398354656, "checksum": "c70c824b6c16e5fad922ec9b8d363d97bed90501522b641b0eb0f66b8c086325"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00328-of-01024.json.gz": {"num_bytes": 397326336, "checksum": "7e6008433a0e5bc6eed28a13b9dba17246e7d65ca96c31092086c3546a3a397b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00329-of-01024.json.gz": {"num_bytes": 396390524, "checksum": "f379d844a35172424554bb82a65c790c354b76c0e7abfd868225d1968017d1a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00330-of-01024.json.gz": {"num_bytes": 398259199, "checksum": "ea15be4a83c3de66c42410e13e5ef9c93baf86099a8eded1c1d10b0cd5ad0f29"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00331-of-01024.json.gz": {"num_bytes": 397618860, "checksum": "7b6aad6224ead9ee3a0c860cfd991301ef5e97093b23c76d713e73f4911d0e44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00332-of-01024.json.gz": {"num_bytes": 396743573, "checksum": "bc5333d383020d2296aa0f6ec940ab586a367efe50d1c597f9db55ca72fa66e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00333-of-01024.json.gz": {"num_bytes": 397460128, "checksum": "095b3a85a9598009638622ca21cb00142efa0d68196c8c3a8bb922cccb465e8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00334-of-01024.json.gz": {"num_bytes": 396900262, "checksum": "6f005575f4843b84f4512e1b7c1b748edf497e4e9f55eaae47f9b4637161ccab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00335-of-01024.json.gz": {"num_bytes": 396106895, "checksum": "66bfe399d0859f71c20db01de53ca7bf997b33afcd3d181f181d9f265a2c2fa2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00336-of-01024.json.gz": {"num_bytes": 397732616, "checksum": "1f1e0435de870b98b119e91edd4a0d32d078dbb810f919a70b85360cd860f0cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00337-of-01024.json.gz": {"num_bytes": 397834763, "checksum": "1db4bcdaa6fca612c3f1b38dad6d5402679ca21aa6a545850d61bcda10103697"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00338-of-01024.json.gz": {"num_bytes": 396712179, "checksum": "810c104a8862699c490fc8625a7be4115872fe2de4d8c061e095dc5a81eb4d19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00339-of-01024.json.gz": {"num_bytes": 396838831, "checksum": "9bbc616d5c4aba46475957a22544dbdb0557f8de31cdf919718fbfe55bc70ac8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00340-of-01024.json.gz": {"num_bytes": 395587861, "checksum": "48c8411ee2b5fc8cffe1589ed204d0ac8a12b5b3bb1857373f84bae984d49e8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00341-of-01024.json.gz": {"num_bytes": 398093153, "checksum": "4ff8ba83e489580da2401aaa23ca3329befe8fc08b6f299b612950c358688604"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00342-of-01024.json.gz": {"num_bytes": 397248009, "checksum": "c72e063f95d10ce661b4bc97538eccf6da6ad493b7e54da555a46e4a47aabbed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00343-of-01024.json.gz": {"num_bytes": 395939409, "checksum": "249eb2080c55402aab34a31a442b06bcaa25d2df3f4319ea1a5f50dc6bb709b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00344-of-01024.json.gz": {"num_bytes": 397608807, "checksum": "8cc57604fcc5fa920b0d16df6e8d8b7f4ca88c0c76c86f9ac81f42a615b330e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00345-of-01024.json.gz": {"num_bytes": 395751274, "checksum": "13fbc76e49a8b856f7563b945bef10d786a86caff63b4cebea50416ca34932ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00346-of-01024.json.gz": {"num_bytes": 395516794, "checksum": "61d43da2e3e7770016ba7235eaa74a1e6a180e64cd2cfacefed5c34e8b72eca7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00347-of-01024.json.gz": {"num_bytes": 396180000, "checksum": "4a0ca2103de168d05d0090c8800d47f216cc167a9cfe9e736403aedf040c5e46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00348-of-01024.json.gz": {"num_bytes": 398461180, "checksum": "a56396961496499ac289a85d126b916132e787d0dc4fbd9961aca7dbbc7cfcff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00349-of-01024.json.gz": {"num_bytes": 398049366, "checksum": "ca012572c575f6a8e6ad6453296ff93f22118995c17928e76b655da44ce5810b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00350-of-01024.json.gz": {"num_bytes": 396532962, "checksum": "bb35d17862201063b46d8745dc182756d1bb09e809c4c355452ab1967e655491"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00351-of-01024.json.gz": {"num_bytes": 396576223, "checksum": "19ea45ab2fe5487d2a69cca7c9a1db7a09c8d5dfdf130412bbcd241cc60a61c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00352-of-01024.json.gz": {"num_bytes": 395956381, "checksum": "bb5869b8649fffadd5f1945ca9a79588e84081a8fc45b7e4cb5507149b5be2d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00353-of-01024.json.gz": {"num_bytes": 398903623, "checksum": "cb16a7ecadd28a8b5622c4e581f463f0ae2fe20a3e6582fa6885d76e7523715a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00354-of-01024.json.gz": {"num_bytes": 397316693, "checksum": "42aea18548695c458ddc229d8c837356845609aca3bb64ce6e07b185443b9468"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00355-of-01024.json.gz": {"num_bytes": 396240550, "checksum": "1577d76807548d83427293b9f534a3261fb72a345569f0491a1fd2691047bd92"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00356-of-01024.json.gz": {"num_bytes": 396132315, "checksum": "b6e17a39292e082e517082b23b381305ebe889c2530fb5eb74a2683d36d07a86"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00357-of-01024.json.gz": {"num_bytes": 395948117, "checksum": "524ebed10c881f52f155db5d6690806f5a97aa8f811deadae916323b50427ed5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00358-of-01024.json.gz": {"num_bytes": 397397242, "checksum": "8e23d852bc3a0dda4684d5fd511003ad6f18232e5f54e32638c8db62e9d18c6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00359-of-01024.json.gz": {"num_bytes": 396141321, "checksum": "345c34dafbc59f5e93355c8b2e6fcde6bf59bc9e1ebbf5cb962d54228e6d3204"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00360-of-01024.json.gz": {"num_bytes": 397258644, "checksum": "51db06055d95e2b43fddebf8c2b7d76b7572745f129d89fe005f8e5d3f12b758"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00361-of-01024.json.gz": {"num_bytes": 397913411, "checksum": "2c0f6054fef084d3e7cd10e2de0b1d3a48dc716af1e9146548195df128bdaba9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00362-of-01024.json.gz": {"num_bytes": 397722576, "checksum": "664b390b20498eb6e78fc09604b3a947fc1847a01e3eaae4c7861d1dde3b90fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00363-of-01024.json.gz": {"num_bytes": 395416894, "checksum": "c57529884c6d4977a279a097c0dfbcc31d52048cdcf64950182c743583d7989a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00364-of-01024.json.gz": {"num_bytes": 397028679, "checksum": "ed4f252d63c679f6e3f35847e0871c3360e072b0d6963f662d7e808b6615457f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00365-of-01024.json.gz": {"num_bytes": 397574891, "checksum": "68e8e44a531d98897245fee90ad349f4fdee891b2f68dfda78a1dedcc9474326"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00366-of-01024.json.gz": {"num_bytes": 396905692, "checksum": "9e88b888d85633671e009ed7093763b934a42054ed6a1252222dc64781a20e22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00367-of-01024.json.gz": {"num_bytes": 396802011, "checksum": "2abaf3f3946788258b8543fa2ccccc0c20e6980b9d26a38decd356e67f575fa1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00368-of-01024.json.gz": {"num_bytes": 395630737, "checksum": "b4960e3395d8a1bf8350f57e5f6280b00443a4c6b85e6fd47478fbbfc1733caf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00369-of-01024.json.gz": {"num_bytes": 396228047, "checksum": "08e8210426e6c6ef9746675592a3eea4a92eff9aa4bb7ffc6bf6ba54bc411f72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00370-of-01024.json.gz": {"num_bytes": 396548482, "checksum": "10e0305ac4d1e410d749637e0c03386d969563f8eb73bbbc376fc1d21025e4ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00371-of-01024.json.gz": {"num_bytes": 397344482, "checksum": "03df0f4aa5c377f6b45db3c3b863240bfb1211ddb226bc055433fbcd9ee8e873"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00372-of-01024.json.gz": {"num_bytes": 395872223, "checksum": "9b70549213cb01595179928cdb020daaf7bcd2085c5e947d111f3cc66e406d2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00373-of-01024.json.gz": {"num_bytes": 397399096, "checksum": "945c204cdb107669a8d1252a91323eb300c902bdd6c6a8167a90805ec02cba9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00374-of-01024.json.gz": {"num_bytes": 397755002, "checksum": "8353d4383f73caceb5d112f260b37d1349dc7898af2d05b98ffe17d22aea97ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00375-of-01024.json.gz": {"num_bytes": 396534763, "checksum": "a3de41388a6d8ce3b605c6586e47b74a565dd2f54175551987bda0a0ff95036f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00376-of-01024.json.gz": {"num_bytes": 395594630, "checksum": "7cadf813f2b31a1bfe44fdfc84aef4eb65e889c2616c56b189890734c22b731f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00377-of-01024.json.gz": {"num_bytes": 398241040, "checksum": "15df154b52cb4d9314dbc4ac26ca4b4df7125b12131d538fd480f8a6b3fbdfc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00378-of-01024.json.gz": {"num_bytes": 397217224, "checksum": "208ce680427f62d78dad857bee91122a79f968589b4e44f2f89919e91f4dea30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00379-of-01024.json.gz": {"num_bytes": 398504097, "checksum": "0052fe7f27e720423b6143f401b8618428d913b22fc2af2950874785e2ef7528"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00380-of-01024.json.gz": {"num_bytes": 397494149, "checksum": "15c4f07a2629c7bd79b243c97367e3e18de02b5ab09eccc0f85b1eba0e0b071a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00381-of-01024.json.gz": {"num_bytes": 397190859, "checksum": "77c71b4a79ac2f462040ea0e8408fdb8f719fac0f09fadb760ed00b709e9dea5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00382-of-01024.json.gz": {"num_bytes": 398126420, "checksum": "aa44d029398c33f733065c489ab3ded9395f6e53263407173b6e9c27b6fb9c45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00383-of-01024.json.gz": {"num_bytes": 399108296, "checksum": "f507161fbe96f8abe9dedccba2458448719e6b153bcc1256ecee6b4b9c82256e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00384-of-01024.json.gz": {"num_bytes": 396156787, "checksum": "83c236bbc8508fb81992c837751a4d8ad4b9bc138dd1f4bb5c1fcc68203e12da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00385-of-01024.json.gz": {"num_bytes": 396878483, "checksum": "df45b4749951a46695f88789fc536617ee3470083e55562292f606e09185e4a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00386-of-01024.json.gz": {"num_bytes": 397495799, "checksum": "a8240c9e7266e47bda8880e38ac8a5afa8541aed4b989d6642b31497716a51ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00387-of-01024.json.gz": {"num_bytes": 397062301, "checksum": "e6fd54ea6f17d5570fa4cc97554813a7a33bd4e44cbc456b27b0c87c1af22c60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00388-of-01024.json.gz": {"num_bytes": 397074091, "checksum": "fdc2a134df4a669deb839f26947c86b7e7a4bc7596a6a1c25562cb97fbb6b089"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00389-of-01024.json.gz": {"num_bytes": 397056868, "checksum": "e7390f0007582a3460fa67375b2628c85a1aa85954796d8e6584fadcb35761cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00390-of-01024.json.gz": {"num_bytes": 396404332, "checksum": "820a97060abd3172852f38e1636706c8389adad8495de56f4c3a2c3ba6008235"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00391-of-01024.json.gz": {"num_bytes": 397125489, "checksum": "68732c5ab9f4b6945e79ce2a1b45b97a97822d6a107aa79aa9135f29d91173ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00392-of-01024.json.gz": {"num_bytes": 394992472, "checksum": "c9d1e8cfd481631a76544e5880ceee9990e7553c88c5978a91b48ec8aa47717d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00393-of-01024.json.gz": {"num_bytes": 394778146, "checksum": "7a5ec4f0878f676a3ac2c417f512186066d793f28d611f97135c3626b3b60fdd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00394-of-01024.json.gz": {"num_bytes": 397024190, "checksum": "44e32db5a39684ab1789cfe97b6e9cbd3c539390e7a4c8ec9298e7177945452b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00395-of-01024.json.gz": {"num_bytes": 396537190, "checksum": "601ec281240753ac5793ec7cb83802a788c4d88e56dfd83e6c875cf2ef9bd8f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00396-of-01024.json.gz": {"num_bytes": 398049705, "checksum": "b1024b69e191b2c7073f5f4f3ea51e8710be54db8603ce8aaabbfb919ea6694d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00397-of-01024.json.gz": {"num_bytes": 396670567, "checksum": "11357bc600f9b0c443f124c7fa4046d10cf03e19016e5ba8cdde884d2ff76c9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00398-of-01024.json.gz": {"num_bytes": 394706629, "checksum": "778eca6d845b9a7d49e22941b959a95e5e4d2d9714720f27b810230d136acfde"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00399-of-01024.json.gz": {"num_bytes": 398257272, "checksum": "27c2a30af83975d32469e85fb2e27953a3aa9f97514f621063325cb9af1829fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00400-of-01024.json.gz": {"num_bytes": 398732278, "checksum": "aff9a39748526a03d3476288cdbce122c3683baf113362e9085895609d03c3c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00401-of-01024.json.gz": {"num_bytes": 396372632, "checksum": "a6af262bb962eb1c45d2003ee1bb2be1a3a12cb3e53d4ffe58b4b68dd852957f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00402-of-01024.json.gz": {"num_bytes": 396783625, "checksum": "db9aca12012da21fc5a0619a47e9c3075959786d6d6d74f6a244af1cb33c402d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00403-of-01024.json.gz": {"num_bytes": 396950960, "checksum": "b3566f7b9251f6aea9343d1344151f10fc104464f92e8f10a97742defffc2244"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00404-of-01024.json.gz": {"num_bytes": 398481154, "checksum": "897904040b5887620b9996cf89656f5bff329a430a8c3dfd6802d0c879675376"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00405-of-01024.json.gz": {"num_bytes": 396065216, "checksum": "45e0108549ab06d9a8ad5c45dc53250798d0e58f7e940080a754106801250009"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00406-of-01024.json.gz": {"num_bytes": 395637879, "checksum": "bda70f3a19b19e2ffdd1c3a26b959945b447acd450cab49e72ce727d2218af5f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00407-of-01024.json.gz": {"num_bytes": 398356109, "checksum": "1df9e8b4715d9a3f02a0b06aef6095f81d38acd1be0b4fa402acaac0258c3116"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00408-of-01024.json.gz": {"num_bytes": 396041456, "checksum": "e89ebf354280543204e78f4308a8f8751cc26094524628cd8e9cb691d9911b82"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00409-of-01024.json.gz": {"num_bytes": 396254329, "checksum": "15729474174d6a5adb5935f25afa6de2f03a8dd2f73b780e23795ede92f5762d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00410-of-01024.json.gz": {"num_bytes": 397850848, "checksum": "98f1b8fc845e0005b76d7eac70a430ce98e6989569344ea92266f8391b1396fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00411-of-01024.json.gz": {"num_bytes": 395527322, "checksum": "52b2e31f2adb61c8e703c6758016cbfc650f8104dcd5f78867c81434be155ea6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00412-of-01024.json.gz": {"num_bytes": 396155992, "checksum": "7b6b4192f9bec4fdeaf9d6dcabd9cbba6b4c8ebb42d26730fea21bad139823c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00413-of-01024.json.gz": {"num_bytes": 395766377, "checksum": "775d1fac6b1708ba0384d922640b2f372b3ee146fc79fbe692ff69a7c6c699b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00414-of-01024.json.gz": {"num_bytes": 394860848, "checksum": "0386d8a8e0cc9d5d613b1f84085791de57ad05751d94d25681d86dff5cec1afb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00415-of-01024.json.gz": {"num_bytes": 397566065, "checksum": "1957b0d185943b1952dc66e78f0a7d449f49f8f55fc0978bf77e8dde10f4714d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00416-of-01024.json.gz": {"num_bytes": 396297306, "checksum": "3f8796934edb79d172e682511a5ed7666aa09ff541ce55e2c66406bdb6eeda9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00417-of-01024.json.gz": {"num_bytes": 398314475, "checksum": "8da08075b966c04aa7859275eefd34c78cd2b9edc366684733d027ad6d619ba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00418-of-01024.json.gz": {"num_bytes": 396296110, "checksum": "efe43733ebfc7b65c646aee68b883cf40124c1446a28e70ff2bfa9e1bb1377cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00419-of-01024.json.gz": {"num_bytes": 397614415, "checksum": "c0f02d78715de9c3ea0c684dad36a506386081fed2011ec298ca0ee623c7792e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00420-of-01024.json.gz": {"num_bytes": 395133656, "checksum": "6237f5797a35dcdd89a0b70cac4dedcfb3fe418560f8dbbf6cad685f11c870b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00421-of-01024.json.gz": {"num_bytes": 397061849, "checksum": "ee37899a6a49269026633ec79577491ff4b11e219e0236dcba68eb168279067b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00422-of-01024.json.gz": {"num_bytes": 396539584, "checksum": "e5914a4b97c27da82eaee2f4f67a165de946bb38a00d6126b1527f5eb1200417"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00423-of-01024.json.gz": {"num_bytes": 397715346, "checksum": "b99e628f8790a7baa8ee7828e31f2ec72374f9a8390c1d64c9b8092b10d9c7fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00424-of-01024.json.gz": {"num_bytes": 396335469, "checksum": "9cb3b9eb00760bb68f3df4b66b96f1e5798c338231500472fd64c49cd87c6599"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00425-of-01024.json.gz": {"num_bytes": 396714466, "checksum": "f28d4901ccde8eb7afcede9732ab94fd18c49e0e3731659ef587058d6ea2ab28"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00426-of-01024.json.gz": {"num_bytes": 395566563, "checksum": "9ab75a89a425ce974fd36e936476a30db913c2d7c9ca6e5522b91ffbcbbe30cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00427-of-01024.json.gz": {"num_bytes": 395379035, "checksum": "5e1ca658bea5ba5506afbb9ae5a5da4d35cdc3a215478c68e11652a7d5d918f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00428-of-01024.json.gz": {"num_bytes": 396419259, "checksum": "d740b37b576bcde0e1c8eee27c3bfb3b58c1a0d3c5b471001804b2a37f277ac9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00429-of-01024.json.gz": {"num_bytes": 397116774, "checksum": "d1c10b0ba72aa2d4cb4640d1263c32868190942b1e93b4bb4e9798e25f10ba67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00430-of-01024.json.gz": {"num_bytes": 396634586, "checksum": "11dec038b4c1c35d32d000915812b6ec8da9abbbec2e15f7493551198b6a1ef3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00431-of-01024.json.gz": {"num_bytes": 396704705, "checksum": "efdfdef444cf68fc05090107033ffe2ac906b6efe2fc138e90f47cd4bd0b6204"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00432-of-01024.json.gz": {"num_bytes": 396264701, "checksum": "fa649c2e2dbc992408c3a60327e5d5ace4697c84010446bb286e544eb6c604be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00433-of-01024.json.gz": {"num_bytes": 396887722, "checksum": "3d5fd3fbf209dfff2057143a3dcf7eceeccb1e85967a9a85a992f465e3522335"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00434-of-01024.json.gz": {"num_bytes": 398856291, "checksum": "ab6dc5343b052da901f4671c1cb3173850fbc6bbfac2623ca14936b2b83d9667"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00435-of-01024.json.gz": {"num_bytes": 395888569, "checksum": "26abd1e2263af02f998705501bd02ead2edc3d7f68fadc7b198e7fcf4dffc454"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00436-of-01024.json.gz": {"num_bytes": 396976077, "checksum": "a5dadf6ec93e8dcd62b0e1de3cb03c866147bafe0da8e631341663ccc03bb801"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00437-of-01024.json.gz": {"num_bytes": 395809168, "checksum": "7f98e98270f9b88570b5e498511ee65d07428db604af349ef9107dbcf65ac4e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00438-of-01024.json.gz": {"num_bytes": 399136723, "checksum": "0e03ec507b90b38d5b6d7dfe27d40e127efdc9a0bae349bea2e743375ea29b9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00439-of-01024.json.gz": {"num_bytes": 396435416, "checksum": "5f868ba66ea32a23be4a926fda0a86d0d2ab4948326e1ebac615fa16a2a6864d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00440-of-01024.json.gz": {"num_bytes": 397487165, "checksum": "d30005787e7472313982cf2860e0a0764900b82a7bf616da27e6c1c3298eb215"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00441-of-01024.json.gz": {"num_bytes": 395968030, "checksum": "181461b447d88040130c3348ae7d22f220e0f97ace030d6f54301a9a3d483fc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00442-of-01024.json.gz": {"num_bytes": 396909150, "checksum": "0854cd3454047e0c6a0746ef21e0cbbb22fbdf4349c2e668f4fa1e49add183c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00443-of-01024.json.gz": {"num_bytes": 396271897, "checksum": "2493db29dd3cadef3719576c34213496eff807df5ae8cf538f13e84d403fec77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00444-of-01024.json.gz": {"num_bytes": 395540084, "checksum": "5e717d9e0c1b6f728df0f206e422a0958a537dddf31fffa4d699e5bf4b3c2b16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00445-of-01024.json.gz": {"num_bytes": 398750991, "checksum": "b8af9d413da48fb5f9a9174b12ad253b2eb2c1ed7709cab710d66710841568e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00446-of-01024.json.gz": {"num_bytes": 397575547, "checksum": "2bad5a914cb9f2e5e99d76afbf85eef66c18e7c1cf2e11c5d455792ae86ab441"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00447-of-01024.json.gz": {"num_bytes": 398035036, "checksum": "d834925674a33ed5eb8fcb335fd81b95e4ab882010e434e3fb9323e0f23be2bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00448-of-01024.json.gz": {"num_bytes": 398658613, "checksum": "16f3ac40180e47b9b97998f5d1d7c0e9336e2fee5612a3397fd161937f7a2b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00449-of-01024.json.gz": {"num_bytes": 397934476, "checksum": "09dd3d5a529f62b10d1ec97f37ed142315190fb437be3f50987ee955b11f7672"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00450-of-01024.json.gz": {"num_bytes": 396444119, "checksum": "8a25c11e0adc5fdf50944767fbfbf01a9c35b3c0e07205c7c06288d1f68b4c10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00451-of-01024.json.gz": {"num_bytes": 395963541, "checksum": "f3ac2e295ca4b3ca1f55c8b500ea2588f1519163cec381297ad4bef390fbbe1c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00452-of-01024.json.gz": {"num_bytes": 396594911, "checksum": "25a57709e934077c2972f0f8a1a9db7afe9b7558ab023bd6ee5224b2f8cd770a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00453-of-01024.json.gz": {"num_bytes": 396745507, "checksum": "75c1a4803bb58efe5df885bccd13596d46dd1f3ea30899a7e83812167b990bde"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00454-of-01024.json.gz": {"num_bytes": 396193342, "checksum": "c151679573ea5f5b52e26e8b50da7e14760d1ec15c63a5b864b648190efd48f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00455-of-01024.json.gz": {"num_bytes": 398096160, "checksum": "7f86270b13ee4133adaa06de809f26ef581229407813fca05db521d9d36880dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00456-of-01024.json.gz": {"num_bytes": 398965570, "checksum": "d5b292189c5d318e0ad622eec1e764993084d0477147f51f29acd637935fec5c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00457-of-01024.json.gz": {"num_bytes": 396672892, "checksum": "8b490f615b3ed701390ed671d5645dec4aa3fc576a032da8f9d434087c1eb8c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00458-of-01024.json.gz": {"num_bytes": 396911580, "checksum": "8bcadc16baaa4e36fe17ffc0862c264230385e18bbd861671ad5fd8cbb86404d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00459-of-01024.json.gz": {"num_bytes": 395969213, "checksum": "b8ff8371a01d7bd1782044058ee0f53d4d1275ebca0870ba16104c1c4b12f07c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00460-of-01024.json.gz": {"num_bytes": 396928338, "checksum": "23dde1fe55277467d6d2385684b71e90e9066e6a3c349a1da30a1487e87c8539"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00461-of-01024.json.gz": {"num_bytes": 400009637, "checksum": "34b98d46d207c5b6ea7416fab6f3cfcb1444cdc19376464ae9abb9296fd14c3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00462-of-01024.json.gz": {"num_bytes": 398107677, "checksum": "2031735c0f38ce43e37a5bb1b9728fc37c758fc4af71758c3d3b9535716a3253"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00463-of-01024.json.gz": {"num_bytes": 395503017, "checksum": "7820184904183fad9a61b6c638df9de11d4624bb3aca08885b842255172cecee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00464-of-01024.json.gz": {"num_bytes": 397493281, "checksum": "b39b1b1e6686014a3c62e74912ec3b915dfc161b62e2d1108410354e6dec760a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00465-of-01024.json.gz": {"num_bytes": 397080149, "checksum": "a65cc7f590cc498da334d5a8653e818421e09e5e6ce2e8bc2a29ac67a02c3d43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00466-of-01024.json.gz": {"num_bytes": 396633690, "checksum": "15d891873ba02923893cbc8c42adc0468bb39161f898a810037cc2e9f82e0796"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00467-of-01024.json.gz": {"num_bytes": 395045117, "checksum": "711686ff5478ec35ccaaf1549b7a33b941e322585f702257dfe2d31630245ba9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00468-of-01024.json.gz": {"num_bytes": 399486439, "checksum": "59c4599c8610f4c54778daedbb358f5e26fa527f8f94c3364b70565ebc90571e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00469-of-01024.json.gz": {"num_bytes": 396170105, "checksum": "4263dbb03135c2d8b16fb323208f98fe1a1ff1223e76a7ba085f881411a0ab95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00470-of-01024.json.gz": {"num_bytes": 397479432, "checksum": "2db90de8f4d2bde9af453478ed4667166f636af701bb487095311f99b28e59bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00471-of-01024.json.gz": {"num_bytes": 396679096, "checksum": "caea3c4744adb89f006d9b0d9ef93241a55c1fc165cb0cd62b6d07fa3a40cdc0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00472-of-01024.json.gz": {"num_bytes": 397080237, "checksum": "34995676d953f4c95f8bd4f54fba8f92b86189cd73298ab77ee2702611b86e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00473-of-01024.json.gz": {"num_bytes": 397881706, "checksum": "c0fc6c68ae509d8273e7ca0efbe24f1452a57dcb000f44f550fe9600fd305e62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00474-of-01024.json.gz": {"num_bytes": 397705270, "checksum": "50aeb620f8c03a2e4f2346a0c79a4509adfae084ffbeff0b86d8892b858a821d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00475-of-01024.json.gz": {"num_bytes": 397201717, "checksum": "4fa508d23abd417bdb0b0e7a61f9aedfb770609214cd85b10b4bde7ced7f12b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00476-of-01024.json.gz": {"num_bytes": 397522775, "checksum": "27da6164865687041e4f53d9ecec2edc877b147da5b424acbac2c69480132a08"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00477-of-01024.json.gz": {"num_bytes": 397323156, "checksum": "e40115fc4901a3930494652ce9ee7abb0c3f41abc6d6c58c81fa75a0ee752db8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00478-of-01024.json.gz": {"num_bytes": 397380721, "checksum": "79a16b7016aed0eec375ca383eb316765687f12421f786b2e133faa5690ef197"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00479-of-01024.json.gz": {"num_bytes": 396828680, "checksum": "08185ce3c3e5b01552be7d8f08ed5b27a6b1b121bb2d7d70a78b7074fee02fa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00480-of-01024.json.gz": {"num_bytes": 398678311, "checksum": "37a5804dafb2f4aff9e393af5b127c3577ab8a5dd23f1e41f2304b25a4c428a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00481-of-01024.json.gz": {"num_bytes": 397654112, "checksum": "47ce12535b753d8936ce3b569675e76cb6f638bfb74a93caf201f3ffc409d71a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00482-of-01024.json.gz": {"num_bytes": 396387301, "checksum": "1d07828a199bb1e1c0c8342ba99e484093557188370d1ced90803c2615d24b7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00483-of-01024.json.gz": {"num_bytes": 397178863, "checksum": "b6499612fac654798010e11c27ee8a25fc05d1dbed8aaf2338fd0ea377dc4732"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00484-of-01024.json.gz": {"num_bytes": 395826769, "checksum": "ce197ad5a226249bbba53c34b9f3c83508b542853748c3094a5b98befb537f2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00485-of-01024.json.gz": {"num_bytes": 397100006, "checksum": "f483044a4a0418b695e0b989f0fd03bfa79df01b649991f2356443bcb29d0820"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00486-of-01024.json.gz": {"num_bytes": 397658615, "checksum": "297beef7b85dc128a6a58d834c5fd1b24bd7fe84c7a317500461720c742235f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00487-of-01024.json.gz": {"num_bytes": 396904673, "checksum": "06751938694fad1645ed575208e8e2c1efebb7165b4feb2d0ea871dc348741f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00488-of-01024.json.gz": {"num_bytes": 398019631, "checksum": "eb58bf8b011fedf15835841317e445e9e757c9939b4453a013233f020f98a697"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00489-of-01024.json.gz": {"num_bytes": 395822836, "checksum": "b339e33e7affbdaf691852d3668ff79adf8476a3c33eb86ad9f4ad4a6ebbf3dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00490-of-01024.json.gz": {"num_bytes": 398410737, "checksum": "4d8356cf804474538772c5520e77e75ac750dce3e6b103c9feab49ccd46a58ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00491-of-01024.json.gz": {"num_bytes": 396607853, "checksum": "1757097fb884d03aa288a05870016b1c2b9f1700ac5913d85c9821cf2e367702"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00492-of-01024.json.gz": {"num_bytes": 397612443, "checksum": "92e98e431a378e0402d81299c49209c66d39b0ba7ae63711f8d6ecf542f5fdf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00493-of-01024.json.gz": {"num_bytes": 395595466, "checksum": "d839e1763aa6ebc7cbcf1b870d947ba45b0b4ac95b0adbe4941a0b121690a311"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00494-of-01024.json.gz": {"num_bytes": 400397068, "checksum": "31caeb5f0ef694c06ce434df44c01f4a91fcd48e4acb4f1bf167eae6e59a02de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00495-of-01024.json.gz": {"num_bytes": 396458630, "checksum": "26291dfcae5145cdc306317ecf95851a3f693b4a7c6e132e55384ec69d85ef3c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00496-of-01024.json.gz": {"num_bytes": 395037560, "checksum": "b32344b92f81006ad9e2e471f5ef8133e87924c5150145b13d51c3d7a0f68c46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00497-of-01024.json.gz": {"num_bytes": 396247929, "checksum": "0396f0bb16b06ff130e955f260233ec868ada1daef6e8cbd480ce388628d49b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00498-of-01024.json.gz": {"num_bytes": 394798084, "checksum": "28d43d4e7bbce4e20167741ea2bbc3f17981aa51f9c040cfc41c522e732c6d32"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00499-of-01024.json.gz": {"num_bytes": 396699883, "checksum": "c6f6deff919b375fb08c74e159c25aa66362e4cddb0700f9b1e0e2701293ae70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00500-of-01024.json.gz": {"num_bytes": 397014521, "checksum": "7ee22957fdfad0880f132f47860612331afce7a48975b9312233ba8ddf537bed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00501-of-01024.json.gz": {"num_bytes": 399063718, "checksum": "ec94186b620037002819cd40347e6aaf67cb847848483790cd687222c9addbbf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00502-of-01024.json.gz": {"num_bytes": 396938850, "checksum": "a218de10cee75c4bb5a7102fbe208e6e65142ba5f960ecdc2b56b6f85fa30840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00503-of-01024.json.gz": {"num_bytes": 394631309, "checksum": "8189de9454986f63253fa1ad44c63d5c2f692ff4bc3a848c7c2fd02e08f4e1b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00504-of-01024.json.gz": {"num_bytes": 397884411, "checksum": "b7b268545c27573840bf8a6abb7361c209f92f9b5f0f8028fffd49b0c773854b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00505-of-01024.json.gz": {"num_bytes": 395784113, "checksum": "b9f1610be9f045c15e43a7343bd2918743a71585a7122a4e781533dd39a73132"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00506-of-01024.json.gz": {"num_bytes": 397939195, "checksum": "f07b77d1be71c5922321e8683140f9a63a90903f1fbd1515d908807e12fc4597"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00507-of-01024.json.gz": {"num_bytes": 395925741, "checksum": "23e9927e9e83fd03e9d99c3fac05f1bf63d6c296a2b02d1aa208798d27d8dc1c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00508-of-01024.json.gz": {"num_bytes": 397426015, "checksum": "f4b8a74c610cea50a6b144337f65fcfed11fff21df6683503f25d4b82e29a4e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00509-of-01024.json.gz": {"num_bytes": 399072341, "checksum": "c3069ae9658273cbaeaed1730f171837c8d3042e31d1093cf0f519f601309a41"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00510-of-01024.json.gz": {"num_bytes": 395859781, "checksum": "e5863648f64423397ca1a7838df18aeddbb3d5d3a2551321fd99a480508fa86f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00511-of-01024.json.gz": {"num_bytes": 396948832, "checksum": "a2209ec05a794f083cf163c102c6ddd8d5e5627674686950e17e586128a81e60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00512-of-01024.json.gz": {"num_bytes": 396585426, "checksum": "1c6fdb002dab490e6ddd7fe6023b2124bb944b7ebe95ee3b7faca9a92f4b5de3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00513-of-01024.json.gz": {"num_bytes": 396789970, "checksum": "83b02c0cf9ffea9d021adc102269c30a33ab3a803d331ba8d39aaa9b3b7acb43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00514-of-01024.json.gz": {"num_bytes": 397131474, "checksum": "783f25460641cd3532c3bb3920c7d3f0c68b5e674d44cba33b1ed755608cf8ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00515-of-01024.json.gz": {"num_bytes": 396127068, "checksum": "61e5b9947f77d929442f23fe84465d88044631aa1eb6438a0b86372cba7286fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00516-of-01024.json.gz": {"num_bytes": 397526020, "checksum": "539b032f528d1ec3a8e8420514ef2118f05482297b052f6d28876a8bf776a080"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00517-of-01024.json.gz": {"num_bytes": 397748661, "checksum": "03b85a51aa7bcde672cc017fcbb0f11976cbd1447fc0ccb4f4bc822b2b04b27b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00518-of-01024.json.gz": {"num_bytes": 397915751, "checksum": "80dec6dc7d15459c113c16f23978c38cdc1157ca18468d8a00e0d2192bb2ffd9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00519-of-01024.json.gz": {"num_bytes": 397847480, "checksum": "7125e7915fd03c6312cfe448e4e7a8629249765c13d8558b17c240c2aef713b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00520-of-01024.json.gz": {"num_bytes": 396232144, "checksum": "27974f9766c18fd0b652c94eafa3493243c8e1b25b6e850e857ab6246b193b48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00521-of-01024.json.gz": {"num_bytes": 395111538, "checksum": "61406e92a8f9a6ab800b3dd25cbac842e3487a4c7db7b1bb2070a41d627367a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00522-of-01024.json.gz": {"num_bytes": 397690206, "checksum": "b2e29801d120132a5fbbd3662a54290e46ff5e178b3146ebfc2169facf72e7e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00523-of-01024.json.gz": {"num_bytes": 398274007, "checksum": "79905dbc45756c9f1c225120709d39cbf3caf435e322a531a4add690a1d0440c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00524-of-01024.json.gz": {"num_bytes": 395689218, "checksum": "1dc3086cb869abb13862970186f6a77cb29b687cd49518173f639c148d937f6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00525-of-01024.json.gz": {"num_bytes": 397979085, "checksum": "6958bbc6029c00229fb0059d016a6b7a2bd21cfdc69392893423d2657c35c7c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00526-of-01024.json.gz": {"num_bytes": 398473877, "checksum": "895f42c4e7569f0db3832af13e56499f65fff74e93fc0cdf60c1c4b4b08881c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00527-of-01024.json.gz": {"num_bytes": 395879939, "checksum": "e84e72048b56878b1ff904ee83d92c208e15b16663b99a9d763edc23c2e0e55f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00528-of-01024.json.gz": {"num_bytes": 396472889, "checksum": "badcc3cda339c61936591e9333787ea032c42d7ff2288fdaff791bdc8504ce96"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00529-of-01024.json.gz": {"num_bytes": 396983038, "checksum": "ad20643f9d50c7c508fa136ceed0039ce39708e0e7a5e743c1981f1000bc3c4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00530-of-01024.json.gz": {"num_bytes": 395774249, "checksum": "9453fa3fd296150b436f0146171ea8317512c6735ee9434622a83765a5d9e310"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00531-of-01024.json.gz": {"num_bytes": 396171120, "checksum": "3e3c230ab6beda13e4dd4747c7c6291e57b1ccb4a96ac2edb46ffdb4c3cb05b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00532-of-01024.json.gz": {"num_bytes": 396200411, "checksum": "e9b52c3dad233fd1c4310cf5f76c2e6d0788ed084abcf931f99ab7002976d75b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00533-of-01024.json.gz": {"num_bytes": 395580851, "checksum": "e135cc4420d9f4d17ab523f7db8c559021a46a9a6bcdd21a6c4075047465906e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00534-of-01024.json.gz": {"num_bytes": 397459281, "checksum": "bb4f32ee1c1bedf4582b0f4f9ec7644be73fa25bf18cca7506e3c26e98818bad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00535-of-01024.json.gz": {"num_bytes": 397344480, "checksum": "3766ddf8313c5cee08a575fa96bdde06a5b293f1964e58293ea583d72bd18e20"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00536-of-01024.json.gz": {"num_bytes": 396588089, "checksum": "56d236a4250f9488d80b93c0c005962d018da256ea5632c7e16ae26c54188749"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00537-of-01024.json.gz": {"num_bytes": 397606873, "checksum": "d7ec24ef99de2769937b89e0ca7e291eca2bd0438d501d9228d5ab035f49d83e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00538-of-01024.json.gz": {"num_bytes": 397608864, "checksum": "1a60378a0f1a200b11f85577bbd0f373ae47022eab16fad53da492ca1ed35bfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00539-of-01024.json.gz": {"num_bytes": 398377669, "checksum": "787d263107eb09e852b015c17d1d0f54d8b93e78292c0c1e60cf99f27535c608"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00540-of-01024.json.gz": {"num_bytes": 398516980, "checksum": "dce03ef0813ef66e27df8730da7e341b49bf7e684bffd3a9cf700905501d1d72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00541-of-01024.json.gz": {"num_bytes": 395557685, "checksum": "e4035222d65124bd3e33372b76b65c2dad9e696701607ceeb5968d483595645c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00542-of-01024.json.gz": {"num_bytes": 395725875, "checksum": "4e7ae0b1c0c4d514e0208e21336d095fea5970475077d6690a917faadb2b72b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00543-of-01024.json.gz": {"num_bytes": 397625187, "checksum": "a96ac467b6ace74a08f7dbc4bb8e3fc57fae36abc8975d6b60a7b7353ca9ca88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00544-of-01024.json.gz": {"num_bytes": 397078230, "checksum": "337470c84cde5d02bc6a89003a6796de9e63db269e7800637ef2d220d75bd3ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00545-of-01024.json.gz": {"num_bytes": 396145060, "checksum": "da65d66aa4cfff77c754f8017eedd92cb82494b9425c2d5c5491d64603b2231e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00546-of-01024.json.gz": {"num_bytes": 396093007, "checksum": "399f7b70d1c1b45ce315f396d5fa0db2c69e41c522b0514e19bcc6802b953b1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00547-of-01024.json.gz": {"num_bytes": 397457696, "checksum": "47fc8fd82271e6b1fb074512da45dc005e22cb7f0aca3b7b621ea87613aeff9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00548-of-01024.json.gz": {"num_bytes": 396246097, "checksum": "3108770b39746852d7c048d9a8777722480505bbf4592732c7d1f231e2505c55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00549-of-01024.json.gz": {"num_bytes": 393096516, "checksum": "9bb2b88775593afe4060349985ff4417a37f1ba9b4ef33399c58644c01a92b89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00550-of-01024.json.gz": {"num_bytes": 396631619, "checksum": "cbb55d645d145ecc2ff9b96524463f82d5548c0bdf42381fc6faaad256e7ead7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00551-of-01024.json.gz": {"num_bytes": 396806780, "checksum": "ece03d7f12daa39473b6b8d5faed08a3f751efb9b1ee99f69c5188633d4a0f43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00552-of-01024.json.gz": {"num_bytes": 398608968, "checksum": "7fbbde9c39d67d8d7f9f16c0848188b743c6ff5bc44e6339d5fd88c32e1aafef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00553-of-01024.json.gz": {"num_bytes": 397696672, "checksum": "85f9c5c5fbcfd06f715b520a1a3a63a014b1831d2f65de5f02cfea49a18ddf63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00554-of-01024.json.gz": {"num_bytes": 397122204, "checksum": "78e3d43c3d2b71d8483788a085cd5706648767de7a2fc4aab707d6a05257ff00"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00555-of-01024.json.gz": {"num_bytes": 398704893, "checksum": "113e5fd99ada6ca96c086487b6e4012bad711d1d482d580e22d3af5b9d118572"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00556-of-01024.json.gz": {"num_bytes": 398099675, "checksum": "c7a816f8f2f74b4554ac17ffc41e67ebbcabb7c8b0c94292b4569bea372bea3d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00557-of-01024.json.gz": {"num_bytes": 396538561, "checksum": "7af6d2c9886481a0d393e026739b5ad7d0fc358ecc216d2fc124160402d4b50a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00558-of-01024.json.gz": {"num_bytes": 397660839, "checksum": "c1033428189671d4e1ba55c822040f307748c6ec31b80be3e4ed8e7a4325066b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00559-of-01024.json.gz": {"num_bytes": 398754128, "checksum": "69c9f88840166363f2b7ddaef05ac9d10441fd184d8451abfde76eb105572342"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00560-of-01024.json.gz": {"num_bytes": 394988981, "checksum": "a2dc4fc315a0db8f1a868d631d2941ab2806f44c2ae698e94bb7e8308bd67c70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00561-of-01024.json.gz": {"num_bytes": 395801300, "checksum": "dc1b2b4594e3fc7f8795f7649d1c524405edce56d617f1e214692565de8c8937"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00562-of-01024.json.gz": {"num_bytes": 398322250, "checksum": "c23404fef6a6b5b887cc2dddfe341e983939ae36078d62842919a3739c96b43a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00563-of-01024.json.gz": {"num_bytes": 397584845, "checksum": "c909fe429772c8198f904496ea6cf239d669c6c787889cefcb7623e08a988db0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00564-of-01024.json.gz": {"num_bytes": 396436964, "checksum": "8e7cb1863057a3b9929af4da29b4e1cca1f71c254f5eba91a657d9e8c1fd6dea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00565-of-01024.json.gz": {"num_bytes": 396486039, "checksum": "23ba56e78c4edc4d58fd7fbfcf784b29037204a641e43a9894c95c68bdb982fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00566-of-01024.json.gz": {"num_bytes": 395358745, "checksum": "71259a300ff096b49e3461c91824a8185037ca85ef2018dff2617f335ab304b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00567-of-01024.json.gz": {"num_bytes": 396405726, "checksum": "d9b56ed523376681dd81cb9831727467461bdfb87c80d3932937338370093033"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00568-of-01024.json.gz": {"num_bytes": 397509797, "checksum": "c650aad13a48d5b0c51162ad19c9eb3135559d0a3318dba701a90e8138a8cd24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00569-of-01024.json.gz": {"num_bytes": 396514261, "checksum": "d71e4126c2deffae8ee55077cee9dd2b70ce27adec767bce06e02afb23b42416"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00570-of-01024.json.gz": {"num_bytes": 397072833, "checksum": "519a32e1bdf7f5b97e1a438242a79218317e04e44021dc61aa65c526d35ce8ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00571-of-01024.json.gz": {"num_bytes": 397170114, "checksum": "919a9659156cafb26b87190fc00b9d33c4fd536dd35544cbef8e5ddc018ae365"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00572-of-01024.json.gz": {"num_bytes": 396475017, "checksum": "3d7e4e548f01c9ad5fc99b4342cbf9a9004737058dd93aae8b7d95b2c00856bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00573-of-01024.json.gz": {"num_bytes": 396749955, "checksum": "032f8e37328c9f0fc046e5a6ff5a79cbb744f3100c4cbea78e397c449471bb10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00574-of-01024.json.gz": {"num_bytes": 396036505, "checksum": "8e795341527712be32a69307ce8cbd2d6195c6b2fea596d326a279734505198e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00575-of-01024.json.gz": {"num_bytes": 396722381, "checksum": "45a43576cfc61842bde146eaa566b4f22a128c3c2eb8f30c59a6b6cae4bcd4e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00576-of-01024.json.gz": {"num_bytes": 396163377, "checksum": "38429d2d6176ee42ddd495e052c01735a9a7f0076cde107d24a0a9c7a26bf2a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00577-of-01024.json.gz": {"num_bytes": 396813305, "checksum": "eae77c319bba236feaffc9f74eaa38e911fa48eb06f4794c9b1a6d17edab91a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00578-of-01024.json.gz": {"num_bytes": 397797226, "checksum": "1dd2b3d7e99fde8903bc12625568ec4fc6fe653737b3af5e9c71432e311cf5f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00579-of-01024.json.gz": {"num_bytes": 396012631, "checksum": "d9322e66701b4ada3788b91a07e87b03af6c91eb4cfaaefee23c0330987a1840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00580-of-01024.json.gz": {"num_bytes": 397943129, "checksum": "23deb32e1b0f07a55a5cf1572cb8e313ce716c748a07f58bd90cbae97290d0a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00581-of-01024.json.gz": {"num_bytes": 397614648, "checksum": "6193f8b848c7930fc04b9f2429dbccf36f1b291271b3eaf646c655433bf3ff9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00582-of-01024.json.gz": {"num_bytes": 396659280, "checksum": "40997ef02c7040356cd1c5acd8e6a5121e00b31253713cad4f529ab2922affc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00583-of-01024.json.gz": {"num_bytes": 397686445, "checksum": "5cd21271e4ae036f8d1e0c320330a6c93a8b1ffbb9293a80c56c2d7f123f9ee7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00584-of-01024.json.gz": {"num_bytes": 395500815, "checksum": "c25befb7c735b2340b092a04375d2109c1b876d2b0057dd8d4ed4beac87118ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00585-of-01024.json.gz": {"num_bytes": 398413461, "checksum": "073f632e95c218fdf17274fc21915c94f56bdfbb58a6b1a0550de249ce4d2129"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00586-of-01024.json.gz": {"num_bytes": 396849745, "checksum": "647cbe9bd7709c0d8a01485096fd88ad0fc09b27de324eae141a8d841536b71b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00587-of-01024.json.gz": {"num_bytes": 398567154, "checksum": "557af97a8d2b2656149bc25ee5b362116d173e6a48911b860ec10d512b4b763d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00588-of-01024.json.gz": {"num_bytes": 398086388, "checksum": "9e9afa15ee3534e497c9fc7c8cd967388183193dade3d1ec82a8e2b0e82c5118"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00589-of-01024.json.gz": {"num_bytes": 397335823, "checksum": "ed8a1d0b9c55f465b5d4a4e5ea022f6d17aaa8b82569be7cfec55629c1bf26c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00590-of-01024.json.gz": {"num_bytes": 394931693, "checksum": "3fbe539fcf64f0d914c19b383de9953b0605d4a69f48801145f0db1972f9c6b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00591-of-01024.json.gz": {"num_bytes": 397828770, "checksum": "9165de8866384d3d03c3876c39c96706e33a24b9f95acc09999c2dbfb85cd9cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00592-of-01024.json.gz": {"num_bytes": 398782493, "checksum": "433a9cb730d7ab024b56ad662a3ea53633f7ff26c625051c4c02f252beeb87a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00593-of-01024.json.gz": {"num_bytes": 399264489, "checksum": "4a7e5f40aa8b692cfa0519d33a868e9a05e579ad430204bc13c48b533eadc5ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00594-of-01024.json.gz": {"num_bytes": 396629833, "checksum": "521d5e90550dbc97ab26a18a0b75da81e38ce2083ff5fd93340fded2e54e1ca1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00595-of-01024.json.gz": {"num_bytes": 396916313, "checksum": "30c9be1d99ce0a41b214fdbd5115988c82ca317d4aceb30c19fbca05e0a409e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00596-of-01024.json.gz": {"num_bytes": 397013253, "checksum": "b16bd9d7d893b4a71056575fa0799bef96120c03cfc6e2a88c292469a67f2614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00597-of-01024.json.gz": {"num_bytes": 395980036, "checksum": "3bd15089b6fff342df2b3109d7ebadca35cead4f44ca5b1b55e55d8892aab82f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00598-of-01024.json.gz": {"num_bytes": 396295935, "checksum": "6252d951a9570baea9767cf3350a6d09ac5a5fc34ba80eae3b5c40adb8361ab9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00599-of-01024.json.gz": {"num_bytes": 398608239, "checksum": "b265a385cdd5e64d1fb2ffce739e72f2fe2cc8944621f20e2084dc52b91cdd9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00600-of-01024.json.gz": {"num_bytes": 396563743, "checksum": "43d12028cbe738e8f450911f6a55dcb00f8742cefc2a2c4da5f9e9220b0572c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00601-of-01024.json.gz": {"num_bytes": 398256993, "checksum": "9368dcfc581e6d572d899ef25b129bc0268901a2fa009500174a0985bcf330df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00602-of-01024.json.gz": {"num_bytes": 396202546, "checksum": "3cc57d7afd161fcd411f73da8369d98db4c6d8e30643ee01450adef21e8ea3ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00603-of-01024.json.gz": {"num_bytes": 396338425, "checksum": "cc21fc5b8ed6e5115bd8924954d685ed52cd5b773ab63d37188343443c95851a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00604-of-01024.json.gz": {"num_bytes": 397597307, "checksum": "d24f6d807ae35037e695e19917ed446f74448166fa464c862e31fe7ba2bea196"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00605-of-01024.json.gz": {"num_bytes": 398278313, "checksum": "99166183c752aed8d0f2cc9c010f1ebdd4fb93d40e936fd6c082eb3542baa956"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00606-of-01024.json.gz": {"num_bytes": 396590468, "checksum": "657ce79340c15524a5897459a6cf712fa4127def2445f7eb3de21c9b46db3794"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00607-of-01024.json.gz": {"num_bytes": 396603228, "checksum": "3705441435f18d1e4aeea9e794e1216fcd29b48213763a554808e3d3697951a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00608-of-01024.json.gz": {"num_bytes": 397280580, "checksum": "be0bef2c16e9bdd0387276402dc99fe5a9a0a7a105a44e88bdb783139f2de474"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00609-of-01024.json.gz": {"num_bytes": 398284528, "checksum": "3a7c7a8cb01f6d7589152a1483682a5fa99e119490f3e70d8a02f582f2e2b19c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00610-of-01024.json.gz": {"num_bytes": 398872039, "checksum": "c349aac5b64227397ec2870992ac9e4fac9fe39f1fd4e0a7b8c727e171655e14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00611-of-01024.json.gz": {"num_bytes": 398736440, "checksum": "63ca5eb2d27632b3b4dde8e40f9925e71e21ef737262bcda7a99324a67e0fab5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00612-of-01024.json.gz": {"num_bytes": 395170895, "checksum": "3b4bb3e14ee981a9edb9828ce40b86b5d83dfafcc1a5e0e02642cb40924bd6ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00613-of-01024.json.gz": {"num_bytes": 398443337, "checksum": "e95adbd7d55024b7e62145860f217a6f04f5fcef79ac23e92dd9e14f9a0b2a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00614-of-01024.json.gz": {"num_bytes": 398854661, "checksum": "def8cb789f8f79fa169e855816c5e4bc7d5c253e565502691a9abb826d7436d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00615-of-01024.json.gz": {"num_bytes": 395505189, "checksum": "6775ca6aa4f834289396a438906b90936ed0ff6390213dac2b0861f40d7761e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00616-of-01024.json.gz": {"num_bytes": 398999454, "checksum": "6cd5efddacb09cc80ec1eb79f93b562044787903b3cb1c879be2acec64a9dbdb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00617-of-01024.json.gz": {"num_bytes": 398570431, "checksum": "26d1f587377446e8b1499be7a3b6776d437baa40353fb04c591203a420eb0cc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00618-of-01024.json.gz": {"num_bytes": 397064982, "checksum": "e59a87fd1cd3d87fff4b15c3a9331521d7587ac7f4a7fd51ec3906b484ef9ad0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00619-of-01024.json.gz": {"num_bytes": 396676338, "checksum": "8077c3a15d93579d0fbf00bd9d117bf4f50092c5be3acf46c7d4433ef7be9dfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00620-of-01024.json.gz": {"num_bytes": 398186471, "checksum": "ee3fb91d7797ebf1daf8dcb81563b7dae7b161d97732efd35e3eb6ebea732ee2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00621-of-01024.json.gz": {"num_bytes": 396467968, "checksum": "386adb83129a7306ef4da37c1cbedc39b3971e7633d516d406a982f307577e67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00622-of-01024.json.gz": {"num_bytes": 398293882, "checksum": "b708cad0e04c56174d0feec84d7224a4490cb8db023d38e57398cad89b78568f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00623-of-01024.json.gz": {"num_bytes": 397396780, "checksum": "c50c4568c6f103b3e6a3702cbd915ecb530df954df808156bc38a98f36a0b944"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00624-of-01024.json.gz": {"num_bytes": 396971282, "checksum": "11351ef83c9fb883d6c0f484af5c10f0d686b7ac4a2f08fae9ac3d9837df0a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00625-of-01024.json.gz": {"num_bytes": 395882440, "checksum": "dfa97ea7949c9bbf7af43d43ac5c8d0034bdbd1ad572895159b7c7846ab89676"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00626-of-01024.json.gz": {"num_bytes": 398292846, "checksum": "fbc9c23dc286ad6fd7f01f344de97ef5789733af581de278488869bd36f3b246"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00627-of-01024.json.gz": {"num_bytes": 399890427, "checksum": "f43bbde36b8bd34ed9998b99b42c85434b8bbc8bbaa1cf5b38cec6393099c23f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00628-of-01024.json.gz": {"num_bytes": 399589466, "checksum": "c50058a4937912b678d33d34ff91e2287e8701365f4f71fce61f9002652556cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00629-of-01024.json.gz": {"num_bytes": 397355095, "checksum": "051c4631d0587b6f65827410ad2f2121c05c849a009274415bc5e7f72db42d44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00630-of-01024.json.gz": {"num_bytes": 397860559, "checksum": "07b48a86a8a3245fe5b78f6943c8970c839942b8d86abf173507225b0d1520d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00631-of-01024.json.gz": {"num_bytes": 396161304, "checksum": "70a03f0308105de5266c4a40803b51f99888b362b71409719b7f71f73761b590"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00632-of-01024.json.gz": {"num_bytes": 395620184, "checksum": "c6923984c419f08bb4e6effc27dd25dd986513034338debc9b238592dad9f607"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00633-of-01024.json.gz": {"num_bytes": 397572527, "checksum": "900fc701703234031e825a1eb2d11b364f1dda97eb0c7943e17ef278695f7bea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00634-of-01024.json.gz": {"num_bytes": 396215174, "checksum": "0cc838e395581933123fc57c6690afbdd2be1b67d213336d9b8c08b3876f8458"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00635-of-01024.json.gz": {"num_bytes": 399176005, "checksum": "5a3daa1bd0be8c997da56257f063a7d1c7b2b271648a46615b26ca4beeb42863"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00636-of-01024.json.gz": {"num_bytes": 396035356, "checksum": "9d21ce1c8b5a7c1330cc95b1f45286fb8578d5dcec0686724ff6e25a97f38a7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00637-of-01024.json.gz": {"num_bytes": 397214839, "checksum": "83cd34e1ba09c268b515fda7699e12bfa2531fb7e60e2f861946ffdc01e54a04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00638-of-01024.json.gz": {"num_bytes": 396292535, "checksum": "82a7bae9a7d35fa707bcb6d90f7b244f1509e112dfdbd604c9be1f8b8ce7150b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00639-of-01024.json.gz": {"num_bytes": 398009954, "checksum": "b6d7ebd102c67960413caf5fcdc5b4aea728b6d3d6369ab8dd3cd6bee6c769de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00640-of-01024.json.gz": {"num_bytes": 397558496, "checksum": "151c55d019fd84fdc0eab73d24984e5d88ac964c86f89a361a03dc776a22b5b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00641-of-01024.json.gz": {"num_bytes": 398031508, "checksum": "e0e87304a8ac408adca2badf2564ec52caf155295ea303a121c30f3b1ce797b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00642-of-01024.json.gz": {"num_bytes": 396594124, "checksum": "73d08c99b6b96d96b82d88267b2a392a7dda2084ba5142b8eefd0d23212702d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00643-of-01024.json.gz": {"num_bytes": 394552252, "checksum": "ebccf3b935d63c30f626d317af250b6bd0f04ef5e1cced829287ba64fbb0d25f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00644-of-01024.json.gz": {"num_bytes": 397586341, "checksum": "674c0965a9a880c057b6f2dbb785a4a6ae048954d44ba4f5266dd5e65095d06e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00645-of-01024.json.gz": {"num_bytes": 397950976, "checksum": "7ac8d4dacd682a2977818f01d860c3dfa5a5e5a78f7d2d95be0353a675452e93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00646-of-01024.json.gz": {"num_bytes": 397511840, "checksum": "452a9cc03facf9151552f914f9a8a3507a96fd8ea40f7d04951a29ecbf6aa1e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00647-of-01024.json.gz": {"num_bytes": 396692070, "checksum": "5a795a238203444596c711bcedc634e653e5240c9a800a9884c51f878340b494"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00648-of-01024.json.gz": {"num_bytes": 392707626, "checksum": "9cc366c37950624df6af318ee52a97d32a40e278fcb519cbe8545b04bee3204e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00649-of-01024.json.gz": {"num_bytes": 396283284, "checksum": "4ddeec31a30b5c563838b17e1115ad30041e08c70a94f299ea324ee4b71fd82b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00650-of-01024.json.gz": {"num_bytes": 396349662, "checksum": "f5bc63114ec9d73d6cea7f8e38a95031ae2bcde849b27440afd840a3e72aac13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00651-of-01024.json.gz": {"num_bytes": 397187042, "checksum": "7199c0242b2654509af187c9c8bbfc22cc5067aafa1ff69949b1f0e5b718425b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00652-of-01024.json.gz": {"num_bytes": 396263026, "checksum": "c9e62b6df7213ea5b71913fbf736403f33c51e5a868bf1035cebcc39d80635bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00653-of-01024.json.gz": {"num_bytes": 398689010, "checksum": "f3bcc9eca4d71043e920db6399a032f916c23b1da329d2ef86434a74f8e7b318"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00654-of-01024.json.gz": {"num_bytes": 396938678, "checksum": "fb41df26e1f68e1e9d12ae8740535ca66e80910320be2270d680fec40d6fe9a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00655-of-01024.json.gz": {"num_bytes": 395995226, "checksum": "018b40ddf6d88c4c346c8018439d16f6ca66ee0720970e84ddc34b1010ae35d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00656-of-01024.json.gz": {"num_bytes": 397860049, "checksum": "8f3847e9bb5a8145e2959b340f86cc06f85e6646f32d5d785c5c90ec11a9f404"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00657-of-01024.json.gz": {"num_bytes": 397142407, "checksum": "a1ae8735a39bd099dac2e50c22e312f1a010f2644774ef53c995f3437c0a5524"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00658-of-01024.json.gz": {"num_bytes": 397827609, "checksum": "f6154377cfff2453392fb899f81514a7c0ffd40dbc35d8842d61a115d0aeef35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00659-of-01024.json.gz": {"num_bytes": 396861858, "checksum": "4299633524667921549573c469a73e33abae89d107375d5ccc6a6d987c2a2a26"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00660-of-01024.json.gz": {"num_bytes": 397773823, "checksum": "44eaf6c1739d8a9c13c54750c473ac04aaf9d2223d8893cd8094f1769b1f6f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00661-of-01024.json.gz": {"num_bytes": 396311257, "checksum": "18edb60444b660c7cc68dbe59ac71989be0e20ff13639725a5f05e4d4d512514"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00662-of-01024.json.gz": {"num_bytes": 396176936, "checksum": "7b60541181fbb92f361fbdf0bee80d086c75279610aab792a7b3877d49a3e1bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00663-of-01024.json.gz": {"num_bytes": 396274985, "checksum": "59e057ee5f5e8c7267138c18c5c88f3ca24d30f86c484e4bb0c0a4eb5169c4a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00664-of-01024.json.gz": {"num_bytes": 397483935, "checksum": "585f45d3ac3f88c3bf1c86e01daa46537f8f5c5165521412de0e67393cb6da33"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00665-of-01024.json.gz": {"num_bytes": 398831104, "checksum": "e403d2f4ff6e74abc9639749f93f77cc868453908c10821fea7fafdbcc981a06"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00666-of-01024.json.gz": {"num_bytes": 397668116, "checksum": "f9bbafa396a466b24630a259a01804b2857c1dde2fa3cec60b2967a88ad9f528"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00667-of-01024.json.gz": {"num_bytes": 398123165, "checksum": "ed693d5ecb9dfcaf545e831b5769b877e927125794cae61a0ec7821c3c85dfe6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00668-of-01024.json.gz": {"num_bytes": 398152096, "checksum": "51c33c07d503743704f564bc6a372c2f6f8f13a1ddd00b0b9a2c44c94cc57444"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00669-of-01024.json.gz": {"num_bytes": 397927981, "checksum": "d356b5268ba39e38ffccd20e95803f3218407e0a1ca3b4d1165ff82796ec1bae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00670-of-01024.json.gz": {"num_bytes": 399074605, "checksum": "bb96ea8154ae01275a9197709820e670c4e6212c740e92a7f1cfb7c618a49bea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00671-of-01024.json.gz": {"num_bytes": 397864381, "checksum": "afca3dbcaefdc368e996259fd595b77fd98a885ec005a93069a01b83227c827b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00672-of-01024.json.gz": {"num_bytes": 396077133, "checksum": "3da96ebd1b28b55b03bbab8e85f78295cffdad9020f869cb456da27058ffa090"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00673-of-01024.json.gz": {"num_bytes": 396943842, "checksum": "6a4c344a8af68a95e20d58b64fff8fe616c2a406cf26f642cdfea65fce5883d1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00674-of-01024.json.gz": {"num_bytes": 396975969, "checksum": "e6b0f7727d78143fa180abb76e617b37660b35f6323f19bf1dcbc78fb9374508"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00675-of-01024.json.gz": {"num_bytes": 396692800, "checksum": "e4ed97b19c6d83e618a3fcaff75460d828ca419b1e62842a1493b0ec4c9703e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00676-of-01024.json.gz": {"num_bytes": 396514400, "checksum": "a5672f1561ab85f071395de43e702791aaacff77a9f67f6ec9e14b12aba675b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00677-of-01024.json.gz": {"num_bytes": 395939125, "checksum": "3dacd3bb90b5e645d1b9a962d8df87f571b0fcf227996068535bb98a68f9191d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00678-of-01024.json.gz": {"num_bytes": 397022852, "checksum": "c1a0ef31342161369b7fb709be17e3c86191c1a52cb04b704fc58190818302c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00679-of-01024.json.gz": {"num_bytes": 398325372, "checksum": "47ddd1056ad977407f61b2eac3ff803d17b1aa8fa0719279bf911caf49bbb7c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00680-of-01024.json.gz": {"num_bytes": 395502228, "checksum": "cbb93f322d684ed558cbf8d92b9f83958ba772fe4177093a334b4596343f3cd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00681-of-01024.json.gz": {"num_bytes": 397981781, "checksum": "9ec2dec493733846a1ec9f68ff5130cd461d7ab9c07b22d4aae94463bcf03146"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00682-of-01024.json.gz": {"num_bytes": 395265758, "checksum": "7731cb9a2898c730a650e5d1b358886ed562228928aefe55d991cfaaa61a9a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00683-of-01024.json.gz": {"num_bytes": 398783283, "checksum": "6f2bb48070e809ac17fc90e1117d63bd8c7cd0079d9e44c9f262c4ce60f5d373"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00684-of-01024.json.gz": {"num_bytes": 396160769, "checksum": "fd07413637b97b68cb3a7a6cb86c4656017b7841728e806485ae196294e79f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00685-of-01024.json.gz": {"num_bytes": 395594461, "checksum": "939925a9169da729891fbeef926f420b80bcc60e0f170bcf9a2095449a22d424"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00686-of-01024.json.gz": {"num_bytes": 398275260, "checksum": "13836c45719ba10f2d581cf17cdab1daa4cc207a49db2b4786b451605842ac4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00687-of-01024.json.gz": {"num_bytes": 395256765, "checksum": "0c0d0e6c1e3cb9a024c184a8510066a005c031a15af74d117d0e736a358a91d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00688-of-01024.json.gz": {"num_bytes": 396635904, "checksum": "2462e084563f8b8de68c6e826289949ff8ebf8cfaf323344c07ab93e56373539"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00689-of-01024.json.gz": {"num_bytes": 397749444, "checksum": "d03746220f3374c80102ed39d8f6ae0daec40fc1b23312c08ecdee82a65ac6df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00690-of-01024.json.gz": {"num_bytes": 399380060, "checksum": "217d032ecce8d0b7e448befe83aa051a3bfab8cb0e167d043b6abc833f5e9b4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00691-of-01024.json.gz": {"num_bytes": 396975651, "checksum": "354fe9bc07aefc55cbbf8752f53ad69d45761da928bc8deb6fee1de9e244e93e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00692-of-01024.json.gz": {"num_bytes": 399720848, "checksum": "21f88940b6cbceefd66ea5e8d466467806370ae24a5833ca308cd840daf5ff8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00693-of-01024.json.gz": {"num_bytes": 396787846, "checksum": "c8d28980ffa1eff4459d2fbf0043a1f8eeaf840a3b1d1ea4989b2192c7a82041"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00694-of-01024.json.gz": {"num_bytes": 397945967, "checksum": "1936570da24c4bab9fe0559826f1cc509c4ab6eb3679e26d697efa6e7e5c8a81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00695-of-01024.json.gz": {"num_bytes": 396349049, "checksum": "8e497506f84513272a8a0694e7d4efb004b1e3b515887e3b5762f59b6c659dc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00696-of-01024.json.gz": {"num_bytes": 394901418, "checksum": "9e1d6cc187ff67ee734bbadc6cbd57eae05634a448edfde184fa8d6fc3259836"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00697-of-01024.json.gz": {"num_bytes": 399142528, "checksum": "9584496113a8612620748aaba35e185b8f47b7c96b4ff0dc7bfdd6024a3faa14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00698-of-01024.json.gz": {"num_bytes": 395923784, "checksum": "83a3c57b3870ed9beeaf3ec8ab694e0be458106f3128b14b2a44a036e89d32b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00699-of-01024.json.gz": {"num_bytes": 397137494, "checksum": "0befea64fe749d79592e337bc359bcef70ca8816d0126ebf89d4b8fbfbdcbec6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00700-of-01024.json.gz": {"num_bytes": 396554785, "checksum": "34739b543636aeadb6dcce3e7c97ca49026cc9897c13add6b592fe60e5c40338"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00701-of-01024.json.gz": {"num_bytes": 398091188, "checksum": "c9bcc7c9e91de707ee548e67452d6970af2e19bef91f966b19fa71504e5305fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00702-of-01024.json.gz": {"num_bytes": 396039798, "checksum": "fcda5f8ddc5ed163db84aa70c565f8181731af9a29918a2ece0436d3146d7125"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00703-of-01024.json.gz": {"num_bytes": 396889704, "checksum": "c80445d442a766d2e87ecf5804e87bf7f8b23c2238476fc2b51f657400739306"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00704-of-01024.json.gz": {"num_bytes": 399465260, "checksum": "0bb73674d579523fcbe079fbea7190138911711f023404ae46ea7b685fc09c73"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00705-of-01024.json.gz": {"num_bytes": 398579507, "checksum": "97d6fd9cea2a47913c6ee9d1e34c3440858f25f3d670cc81c8f83f2346fce6e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00706-of-01024.json.gz": {"num_bytes": 398761590, "checksum": "2f4836001b8b80066ae09b6e385ed0048770c13ba2410e0f0309ab4b9200e37d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00707-of-01024.json.gz": {"num_bytes": 395576626, "checksum": "8e0c0c635a7a7c32d4fdb1a7906ee95a9f334a55b2ff3881cdc7d5e816a9c817"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00708-of-01024.json.gz": {"num_bytes": 395930921, "checksum": "e6978b92f333230972e2b4c31cb86b5286fb899948c7680c7a9cbe75a9d60296"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00709-of-01024.json.gz": {"num_bytes": 395734676, "checksum": "13071a3527071f06570c6cfa485073f2f3980c83cac782db6bf66a75dd865df3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00710-of-01024.json.gz": {"num_bytes": 396501107, "checksum": "6562cb3675a42a58b8c8b2a232043adf532fe49420e30c3c237a6d8889a8de30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00711-of-01024.json.gz": {"num_bytes": 398422179, "checksum": "f38b59c4739d3c15e5bf5dbc0965d1a5dcc0f49a3c89eb7a6822003aaa1ae7c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00712-of-01024.json.gz": {"num_bytes": 395905103, "checksum": "500b4914f3c42d5e24ced7d36dbd3143c49e4fd5dfc3d53a172d1a55ae738889"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00713-of-01024.json.gz": {"num_bytes": 396009909, "checksum": "4f50bfa762db1435a89195fd180615e9f569c1668e128d343c87c40ac5cf60ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00714-of-01024.json.gz": {"num_bytes": 396963447, "checksum": "fd9eea7dfb93916a3798a8b69d29fb5d4bf0fec448b8a24427f729e7a41205e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00715-of-01024.json.gz": {"num_bytes": 397474378, "checksum": "3c61bcf6f24e21d2584bb4ae008230540d9a375e35f3c4ba1668621b80d85c5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00716-of-01024.json.gz": {"num_bytes": 396285471, "checksum": "c554e562a369d9696219ea8b0e363907c50f626d7c410a26515e07de801da74a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00717-of-01024.json.gz": {"num_bytes": 394827995, "checksum": "f8b4678c21d93c19d50cb576f0910050d24dfd606238bbf8013c45f98defda12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00718-of-01024.json.gz": {"num_bytes": 395517823, "checksum": "1bf63affd6914d98e197b6e1ce526cae7754ecdc750184154d3cb8e3bdd21a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00719-of-01024.json.gz": {"num_bytes": 395561934, "checksum": "c04b162d984ff2ada9f39aa6c0fac04a1531fbde05175f856d2e3ca2797a448a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00720-of-01024.json.gz": {"num_bytes": 396227762, "checksum": "25da2ac7c1f3cbc361807f67e8826ffa95f4caa25f81f66832cbd0a08f1a51f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00721-of-01024.json.gz": {"num_bytes": 397716450, "checksum": "28180c6396deaf34e2a197f5cad1b53ba1c9532db8b5c21dd7d81332b2793181"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00722-of-01024.json.gz": {"num_bytes": 398022279, "checksum": "9c3a8038a7f9431b90f67ea0d3b77353d0508b09865f49af575b6aaf5e32d6b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00723-of-01024.json.gz": {"num_bytes": 398064523, "checksum": "4b18959f604bd5f379a73b52947261cb8d63f2243f5afeb5807a13669ef4a800"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00724-of-01024.json.gz": {"num_bytes": 394747045, "checksum": "615f13a1b2a6942931519b7a7f6aba286f6045aad65b041c2c6643ce906de1a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00725-of-01024.json.gz": {"num_bytes": 396726374, "checksum": "4099a416eccbb56818efda68bd027c993c1a5fa1a8e722bc268041fd3f804cfb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00726-of-01024.json.gz": {"num_bytes": 397361407, "checksum": "152d5e2bad0de3b6b48fb26066891b160ea79c4c382ce6aec6047196e3b08ef6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00727-of-01024.json.gz": {"num_bytes": 395542925, "checksum": "ce1d46b0cd7d9e4075db3feab71d2f72939817ebf45819e73ec277c9cc07307b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00728-of-01024.json.gz": {"num_bytes": 396647931, "checksum": "c859626b14584c1bab396c867ad5eb11ff3af39628206b03612ee2d2b3058497"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00729-of-01024.json.gz": {"num_bytes": 398272080, "checksum": "758fbdc5bf6d66a36d69d31141742b2a917bf0341494b844f22ab82cd54e7ead"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00730-of-01024.json.gz": {"num_bytes": 395977662, "checksum": "56a7fcb59ece26d4b19be0bd5e6c2d0f05e4b1b23e8ce7b4fab064a29b229c02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00731-of-01024.json.gz": {"num_bytes": 397530948, "checksum": "bf0f4dc8796a737daf80b977a6e3656cb1e244fc40d6df92852da45e53e6cfdd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00732-of-01024.json.gz": {"num_bytes": 398314575, "checksum": "1862bcc85d48f59283eae56836e5598f20287ce36a185252abb24bcfbd1377cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00733-of-01024.json.gz": {"num_bytes": 398547748, "checksum": "476389cb582df3c214f3f5a45268bdb47b581a432c08723bd811daa5f5990083"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00734-of-01024.json.gz": {"num_bytes": 397380175, "checksum": "2b6fd36a8f8bc3edfcd8a486de44d2f3132f7b8f4bb2d4c93453dbf1a1b6667a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00735-of-01024.json.gz": {"num_bytes": 399584382, "checksum": "3e0a067fef0b40edcd23ce6680efc07253660b8c00699630bb7629b9d803a198"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00736-of-01024.json.gz": {"num_bytes": 395312038, "checksum": "e4f92413c837d269481ecc0b5d0fc87548bd2ae718ef7f9bff18674ece289bc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00737-of-01024.json.gz": {"num_bytes": 396820243, "checksum": "e61680c57505f027ef8cbd28a45e706936befa2ab40a24a63e638019a1717b63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00738-of-01024.json.gz": {"num_bytes": 397691872, "checksum": "d3acc0c9c76ef2df89f49896744dac53f488f830d3d42f0c481f2321ed60fa67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00739-of-01024.json.gz": {"num_bytes": 397912166, "checksum": "18d281ed9831f28c4c54256a844ab2cff7a5b681da1b7c8eab2565b106381aa9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00740-of-01024.json.gz": {"num_bytes": 397093867, "checksum": "6a65230910384587f5e7f34b52c2a6d9a86a8b1f7a23d26f890b6e810c051815"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00741-of-01024.json.gz": {"num_bytes": 396371058, "checksum": "26eb40e98075ab716b4edec76d1723a679e648258d6812119b46f7522dfa9b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00742-of-01024.json.gz": {"num_bytes": 398346941, "checksum": "466043ec98eb806916806cff7495f0bae89cfeb2835204ea34328030b92a27f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00743-of-01024.json.gz": {"num_bytes": 397366055, "checksum": "d98d31aaadf95dd0d1cf0548db515c8e77c95bbc4b611ae9ab5650429c171889"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00744-of-01024.json.gz": {"num_bytes": 398722902, "checksum": "a43c80ab3bd8d12d12b4ea41d9054b90214fd3ea2ef957f317d6ed6fa7b60e34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00745-of-01024.json.gz": {"num_bytes": 397562514, "checksum": "1e6dad94e0f90bfa0fdc5557c58873aaa95fa9ce1c7b70a1fe76817289cff78b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00746-of-01024.json.gz": {"num_bytes": 397731351, "checksum": "21fefd6cffa9032c9ca7cec91cd775c83bbd37419ae236eeec9589f8bc4be0dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00747-of-01024.json.gz": {"num_bytes": 397781450, "checksum": "b84c74bf1caecf92777fb85129bb009eb3a27fbab1b97af567f36a8bf100e704"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00748-of-01024.json.gz": {"num_bytes": 397425031, "checksum": "fe9bb225f6d03b44e552ec985c844e5012e90c4ad99f699ec4ed4297db91349d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00749-of-01024.json.gz": {"num_bytes": 397925850, "checksum": "3913b2955fee02e2ba716d843559bc4bf4e85a2884ae4495446a379f857a30e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00750-of-01024.json.gz": {"num_bytes": 397089489, "checksum": "773486144d3008cb3207c3c8b65fe6081c9e64dda09728d3586bc82e6bb73fca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00751-of-01024.json.gz": {"num_bytes": 394819424, "checksum": "d728b117a7b74150b03ed7d562514c2e45ccc03b0bceb120eddfa8333166a923"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00752-of-01024.json.gz": {"num_bytes": 397199683, "checksum": "6c10c3f4e3737db6a70375bd605139de61ae8b09a1aa91dd1cfdb82c183f0cb3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00753-of-01024.json.gz": {"num_bytes": 399197199, "checksum": "101c4ed5426b586a4aeeb7dbd377306eae9eec2eaf934e79d25583abff70b15b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00754-of-01024.json.gz": {"num_bytes": 396415619, "checksum": "732f4dedcf1266bcabf15a6a1cdead617ea37d428d8cfbccb5a9dd7521133075"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00755-of-01024.json.gz": {"num_bytes": 394564662, "checksum": "a23f1bb1de23554efff68e730d85802a6491936fb54e256744af641f97ec155b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00756-of-01024.json.gz": {"num_bytes": 395577258, "checksum": "2f4275994a103dca517d4eb3656009c8138930079e00303c7b8746ab6094fd19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00757-of-01024.json.gz": {"num_bytes": 397161772, "checksum": "ab16360173283b22a7e19d181fbf55a6a8d07f0d9007b51aa159c1e81661f5e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00758-of-01024.json.gz": {"num_bytes": 397545456, "checksum": "ff5a6292bc557aa9895de39697e8aea5843fa5a00c83c7983eaa36640d446ecf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00759-of-01024.json.gz": {"num_bytes": 395470957, "checksum": "66a64accfa6c281d2bdfa7b6846397f56c2d4f8a22ae8925a07af853e42f5521"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00760-of-01024.json.gz": {"num_bytes": 397328304, "checksum": "46778c90bcc6da96cf02e66956a1bcabcb9a95bad538cfc0d5190db473a278a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00761-of-01024.json.gz": {"num_bytes": 397706141, "checksum": "4825f25d6e1d13c70e6e65ce13ccd7b1922344c48ee2806952f3ba1b6e26d3ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00762-of-01024.json.gz": {"num_bytes": 396983663, "checksum": "25e1645f05d342b5f872ca809b36d516c7336c22035bfa86cf295d0865e08789"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00763-of-01024.json.gz": {"num_bytes": 396355038, "checksum": "d4c3a92808f0bfb042423cd4166abc57d20603ef07a0f0912058a718a38f26d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00764-of-01024.json.gz": {"num_bytes": 395434042, "checksum": "aa4384f587fd64c24fad9a27defb0345eb44cc536b3d45c710017d225c191ded"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00765-of-01024.json.gz": {"num_bytes": 397204482, "checksum": "cf419554f6c4f6201ebe92e7a232013e5949910f3d54f5cf3d1d65845685c7ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00766-of-01024.json.gz": {"num_bytes": 396420917, "checksum": "32076dd8004ebe35f46d6e790fd6330ad1d7df2b7ae3c4ede325b0da73a673ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00767-of-01024.json.gz": {"num_bytes": 396840905, "checksum": "08e5fd0fc1578a337f3dafdb3c718ade437256119e1968e9f958a8ea9d052c81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00768-of-01024.json.gz": {"num_bytes": 398085225, "checksum": "3579e0756bb6cbf1eddfca27de5cf067a212d683134bc6f8c26a79b7d802bfce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00769-of-01024.json.gz": {"num_bytes": 396879117, "checksum": "0913c93203a084521212e473d08c1d11e8136a8e37f1891330fbce0397bd431b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00770-of-01024.json.gz": {"num_bytes": 396386647, "checksum": "6c12ab51c92b9c92336a6142a1a4e2f7c3725beb7e61dcb004551d13e8d5488e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00771-of-01024.json.gz": {"num_bytes": 396279989, "checksum": "752deaefbf22dd1b1adb36561e8524c1dc555fd105bf3acb78611be9bce72318"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00772-of-01024.json.gz": {"num_bytes": 397850815, "checksum": "4f1969284d1f448caf0bff5d05eeb995cf2339801f6a71e01286f4f7f387c564"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00773-of-01024.json.gz": {"num_bytes": 399466666, "checksum": "20ba552cd30349bc8a2c0b6a8701d4587a005e7ebdf6e3f2a3bf95462c304447"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00774-of-01024.json.gz": {"num_bytes": 398051538, "checksum": "1f66196e8fbf0ebef977f235d2aacb7245f4033b53ecf75ada2f8007465a629d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00775-of-01024.json.gz": {"num_bytes": 399284061, "checksum": "97df92baa605c34ce857d380f1ca42f9e2a0de499ccaa9bab26a5c449451d1ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00776-of-01024.json.gz": {"num_bytes": 396710162, "checksum": "4b1ec54b82c8e5d969d3000ce547f4c20df16d9cc0b889b2b58c8839e9d8e27f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00777-of-01024.json.gz": {"num_bytes": 397265441, "checksum": "03827ccc3c5bebbd12a04019e9797945c55becabf7f9c1f3fe5353513f5c5a38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00778-of-01024.json.gz": {"num_bytes": 396050013, "checksum": "54aeadf4fe16949b2ee9438feabe979570e7587bb07b3c57e47422f662191936"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00779-of-01024.json.gz": {"num_bytes": 397124991, "checksum": "913e268b5474a8b4cf1426f5a0a06c7f437eeabbc35f0126481328b419f85bf6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00780-of-01024.json.gz": {"num_bytes": 395196367, "checksum": "4c1a4f296916c30103a5dacacf8a167e43bb424d085ed3491b19f0ec1985d9f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00781-of-01024.json.gz": {"num_bytes": 396578403, "checksum": "a54f26c233662299ec8f0ae1bd266879e93cf4676707b0955114a1a80e2fcf61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00782-of-01024.json.gz": {"num_bytes": 396142106, "checksum": "3713c6b725afd833063402e6577bc0ed003a87720f700f9272864c2360bfd260"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00783-of-01024.json.gz": {"num_bytes": 396470511, "checksum": "fe9d904a07ffb2581b6734c8dd847435b867d3043ce4b4840b1c54374919d757"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00784-of-01024.json.gz": {"num_bytes": 398156228, "checksum": "af762a9ff3eeb7ed4a56f54702911f0c190b97f8efaa02cb89b1626a1c44c9f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00785-of-01024.json.gz": {"num_bytes": 397185035, "checksum": "6629e1827aab88f55d53de24625f8362daccf910663db8584d959aa44f8043a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00786-of-01024.json.gz": {"num_bytes": 396556703, "checksum": "ce51603900ea0aad8981fbfa8d05d684bfef5360413dadc6933246c2dc81c413"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00787-of-01024.json.gz": {"num_bytes": 396214799, "checksum": "6eed5802b89d63eea115cbfd9e00f6d1b4970bb3600a887b904b548181a4acef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00788-of-01024.json.gz": {"num_bytes": 397965162, "checksum": "eaa948fdaa744576f006bd70d54f129968772a479fb0bd8e946d7605857545d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00789-of-01024.json.gz": {"num_bytes": 396280999, "checksum": "e0b80ec73507f96310abf070e5cd17d5a67ffb4a337820a8b79a02afe81a0b99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00790-of-01024.json.gz": {"num_bytes": 396224660, "checksum": "2b4a06fb6f68c773da34f8d4c33d7746b6a3206bb242042841e5e007fe3cb6ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00791-of-01024.json.gz": {"num_bytes": 397681975, "checksum": "1b167c20d0414d970cda74cd357cf07d69abd1d3fb0f57222028b369551d513b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00792-of-01024.json.gz": {"num_bytes": 396210611, "checksum": "ab55128753a1e58d1032b8fd747c48158a721b12e85990627478f22b78e156ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00793-of-01024.json.gz": {"num_bytes": 397534599, "checksum": "e7476bde08e0065c523d09932cf2cf6ffe8ba023ae0ee435238efb5dd6f93d7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00794-of-01024.json.gz": {"num_bytes": 396536137, "checksum": "6228922504b2d3ebeef4735abdff06cc786d6533a6c150d50f34042aeeae1544"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00795-of-01024.json.gz": {"num_bytes": 395235406, "checksum": "9dae151c15898d7991417596a364e30f00e0ff6280f1505953e6de40c2e228e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00796-of-01024.json.gz": {"num_bytes": 396226178, "checksum": "1dc8decde490324087fcd06e4b1e17117606f2d61a80d506d89a12cce11ba291"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00797-of-01024.json.gz": {"num_bytes": 398556774, "checksum": "a454758e8cffccc88f83517a241f2457e683647949cde6aaf1e217de42f6a52b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00798-of-01024.json.gz": {"num_bytes": 396109677, "checksum": "3daa6b8602517b9873db96522a2852d940d52cdf0fa86f259ac41a9cd688751f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00799-of-01024.json.gz": {"num_bytes": 397930210, "checksum": "09dec669699a437d6fb78b3f2705028fb380b2eaa20ee73b77270216a48b8a95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00800-of-01024.json.gz": {"num_bytes": 394545441, "checksum": "726f99301047519de253e3edbaef5f4a4f95e3850b1b98e01c7864499dad7833"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00801-of-01024.json.gz": {"num_bytes": 395867151, "checksum": "a97ef657bd8ea718427ffc686f55fc1786f0834755fce3ea3ae8402d9f75c11b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00802-of-01024.json.gz": {"num_bytes": 398573429, "checksum": "20ee1f30272a0d5db74e8589be12c17173580cc9f14b039b3d33f3197816ef95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00803-of-01024.json.gz": {"num_bytes": 398084513, "checksum": "31d1a8f6965d3a8cb7e28fa8bf2cb9a5609d4a129dbc630a8e2a939f475b2003"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00804-of-01024.json.gz": {"num_bytes": 397815811, "checksum": "edb758146d462848bdb113df90fa4b9f451eca6658cbd2cab147c8b0eaf88a70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00805-of-01024.json.gz": {"num_bytes": 398641802, "checksum": "b916bafa7269ad4ed09c58c74dc3f098b529444609dafc57e6e4056aa6496ee9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00806-of-01024.json.gz": {"num_bytes": 397993720, "checksum": "92fcc5881ca81b808c14f8c9960d873be70f857f95fd1e777b1ae1d4c62bbbaa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00807-of-01024.json.gz": {"num_bytes": 397743279, "checksum": "79aca62194176964b66a90dda7631d01acc2a6abea1ba19a90076139e390170a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00808-of-01024.json.gz": {"num_bytes": 397076817, "checksum": "a469391e432dac6967e841d46eaeabe9429849492a3df5e91431777fe9b9f164"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00809-of-01024.json.gz": {"num_bytes": 395533122, "checksum": "1278d928e105ea7d9c397ef1da79dcc8791dfad9177727aba098bd451734ce45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00810-of-01024.json.gz": {"num_bytes": 397468683, "checksum": "5c6f3e7550827de9d7028decd82320a55722785394ea4951ee78f3ffadb2d4e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00811-of-01024.json.gz": {"num_bytes": 397348260, "checksum": "8c1ece72814dd82bf1bb663b76a40c58129c08540195f9b2134eff5837faa366"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00812-of-01024.json.gz": {"num_bytes": 396753479, "checksum": "b3770924d0576f7cd1706771c411f0f288277c6c6c922dc7af4017b665109a88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00813-of-01024.json.gz": {"num_bytes": 397977743, "checksum": "864040da6f03f4d2ed2a9eae4daedf304e0d27196f0b522cee4e8fee55f9ea71"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00814-of-01024.json.gz": {"num_bytes": 396168620, "checksum": "542986bb3b75ffcfc853af11a80edb6a31e12527d2588f1c5b2119fe35d3f150"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00815-of-01024.json.gz": {"num_bytes": 397639162, "checksum": "a617c2f27306ce5de74ab756cbf74707fddeb0aa92277b66d0cd65be230f386a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00816-of-01024.json.gz": {"num_bytes": 398296204, "checksum": "174a2e77e6562384cc4e7459ebf536db5cf4b530e4f1d7714e60d082ac7a19c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00817-of-01024.json.gz": {"num_bytes": 396112543, "checksum": "95af2c4f32efb4ed2a41cfa38dd2be09d51d4b0dc53ca8763309503f0276d56b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00818-of-01024.json.gz": {"num_bytes": 398371592, "checksum": "67789e3525f2daf6af2551df12a50341c3ef51c89a9c714a8def76209b5b7460"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00819-of-01024.json.gz": {"num_bytes": 396751420, "checksum": "07431a263e2bb92c048fadbab74ce1399f76fc57a04d7f9e90cb33aa60a4c5e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00820-of-01024.json.gz": {"num_bytes": 399213859, "checksum": "83c03df95869973c2ed46c909c0e92e7ecd75317c06b09e447a62b592421d1c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00821-of-01024.json.gz": {"num_bytes": 398408628, "checksum": "b5cb8c52a8713c5291ccf29c171e9bd9b57a54211392a19e8f31182d1053a032"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00822-of-01024.json.gz": {"num_bytes": 395429180, "checksum": "8c47bf7a0d2b9c84d255df0e7da058fba2b4ca6da3c20cbdfe5a686e01cf5c45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00823-of-01024.json.gz": {"num_bytes": 395437149, "checksum": "62818e45f34e70728494c74daa583e30c70aebf91c2f057470039f6d35059691"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00824-of-01024.json.gz": {"num_bytes": 394503147, "checksum": "e9fd88994b23531ba26e6859ec1985798a2ab9b300c2fdb1e202ac553ab305b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00825-of-01024.json.gz": {"num_bytes": 398841091, "checksum": "77ad5a9ac5e3c1d1180981bffbbdbf8a429854001d990258c615e0e16c8a9f6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00826-of-01024.json.gz": {"num_bytes": 397404278, "checksum": "06a39374c1cda19cc4b034c4877e1fd3bdc84290fdb621fdcdc77f3c5eea9a47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00827-of-01024.json.gz": {"num_bytes": 399316947, "checksum": "fd27a73b130c1cf8256f22212e23799d0dd31281cd29bcf9bb658bcda457b66e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00828-of-01024.json.gz": {"num_bytes": 397514415, "checksum": "3e7d199d05f885e8bba769d21a55a3f2ef2114b66ed738428ceb506fdf272ff2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00829-of-01024.json.gz": {"num_bytes": 397251538, "checksum": "91650563e9520b2d1ec2cd726304b781b4156ffb68bc172635a53f425fa6bb0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00830-of-01024.json.gz": {"num_bytes": 397653118, "checksum": "893ef017cbf7d46c99d9c69ba74344cfc2800bb23faf93e7400c0c282422945f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00831-of-01024.json.gz": {"num_bytes": 397299276, "checksum": "4eb3c91e52547f3b4af586f5bbdb0cdaf6a345b202a09c6aabff5c5f628b2948"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00832-of-01024.json.gz": {"num_bytes": 396915924, "checksum": "9fffd46fc1f1bce010484f2850102e2e153c5695c277efb67f65811630c2493d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00833-of-01024.json.gz": {"num_bytes": 397652261, "checksum": "3b89df9375a906c96eb1e21a6572a07de2f5d875996c01c744933984edb1af1a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00834-of-01024.json.gz": {"num_bytes": 396070735, "checksum": "b758b4cbfdfb799a8615ec9c3678b27dcd9b1d63af4f272879e0dae84cac9d63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00835-of-01024.json.gz": {"num_bytes": 398028152, "checksum": "6e07f1e6a099aa496fef3015514fe5f3cc665c742f8a783389c7da4ce0e0e72d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00836-of-01024.json.gz": {"num_bytes": 395941604, "checksum": "6bef1291a741ea5976749456185a3e3a03c3fcc9ac00370f28672ab39c552db8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00837-of-01024.json.gz": {"num_bytes": 398655070, "checksum": "b0b7e1c826302417630c3e1b1877bf106beefb5a7a11feb9bbf1ac3712714fed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00838-of-01024.json.gz": {"num_bytes": 396374435, "checksum": "3e9bdde8b73397a5fce143e91c92f9e66f46b45edfb30da1cac400b9aa7b2ecc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00839-of-01024.json.gz": {"num_bytes": 396388725, "checksum": "4154322b97c600742660125e6458787e603cf1a44b49267f4d1c569387fd132e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00840-of-01024.json.gz": {"num_bytes": 397564603, "checksum": "f9560028196fc934378389e355101e5e7f8fde9e5c921722704a18b24ebc5804"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00841-of-01024.json.gz": {"num_bytes": 397001678, "checksum": "0dad99ac959765280e6bf6d9d1a1468ef9dc9cc781e8f5bb832f7295e4e79f69"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00842-of-01024.json.gz": {"num_bytes": 397139167, "checksum": "e81fd683da081349629a0a7ae8ff7813351ed23caf4ef87041b64524034abc83"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00843-of-01024.json.gz": {"num_bytes": 396044889, "checksum": "d8e3a5b4148c7e86dea50ee5ba89ef55629d3550fd926c41754e5a26e7e52c36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00844-of-01024.json.gz": {"num_bytes": 397365441, "checksum": "c4d2ffe853b55464961b707b6d0264d6852817077204a0380c906184c077012c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00845-of-01024.json.gz": {"num_bytes": 396477802, "checksum": "7b3c4d435eca57a0fad05c106ec5928750aa01d95047618a3bc84e5342e912c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00846-of-01024.json.gz": {"num_bytes": 395983616, "checksum": "bdad2ba411291435ac0cdd083e46aa8369499f014a788fa85ed8c419fe9cb2de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00847-of-01024.json.gz": {"num_bytes": 397646062, "checksum": "3f6bddcefcceaa4184161432e4f0b9292ae4fe7dac3079d4191a31a38f48c7bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00848-of-01024.json.gz": {"num_bytes": 395958111, "checksum": "5ed10d926e5fd1dcbc777df82391eb3ba57276c7303d488d6f3591022d20cc4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00849-of-01024.json.gz": {"num_bytes": 396960036, "checksum": "ab82adc6f66ab0403cbbb38859009a460e6c8c38c789bc2b2420da8b87096a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00850-of-01024.json.gz": {"num_bytes": 396603592, "checksum": "5a6aa59a01504f5655d429dd5cb3ebc39e3994b22cbaeb5b09ceb29a26b94031"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00851-of-01024.json.gz": {"num_bytes": 396511886, "checksum": "f1954da7e217d893a0237a0f431dd2a9071723e543bf0f4943ce38fab048a44e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00852-of-01024.json.gz": {"num_bytes": 397626831, "checksum": "f5cdcd7ec4f3c855a1006f9278ed4df50574a3fa7aa1c5a2e255ea5fa1a770cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00853-of-01024.json.gz": {"num_bytes": 395811873, "checksum": "24b1033da877ebddc09cfe2d3325868448dab9083b5147d6cfc4fa63ab402a94"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00854-of-01024.json.gz": {"num_bytes": 396513614, "checksum": "419952e0bc38cce474190c0b9ea581ccbce77da5e045dd60f5ff1fa1d2833d19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00855-of-01024.json.gz": {"num_bytes": 396493352, "checksum": "3d2b529871c625fc9c1c59b9d5cede2a77e609041f1ea044d68ac16e9fa6a30c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00856-of-01024.json.gz": {"num_bytes": 396852729, "checksum": "a3b56e6171fc2b14ebe67f6a71af688ea6135597bb8f8cf83e2fb460727aa5eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00857-of-01024.json.gz": {"num_bytes": 396428653, "checksum": "de550a5d608bffde45c149bc0d4c1165cbd3b5baab3d3529f006a02aba6d53e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00858-of-01024.json.gz": {"num_bytes": 397039613, "checksum": "11374c2685676ac2eb3dd0d281b44b512ff1d2968ab320d9c857b44304eb8ab8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00859-of-01024.json.gz": {"num_bytes": 396515194, "checksum": "64879e565e5c467e630566ab75524bb300d58798c814637ffebd15646544cd5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00860-of-01024.json.gz": {"num_bytes": 397764125, "checksum": "7e22be61b3413c8fca2414087655b7ef7bef2ab5ee373fee74d13c8fb991675b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00861-of-01024.json.gz": {"num_bytes": 395314420, "checksum": "29c451c69c8c05f6eee2741b9ef6c241f551257a45da8342a1d6bb341f80314a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00862-of-01024.json.gz": {"num_bytes": 397763845, "checksum": "679668616899f548fb35da32c3e5f121002670cc3296c0c90f5bf45eb3ea1d79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00863-of-01024.json.gz": {"num_bytes": 397356206, "checksum": "43c5b3af2173d4293396f336ec363aa2f31580b65128f44ca8bb891f2022859c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00864-of-01024.json.gz": {"num_bytes": 395463092, "checksum": "77b7b6299955f4869e5db994fa6b20fe3007cf8cf2b6609442fb1ed49284cee6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00865-of-01024.json.gz": {"num_bytes": 396909291, "checksum": "7eca0e82842b52f99640ab574e4b2446309aba6ac262f980fc6d249a337d06a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00866-of-01024.json.gz": {"num_bytes": 397587651, "checksum": "931014d99ab2a765ebf90e876694647c265ca5e6bf2b459eb027d6b06643a8ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00867-of-01024.json.gz": {"num_bytes": 395992645, "checksum": "0976a5389aed40e4bca89cf22382cf121390c75bd755437be474c097c8fee0ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00868-of-01024.json.gz": {"num_bytes": 397789857, "checksum": "6ffd848d165290a746a21767e79a9f046b70534aaf7b14fc01f9365e4e3f7d93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00869-of-01024.json.gz": {"num_bytes": 398124116, "checksum": "5fb85058bdf40c0ee6cf748cda7483b1b3cfad18c26a90c2150c2a3f30ceeeca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00870-of-01024.json.gz": {"num_bytes": 396432487, "checksum": "89d50aaa3620eac4ad593a403ea637b2ff090361ead05c3aa8c7a3351c66ad65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00871-of-01024.json.gz": {"num_bytes": 397484772, "checksum": "490f4104981a9ab3ef04600a4865b9a2a18239e335d7fb7fff79ec1b7a225318"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00872-of-01024.json.gz": {"num_bytes": 397240896, "checksum": "d344994866bc49475f66e9937636afa787e1ff560e3f62dc1a0e4d0220d6ed39"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00873-of-01024.json.gz": {"num_bytes": 395450398, "checksum": "5d3b320aab1f7f09450531649666ded1aba8a9bbcf0f47992c43cb40a6d7a929"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00874-of-01024.json.gz": {"num_bytes": 396365056, "checksum": "346aae20204537ba2f4a865ca80b5d1c6da1e3a3b78d306d7570a69f185cc4fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00875-of-01024.json.gz": {"num_bytes": 396679348, "checksum": "ba81f9c1650d30853edbb9886dde84658c254dee5a3ac1062484f7194cd413f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00876-of-01024.json.gz": {"num_bytes": 398278881, "checksum": "88fb38aad7cadd76c818dbe7a372144dfe17d110f7d2123a80d14686fb43a6dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00877-of-01024.json.gz": {"num_bytes": 397051868, "checksum": "049e4a62056c98284b35d10a74ad5ef7014265a6dccb99a71f93a409933a685f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00878-of-01024.json.gz": {"num_bytes": 396132123, "checksum": "bb7b97a82bd6d31612de66a03af35d404b15808b925e7fd94bd0a8e9e928b927"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00879-of-01024.json.gz": {"num_bytes": 396520374, "checksum": "2a56fed53aa022e6a7956f604d54d99af89a15b6c7fc6b037f94d347f1d15f51"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00880-of-01024.json.gz": {"num_bytes": 397004524, "checksum": "1cadef434909d4508a9a6bf40d6a9323256f3089615a5d2963c83040d5f549f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00881-of-01024.json.gz": {"num_bytes": 397336334, "checksum": "0e36dcd0eb1773eec15ffd0fbbe8951343bb6961dd1838b51e74da2e055db176"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00882-of-01024.json.gz": {"num_bytes": 394949798, "checksum": "78c99406cb921c2b8f5b86e4e7eeed24c799678732e5a5450db6b12b7ceeef61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00883-of-01024.json.gz": {"num_bytes": 398647721, "checksum": "f0e7a0a9970c7fdb5f629771e76bb06bf62b79e9cbf5008e866f954dd436401b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00884-of-01024.json.gz": {"num_bytes": 396040500, "checksum": "05272a55eb2840f94a7dcc30a8d09b957511b983b0fc3fa618a8995bc594d055"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00885-of-01024.json.gz": {"num_bytes": 396460591, "checksum": "27511aa50410260d261866dc970b897b10a95dd4dfd92b0bc3a5fc41e6c75335"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00886-of-01024.json.gz": {"num_bytes": 396149133, "checksum": "e66ba9c7ceca631a4b43ecff1e151524a209368f298ca83624476ee9144cc3cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00887-of-01024.json.gz": {"num_bytes": 397164216, "checksum": "95e341054bd8a21e7f49e4a5aaa5fbe51517ff631e66e67ff1cdaea6e3178002"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00888-of-01024.json.gz": {"num_bytes": 398216402, "checksum": "6fef57de31fa1692d8a4021b317554688657fad3f55dc144e2971d63083e7879"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00889-of-01024.json.gz": {"num_bytes": 396976936, "checksum": "36da1bd0eaa27ca6e8510a3c005695fbbd7b0fedf63f077e3787590d4b1af625"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00890-of-01024.json.gz": {"num_bytes": 396903125, "checksum": "6bbbe5db2c0938efe5f8afe7b30765f45cedc9fd4209bb7826c489381175bc5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00891-of-01024.json.gz": {"num_bytes": 396404354, "checksum": "47601b1b1a0a725c32ae0c32364f7ac188b7e8c68d29a2dffbe1a4dbe39393f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00892-of-01024.json.gz": {"num_bytes": 398144052, "checksum": "a7b6bdafa5a226c22ccdf97c873e4915ed8dd8b59e2820a4dc62f600b4710175"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00893-of-01024.json.gz": {"num_bytes": 397990484, "checksum": "12f08cfa1fb4f94a3d7d9584cc3f5ae9fa518cc095e4cb07939d02ecfb7ffd9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00894-of-01024.json.gz": {"num_bytes": 398271782, "checksum": "004bf46ac7c8d7770b458ec341322f5cef643926aff9255954f08faa1dd43d53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00895-of-01024.json.gz": {"num_bytes": 395489909, "checksum": "3ea14b3dbd7a4c9cb7aad83d1311d335714aaea5b2dd0374debd63c56d02dcbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00896-of-01024.json.gz": {"num_bytes": 397589097, "checksum": "c0f1c7e54bf7a808f66d2acc9aec79f1ce936ba480f5d1e379c6853714413175"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00897-of-01024.json.gz": {"num_bytes": 399215096, "checksum": "20958123acf2d578448a5166f1209b0452db33ed395cfe512015106bf99ad31d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00898-of-01024.json.gz": {"num_bytes": 397044516, "checksum": "46c5145069d861c04b2ac1afe80c4c4453f91869f6cb6a1d9f7b648f1b08942e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00899-of-01024.json.gz": {"num_bytes": 397687759, "checksum": "2a3923d8ff2ce0eab5978a8e0198bc2d1512cfa19c69e673e048b8eaa72f82b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00900-of-01024.json.gz": {"num_bytes": 395192267, "checksum": "9cc72deeea7fbc0fa3782c41938d66315923dd9f53d89f47c00f85f93e454ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00901-of-01024.json.gz": {"num_bytes": 397806320, "checksum": "8cfff74f280636416f523c271f75e5704a570db4cddb8a70d033158868c21347"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00902-of-01024.json.gz": {"num_bytes": 398450537, "checksum": "7df8804eb5ecb79177001f9ce3c66f0ad20cccd8151e817816e9342d07c392be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00903-of-01024.json.gz": {"num_bytes": 396733151, "checksum": "89551a52d1e97b4ec3007f8c43191c1ae1475d0ba5b48d20818a12c85b0add74"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00904-of-01024.json.gz": {"num_bytes": 397497719, "checksum": "2bcde59dfaa642722969d1401a4ce43a35c57930bb1d664371efece1e2e91c32"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00905-of-01024.json.gz": {"num_bytes": 395760696, "checksum": "ec844272b0666a455dfe0cab065e00df44e8da2156a03797100418307c96830c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00906-of-01024.json.gz": {"num_bytes": 398496346, "checksum": "ff68909d470edef08929a91068e1de02841c16a000fbbd17ef042cb76f1fff37"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00907-of-01024.json.gz": {"num_bytes": 397085405, "checksum": "a9b26676af61a6a1355225bce5bbcd67aeaf0fb7dc2209f30235b275536baa85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00908-of-01024.json.gz": {"num_bytes": 397037103, "checksum": "e86688677a46103b0b224333faf1b4f89da062e4ec0ee35752c91ff9772697c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00909-of-01024.json.gz": {"num_bytes": 397394775, "checksum": "93082177607900bfce7fc53f1665a831093bb50caea33e014f327181579c0012"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00910-of-01024.json.gz": {"num_bytes": 396668466, "checksum": "dcfe639607c18a309e2c91864a6912dce3851abd62bbed3ba16390899e637327"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00911-of-01024.json.gz": {"num_bytes": 397926997, "checksum": "aa995c38d953237b1d6d53be7237958a00ca2dbab4a753c7c4404849fb416d5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00912-of-01024.json.gz": {"num_bytes": 397810240, "checksum": "e3f17ac285e8c9b04713713a957602a63e176f476d4a67018012e9cf2a3e5a84"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00913-of-01024.json.gz": {"num_bytes": 397143597, "checksum": "4082ab833be47cf881693ea4442e3940625e0d2c1117e15234886fdfa779bce3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00914-of-01024.json.gz": {"num_bytes": 396398347, "checksum": "7c62dfd17b21ff64af640e4aca8fea0240998596d11ca551a3ab045d5041fcac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00915-of-01024.json.gz": {"num_bytes": 398622100, "checksum": "69abe67cda4b1613d5f741804ccdb294cd5f457027818d9366db8cf2f5f40871"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00916-of-01024.json.gz": {"num_bytes": 397387266, "checksum": "6effa83cbf3345fd7e41e432ef82156bb1334f2cf17589bce313aebee9727131"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00917-of-01024.json.gz": {"num_bytes": 399730979, "checksum": "f0d0ff1ae76a84c07647fa1517410533862f1927fa85dbf38017dabf4607bc1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00918-of-01024.json.gz": {"num_bytes": 396895902, "checksum": "84cc56e725be31047d0b6a025cfacefc462f4a1a546feaa34af95a6f25a4e1a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00919-of-01024.json.gz": {"num_bytes": 395247578, "checksum": "daa3156989ddaa9a7eba228848697ccf6a385679359ab765881d2293bef107aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00920-of-01024.json.gz": {"num_bytes": 398305242, "checksum": "2a9e02ef643962f6009e42304b983c87bae7b74c1edcbf8e6808b320ea7ea776"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00921-of-01024.json.gz": {"num_bytes": 396446011, "checksum": "f83526ad11d81820fce4231e3303d613dbbe56a8fae878d9442c8d7e98023437"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00922-of-01024.json.gz": {"num_bytes": 398010331, "checksum": "e47cb9d7550644ef807c3ea9e19ca4aa1df54eb908b54651bf0e17f0ded9157d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00923-of-01024.json.gz": {"num_bytes": 399160018, "checksum": "470401e5b0777096806113a36dcb92b8d453d6e8f5f4f0b15df2788e382ca03f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00924-of-01024.json.gz": {"num_bytes": 396880756, "checksum": "c86e546c68bf8458951fa723c086d6efa5b210f53cd4fcb2de4b9efc7a71a275"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00925-of-01024.json.gz": {"num_bytes": 396806561, "checksum": "5d9b1105c0053dc9530c911046f4da458f41d92c771282d0df8a3a22838feaec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00926-of-01024.json.gz": {"num_bytes": 397479994, "checksum": "c3253305ac4ef226501e4fd4a6acfc6067a76c084ad852eb2a9f5916aa3d51a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00927-of-01024.json.gz": {"num_bytes": 397083225, "checksum": "8931df0ee597f72ea3592d0a4d236ce655a92cf4e7eb9298145f496246c18c21"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00928-of-01024.json.gz": {"num_bytes": 398000839, "checksum": "5e29e75231bdb413dedd1211bd87e9fc3f4ab8bba41999afc1ddcddc16f4599a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00929-of-01024.json.gz": {"num_bytes": 397731309, "checksum": "03f7a9199b7927a6d78a8aa4eed32c250d32dc409e3bb2847d7db948ee63d46c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00930-of-01024.json.gz": {"num_bytes": 398133003, "checksum": "b22a79dc228697394d0ce25b7d31112f9e1a6508cdc4b57af35e84e65167bfeb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00931-of-01024.json.gz": {"num_bytes": 396694508, "checksum": "dbbc65db3d442f9ace85498a3b27bb598c20cea171b3de17d409f9b989c262d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00932-of-01024.json.gz": {"num_bytes": 396255463, "checksum": "02af4162b084004e99dc6862c88749545593e342a83523597cada140e57a0ab7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00933-of-01024.json.gz": {"num_bytes": 399013035, "checksum": "dc4d3b4f03c36a8f1393ba15195c3f64b128862b812839689fa387e708ffabaa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00934-of-01024.json.gz": {"num_bytes": 396593138, "checksum": "02a5a8e02b2636c9e912a9ef8a79ececde4f4fc92bea74e59791d181bec104cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00935-of-01024.json.gz": {"num_bytes": 396748502, "checksum": "05d1d6290580d5c74b906ab03fe6773ecaaa1ff3be84dfdef48d1a2e7f5e1120"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00936-of-01024.json.gz": {"num_bytes": 397737673, "checksum": "351d3543b1457da9719061948a1b4bdd79be8a0b786ecd6a9a8cc0db49cd2181"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00937-of-01024.json.gz": {"num_bytes": 395377872, "checksum": "d431b01bddcf911d7da5bad74a78d0d1527d60d9720f77868ef08e1a65850986"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00938-of-01024.json.gz": {"num_bytes": 397193715, "checksum": "bff5e755b174e3608ba72b39898a2bb5e9ca6d3362b70bd66143566aeff52690"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00939-of-01024.json.gz": {"num_bytes": 398044482, "checksum": "03facf22c376f03a8078e99d1dcc1c22ed5d7e179de472019cae894f40c7a4ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00940-of-01024.json.gz": {"num_bytes": 398894204, "checksum": "3d3a2125262ee8ca498cd54db52fe626d010a2a93c000ea2b45f931e491ea9e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00941-of-01024.json.gz": {"num_bytes": 396758197, "checksum": "b3957de08e7779d8ec23af02a6d709189796314c70a99f46c90d0bfbd14ad561"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00942-of-01024.json.gz": {"num_bytes": 398181993, "checksum": "74aec8dec794c79683dfe43d8aece4c1c47c5389aa6d4bea847ac461cb5ba21f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00943-of-01024.json.gz": {"num_bytes": 396271547, "checksum": "231f63d05f81d249f618768c9f712cc31314dacf55a6004902a0e7d0bfb13724"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00944-of-01024.json.gz": {"num_bytes": 396603419, "checksum": "d5661730f3ed6cc5bbc5d935a6f1ac7d241b40c52dc83775a421e7a1a672f518"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00945-of-01024.json.gz": {"num_bytes": 396596660, "checksum": "3b5aeb0786dddf0b9cabe2ca071283b276822e2861d8688e38f927595c159b02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00946-of-01024.json.gz": {"num_bytes": 399900563, "checksum": "6d5549970af2c6987583477991552e1944b411642782c07d17eb52f91e714a1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00947-of-01024.json.gz": {"num_bytes": 395391489, "checksum": "f5544ecb42c385cd5d5120c82140e4a36051f6a401d89ce30c8f2fc08cd69804"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00948-of-01024.json.gz": {"num_bytes": 399257562, "checksum": "1448cca7f1b9824adcf8437a33d14a7e95b705396611f82e7aba9a69e0a25118"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00949-of-01024.json.gz": {"num_bytes": 396371965, "checksum": "a7eb228f1d1ff2744af3d1a1358a94611cd92c25d81edac0e209b9f81c8a0a60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00950-of-01024.json.gz": {"num_bytes": 398022110, "checksum": "8651693d2180e518039da487f638c532c53f6d79a33356922b2d8706aa6a83cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00951-of-01024.json.gz": {"num_bytes": 396224338, "checksum": "c46bc8aa1621153fbd913b5d0b23a82352a28b36ec997c4df4b92dcc6ef26895"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00952-of-01024.json.gz": {"num_bytes": 397581207, "checksum": "02775930e3c420978a9d2785ee0137c3963dba7bc34538b2155eb38dd6ee89a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00953-of-01024.json.gz": {"num_bytes": 397045599, "checksum": "9d54940cb594de6e0f8593f64293e96375f0a5c56f3569c72720476bcef1f1a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00954-of-01024.json.gz": {"num_bytes": 395457873, "checksum": "3c12a1c3061164f345d9e402bed28be9af84ef56d5df1b22a3cf9f818ed47ae8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00955-of-01024.json.gz": {"num_bytes": 396450938, "checksum": "45db78bea4fae6cd69d900c581fccda873d2aa9f24ac5e9dfc18b486c15c3788"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00956-of-01024.json.gz": {"num_bytes": 397120474, "checksum": "7db7ea23446bd8a66737546c5daa0c2dec7bd5c4743f52eb53685ccbf54d9b17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00957-of-01024.json.gz": {"num_bytes": 397403279, "checksum": "89de2950bc3f7dd4f95d8a0b7cba19e9678bfbc23175bc22d9f9599ec1ad9cd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00958-of-01024.json.gz": {"num_bytes": 396861933, "checksum": "f325478647cbec9d79bff2266672144147276a82f665d3014c5d2fa9c112c387"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00959-of-01024.json.gz": {"num_bytes": 398439950, "checksum": "70d786bb337c012269caf6aeea3bf9604d279d3e4335294c72ca6cb5a9fbd951"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00960-of-01024.json.gz": {"num_bytes": 395684257, "checksum": "e1d170b0a4d6954a920ef3923688a7dbf40398609ed2ae04b2635df9ceb07821"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00961-of-01024.json.gz": {"num_bytes": 397526287, "checksum": "47b90e3747f35bf67c872d65d843f6dd9bfca15dcb769b31bf3586c6645858bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00962-of-01024.json.gz": {"num_bytes": 397473683, "checksum": "d0ddb2c104f515144265bd3eed526a65ada46f848183688b420694751b113272"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00963-of-01024.json.gz": {"num_bytes": 397964876, "checksum": "74725b631c1699b1166589eaebb66374c031b170eab3ab359230cd4a23a8ae79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00964-of-01024.json.gz": {"num_bytes": 396523661, "checksum": "fa0d49a2cc726628d9a1b5ae2ace52ee90401af8ae15add27c3f4566dd99a79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00965-of-01024.json.gz": {"num_bytes": 399289514, "checksum": "11fb1878a8b204181f7f776a764f5e9e577d0fe62d4b2e4ce2164ce9fcc30b8f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00966-of-01024.json.gz": {"num_bytes": 397411408, "checksum": "5646014ca3c99f53bd13183187b1e6e8f84cb6c846d6f1f3a3c82edb4accc47e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00967-of-01024.json.gz": {"num_bytes": 395095282, "checksum": "b799b17f36d85235eaf1bed9f4f760a22b75fca736744218e44fae5917a2286c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00968-of-01024.json.gz": {"num_bytes": 397189410, "checksum": "8d9748f5a92a9e0b836fe74b962bd2da04b62a0a2943ea5e440cef19166a5479"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00969-of-01024.json.gz": {"num_bytes": 395651742, "checksum": "f42c71219641fa302692698b4944864f27b7f87d4477a86babe23745dad72715"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00970-of-01024.json.gz": {"num_bytes": 396180197, "checksum": "383d9586f27579b4a97c5901013b3e025f10dc813047d65158d6621430803aec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00971-of-01024.json.gz": {"num_bytes": 396574555, "checksum": "d2c9700fbac454d3b3a42b2a3c4eb0111eb7cca7cab3d545b0912aba60415c91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00972-of-01024.json.gz": {"num_bytes": 399639122, "checksum": "5d59e643bf20156a28e5e9dfcd811c5a6c3779e1875f375db09a0fa1871dcc90"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00973-of-01024.json.gz": {"num_bytes": 395456709, "checksum": "8b22e82588e30f30f664895b9716cbb0cf38d5ff4331d3be31ab25663c634a00"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00974-of-01024.json.gz": {"num_bytes": 396693438, "checksum": "5fba4f9d634d968f15d5d4fb29d253646494e3e125aaf1c2f8fab38a7e60180b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00975-of-01024.json.gz": {"num_bytes": 395697641, "checksum": "b4c5fceb9fa2397a9b7c75249bd3386b8dbf999d5b52521051a86e067d698448"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00976-of-01024.json.gz": {"num_bytes": 397172005, "checksum": "093aa01a944a222828656d31dacd8ecd57a24a51d361a8742514bb6af009dce9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00977-of-01024.json.gz": {"num_bytes": 396182407, "checksum": "1beef6e248c00abee5f8952641b12d3f5b12d58adc05c8d461c0a073a6ca9b39"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00978-of-01024.json.gz": {"num_bytes": 396180428, "checksum": "0f2bb125af300de2c9fe347899673a4bd2842ba8298146bfe94c9eddc41893cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00979-of-01024.json.gz": {"num_bytes": 396479117, "checksum": "1fe9d0e54b9be79722e6483e386801263ca51d6e9ad925dabbb58a38c4df877e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00980-of-01024.json.gz": {"num_bytes": 395119279, "checksum": "0f262ff2d4701497f6fd6d4f9d3cb1aa3a730ad6bef1961d890a3b0cb4747ee8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00981-of-01024.json.gz": {"num_bytes": 398285798, "checksum": "a295b85e63c176cecd9f5222ba417eeda307e41847eb38c61dec9b83101a8256"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00982-of-01024.json.gz": {"num_bytes": 397811687, "checksum": "2a3a0e0f454dd72a68ed1dd71c508a9b24fb2349ffdfc588cbfcef728cbaff05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00983-of-01024.json.gz": {"num_bytes": 397069906, "checksum": "5b4256392755c4dd79cd37cd6ede645a9a549c4436acd27495e974ebe1d80bc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00984-of-01024.json.gz": {"num_bytes": 397670152, "checksum": "68d4f5dbb3fa349a6811edce8056eb297e771cb9c9939c3a84d30c6ba3ad9dc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00985-of-01024.json.gz": {"num_bytes": 397949975, "checksum": "6ba478b8a1ebf3b1dd67ed7b4a055cc9cc3c01bc90c1852aea8f5a99f6c07e69"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00986-of-01024.json.gz": {"num_bytes": 397730984, "checksum": "a39a23589cc434e573613e3ead44f33adb005c2c13cea8b33601647c97300fce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00987-of-01024.json.gz": {"num_bytes": 399173506, "checksum": "eab46d9d0a0cf05dc5ba475017d98f02f1cfd756c8e707d9823a0463713ebf23"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00988-of-01024.json.gz": {"num_bytes": 398674037, "checksum": "88749d380aac85314df66448542b696e9ae6f61f1b27dc395556737f59ad9024"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00989-of-01024.json.gz": {"num_bytes": 395313344, "checksum": "bc565b662396e3ab4e108635e01873014515663bd5216926a59ae80f6cd4273b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00990-of-01024.json.gz": {"num_bytes": 398567254, "checksum": "e9b9bd97a30ccac353a2386babbd01c3a3bbede8c07bc28d17aecc7ef5af6330"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00991-of-01024.json.gz": {"num_bytes": 396958611, "checksum": "505ab5458d5e52d656048284fd22cc0fcd16e49ba19331669239be37645cb04e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00992-of-01024.json.gz": {"num_bytes": 396102263, "checksum": "59ac5b2b04f224be04a4ceac6a16e29a33681f19cd40cbce3d3e8eb961b9f33f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00993-of-01024.json.gz": {"num_bytes": 396935362, "checksum": "c804f2311de9f7ae5691280e16261b9f8385ef9a71929b2111dfade532b6bdd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00994-of-01024.json.gz": {"num_bytes": 398832432, "checksum": "594727bdc3756e678bd4d156216712ed6c8fc98d3f8e9594cfbed10b2e414554"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00995-of-01024.json.gz": {"num_bytes": 396699737, "checksum": "bb3c73c6d48aebf9c60cde56944faa5bb6727db4cc48ae23d67650742462c42d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00996-of-01024.json.gz": {"num_bytes": 398059244, "checksum": "ac1a7e6e2c2a5468c704f5a2318b5617dd4ce140b98271e2034e00015db6cd76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00997-of-01024.json.gz": {"num_bytes": 397439167, "checksum": "ce9664b29c86c05d3541aee377acdca7a32ef8f0220e0b4b6bf18276b692529f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00998-of-01024.json.gz": {"num_bytes": 397383159, "checksum": "1b4db1b59255f106dd2af7510112eef6d6b611d9f9e000a0e585b623fdb8ae98"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00999-of-01024.json.gz": {"num_bytes": 396339114, "checksum": "ee5e1508704b03f0a9cb3c4bfb578c08fb83a4d20760e3b40f101c58cbbb3ec7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01000-of-01024.json.gz": {"num_bytes": 395172166, "checksum": "f8cbf0bd9c2b90e588942048848fbfa1a20cf775364cb9c84b4d5dd7cf19e603"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01001-of-01024.json.gz": {"num_bytes": 396629363, "checksum": "7cad3f9a28e5988ef91073c48e9d85ea7030289690f817545cfa9f1165dd33d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01002-of-01024.json.gz": {"num_bytes": 396507390, "checksum": "b4ae1017913509855d6d8d4413ff3de4a8d519d91f354b6e5b5267219d20658b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01003-of-01024.json.gz": {"num_bytes": 397652598, "checksum": "0c115446c159d27e6e1354173ebec29e6dff5f38c4d2ddb46c07c450523309c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01004-of-01024.json.gz": {"num_bytes": 397408971, "checksum": "f0b559a832a9ee50225fe1417d936d6b898026d80a105b976deaeae75f9e30a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01005-of-01024.json.gz": {"num_bytes": 397753911, "checksum": "e001c9285ade7de6ac23716b596ddcc733f05bd6abd7e1a67874894c93fbd43a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01006-of-01024.json.gz": {"num_bytes": 397962701, "checksum": "acf13433824104e4bfc3a8aaf8805eb16712cd97b2dc1d48e7d771bee4bd41c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01007-of-01024.json.gz": {"num_bytes": 395966285, "checksum": "4c6069f6a95d036fd3e05a4246db932ad5ab89b9470274f23a17df0b77b9b717"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01008-of-01024.json.gz": {"num_bytes": 397075505, "checksum": "9b3b9c0cd4ee02e18a5d22142183874586da8fd23b4f97033e354f9681d150a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01009-of-01024.json.gz": {"num_bytes": 396881470, "checksum": "14d2d7cf2ebf3b2c73bad4a6099fa1d2b1cb341b100976b03232fb664a7d020e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01010-of-01024.json.gz": {"num_bytes": 397471393, "checksum": "01e6f56bebe0c874d82135f551a6b917759c41af48d127df181267dc9b8f6486"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01011-of-01024.json.gz": {"num_bytes": 398092801, "checksum": "ead5b6b13bd09136fccd9548c224398401bda0ca7ff62ca4db852760760f13d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01012-of-01024.json.gz": {"num_bytes": 397831436, "checksum": "daa2d1507f9b56de0c4aa9d86d93259c1e6f73f0cdfd553ce075a16807dbcb56"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01013-of-01024.json.gz": {"num_bytes": 395098326, "checksum": "c2b21a1a56e9879335c72008919e8f7998dcc1e8df2258fdf2196ea86194e3cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01014-of-01024.json.gz": {"num_bytes": 396164077, "checksum": "0df125946c83c66c6961eae2aa45ad7eea7038d808281d633ce30686a8245e01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01015-of-01024.json.gz": {"num_bytes": 397895284, "checksum": "f6f6eee8fc113b7e717654b9305cc5129c3ee1ce9f263b91f0202762f078a526"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01016-of-01024.json.gz": {"num_bytes": 397723033, "checksum": "48426df1f4665d3179251904c96a0e73c041ed5b57885b4dd852809e632685b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01017-of-01024.json.gz": {"num_bytes": 396761053, "checksum": "f33cf2d744585e0338b29a5a5638752123b7b59f9ae3b723cf7e7b536f9f80ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01018-of-01024.json.gz": {"num_bytes": 396562520, "checksum": "72adb0869cac573282c4bd938cdff556f659540dd4a0a6663711974cb2dc147a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01019-of-01024.json.gz": {"num_bytes": 397564701, "checksum": "3b64235effaf41ad61698b2c28f4d73ced1b6ec6b6d79e0f52314176fa0feb12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01020-of-01024.json.gz": {"num_bytes": 396053080, "checksum": "b16b9f815823d176f94388d4c482652ac656aa763ec738ccd8c8a2a3bdefc1e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01021-of-01024.json.gz": {"num_bytes": 394731398, "checksum": "f4c0044abadd339055bf13843938eef4c066856757250fc15f77060fc0881ba6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01022-of-01024.json.gz": {"num_bytes": 396548645, "checksum": "5ecd8432526eda57065e6161f0618a19cd5993c7dfe86575775f1bf01836f750"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01023-of-01024.json.gz": {"num_bytes": 396863581, "checksum": "c6cd29b8f6067152ccd584ded81df1f9cb905515d48815b8a546d104ec7a3565"}}, "download_size": 406611392434, "post_processing_size": null, "dataset_size": 2059256402722, "size_in_bytes": 2465867795156}, "realnewslike": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "realnewslike", "version": "0.0.0", "splits": {"train": {"name": "train", "num_bytes": 38165657946, "num_examples": 13799838, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 38165657946, "num_examples": 13799838, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00000-of-00512.json.gz": {"num_bytes": 30085821, "checksum": "6666a680b0a34eb8756dcb5fd2b12f0078237f3502e8a513bd3e5b71bb92be00"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00001-of-00512.json.gz": {"num_bytes": 30065900, "checksum": "61c3f9ab763067f76d9bea349d86efb97af7539d481b5d2807f362204971c327"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00002-of-00512.json.gz": {"num_bytes": 30028880, "checksum": "3aa4405d957ed42d10d643efe7c0f51b05e8f29cf4ad8783448083c1cd3f2a24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00003-of-00512.json.gz": {"num_bytes": 30136880, "checksum": "f6eb49e4c0d691e67fe96ddeb3f8370c5e63a7297a31a8da0c58f5cb3a9f6061"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00004-of-00512.json.gz": {"num_bytes": 30110499, "checksum": "6e0908780f555f4b74c6a5055e2c9708333a8466f0b8723a8ea38cc04828ce44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00005-of-00512.json.gz": {"num_bytes": 30097927, "checksum": "a333562df3fcd4c5ccf51b4c00e11f6619ac4a28a878383aefad277bd30131a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00006-of-00512.json.gz": {"num_bytes": 30013820, "checksum": "7c436cd0993077187988239cf74c3e64de440dacad62ba4b02bd4ac0a8d219b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00007-of-00512.json.gz": {"num_bytes": 30557005, "checksum": "dc9e43681c404fef1741e9608295b8dfae0953473993f3fc44fb83af07a6b82b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00008-of-00512.json.gz": {"num_bytes": 30369535, "checksum": "8de7a4005acdb60436b4e5d7274084e28df3aee31a5457c6837452094544c541"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00009-of-00512.json.gz": {"num_bytes": 30033048, "checksum": "32310a6c74cbee1dbb8b196e0cfad41f79e88e48d8f04c88692d42506113b903"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00010-of-00512.json.gz": {"num_bytes": 29948345, "checksum": "b7df217de849e26ecce5ed7a35b6e6238fcc1c08e969023f209307842dd496c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00011-of-00512.json.gz": {"num_bytes": 30558885, "checksum": "82e5428aaeecf27141a7105e48b78dc02516ae6ebc3d6cd4ef13963316279e1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00012-of-00512.json.gz": {"num_bytes": 29888513, "checksum": "f3d7e496b7c85ed7d020c8f8a24a0b27f9b2535abdb22b45c08441a29398c44c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00013-of-00512.json.gz": {"num_bytes": 29936292, "checksum": "bf04d82f0cdddc09ce4aecd9f71910b9858badaf6456253d43d89e6a8c56cba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00014-of-00512.json.gz": {"num_bytes": 30169338, "checksum": "15b4611513154de0dfc1c9d470326fd053adf70de814ecfe8ba7ccee66de947e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00015-of-00512.json.gz": {"num_bytes": 30071363, "checksum": "887bdea83bdefc50786c93e8014d1d49999f8090ff15168598c884cd0724fec2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00016-of-00512.json.gz": {"num_bytes": 30451660, "checksum": "288ad0d553d54052354be506f87878fa7c54b0fa65811c6e456b3262e1d117e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00017-of-00512.json.gz": {"num_bytes": 29940254, "checksum": "b13ad58ae9f38598cb9d560e3ab34c1d0200db73fe86da12230e50086b532463"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00018-of-00512.json.gz": {"num_bytes": 30282186, "checksum": "5a67e71955ab2d8f6531bd3949cd8ab71f4ff91863ea5a6ec3e7b33c31a05dd6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00019-of-00512.json.gz": {"num_bytes": 30373907, "checksum": "a70682315a0cfe0af815c7b2abbcd63310fabbc33ad6e19daad19f1f51506955"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00020-of-00512.json.gz": {"num_bytes": 30104199, "checksum": "980e544ce130a06e9e99ec906342eb0ab8aeaa96ac26eca01c56ebb463f5d688"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00021-of-00512.json.gz": {"num_bytes": 29733696, "checksum": "a69729b8f3ccb9db12476a31917783c1c6e036e7bbbb4089f430362aef71f467"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00022-of-00512.json.gz": {"num_bytes": 30012894, "checksum": "589e698fe450e22cba47813a5a28da5393e79702a528f6a8469f72f6d630caad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00023-of-00512.json.gz": {"num_bytes": 30024851, "checksum": "2a7b036c38fb4d2df6535631018c23d001931e5bf8d8a815fd5b2f9343ec4529"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00024-of-00512.json.gz": {"num_bytes": 29906809, "checksum": "7e512306cb6ebb0b0c3e96ceb16dade9e1e1f484e754bebd0078e7f545fc5b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00025-of-00512.json.gz": {"num_bytes": 30332268, "checksum": "b636b91fcd9a91ce05b8cbeea6f591a0e916175ab23b0cfaf688171c8a98ae8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00026-of-00512.json.gz": {"num_bytes": 30288490, "checksum": "9e2f8e2a37dcfe66873cc5355740448ef75a1de2deeb2d8c047c3c3a7ee485c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00027-of-00512.json.gz": {"num_bytes": 29897688, "checksum": "882616d1e8ca66c0b6e7aa2ccb18d9239021603ab1b9486638a9a3447ddebe0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00028-of-00512.json.gz": {"num_bytes": 30201690, "checksum": "0312b12f50c64fbe7b894a28e0940089ad57af95df8116cd7d43c0435ec2e79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00029-of-00512.json.gz": {"num_bytes": 30237920, "checksum": "1e8677140186b219d32e764889dcc344ccac9db51685363324d1bc13ddef2bb7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00030-of-00512.json.gz": {"num_bytes": 30048903, "checksum": "43558e81c291cbf53a5b6a016aecb0e07e26a98b8fb32f4a000037b281afa363"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00031-of-00512.json.gz": {"num_bytes": 30294528, "checksum": "c33ae8a2fad7e5264d093fbe89ed1611357110a4f0f26dd5a93a4dc15560f205"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00032-of-00512.json.gz": {"num_bytes": 29868168, "checksum": "5dc2a8f96db8da87607efc0b708e6a2172530f0c9b43665dc01286109b5c55bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00033-of-00512.json.gz": {"num_bytes": 30105916, "checksum": "c4cdc2b39a86eff251f903d7f3d39605b721615aeffa6a2753f3588b7dbef6c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00034-of-00512.json.gz": {"num_bytes": 30126174, "checksum": "6d874182112b0881dc929c0182a30ec4f9f1633372a2b822200a7b1faaf4f1bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00035-of-00512.json.gz": {"num_bytes": 30084101, "checksum": "5bea17f0cd4dd888f5d8a2d4092138e4777d80493a1f410d618d4cedf353b914"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00036-of-00512.json.gz": {"num_bytes": 30095974, "checksum": "6e7f42f3012d8ca7500c7e2ec82d27c26b3cd8bb5b8b66a7fc8355d77284f433"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00037-of-00512.json.gz": {"num_bytes": 30239345, "checksum": "54ee45bf25152060679bab3e5fc6f5cb5a3add6acd2664cb152f88c223f83239"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00038-of-00512.json.gz": {"num_bytes": 30247683, "checksum": "f738a2f0f156f7bd897d9d822748d4192a5fe46b566c7288ed5b840c4ffeda64"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00039-of-00512.json.gz": {"num_bytes": 30057005, "checksum": "60235900d69579334660c153c4fe384c08f14f4e729a06a1e8247e8b4ab8a213"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00040-of-00512.json.gz": {"num_bytes": 30185136, "checksum": "5a059d64fd6a1b42a2faeb4088db327c47f9e8328737ab74a0e0457f84433374"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00041-of-00512.json.gz": {"num_bytes": 30314653, "checksum": "2cfdc460c8dd0fb4766191ef2aec0af856af7c95d11eb3f1d731f63b71db4daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00042-of-00512.json.gz": {"num_bytes": 30123256, "checksum": "64e59b8ebde3c12b0a1d218a302252b96aeb5bb4976927463101a9509579ec22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00043-of-00512.json.gz": {"num_bytes": 30057043, "checksum": "edd200b97394f15f9cf0a6289406a83b42c3d6f961456f031f5814db4f6d482a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00044-of-00512.json.gz": {"num_bytes": 30029900, "checksum": "1b2980f21ee5cffb271591adc8eaa414438841426442f194b5f4b703356f4e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00045-of-00512.json.gz": {"num_bytes": 30367170, "checksum": "83967210891345b831956722e8dcd29cf55fb17b786c85c2dd2778528ab4d1c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00046-of-00512.json.gz": {"num_bytes": 30105866, "checksum": "6921ac4854e2eacaeb4be07669faab85f2bab33f744c7efae1ce17be25176bb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00047-of-00512.json.gz": {"num_bytes": 29957618, "checksum": "e8eba2ba9f51e76a06a2df43b6b120c47b6e41f61e46a2e3331518ebb2d0c84b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00048-of-00512.json.gz": {"num_bytes": 30329887, "checksum": "6af9c44a53d7eb9df9d86ee4d895fb9f7f2b9b3863fd30aae325e79fb792a10c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00049-of-00512.json.gz": {"num_bytes": 30116207, "checksum": "57dc1e94f73b55e0be5690b01d61188a62186ea9f5f85b556ecef3bcaa36fb92"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00050-of-00512.json.gz": {"num_bytes": 30236341, "checksum": "eb75bdf0e63e798838b3d7abfc6a3bfab5de2ba39af833c38048dfe39c1175b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00051-of-00512.json.gz": {"num_bytes": 30357091, "checksum": "f48b1f5e07311ca9d69787019a56ad849932e6868d1f7778681cf7e4cc9fc562"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00052-of-00512.json.gz": {"num_bytes": 29944959, "checksum": "debf9490c057f11e404898b4a57cb424c1eb523fa90bb7899b1317f970481638"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00053-of-00512.json.gz": {"num_bytes": 30240416, "checksum": "9e847a5c6eb80e5c045fbb405729c695911674bd8d29b1d0be0791303d02f41d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00054-of-00512.json.gz": {"num_bytes": 30174556, "checksum": "65a80db1cdde9153e08277ad2d9074dfba1682c0f771fbb9f4aa8f88ca557f43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00055-of-00512.json.gz": {"num_bytes": 30134394, "checksum": "beb8d280d322520ded21aec92ae087867d0bce64aac4e243a127a88f143ff578"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00056-of-00512.json.gz": {"num_bytes": 29891026, "checksum": "82fceaec35a2456487a59ae652d72f41a940d2d6bafdc4f05a6e02bcd7ed4dc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00057-of-00512.json.gz": {"num_bytes": 29920525, "checksum": "e4fd55ba5fb2825ef4209aec87706ecdd3db040242c6aacfc82f350765fbeff8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00058-of-00512.json.gz": {"num_bytes": 30060421, "checksum": "3cfc894a1853e3d1f2daa314873b7919fa52b7208b590637f8face6536305770"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00059-of-00512.json.gz": {"num_bytes": 30038488, "checksum": "4f06ab7b5ce8e8c696445db4a3e32896b6396e3f67d7414a593e7398d752e564"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00060-of-00512.json.gz": {"num_bytes": 30129718, "checksum": "7923385ee0c6801073feb10437ee3c59e5f5dfe82c2311ad8c4ec670dcc0ec87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00061-of-00512.json.gz": {"num_bytes": 30130505, "checksum": "5cd682e148b8488775622098214fc2009ef9c95355f46341bd78434f1b560fa2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00062-of-00512.json.gz": {"num_bytes": 29968130, "checksum": "53562fc23501f3a1d11c8ae6a59e719d6f4e67db8b8ea1d55e2b1b80849afd08"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00063-of-00512.json.gz": {"num_bytes": 30116532, "checksum": "008cc5c0cb7d60e84ffdfe2132f6bb49aafbb31083fd026067b3859326ca64fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00064-of-00512.json.gz": {"num_bytes": 30236194, "checksum": "8f9eee169071e80c94c248f1c37b7fa631bd75a7f6e401f6a963aecd8815910b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00065-of-00512.json.gz": {"num_bytes": 30077312, "checksum": "8c5e18ea3575cd350e98d062ef88d3fd1df068e4bd410be8732723bda03656c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00066-of-00512.json.gz": {"num_bytes": 29920862, "checksum": "e377b8112dc6ff6834607c27b927636429e887f4ab8edc0824363941b7bb311d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00067-of-00512.json.gz": {"num_bytes": 30278223, "checksum": "ec2c2ac74cc3f4f814d645410cccda266151949dd36aae518b8082b948b47edb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00068-of-00512.json.gz": {"num_bytes": 29940464, "checksum": "ddfc16a17cabf48a2c59fa8ef25ccd12d899d3462d08b45f2a301567ccc105c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00069-of-00512.json.gz": {"num_bytes": 29903118, "checksum": "66d9d1791cda56607b2561199503cef216df86b28d4519d5862905671a4ec4c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00070-of-00512.json.gz": {"num_bytes": 30082323, "checksum": "8072d3bd5e19c005493c0332b73ca5be253397f54be90be1bb7b2ef8df7ad117"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00071-of-00512.json.gz": {"num_bytes": 30128276, "checksum": "b7c68af5a6dcac3fbb3dcbe12123d1045a79baf657a8b3bdada60c1a97404c48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00072-of-00512.json.gz": {"num_bytes": 30458419, "checksum": "cfe5c6ae2ad1531271b0039042e033bdd7caf9604bfa219980ca27513cea755f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00073-of-00512.json.gz": {"num_bytes": 30366974, "checksum": "a132f5e85376b0d0a06c6ae6af9c226dcbc98394461578c4fbc6cd439ba6e721"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00074-of-00512.json.gz": {"num_bytes": 29987779, "checksum": "f905e808b50908a7d2a7f0944e7e6c01ffd97ec16e5f0b6ed7169a60d66b0100"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00075-of-00512.json.gz": {"num_bytes": 30070204, "checksum": "b57458683803936f6bc03b06fc26be9d1a09ba09517b5c1518676f468e404595"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00076-of-00512.json.gz": {"num_bytes": 30129238, "checksum": "81e88ec53e39d6191e40e5852564f592b745abf99c71ff78302292632f636792"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00077-of-00512.json.gz": {"num_bytes": 30051399, "checksum": "218b0f6e219e42113e35d99458861f8511266dee6c17d9e2780a17af8877f822"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00078-of-00512.json.gz": {"num_bytes": 30144230, "checksum": "c0a337619559362e0e1cd0fe87c9ced5c987313a7f3cb65eb44f8b861c41c616"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00079-of-00512.json.gz": {"num_bytes": 30544297, "checksum": "27e257efda6adbce01585b3b6cdeefa95d31f607012fed5dd4310bfb5a790ba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00080-of-00512.json.gz": {"num_bytes": 30188866, "checksum": "26411f1a0a7b299d0bf6cf78db04b0bcc617894cd87d59e54614f3258dd393ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00081-of-00512.json.gz": {"num_bytes": 30418881, "checksum": "87a659f6b24560a754ccbfb6aee019484e48e3ddc7955a6c7a18aa9098952cfe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00082-of-00512.json.gz": {"num_bytes": 30086460, "checksum": "708fe5108042b957688817625c84059c11700b18ddcea3814b86b6c8c66af8a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00083-of-00512.json.gz": {"num_bytes": 30138639, "checksum": "8d8681519538afdb7622b677ca5d3ae2a643382bae9639e3ad90c82d36477653"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00084-of-00512.json.gz": {"num_bytes": 30228150, "checksum": "db708760b9d45e0b20c8dde9b0008f01761d9bb0f37a194845b4d097a60e477c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00085-of-00512.json.gz": {"num_bytes": 30004564, "checksum": "19ba55c7cbc44ae30a6497373fc15b548e5c45667f790c392857f6fdaa7e2bf6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00086-of-00512.json.gz": {"num_bytes": 29696360, "checksum": "4cb07dd259a084818f9a79a4fe4fb7b24ea1adda0cd4fd405ba003e7bd481f12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00087-of-00512.json.gz": {"num_bytes": 29927300, "checksum": "7c3c07dbc9c57881a3c1abab85a927f1ba609c58da9dcec22d7415079cd336b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00088-of-00512.json.gz": {"num_bytes": 30038333, "checksum": "59158c87d7e9e5011516f98dec1313758072ca6685c7ad9df5ee4a075d9ff8a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00089-of-00512.json.gz": {"num_bytes": 30223506, "checksum": "d3f39f7e90b4a82257779290a3f2de5619049d69b2169577f1e3c81791d85419"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00090-of-00512.json.gz": {"num_bytes": 30266969, "checksum": "88ed3237aadff809cec186fa378e176774d3f32aef1a6d8bfdbc530f64e8aed4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00091-of-00512.json.gz": {"num_bytes": 29885840, "checksum": "b9a247993a8eec31b3f853d1329ae79da29397dd27eb4acdc196b71c091335e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00092-of-00512.json.gz": {"num_bytes": 29942337, "checksum": "3d83cc54c06cad8effdb7a38ed6666b5d912e6fffcf4c82471af064b0aabe05e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00093-of-00512.json.gz": {"num_bytes": 30129376, "checksum": "d72ed9855fa86ceb4089435da3d78e8d4151b92185f828329b534d1adf3821db"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00094-of-00512.json.gz": {"num_bytes": 29613450, "checksum": "f61f74aa65a81616b97cbc34a8be1b563f83f69709642b8156eb76cdda02103f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00095-of-00512.json.gz": {"num_bytes": 30469526, "checksum": "926d1ba2e4b191e75b0bce0cbe4c15f95f244445ec03a6095c009c34e36f897e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00096-of-00512.json.gz": {"num_bytes": 30126036, "checksum": "e74818ad94e408498644dc71f1ed967f356f539418222f1dfea467a21c99badc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00097-of-00512.json.gz": {"num_bytes": 30374980, "checksum": "d9cc8827ee38bddd1a31e48b2b0064a567520e3c0f2e1be745acef57d267e4d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00098-of-00512.json.gz": {"num_bytes": 29928579, "checksum": "090ad37fd9eaeb53308599f2da1053b19b1c6478adaea5a8a1c35d6c35340111"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00099-of-00512.json.gz": {"num_bytes": 29901456, "checksum": "c0e7d9a7cbc3b9b940077508441e471a1eb70e822479fcad726b900e6c196382"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00100-of-00512.json.gz": {"num_bytes": 30033459, "checksum": "b62033de618191de3200205e6e40725baf045e403060d10417211d47854d6bb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00101-of-00512.json.gz": {"num_bytes": 30280468, "checksum": "8726d092785856ec690dcd8a9edcd968cd04af1cfafe8a83192e3c0782f02b4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00102-of-00512.json.gz": {"num_bytes": 29805195, "checksum": "248edf4dd6c9a1137c7b45ab0b5a05a5fc93fd14cec17a5da4d758b9f7b359df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00103-of-00512.json.gz": {"num_bytes": 29995494, "checksum": "d66b75c3f08a0db141d2c0162eb3dbc351e656ba1ba480e77eda051435d1390f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00104-of-00512.json.gz": {"num_bytes": 30318447, "checksum": "09bd2068c20d33783f39322c95756fd3dbd0da91f4380fae3822cb33b7d06779"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00105-of-00512.json.gz": {"num_bytes": 30209523, "checksum": "0a399ecb1116890e1a0189cd2842d64d8ed53213b1623ae38229a6ac4f5c1c76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00106-of-00512.json.gz": {"num_bytes": 30476739, "checksum": "540f682a7c977d20f920b5af1ec7e40c14a0d54f1718b43271e22dece9cdce16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00107-of-00512.json.gz": {"num_bytes": 30203291, "checksum": "0dd51deb74ab391c54b20862f7df561f74d00be2ee4fc13987f91771870c099b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00108-of-00512.json.gz": {"num_bytes": 30265100, "checksum": "172b09a108b154014077a415f644cd16db6a66f178bf780c120a6c4fecc3c0a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00109-of-00512.json.gz": {"num_bytes": 30342649, "checksum": "214a8f147f2d77ec0f3889b0a2d782e5d44230878359e695e9523561e6723a1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00110-of-00512.json.gz": {"num_bytes": 30152418, "checksum": "dc0d34ce7918b80ecef3528ec2b063edf7b12223c453ac7fb9d39232fecd81d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00111-of-00512.json.gz": {"num_bytes": 30160329, "checksum": "d0594cb69d26f0e853575d86f92b1aa233b5bb236804a2f496a792fa031014ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00112-of-00512.json.gz": {"num_bytes": 30428351, "checksum": "2b0542d973bab88e696fb9efbe042167600da397d776ef65344dce868bbcb0b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00113-of-00512.json.gz": {"num_bytes": 30200133, "checksum": "10dcb929692795fefcf4623040191d9cb6199fbb3b164648b62b9867e8392379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00114-of-00512.json.gz": {"num_bytes": 30205273, "checksum": "f16631d5bcbbe133a01675286ca7667400ecc7e6df13d728015381d21ec71cfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00115-of-00512.json.gz": {"num_bytes": 30164849, "checksum": "bed27819db4bb7e02cb42cdda18acd232659a2eaa43eed910ba26d686cb3f837"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00116-of-00512.json.gz": {"num_bytes": 30117752, "checksum": "4eb4bec7adac3c2f431d356212f8a9d47136f0011f5f9e71dd29d82b1b823e2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00117-of-00512.json.gz": {"num_bytes": 30062588, "checksum": "79639624734885b3051b10f052f5486d7124bbc4bcd18d99348f3683ee2fc54f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00118-of-00512.json.gz": {"num_bytes": 30125828, "checksum": "e922a4a5332a4182ddcf6ac8ba910024fe4fa878b524f7368b27373f75bbfe44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00119-of-00512.json.gz": {"num_bytes": 30156741, "checksum": "a44aba8779b99ace2f212789389af058d12dfb0706221b296676d5e10528dd78"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00120-of-00512.json.gz": {"num_bytes": 30489925, "checksum": "82bec41bbea7bc5ddb67b3bccea51122da7d0922768f8bda7a0c9d489bd20cdb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00121-of-00512.json.gz": {"num_bytes": 29606989, "checksum": "b49238f5b75aaf876657826cfbd4346d250f564a86bdb010aa1e85b44a969229"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00122-of-00512.json.gz": {"num_bytes": 29770557, "checksum": "0803ccbd505db47cd09b20d86cc6ad459c7a8d1c583a5ee756b0397369d8b6fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00123-of-00512.json.gz": {"num_bytes": 30248121, "checksum": "d73a1bf285a0355bd61a25891cd8c5fd9da66535ec515dc7e1602a769b994727"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00124-of-00512.json.gz": {"num_bytes": 30131013, "checksum": "65d2dcc7e63a28e1911717d149b907d0c74fda6e36db2840353a0290f7880324"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00125-of-00512.json.gz": {"num_bytes": 30348971, "checksum": "5dee3c7afe0364ccb8e36647d01e78ffe61690f29f29aa033efac9a0413c2a47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00126-of-00512.json.gz": {"num_bytes": 30370074, "checksum": "1dc04b3755291842711623d1d6cf042e2d66987103a0c708f01c9136a8c42db6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00127-of-00512.json.gz": {"num_bytes": 30320846, "checksum": "e31a27ba25bdf13e6f929fd38d53409dd3f50be78ad955b69b1956709de5aedb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00128-of-00512.json.gz": {"num_bytes": 30076235, "checksum": "122ee9d293428a7a823c17b3a432b5b2198fa2a68bbb246b97e981bd09f78f0c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00129-of-00512.json.gz": {"num_bytes": 30569486, "checksum": "918bf43ce3ab54d535dd02cbcd09f1081890be3287e23fd81bfa032beec61ebc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00130-of-00512.json.gz": {"num_bytes": 30280169, "checksum": "ab0a53e8c10dfdd139281175b5fcfe3090fa238fcb383e27b1dcdfdbbe8a879c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00131-of-00512.json.gz": {"num_bytes": 30338899, "checksum": "e54771e12a6f3583c3accf9bcc01b598819231f367e7f80cbd44cf6683c5c852"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00132-of-00512.json.gz": {"num_bytes": 29969011, "checksum": "f69d7052ca7657fdebe547a6e196b109285d5d4e4f1a68f3900a37ba6fecc22f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00133-of-00512.json.gz": {"num_bytes": 30179558, "checksum": "cf2130dedafd8f47e97661a5b1555813433e3f7293b5c5cb222cf551d90a0604"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00134-of-00512.json.gz": {"num_bytes": 30080257, "checksum": "1a32902fc21633ae8d41e4e5518804f4c719dc8729b866ebc32d3c36fdadbc10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00135-of-00512.json.gz": {"num_bytes": 30284972, "checksum": "6e3a78e7a530d91ee4578caf462a4c685a5f221f0cd8eb9639c9067e2b655a7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00136-of-00512.json.gz": {"num_bytes": 30130265, "checksum": "defc57340cbaa5f325994a91b5134789c84a76a4ca7b9fdbf993b0e634735f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00137-of-00512.json.gz": {"num_bytes": 30146793, "checksum": "7ce5035f452eb2e1adeff36d0c6d6d65c245d139a86ef48bbe10c5275975183b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00138-of-00512.json.gz": {"num_bytes": 30180265, "checksum": "298849a53a8ea0e68d01cc137195bc36d686077bed722e1198337a1dee3c51cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00139-of-00512.json.gz": {"num_bytes": 30398387, "checksum": "ef2ac4b8f195141a79a357d934d5d97bd4d2c64027ec7509b5873a4ae32fcb9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00140-of-00512.json.gz": {"num_bytes": 29652990, "checksum": "290f1c99b696e345aaa6ac6d5a882a87dcf5d3939b08ba859a359d2459498785"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00141-of-00512.json.gz": {"num_bytes": 30083642, "checksum": "fb6a38388a25261d86fbd8ffea63e06bcbcbd6846a4eb6f13fd09d7fe5a1fbc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00142-of-00512.json.gz": {"num_bytes": 30131064, "checksum": "b61ccf6166ea4b777629bdc07d543f299bf7569deab18228ec5bb9edc8cd3eb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00143-of-00512.json.gz": {"num_bytes": 30244435, "checksum": "22812c50efdfcf2c0fdcf593639dfea09ffee8068321c30effc669c8234d4f3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00144-of-00512.json.gz": {"num_bytes": 29725094, "checksum": "79cfa65a3115193629d16606643d90dcf27d3108c320cc9e364ba19fdb9fb1d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00145-of-00512.json.gz": {"num_bytes": 30335033, "checksum": "e836f0bc9acba85fd1721d19cc24054e97defb0d12678bdc0d086f40deb9b1a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00146-of-00512.json.gz": {"num_bytes": 29905680, "checksum": "bf684871a235078390d6c6bb03fc2d5bbffec2b095806df652a19baf5e67135d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00147-of-00512.json.gz": {"num_bytes": 29852459, "checksum": "0e716de5b3b09ec287b039be0f0dd6edd7d541aa6d3f9d2be18768e1cd5f4cd8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00148-of-00512.json.gz": {"num_bytes": 30364788, "checksum": "4cef624e6b7c2b73dbfb47227e31681223a5a9369c4b7daef8606b796f010dd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00149-of-00512.json.gz": {"num_bytes": 30096278, "checksum": "fb448ccc7412f5ca8667004a70f3dd6e1b5e6cb7f6facc06564bd22b1d815593"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00150-of-00512.json.gz": {"num_bytes": 29776995, "checksum": "1e14268cf723bc7336b33896537643d21dbefc1f05ffd5201feb5fb1130f9683"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00151-of-00512.json.gz": {"num_bytes": 30205172, "checksum": "797224cf74063fbcaec741535278ccce141e6dbbdd69a2191d07f89816ab14fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00152-of-00512.json.gz": {"num_bytes": 29845034, "checksum": "77eeb2353f544c714deea68d4a781b498c40d7c1e27db3aade4987b381ca29c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00153-of-00512.json.gz": {"num_bytes": 30258796, "checksum": "0fc581e92e70dda031d72a4aa0bbd65b1e9b28884f0ef5dd5e895cbecb270609"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00154-of-00512.json.gz": {"num_bytes": 30249734, "checksum": "ba10dd0a24bded170541e23078264b82b35bc99e402db594e2335e31905ededf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00155-of-00512.json.gz": {"num_bytes": 30198742, "checksum": "fe285ac893126062bcbc20df75a9f65c57d3a7391354fa7e62b7f6a7122d6e77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00156-of-00512.json.gz": {"num_bytes": 30168323, "checksum": "d21826b71bc85dbc496dd947ae9ee79d62885cffb3fa7c47409feee6ab247f17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00157-of-00512.json.gz": {"num_bytes": 30241978, "checksum": "fc41765301b62849eda0b7b08f792e45f03db458fb92063af70c43d7cd0d0bb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00158-of-00512.json.gz": {"num_bytes": 29959715, "checksum": "1eded3ce0bc099c7e198e9277719d578c3fb6c425bb2110cb0ca6ce469d1d19f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00159-of-00512.json.gz": {"num_bytes": 30109595, "checksum": "eccaab5b694c2f0017fe1d423637872d5587f6deb316796f7c0ff5517fa28178"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00160-of-00512.json.gz": {"num_bytes": 30201741, "checksum": "4ceee71372da6112101665f5bbf942a85f065feaab924c6e3f83498169bbe255"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00161-of-00512.json.gz": {"num_bytes": 30176266, "checksum": "6ed829daaad190b2d50b626d840edb750a063afad95315ffe7604a193183a489"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00162-of-00512.json.gz": {"num_bytes": 30018118, "checksum": "dcf8509a55213425a41706e5209ad411afb715fb9cd8c1a8b8edca23fab7d6cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00163-of-00512.json.gz": {"num_bytes": 30236016, "checksum": "d93cfaabcc7197637f233896b5799527f27d5b2dc60f0f0411ee51f05f09c500"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00164-of-00512.json.gz": {"num_bytes": 30150055, "checksum": "cc7de5ed3c774ff1dc350fbb5167dc1610c4f9a0dbc7c5d60ed4cf08aaf23ce3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00165-of-00512.json.gz": {"num_bytes": 30348056, "checksum": "b41c4a3b7b4e96262fe5c87d06fbeb000dc48cc1d304a475bb4f4e1af84a9afb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00166-of-00512.json.gz": {"num_bytes": 30015834, "checksum": "0a0821b7628b9b019995a9f34223e2960ded84331ce1bb55089838becb8a170a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00167-of-00512.json.gz": {"num_bytes": 30282254, "checksum": "1285af56d024efe2166fa892878d471948e1d4c996922c7673e3c0f7f0f76bef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00168-of-00512.json.gz": {"num_bytes": 29815124, "checksum": "29ec54ed647725ca3b9aec3bae341151a8e2b708cf21cd87b4389329298442b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00169-of-00512.json.gz": {"num_bytes": 30346843, "checksum": "1791e3f8371a63f9f849b7bf430e70d3f4011dbdef572c166cc5d49d06162fd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00170-of-00512.json.gz": {"num_bytes": 30175685, "checksum": "de8f82986addfc64b88fd3041d7ee6fdb64e6f770758146dc4c9309df348e965"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00171-of-00512.json.gz": {"num_bytes": 30145505, "checksum": "0dda47f679666862de6343e1109ed92866a42e8fa129ee69e9f0b73f18b6aecb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00172-of-00512.json.gz": {"num_bytes": 30009998, "checksum": "2990dae6c16b7d60652439bed8b80ee4cf93972f33d8511d3d6aabaddfeca5cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00173-of-00512.json.gz": {"num_bytes": 30062185, "checksum": "e154a969bba2bf9430e0c8307561de78599fd2bd527cb1f15bbaf8f8e88cdf23"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00174-of-00512.json.gz": {"num_bytes": 30055129, "checksum": "e714ae153e8a927c88fe577d4c27017985d3ed7f3d0f5470f9a5f25c2e901a9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00175-of-00512.json.gz": {"num_bytes": 30091082, "checksum": "5f47c663d1e15d94fb0057d303048be990c713f3285ada2c6233137b1d84d60f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00176-of-00512.json.gz": {"num_bytes": 30235767, "checksum": "20b05e4e99e5a05f6a4c29b304803b895bb8816caea6203643723ca587d66128"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00177-of-00512.json.gz": {"num_bytes": 30071950, "checksum": "29294e4b224df4695c9342c6f23d5495de9a0ca6a1be7217aa2211506e8ac7bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00178-of-00512.json.gz": {"num_bytes": 29932121, "checksum": "6022ed3b2ceef02324e40d3c7407622c95ead2cd3d3c41ab15ff9dd218265673"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00179-of-00512.json.gz": {"num_bytes": 30119251, "checksum": "42fa0aa883d9db4303a4981e4e308b2432b031fbccc98c3e1994ec775ba8023e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00180-of-00512.json.gz": {"num_bytes": 30175456, "checksum": "6fb2ebd61524846f6b1f746f9c6356045623beb4b685fe265a23446037c9cd9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00181-of-00512.json.gz": {"num_bytes": 30029564, "checksum": "b779d721bb135fceaeddebb0dad1bdb43c9067a5e8595b3d544dfa7a084eb9f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00182-of-00512.json.gz": {"num_bytes": 30437016, "checksum": "b388fc0e862d7f6bb5b879ff7c69c301038faf5b542f6b40cbea4e2096a41e6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00183-of-00512.json.gz": {"num_bytes": 29994048, "checksum": "8208eeca7bc76f8b1786c95939d321ca0c7ae190b1f12dae86738810e412aa8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00184-of-00512.json.gz": {"num_bytes": 30338616, "checksum": "49859e75d999f65de99f9236e649a81989360f0328ba684671057b0dd7cf5e79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00185-of-00512.json.gz": {"num_bytes": 30088874, "checksum": "ff6d32fdd471d3076a9367c175baab84a5d699ccd6dcfe00c755f0b714ca6074"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00186-of-00512.json.gz": {"num_bytes": 30193681, "checksum": "82508ed104fc57de3062258eaea57854ab9e1934437a88dc0d8a9921f3641bbc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00187-of-00512.json.gz": {"num_bytes": 30171163, "checksum": "409d6576b25ad27455c755e5484e3f51d5d9788962efabe1c32e06bb3febacab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00188-of-00512.json.gz": {"num_bytes": 30060432, "checksum": "fae94de96fa2962ef51e2ea90a5f760a5cee5de249bfd9f56d7c7b4e5c20f6de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00189-of-00512.json.gz": {"num_bytes": 30180741, "checksum": "25293d5cba09980086f380d9e9ab44543adbbdcd05ed08601248b3a2b16d118c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00190-of-00512.json.gz": {"num_bytes": 30207152, "checksum": "ccfee160de15df5d88f0ff5a898a0c5b2d0ef4ebd6e6832715a9ef8a9904f88f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00191-of-00512.json.gz": {"num_bytes": 30143987, "checksum": "4c579619e465d9d97451801147202826a3855e772ea6dc4e9968e43ce2b8c05d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00192-of-00512.json.gz": {"num_bytes": 30072097, "checksum": "9c32ecb6d4ec9feb27c5b642879b464e68ca8804db161219503f624e7ca1166f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00193-of-00512.json.gz": {"num_bytes": 30172886, "checksum": "8442ddc3843c72aa169ca67801ff865ff85e4183beb38faa664f4f1d1c22a5d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00194-of-00512.json.gz": {"num_bytes": 30037105, "checksum": "2942ecacb22cb9a2953c68f21ddf3368cd47ab1f2b2d8e1f5c76b1c849b28d91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00195-of-00512.json.gz": {"num_bytes": 30014854, "checksum": "9e5c6815a5734403a7062bb27b2565d433a3520a401c836ac3f16e743a1dd949"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00196-of-00512.json.gz": {"num_bytes": 30020510, "checksum": "792712f0073c158b5f96f7a99d97970fca3819b69739d34d7d2b7f4b8b407b7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00197-of-00512.json.gz": {"num_bytes": 30072566, "checksum": "3ece37e2d0d0b26fbd839b5d3facdfd70844945a06867fb68b141f6b1378462b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00198-of-00512.json.gz": {"num_bytes": 30036679, "checksum": "c3f37a9b89987dde4578b394b5c3916c2d4fd87e0902309b4c81af19b1d2d5ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00199-of-00512.json.gz": {"num_bytes": 30195178, "checksum": "ae01bb5515097a083afd498d8530e788d99671e7cf802c4402957d6252b2ec77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00200-of-00512.json.gz": {"num_bytes": 30064374, "checksum": "2399d4869f3a8bb4a9adced5ec548a9a3fde1d4fbc4e3abd9a0a3b495fb9a8ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00201-of-00512.json.gz": {"num_bytes": 30136711, "checksum": "5c922040697bad8d7807d79f34f2b667eea63ceefba89b2d413fcd4d66497607"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00202-of-00512.json.gz": {"num_bytes": 29962983, "checksum": "e4df518d612a8614de73d5944a31d22ad06ec9ecd26fb52e500df71fe363c1be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00203-of-00512.json.gz": {"num_bytes": 30178998, "checksum": "e84a98a176451fc82d940a64cdec821e320a648780edba6466b74a1966eca47e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00204-of-00512.json.gz": {"num_bytes": 29988832, "checksum": "c6dc56388bc7c57cbdee8280895ab80da7b4d49c9a0101a685229c50cad2e2e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00205-of-00512.json.gz": {"num_bytes": 30229414, "checksum": "e7e5175b6a7372377ba3a0db439911e189db459787d48588183ac1a0198c5fa7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00206-of-00512.json.gz": {"num_bytes": 29914929, "checksum": "eb263433133660ebe219cd5817dea3b546ef2fba0e15396b2768d7091117cdea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00207-of-00512.json.gz": {"num_bytes": 29912800, "checksum": "7f8a5f62ba5912b64af5b02bd987b4d81727223ef8eff110022e89d01961366f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00208-of-00512.json.gz": {"num_bytes": 29900590, "checksum": "bc2af142244601bb7a96859dfd9885196940e675ca217cfc7c73ac9c614ea938"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00209-of-00512.json.gz": {"num_bytes": 30242768, "checksum": "fa51a4337faecfc790ca925802f87f10761552e16578b880ced80497f62bba60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00210-of-00512.json.gz": {"num_bytes": 30039857, "checksum": "3adf7482ec6a3ad106c8edca3645a94032c33f84fcd26bd9876f2b8a1f6b5722"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00211-of-00512.json.gz": {"num_bytes": 29846856, "checksum": "8e931aaa9c1f069c0eca0b4605277610df9d2d0c07a0dbe6191fb7081b0e642a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00212-of-00512.json.gz": {"num_bytes": 30022172, "checksum": "21c8bba1c83544c27977b22b077fd77f8df9cd06bc4eb5e9e9a532c511498d36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00213-of-00512.json.gz": {"num_bytes": 29877918, "checksum": "b64ebaa088df5c6230e69f207267a038705c38f4d327970e9117979e1c13d1ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00214-of-00512.json.gz": {"num_bytes": 29906552, "checksum": "55d833a2b78ad564e6532d1acd14511e8b48d703030e3bbc92d7c835c1ed38c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00215-of-00512.json.gz": {"num_bytes": 30075441, "checksum": "999c77c136d3df83601e33c823f389b133f33c4c0b03736ceace617b526cb293"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00216-of-00512.json.gz": {"num_bytes": 30507152, "checksum": "0b23d4e57eaa101c78bab46151add537668d2722bf0c50470c1b434ec3389ae1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00217-of-00512.json.gz": {"num_bytes": 30044236, "checksum": "6abacfd53e231a38c714d436018cef9a58f53320026c2ebb27d6caf08f02d7ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00218-of-00512.json.gz": {"num_bytes": 30047926, "checksum": "01120ef69493d84c44d112a41c69a851edaf89232679366e812f240fd26a0e47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00219-of-00512.json.gz": {"num_bytes": 30349211, "checksum": "c4fc219559f0f076f634fc6812d4b13c229908c1ae45c3b74c059fb3b8124f63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00220-of-00512.json.gz": {"num_bytes": 30063445, "checksum": "11f712439d54ef062cfa1225328fc4faaef5f6c9c0b0d87a0a81d25a71350e28"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00221-of-00512.json.gz": {"num_bytes": 30115660, "checksum": "9a344857ef4f9d141b57df38e25f717153b773436d72c23e10289ffe67c315eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00222-of-00512.json.gz": {"num_bytes": 30134562, "checksum": "227cd1847a948e388b404b5cda9289f05510d4e22f0ae5ec4d5a87a8f7f98a45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00223-of-00512.json.gz": {"num_bytes": 30120819, "checksum": "e0029aa6b612a98f76e37d82107fcb90f2b57ae8d52beea172b5153b76334f20"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00224-of-00512.json.gz": {"num_bytes": 30371365, "checksum": "1ce5242d163ca12dbb22655eb841bf80750b552353af4f84973285d823d0add5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00225-of-00512.json.gz": {"num_bytes": 30319212, "checksum": "71cb82bb95107a7e0b7777a5fcaa0f76b465ba828ac47401babcf7289eeb2335"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00226-of-00512.json.gz": {"num_bytes": 30020940, "checksum": "b7b8d98ade41f52ece23e896bdc4c19ad034a92ba18adb5fac85c7271afbfa65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00227-of-00512.json.gz": {"num_bytes": 30109958, "checksum": "b2ec382f44caf4e8e46fef2faf6bd2e4000420e6da2eb12a5d9f6e7efb4e1564"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00228-of-00512.json.gz": {"num_bytes": 29940895, "checksum": "ff86264683d0fdf9d689aa30e7889c4ceed21098b7c60a220db92d396614cb1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00229-of-00512.json.gz": {"num_bytes": 30080588, "checksum": "3a5502cedd61501055eb16adb6ef861c75880524c5468a69cd346bc03e98e219"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00230-of-00512.json.gz": {"num_bytes": 30376399, "checksum": "6d3a4171a1febe9149f6900e3cca5a38046ca9d59214b548a4ef9de7de754bbd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00231-of-00512.json.gz": {"num_bytes": 30031670, "checksum": "a2c8d9bb3eb260d5d8a7dcafc4703540332e2896e5127372d380d7efbd567a3a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00232-of-00512.json.gz": {"num_bytes": 30132612, "checksum": "c9dec917eff4d72c684d6f8373ca66839061e29d25f0aa5fd6fb7de5c30df469"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00233-of-00512.json.gz": {"num_bytes": 30178285, "checksum": "1eb83b8eb7e72b2b3e55420436bb17521b989d0627da46f8cc61fe9f420fd464"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00234-of-00512.json.gz": {"num_bytes": 29991258, "checksum": "5e14e2a9e8c0aba73feb9134c694e99baf57357bb524877322ff5181eedef1f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00235-of-00512.json.gz": {"num_bytes": 30045172, "checksum": "50a118a072498b5338802cceacb97a9aa9242252e8d76d305cf5f0d928fd4af6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00236-of-00512.json.gz": {"num_bytes": 30403542, "checksum": "7d7605576975232579e422a1b72625ad6f9d714d27770725dc7b99ba258e1985"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00237-of-00512.json.gz": {"num_bytes": 30242989, "checksum": "22d152fa02c5a959e978ea4887dd873dfef7267af0a577b4d796ff0cb52d5c56"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00238-of-00512.json.gz": {"num_bytes": 30214634, "checksum": "6d0af6f396fa21867e899a7678c633e47bfe79bcbda29b8072c5d32ab20a9aa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00239-of-00512.json.gz": {"num_bytes": 30255546, "checksum": "d35a93632638b6283053b121f0f30d47ea20b2747d871c3dd0beb13f4ffbcad9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00240-of-00512.json.gz": {"num_bytes": 30347604, "checksum": "fd052d532fcfe811d96f8433f79a684f68f76ec42bd959c76ae3b63aec0b2c3e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00241-of-00512.json.gz": {"num_bytes": 30135691, "checksum": "12c80c41dc4d6313bce4a171999ecda93ffc59f2c70cca363bce214cd12dc9f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00242-of-00512.json.gz": {"num_bytes": 30229834, "checksum": "fca5b81914ac0c5fe0b0c1a554a1e62c64af5c98740df1f8ce8f48f2a62b6a48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00243-of-00512.json.gz": {"num_bytes": 30053753, "checksum": "ba41c505579524e9d244354a70060c9a0131007e0b129f03e628bb7b7b512ca9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00244-of-00512.json.gz": {"num_bytes": 30216889, "checksum": "54a391c1d2de7627e739f3cd94eeccd50a80d56a40606f7c5392f6098df456cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00245-of-00512.json.gz": {"num_bytes": 29887569, "checksum": "c3263ea7e16e0036961dad28fef57ce4f0495219e59b4e800af82b67b3c6c506"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00246-of-00512.json.gz": {"num_bytes": 29906815, "checksum": "a3dcc92aed81708434edee84397010eae4ffeaa38b39aaf3919256f72deee625"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00247-of-00512.json.gz": {"num_bytes": 30074896, "checksum": "019e983a95908651bfae83e37bda5200b3888b03ab235fc8db2d5b16742f028f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00248-of-00512.json.gz": {"num_bytes": 30108081, "checksum": "6f68835ec02cf899f8f44a795b1e3117956ff5bb6c8946435d9861ae7a112df3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00249-of-00512.json.gz": {"num_bytes": 29957882, "checksum": "9bed6b7f56d93fa3973d4f177dde0973fa0eb6fe17d8d85279d865531613f963"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00250-of-00512.json.gz": {"num_bytes": 29822284, "checksum": "1848bef8d11360df55a576c64147e519327b1178f77d3ec14ab9522b33b1c423"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00251-of-00512.json.gz": {"num_bytes": 29956462, "checksum": "425f69c361a8671cf571df577ac0cfafb4894de494360084b7cbe9cb8869bc3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00252-of-00512.json.gz": {"num_bytes": 29733712, "checksum": "7198e831e75eff1e116513f9cbe098c071f051c545b41d1943211a1d996a3c67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00253-of-00512.json.gz": {"num_bytes": 30450662, "checksum": "0452804e723c919bd3c84217bb1dfc8764112fd70c5581f84520df7592f28ae9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00254-of-00512.json.gz": {"num_bytes": 29944765, "checksum": "dbbff2253d70094537de481344e5706315271fdfce7ebaddc8d277ed05ddfe24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00255-of-00512.json.gz": {"num_bytes": 30321363, "checksum": "79173dd85d535cee71afb52f7775bbf7289509bc555efe21a8700d36f7e5da25"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00256-of-00512.json.gz": {"num_bytes": 29982818, "checksum": "bacd191568e72da06c564fc7476225ce83440de6aea6c85ebe7f5279f1c15846"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00257-of-00512.json.gz": {"num_bytes": 30338592, "checksum": "998287203665559c27a66e889611ed716b7a389e403b2e857086f548b2c47b39"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00258-of-00512.json.gz": {"num_bytes": 29911193, "checksum": "ed9829f41a71cc187d0ddfeafc9cbde8e362b52914c988708a1a5ffbd3c152af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00259-of-00512.json.gz": {"num_bytes": 30227794, "checksum": "2fe86814499a3379601a179acca1d440b3c79467827ce9ef9787e1ab311904e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00260-of-00512.json.gz": {"num_bytes": 30206902, "checksum": "c4efdad05d3f5e9f27884399ab0ec82081c26486e87f0ed5408a9eb80b223daf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00261-of-00512.json.gz": {"num_bytes": 30035514, "checksum": "e47675a956a626a32b1870c61e6f98c3cfe9cc571901cf477abae982b4e63c96"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00262-of-00512.json.gz": {"num_bytes": 30406718, "checksum": "ae19c1389e26562322f745bafbd7839e7a95b3169743d48baa7ae7f2db2a0b5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00263-of-00512.json.gz": {"num_bytes": 30266531, "checksum": "289c9fee87f12ea22ad5329f80cb379e5e9c22c5cb6639077748958228c62bf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00264-of-00512.json.gz": {"num_bytes": 30100823, "checksum": "7c65dd5d90c6df49ca2dcbfdbf1b9fbb0789cb32043795942d88c5f2d7a99869"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00265-of-00512.json.gz": {"num_bytes": 29957109, "checksum": "e3a1b501b2cc3f5f2667ef179d7876db602daedefd0cd741c0898679b24984e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00266-of-00512.json.gz": {"num_bytes": 30196603, "checksum": "9337dd8240f168da5f6a8b57c5c169a2a400a9a160eccc8a6e44e7b32004ff19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00267-of-00512.json.gz": {"num_bytes": 30304605, "checksum": "513eea4e78c399cc045e25f13bb5f77ddb6c9b606522bed8216945c529894e8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00268-of-00512.json.gz": {"num_bytes": 30312562, "checksum": "0503c5bf6848213c5fcb81a5c94307fc010d910a8989e104ad5fedca58c76f7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00269-of-00512.json.gz": {"num_bytes": 30045257, "checksum": "59bd3011d12d7d70b5fd64bc2dd2016b1a9ca6f0d210dbb3e6c202bbbf74ced5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00270-of-00512.json.gz": {"num_bytes": 30027628, "checksum": "8d3ecf4c61acafc49b624d08b6aa31340643e030f6c2248f689e8a17d355359e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00271-of-00512.json.gz": {"num_bytes": 30014730, "checksum": "b2e4820a0a7287786f802b3b40602c8ca77c7813b5f50db8a336b89b89bbdf37"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00272-of-00512.json.gz": {"num_bytes": 30145705, "checksum": "20c73e4a9056a5201621a4799b86c323c5136af43caa63a74298a5c3bee890a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00273-of-00512.json.gz": {"num_bytes": 30165945, "checksum": "8f07a91b6b40444635d869b94558fa68e3593626808bc6122d4e17403cf76101"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00274-of-00512.json.gz": {"num_bytes": 30097947, "checksum": "9530522c841d8f09ccb89f4f0238f7b9048c211e85b27449fb3c09d3bd2bab7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00275-of-00512.json.gz": {"num_bytes": 30296359, "checksum": "51a358db81805a20df4f920baacf3adea05209282f800fbedfc7fa49638a072e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00276-of-00512.json.gz": {"num_bytes": 30311407, "checksum": "a51253cf73fb200053eb5fd5eca398a7a070fcaa27fc99b23389d09eef7fe5ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00277-of-00512.json.gz": {"num_bytes": 30372345, "checksum": "cc4f6d9040d8c4909d4ea5b661a7e54ba4775ff1c7c55db1ff686a56d428e2a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00278-of-00512.json.gz": {"num_bytes": 30379507, "checksum": "1052defa657524e1211e67d775a32243b164eda431c4c6ed351f0c6727f21b16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00279-of-00512.json.gz": {"num_bytes": 30195406, "checksum": "6f4fdc92c516ad779fd521afba7d8d5bcd40672e63028f43f70fff4d7605f5ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00280-of-00512.json.gz": {"num_bytes": 29902057, "checksum": "c26f89efd0977465f45fe321036d88e2d6ca3ee1edc4bafe4b40ad1895cfc0e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00281-of-00512.json.gz": {"num_bytes": 29779702, "checksum": "094139d741b7a47faaaaf50093ab4edbef6ad1943985c6f453ce45a67a95b190"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00282-of-00512.json.gz": {"num_bytes": 30063500, "checksum": "280d69bfc795f1502a9e744d53d1a189051a1e771042721f8e6f74f6559e25a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00283-of-00512.json.gz": {"num_bytes": 29956350, "checksum": "505e49b7eeab46c77a324959eeff103f8899da1efc4d0fef5c0e6c6f8879a721"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00284-of-00512.json.gz": {"num_bytes": 30146285, "checksum": "9b075f2cfdb9a90fcdc7f779a52b0c5dad36385214844d4fd9df1e528ae78b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00285-of-00512.json.gz": {"num_bytes": 30160056, "checksum": "d9b9f3cbb9ce2a0a0a1a2f7ce91e98621d48a7a900c278aeef437dc6c0a7cdf0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00286-of-00512.json.gz": {"num_bytes": 29844025, "checksum": "6de9ff1013484662305e414725be2d0a4a1873a941250b95b80b5dea8919cf95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00287-of-00512.json.gz": {"num_bytes": 30089218, "checksum": "444ff132c4a5330653b7319d34b2c7f4ae3b960d8b510cbd7389e3881f65ac5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00288-of-00512.json.gz": {"num_bytes": 30092170, "checksum": "46dc5b3b84e4387ad718fdf96b751354d7048e898ec664e0d3bdfc21ee841ec2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00289-of-00512.json.gz": {"num_bytes": 30365397, "checksum": "b42e35746112198143ac18509e4f0148772db75e19f5eea9ed0d7e2849dbba48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00290-of-00512.json.gz": {"num_bytes": 30275920, "checksum": "25d99877235c4b9dacd5d1dd7e9d16bba76cdf6cb1725fa617209142873dca0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00291-of-00512.json.gz": {"num_bytes": 30125784, "checksum": "51da68b6f2751a83e2534c342b6e9d69c419fb606b44c42b872d69f5f726df3c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00292-of-00512.json.gz": {"num_bytes": 30201021, "checksum": "1e0a42b5e7ea7049c3c86b96d37c5d1c36f3ba2e2dab02145a897ef056fa6a87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00293-of-00512.json.gz": {"num_bytes": 30124224, "checksum": "8c744f5c6eb92c0de70649cd773c0ad147bc7a1487b2ae7f1107bce9d19da601"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00294-of-00512.json.gz": {"num_bytes": 30074708, "checksum": "b3cfa4c4408c1a9f39b48e18a62e112ec3c132b226efe0850f9e58e2a517aa97"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00295-of-00512.json.gz": {"num_bytes": 29990007, "checksum": "012f63e147d22e34249e930975a2d8958a8d0b17350a9f6e368d702189b40d5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00296-of-00512.json.gz": {"num_bytes": 30093755, "checksum": "5573859cc485ae4535b83fd408dcc6a82f644832c93e6125db9a16dd6ded338f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00297-of-00512.json.gz": {"num_bytes": 30078472, "checksum": "25e694485171ba1347ccbd7916c1b87a0d46acfd13795a8aabb1cb57b5eb1221"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00298-of-00512.json.gz": {"num_bytes": 30327122, "checksum": "6d6832cb3b1c86b6392bc9ca52f69a0bb16bf71c3c7664d9fe668ee259a40a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00299-of-00512.json.gz": {"num_bytes": 30214180, "checksum": "9f3c3d87a525874ea117e36e0b30d7f5cc6c64564506808058a0788d74943634"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00300-of-00512.json.gz": {"num_bytes": 29895171, "checksum": "e99d296965da2f731ea660889ce834cd1d21edf427298bab3a059ff3ebc64a2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00301-of-00512.json.gz": {"num_bytes": 30131063, "checksum": "e5eeb0f237cf986134c946bb3c2a4b5483fb9c88b3c2b16b9db26135043036d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00302-of-00512.json.gz": {"num_bytes": 30184609, "checksum": "4ac9bf5ca6fac7f7293238852424340326347ceaa6f5dfa6fddef8003421bebd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00303-of-00512.json.gz": {"num_bytes": 29956412, "checksum": "559019fe1ef1f7e77ac53ad98b3556965ebc524ecb80bbc3f26255d5ae6e3609"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00304-of-00512.json.gz": {"num_bytes": 29974071, "checksum": "3c54edc4b6a7e34048cbbadb55cb3b16496a4e6e7334b4ede4e1368daf4c5301"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00305-of-00512.json.gz": {"num_bytes": 30338106, "checksum": "1c91c0c5bcc2bec0a698318ad6f576a06db7885c20ed7f36782427b80580a75a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00306-of-00512.json.gz": {"num_bytes": 30178986, "checksum": "fff99f2758c2de57ccbfbfc6388f67e624d00d4a6cccb5820a7a8f5fcf02d386"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00307-of-00512.json.gz": {"num_bytes": 29493455, "checksum": "5d08c6e3909e21bed456ff9d06c983f14d3a277cb399a91047a692184f87c4c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00308-of-00512.json.gz": {"num_bytes": 30228844, "checksum": "04bffac195e24383d06b0ab9ebf019959a4e7abe8e8e6a0cdfbf0a8e7c23c899"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00309-of-00512.json.gz": {"num_bytes": 30351688, "checksum": "3ce14d5104d1318c6a16d042735f0a71f4452897de60d17408181ec5b135bbb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00310-of-00512.json.gz": {"num_bytes": 29993012, "checksum": "afad2f39bf4cb932e50d9a0be93940b423e7abcc3d67dac15b1939e4e40f4ce4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00311-of-00512.json.gz": {"num_bytes": 30448951, "checksum": "a049c31ef6304084d33cb7bdd2e21ada0c60b40b1002b2369e60d36a5098c4b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00312-of-00512.json.gz": {"num_bytes": 30034189, "checksum": "557d1e88400a6d1d8ee4d717a959239edacbdd3e18d8cd20c5c85b77174dc302"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00313-of-00512.json.gz": {"num_bytes": 30066486, "checksum": "e4823ea1e9a59d5db84564a5b90c28fd8058450f238c60ad689ffd6b673d65f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00314-of-00512.json.gz": {"num_bytes": 30397706, "checksum": "1b4c0653e7ccf7fda0a53d8cbd5ddd57322ac83822e9d05bbdb9eb8ac979cf50"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00315-of-00512.json.gz": {"num_bytes": 30219107, "checksum": "9c364c9cab4ff7acdd1818b13de2f36713df8fa6c504ba15cdf47fe8e3c30206"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00316-of-00512.json.gz": {"num_bytes": 30098661, "checksum": "84dd8a8739b5abc39d8180f0894b1fbf2930d6d333d7c86b646f40763327397c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00317-of-00512.json.gz": {"num_bytes": 30178992, "checksum": "16e4791b4e5ab3719dacf79fedb0b88ed54346372874c37ccb71d86bc419edc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00318-of-00512.json.gz": {"num_bytes": 30022982, "checksum": "98345a826aab12bdaf5e639205d5dcdc1da8fecd7cafc1982df89ac8d4df7ebf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00319-of-00512.json.gz": {"num_bytes": 30360409, "checksum": "d53a39019a1627b42ae6bff68e283d37d0bb5f48b328c2c5cdcc1a3897f4e992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00320-of-00512.json.gz": {"num_bytes": 30347267, "checksum": "c343a0eedf58484055e58762802ae8cc05f2cdb0b923785c493d056a2cbdb015"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00321-of-00512.json.gz": {"num_bytes": 29967877, "checksum": "cc5795d254ad749ccfe613034927bdf95529545ae1f277b694dd24a5996aca83"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00322-of-00512.json.gz": {"num_bytes": 29885538, "checksum": "d5eaaa1eea983bd37ed34651e6c16b746ff7c92e48038b234149fa6d04d3d866"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00323-of-00512.json.gz": {"num_bytes": 30308848, "checksum": "a42cfaef5e088fd6b24dfc121084a6cd038f5b0bfaecb9f33997ab22a97fb155"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00324-of-00512.json.gz": {"num_bytes": 30351634, "checksum": "0e2e6933f93466e9c8fe966f7770fe4c34caf182c713dad3206f4132eed1d41d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00325-of-00512.json.gz": {"num_bytes": 30077168, "checksum": "77cdbf7040ce7f38d735fef41813ce63aaa16fcd87fce80e6ca6bd56d350c369"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00326-of-00512.json.gz": {"num_bytes": 30031750, "checksum": "8d994c2dc1b766e3270dce3f0b8f6f8fe22d5c1e0e9780e1bfed52c1292b8641"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00327-of-00512.json.gz": {"num_bytes": 29845765, "checksum": "f6279e351d016769d6fb5482d01a15ba054d5fe6f9f1c4e92c0663cef0083002"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00328-of-00512.json.gz": {"num_bytes": 30253188, "checksum": "2ea84aafd94d1843a2cc4428279dbb079c6ae0aae6c00f90ee4b5ace3c827afd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00329-of-00512.json.gz": {"num_bytes": 30124922, "checksum": "49e3d91126d53eada7bbd87bfe9eaae74f059c69cd70a3a3b8101f49c1aca154"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00330-of-00512.json.gz": {"num_bytes": 30026414, "checksum": "07442fc4f7fb1732362293bc15a6754d70ecf4743392cf89c4497b3cd96269fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00331-of-00512.json.gz": {"num_bytes": 29961847, "checksum": "f437c6f5f758a5d32c8fc949037060259162864c29aeaabf37032e79f5a1cf0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00332-of-00512.json.gz": {"num_bytes": 30167166, "checksum": "96018497eb6dec020436c1333ff81980a64fb615997855fdd8cf35fe3f658db6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00333-of-00512.json.gz": {"num_bytes": 30192963, "checksum": "1c12ea6b9031049dbc84e4da6b5fdedf480e989385d758c88322c415a1cabbb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00334-of-00512.json.gz": {"num_bytes": 29847008, "checksum": "c269285f15f626b4b15a7d1705ffa08e3f4d49ce13de8174b72f9f6276a1c6af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00335-of-00512.json.gz": {"num_bytes": 30262244, "checksum": "179ee564e6fc644d9ee139bdb02d470a1172221b0f6e510ee5935683500f8257"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00336-of-00512.json.gz": {"num_bytes": 30262910, "checksum": "317933afdd8dc8a3a355e44ee3d84bbab12a2f30c98ea1172dde7074ed4c0557"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00337-of-00512.json.gz": {"num_bytes": 30155329, "checksum": "c5b850399252ec41b0fd9cb2da87ce25e5a44df9f44c6ed9d8c559a5729e5a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00338-of-00512.json.gz": {"num_bytes": 29952961, "checksum": "48083123ba97a6212e0501799bd01936f0795bdd4d9c2710b9aa67d54b29037e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00339-of-00512.json.gz": {"num_bytes": 30403399, "checksum": "313b60f985dcf591f34d351b758eedace655b6c6d3946dd2ddc55f34a9a97ae9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00340-of-00512.json.gz": {"num_bytes": 29917484, "checksum": "2c72290f3bd51dea2a2877d68a968dc2b75dadf99ab3cc2230e41be45f3515d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00341-of-00512.json.gz": {"num_bytes": 29905522, "checksum": "1acd83a0da4a7a4912b589dbeb68b37396d0454371b2b71af4ae18b854d482ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00342-of-00512.json.gz": {"num_bytes": 30022369, "checksum": "8756be42335bba12d06de63e247659f8d603a092ff342360dfed645aec135c47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00343-of-00512.json.gz": {"num_bytes": 30229313, "checksum": "863e29987a3ccfa08e14ae987c81367a53b9fe08795184db086117a9555e058b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00344-of-00512.json.gz": {"num_bytes": 29924335, "checksum": "aa9003a7cc3527fb658fd807c78890587a8b35634a1f0838bc221a6374205d20"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00345-of-00512.json.gz": {"num_bytes": 30229482, "checksum": "a7e88b015bcf7761217e9b3ffd413f13cac48f6afe083353436de6cbd0d0018d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00346-of-00512.json.gz": {"num_bytes": 30029147, "checksum": "b862ea62ac032c203c0038c061a44edabe4644be03b876ec7322e96762374940"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00347-of-00512.json.gz": {"num_bytes": 29808182, "checksum": "62915b86cbbf61a76f73d05509a8e839aae0b965134ef79022377625df7ef741"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00348-of-00512.json.gz": {"num_bytes": 30091116, "checksum": "6c384c2c6bc8340b88e085f8bbc2616be68c96fa7b8b88306b4500367d053a49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00349-of-00512.json.gz": {"num_bytes": 29867618, "checksum": "bfb19508ecf8bd4d9a8847f0edab5acde6896182c27da706a6f2863bec43c152"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00350-of-00512.json.gz": {"num_bytes": 29723106, "checksum": "a645c62c94de9018175f15a0b38aa8bd2484601ee189b7c27d589288eb5af97e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00351-of-00512.json.gz": {"num_bytes": 30047620, "checksum": "991061a23834e6bb3dc0595cf0e8328e07746d10fbf7a7ba397c1410cb66175a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00352-of-00512.json.gz": {"num_bytes": 29808328, "checksum": "6c8e377a6cc82e81d66e2be3d23c1cdd42480015a68a1db458d542b7ff64ab7d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00353-of-00512.json.gz": {"num_bytes": 30040117, "checksum": "ead6f32d98a91c47fb9c21334143f02181efb0b831705baeebb9820d069598fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00354-of-00512.json.gz": {"num_bytes": 29953984, "checksum": "ba349e503d017abbc1c83da2314c0a4892a9f3e5e480173812578f44d9b5904c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00355-of-00512.json.gz": {"num_bytes": 30179912, "checksum": "2bfeab794bbe0432db52cc595d25864b17fdb0744a80d6d907f6f2ffc5c56b81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00356-of-00512.json.gz": {"num_bytes": 30312163, "checksum": "d0dec696d28c601d3a1f75b0b6e6e711e00809f0d5ea915f63cb6d9b7adcc597"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00357-of-00512.json.gz": {"num_bytes": 29931515, "checksum": "d43c75371e32d0c1e65f43acc00aac3ca43762d4c6eb6bb61759ac5fca593a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00358-of-00512.json.gz": {"num_bytes": 29739788, "checksum": "96fef1b4a5d6a080ff5d4a10bc90911dcb2ddecb4be91d0c9620e6d2484e3ee3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00359-of-00512.json.gz": {"num_bytes": 29913841, "checksum": "05b065d2d13b787ddee4707be7e2be46173c23794b9e8c773d0da743f435db17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00360-of-00512.json.gz": {"num_bytes": 29805295, "checksum": "826104b9f4c2634d128f15564bd4990057dfbbb4066f2a082039d243bab56935"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00361-of-00512.json.gz": {"num_bytes": 29839676, "checksum": "ee5ba4cb14ecee0c857828a866615c6bfe45f67b158173dcac44146a02d97738"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00362-of-00512.json.gz": {"num_bytes": 30154783, "checksum": "d67b49e6fa5dc293fbd3057b7ca0beb7e0bd1ff692cdad7f2dfb7abadc1f4599"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00363-of-00512.json.gz": {"num_bytes": 30126118, "checksum": "6940704da6cde5822d48dc806280b8d57e0593ba299731e68ca9c2a4f7cf65bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00364-of-00512.json.gz": {"num_bytes": 30184894, "checksum": "e740b4a0240e691f16a423fd658aa3c7539986695418af3b5a171a48524db74f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00365-of-00512.json.gz": {"num_bytes": 30386766, "checksum": "5a6a9461ef9ca579a849f6bef4d6225504a885aa797d3b2236ed8df6f5ea72ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00366-of-00512.json.gz": {"num_bytes": 30208411, "checksum": "8e0ce2447dfadaa4d41b991a2ce1be63b409e58e88944594dc8591bf9ab41403"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00367-of-00512.json.gz": {"num_bytes": 30266003, "checksum": "04ea00b46a583edea7740d74d719ef7f303b7f3873365b9ff4e94f08ef80832a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00368-of-00512.json.gz": {"num_bytes": 29993752, "checksum": "38b1a55dd4ff1b504d2dbc0b2ad54fe43ab16c8bdba55bd97f4a55dafa8c83dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00369-of-00512.json.gz": {"num_bytes": 29833222, "checksum": "a25c405918920ed00edf5f3007cb8895b59fb67618dfea266b048273303b9592"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00370-of-00512.json.gz": {"num_bytes": 29988999, "checksum": "2812e6d9865d77ca8ac2d1499ba86be1ceed868a1da2bd13fbd0967058a3516c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00371-of-00512.json.gz": {"num_bytes": 29866636, "checksum": "ecd1d3bdc41c3f41f8c9d3a63c75766c173f70ff117af748a08c221ca4273b18"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00372-of-00512.json.gz": {"num_bytes": 30296883, "checksum": "723d2c5ebbdd95ab84c53e458d81944b6907d08c7aec67300f012880624d0010"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00373-of-00512.json.gz": {"num_bytes": 30310322, "checksum": "ae45d088521f2faf9852cb169962176e84bbb81d5ba157d4228d348f7fcf60f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00374-of-00512.json.gz": {"num_bytes": 30340527, "checksum": "9b09c9e1b424fd05540b720c5a85f71eea43d743dc4ebb318e839125ccac9383"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00375-of-00512.json.gz": {"num_bytes": 30193692, "checksum": "c3ca4bb179cadf872f25f1cdb5c3667933bb8dfb7af21068a24b1b09c961dfa8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00376-of-00512.json.gz": {"num_bytes": 30184130, "checksum": "5d801f4bc20c4c6d8821ccfff06cb5dfe4214e571734feacbea3325462afa280"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00377-of-00512.json.gz": {"num_bytes": 30259301, "checksum": "ebf08508c24e29a8a14b72248f090d765b02ee7a31296811d0391f2a2e73c046"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00378-of-00512.json.gz": {"num_bytes": 29650049, "checksum": "c13e994e68b938ca069d2d412e7891cbaf2ee205d65b1c17c6acfea01adce157"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00379-of-00512.json.gz": {"num_bytes": 30265211, "checksum": "667da6f0650dd684aa50bc691b5783968ae8cab847dea14fc8d8bfe203e351f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00380-of-00512.json.gz": {"num_bytes": 30429631, "checksum": "7cf0e9ae00bec72f571d152730107efdd944176818600517fb2d0412a859d366"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00381-of-00512.json.gz": {"num_bytes": 29889471, "checksum": "f781b3128e92c54365be7771695555378067a65fb922e04062ab6f3f092ec827"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00382-of-00512.json.gz": {"num_bytes": 30029894, "checksum": "2d133def2bc4b840312ebe5c466c9f22729b67aa4c2a41dda2e6a9a55ddcddbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00383-of-00512.json.gz": {"num_bytes": 30249255, "checksum": "e8610abf7e2bd70b1067a1b2dbf392ac32be156945502629228969974d3899b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00384-of-00512.json.gz": {"num_bytes": 30362665, "checksum": "f217071bd0c1b1bddb3342c85064d7ebb54bcde2512997636f0638a0b3641588"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00385-of-00512.json.gz": {"num_bytes": 30080234, "checksum": "2db4b15c7391b6e6d3791721ee574d09101df597110feebc59e4f0aff4df6c26"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00386-of-00512.json.gz": {"num_bytes": 29897704, "checksum": "035daed74487c5262b8cfbefdfaefd17f2834c7b4a1d293934d755e059b58f5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00387-of-00512.json.gz": {"num_bytes": 30072139, "checksum": "73013fbd06eaf94a7c8a0f0de420f83bed56655fb2d4e5d93972e8ca1847d130"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00388-of-00512.json.gz": {"num_bytes": 30123843, "checksum": "5db846c3d0b36774ce771ddfa8c53a915767926a2ad48222256d839326336f19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00389-of-00512.json.gz": {"num_bytes": 30278955, "checksum": "9e4c590e67b2fbd357af955e39864ffe73dda201d76759935fda80b10b463500"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00390-of-00512.json.gz": {"num_bytes": 30013591, "checksum": "90974ba6eff489e0f4f52187b6241120740c782945e86525cb5d1e551a54e322"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00391-of-00512.json.gz": {"num_bytes": 29925212, "checksum": "10fcd62813434e2557b5861fd8604f534952561065bee9dc525b1cd3f5b2730f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00392-of-00512.json.gz": {"num_bytes": 30016498, "checksum": "da88b36bd3f15551d8fad115a86f111cc5c3d9a3c6fa9497214aabec7bcd6aad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00393-of-00512.json.gz": {"num_bytes": 30061083, "checksum": "1ed9881020f240e1277e6513bc2abf24ea48e9cb0046d7e87a6d3669c8b42a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00394-of-00512.json.gz": {"num_bytes": 30043459, "checksum": "a35c3de1b0c982df8471705574e6eb7cc730fff122ff17d1381f2c7b9f20d6bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00395-of-00512.json.gz": {"num_bytes": 29921106, "checksum": "f4cf52f8d6a1288773cc366469df140f885b233fb6aa1cb75387a450d88ec94f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00396-of-00512.json.gz": {"num_bytes": 30024980, "checksum": "5ebe04e54e4242d52aacb4c2e107dd10e609d5a7a6ff0425d9952bed98ef4921"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00397-of-00512.json.gz": {"num_bytes": 30096825, "checksum": "3ac381004d8257aa50fb28f0fd2171abbb93ad825c3f43422b9dbec6e1c6f31b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00398-of-00512.json.gz": {"num_bytes": 30059739, "checksum": "40c38af325f4d01ae7c74aa9cd8f8d1c96c6af851175f80d3c50d85c5f5d3585"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00399-of-00512.json.gz": {"num_bytes": 30049826, "checksum": "2ba0109b2d5b88422250bcbd2494cc6e11528710f38fa6e83a1f699b840b68a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00400-of-00512.json.gz": {"num_bytes": 29953506, "checksum": "010610ba3af3dbfbcf2fac93136b7066fc58eb914dce9ae999722d0cfec4d331"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00401-of-00512.json.gz": {"num_bytes": 30271141, "checksum": "29587bb4be2c367f6479705b5c3c28716affeefc857ac1f77e4c33e55264def0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00402-of-00512.json.gz": {"num_bytes": 29861236, "checksum": "8e399149c335ec599f881fada448c9b4be22326357153c74b0de627078f1d43c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00403-of-00512.json.gz": {"num_bytes": 30175831, "checksum": "0d2800836914a1e2ef4a1aaea6e70d19699fc2555582ec670223177cac05a4fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00404-of-00512.json.gz": {"num_bytes": 30097682, "checksum": "f9665e9199978b123feb962ce347b30cc1520626c32dfef0ca3cd8895a45e445"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00405-of-00512.json.gz": {"num_bytes": 29810961, "checksum": "8ea29cf9f7774a16a4c2aaeff1b6353de2951073676a9c411f19b0a5fb755b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00406-of-00512.json.gz": {"num_bytes": 29963498, "checksum": "90b10c91f6e0006576ec9b426c424e50fc1726c25ae8eb91bf91bb9001ade2e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00407-of-00512.json.gz": {"num_bytes": 30089554, "checksum": "cfa905514e4f19c4eb82e438f5eb987731004476f026f4bebbeeafbe519ec85f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00408-of-00512.json.gz": {"num_bytes": 30148002, "checksum": "dddada59e2ef306cdf83b7c9ce3c912792237852053a4ea683224438a242c5ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00409-of-00512.json.gz": {"num_bytes": 29989174, "checksum": "907667ac304b6cca7100a9606e915c003fee43f1640d5b01405beb16eac4c379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00410-of-00512.json.gz": {"num_bytes": 30519580, "checksum": "acd5cd2ecc46927046c81c9bb3459dd72a98e346ebb59c13c0db08fbb60961a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00411-of-00512.json.gz": {"num_bytes": 30408107, "checksum": "6a9c2d42717f853cd4a76fc5275e95e2a584b7465c6059f586f6a06417048a42"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00412-of-00512.json.gz": {"num_bytes": 29699198, "checksum": "29e76bdab47496ed61a102edd3c61c20e60ab52abeb8e6068f7aa4ad1868f4fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00413-of-00512.json.gz": {"num_bytes": 30065457, "checksum": "b4a33941d0b994b82e3be351542cb4a832742e050ebbd71481e7ba34c8dcbc3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00414-of-00512.json.gz": {"num_bytes": 30342960, "checksum": "4ba7edb3c77a45f0e4cb7e969053db6f44ce8c0a8ef262582512814b1161d9ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00415-of-00512.json.gz": {"num_bytes": 30201576, "checksum": "25cb4eb4bdf3cd1b29289a23696be8bd41c5f577294e94607bea7b91252a04fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00416-of-00512.json.gz": {"num_bytes": 30021170, "checksum": "60472bd2a2896bfb57baabb583fc6cdd402a1d776f6a4c9bb58ed556e67cd76f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00417-of-00512.json.gz": {"num_bytes": 30237505, "checksum": "aea8fd33c2acf1cef890549b1f88b18a2eeb37f6d4dd22b552f735811ad0b8a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00418-of-00512.json.gz": {"num_bytes": 29999334, "checksum": "93583d771ce7f0e1d044de2919a3ffdd48b7b7dab0cd3b6dc459200dd53d8762"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00419-of-00512.json.gz": {"num_bytes": 30194801, "checksum": "cd36e129487272742f3e60ab6512dd79b3d1ce3c22490d2e47c00c2ae595cfc6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00420-of-00512.json.gz": {"num_bytes": 29903898, "checksum": "6f18a5ffc7efe5f555b02d3a31ed43714e09e73f7462206220d70450f47cd6f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00421-of-00512.json.gz": {"num_bytes": 30015573, "checksum": "cfacef2cffd953425eaf4d7b2b6cf5d2637bf5d58c6ed2bd0002442795c7d36c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00422-of-00512.json.gz": {"num_bytes": 29966521, "checksum": "14f646b15948cf586ec1abd4bf4bf45bf180913e4d09049fa779bc7a196e455e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00423-of-00512.json.gz": {"num_bytes": 29972805, "checksum": "ad7d4ab443c7a8122976570891a225a44ff86d2299d70706066633a6204eb0de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00424-of-00512.json.gz": {"num_bytes": 30317886, "checksum": "37c8bf3b535ea4053aa2424c846e3449f9eb27d5ff999e1e93b6cee0aa975333"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00425-of-00512.json.gz": {"num_bytes": 30059310, "checksum": "674ca5eaf6a88f76881c8a1c48e1e0f93794785ee5ea17fb70f49228d7f39614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00426-of-00512.json.gz": {"num_bytes": 30182498, "checksum": "988d08cd18162d9a309155d2e75cd4980f76ab4c73ef8286edae94ca4628ebcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00427-of-00512.json.gz": {"num_bytes": 30253874, "checksum": "aa8c08a684ea0bbfda9297aea07429172a2fa4a161268b964421796173275b35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00428-of-00512.json.gz": {"num_bytes": 30055421, "checksum": "b1ed26e826bee7fcbc31cf1c368c9a63eeedbea1c2fd0fb07370b461a03d1a7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00429-of-00512.json.gz": {"num_bytes": 29830674, "checksum": "3efdc67ad7a108416dae47886e542da5c2ab1cd7e1aedd25c1c5d4e0607572f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00430-of-00512.json.gz": {"num_bytes": 29938000, "checksum": "3221ef5e4c28d44c1da4fa04689f318217991c07aff4fdee5e1091fe8e1162ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00431-of-00512.json.gz": {"num_bytes": 29829687, "checksum": "225f4e22df1b45a7dc9fef2f5a44da8f8ee25608cbe34195e21b49c8cd10f3ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00432-of-00512.json.gz": {"num_bytes": 30006209, "checksum": "9fc53637db7b16c8cf6f824adf21d4602efab715ad78eab62c4be7981a8bbc1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00433-of-00512.json.gz": {"num_bytes": 30656456, "checksum": "6bf7b701dc18f68d0facd7cdea49a26cdcfdd7829d5346eefe555485cfa7f336"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00434-of-00512.json.gz": {"num_bytes": 30138891, "checksum": "793532f72aa41c1dd7c549e9597fe8e73796c53eb5fe410a73de418ec446d686"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00435-of-00512.json.gz": {"num_bytes": 30430276, "checksum": "0d13d345ad12999fb4e7a9675e08bb1c90980fd193ed8530e4258e07bd6ea754"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00436-of-00512.json.gz": {"num_bytes": 30173309, "checksum": "fbce5fadb4b49bf833f77337929d873b2b25c3b564f7622f3672dde7a044e5d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00437-of-00512.json.gz": {"num_bytes": 30142240, "checksum": "76c34800a3223f5fe0f1960f3d3c9dd9ecdc2e652493d71ef245415b5027c902"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00438-of-00512.json.gz": {"num_bytes": 29979673, "checksum": "4784c3787d24b9d46ad7c835683c6506c2e55c84835391e2aca0355f032a1888"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00439-of-00512.json.gz": {"num_bytes": 30169105, "checksum": "5012d03e637769d7494bd3cef0a8dfc8b38c995e0d5780089c15d6b1495b3a8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00440-of-00512.json.gz": {"num_bytes": 30107004, "checksum": "529beaf4ad0251e35be574b1f623571526ec91a588ebd7df43e9d1cb99445f53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00441-of-00512.json.gz": {"num_bytes": 30324563, "checksum": "f5e5fbf5e329f5bb0e83f758b8fc76516d65c3f91ad97e328187eaea83e4b667"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00442-of-00512.json.gz": {"num_bytes": 30335681, "checksum": "b8a26ed60f87a87347886b4467aa576ec5e8c106931589a1aa821b99fdabdb54"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00443-of-00512.json.gz": {"num_bytes": 30155655, "checksum": "e27bfb813fd6aba96ada81b095a559f0b7847cd25f7f8973663b19cdc5b8985a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00444-of-00512.json.gz": {"num_bytes": 30340540, "checksum": "705dec13ba2824d45e801bc2cf3e709d6492b1ff6de2f9ddefb5a57dbdada4ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00445-of-00512.json.gz": {"num_bytes": 30248960, "checksum": "09a6b83910369cf269c4f095607fb2f0ac0ec7e25b501f577fe13920a8573ee0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00446-of-00512.json.gz": {"num_bytes": 30316703, "checksum": "8f88b794c08bb492f50073337a30aafac0d05819505b507ab283dba0cf17d125"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00447-of-00512.json.gz": {"num_bytes": 30184407, "checksum": "38c819df823197bea6d647c3f78bcc15024aabba814cae322c1663c45fa8382e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00448-of-00512.json.gz": {"num_bytes": 30238484, "checksum": "8c0abfb8dca37a179b01dadd2227206cbe6e5b916d0111c0b00d2edc3951c7f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00449-of-00512.json.gz": {"num_bytes": 30143151, "checksum": "9731e9644e5615d5d5ebdbacc6efa6382df856c8763b7485c9a5838864c1332f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00450-of-00512.json.gz": {"num_bytes": 30122606, "checksum": "3b746f616f21c91277cde8e6d0d7f792ead7874de7ecdf11830a4a56db3dc799"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00451-of-00512.json.gz": {"num_bytes": 30128179, "checksum": "d6cadfc64ee39c9beb93f0bf8c169ca9d9053e0f76e1c9697841438e20dddef3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00452-of-00512.json.gz": {"num_bytes": 29979326, "checksum": "42de19ffc3ec821fbf5ff686d1b36d189ad9ee5c4553a2ff0d003ee1a754c9c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00453-of-00512.json.gz": {"num_bytes": 30118272, "checksum": "22f9b2d3a9f089f1015f74d1ca0aca8f2a4970595326d964817177cbe6859271"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00454-of-00512.json.gz": {"num_bytes": 30018294, "checksum": "17c16895edccbb8b40fcc52cbafc0c15957020eb530e071dcce34544d5958bd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00455-of-00512.json.gz": {"num_bytes": 30155903, "checksum": "8b9d49837b309c3389d03dd3bbae92395bf7086134fbc69d28d9fff60a90d4a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00456-of-00512.json.gz": {"num_bytes": 30282104, "checksum": "ab63fd2efb0cc883d303241b3488a8135a196db7edc844458cfc1483898ceb3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00457-of-00512.json.gz": {"num_bytes": 29920723, "checksum": "dbde2eeef90144b209ef5afa6d5165ad638ae57d919926a379a10fccf6850a61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00458-of-00512.json.gz": {"num_bytes": 30163167, "checksum": "800307106f5861e0bc246bcaae214e6dadeee849905cac184ecfe6d0b560fa68"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00459-of-00512.json.gz": {"num_bytes": 30248893, "checksum": "3e78d327a9463929f33311e18116f5d1d2ae4926f7a600378875ba854cf5ee47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00460-of-00512.json.gz": {"num_bytes": 29840067, "checksum": "047568a5dad00b04ca1ea4aa262c7a4af9b61e87bc4ea02ffd5c6c8c049bf8a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00461-of-00512.json.gz": {"num_bytes": 30179062, "checksum": "ed8abe7b465bc19150b831632cb7afa298d6cb4beb9b6043a35a0f8afb5f730d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00462-of-00512.json.gz": {"num_bytes": 30266398, "checksum": "d7b74f5c1c1f7bb489700adcfb7e48400c4fcca7669e2d56396d9fabb5a63b91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00463-of-00512.json.gz": {"num_bytes": 30158800, "checksum": "224815aee29f6d04ddbc7457c84338eef9b127a767e7b50ed77283ff166d4f93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00464-of-00512.json.gz": {"num_bytes": 30393915, "checksum": "0dd019fd2c19936ce2e6410b65872f630131c5da7543c8e66fa87547fd1a2209"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00465-of-00512.json.gz": {"num_bytes": 30148939, "checksum": "6d74dc9d74d28c2b8ba8d43ba3d594af0cb176cfa7bf738f3933be2a9c37bb85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00466-of-00512.json.gz": {"num_bytes": 30268228, "checksum": "0e201327066f28c19b082fe35e4fb3bd76c8fd2d32236d1d6e2309489152aa66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00467-of-00512.json.gz": {"num_bytes": 30121937, "checksum": "7352e5a9ee66dcbeed2c9e1fbe6c9355f0e5dd1b30b592a9fd5690958945e5a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00468-of-00512.json.gz": {"num_bytes": 30004669, "checksum": "53876848336ac57c082c9d5735bc1717f69ef38688b221d5e5ab9cd9cb4ec620"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00469-of-00512.json.gz": {"num_bytes": 30049860, "checksum": "a5a720b38f106dd5d2a2b7647748b52b4531ac12294e3b0d8dbc92062639c0c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00470-of-00512.json.gz": {"num_bytes": 29961380, "checksum": "9611764fc4f84b92e86fa6f9ea41464f6c26b07d1c51241b627a3d155e99d163"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00471-of-00512.json.gz": {"num_bytes": 30449164, "checksum": "db508df549d518c3e8b99b2f0098ea93fead1e632f53d8ae2cebff1d3476577c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00472-of-00512.json.gz": {"num_bytes": 30312620, "checksum": "1993b5e292c6c60a3373aabe896f1a57afaad73fdce0ec60e30696368f7c0afa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00473-of-00512.json.gz": {"num_bytes": 30406764, "checksum": "913045c61fb5a145379d9fe08c91ea63092b197400c0c87bfa65af91720b563c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00474-of-00512.json.gz": {"num_bytes": 30078563, "checksum": "c495119e150b083d709ca915abd760683793361ebf3e079b04efc9b7e1900379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00475-of-00512.json.gz": {"num_bytes": 29860761, "checksum": "50bb5f40d2e91ab136aa63063fff860529c8961f2a38500a645b10339751589e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00476-of-00512.json.gz": {"num_bytes": 30199778, "checksum": "c969cfbb7ed7716f665b336b2ed9f7b10b532c7adc6d8a347964831a39cfef0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00477-of-00512.json.gz": {"num_bytes": 30130742, "checksum": "54c8b89102cf882eda5208544a6c5d317c1defa8d997f9450ebd576e58f91830"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00478-of-00512.json.gz": {"num_bytes": 29901444, "checksum": "f669299d794ecc0523c64ad31af8fcce5cf3f880e87fd73f4c3f434425e9b238"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00479-of-00512.json.gz": {"num_bytes": 30587214, "checksum": "25d0fbd9027deaf140650f0b82a2316c37939f199fe7633b9f643684404f2029"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00480-of-00512.json.gz": {"num_bytes": 30145237, "checksum": "68a29728290e1199ce8d1ac060365bc443ea67c24292b2b04f1b4ca44ca7238d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00481-of-00512.json.gz": {"num_bytes": 30204159, "checksum": "1605034b89e33f6794c901adac1eb200bb489f76b9bae6bc56b01e9f6ab4c254"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00482-of-00512.json.gz": {"num_bytes": 30430794, "checksum": "2dce9df095e89ea6645fb599f518612511a62b6c475808ad004c32968b19bae8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00483-of-00512.json.gz": {"num_bytes": 30102412, "checksum": "c7c626977521b0d1f5bcc02c484b3eb4f517ba71006a4802df08a0f4cfb8ea9e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00484-of-00512.json.gz": {"num_bytes": 30171871, "checksum": "519ed997f1f1f1de7864b0bddf202b25e25bed349f63593a88337262d7705968"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00485-of-00512.json.gz": {"num_bytes": 30049539, "checksum": "8d2314fd3239ba3dfa99962c1d0a38e05edf9194e1faebae88f6b19ecab8fbf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00486-of-00512.json.gz": {"num_bytes": 29949995, "checksum": "a7521e09cbe77098c23172427bfb931dd50f0c9d58b034fd1621687849a8d379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00487-of-00512.json.gz": {"num_bytes": 30345072, "checksum": "ebc6254a4d241afb886b8df20819301121fcb234a32a1dd4ee8ae49571081f92"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00488-of-00512.json.gz": {"num_bytes": 30300622, "checksum": "509bba28ddf770d38554a2e846f2ce0d2af59e3662a6d6ec4dddb75fb509f8d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00489-of-00512.json.gz": {"num_bytes": 29949909, "checksum": "996e61f8e674b0a016a568630ee13a7473f99a919437c225a4198d232861e628"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00490-of-00512.json.gz": {"num_bytes": 29995429, "checksum": "9730024ad352eb12f74ac446ed32b9c57898658954be5dd639184fc5264527cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00491-of-00512.json.gz": {"num_bytes": 30293919, "checksum": "65b2a7de3284e892441b0fe8e850d89de842355d78fa9944358b1ee5912a948f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00492-of-00512.json.gz": {"num_bytes": 30115831, "checksum": "26b535c3175bb86ef721593f81d9cf006d4c3749f156c63ccd2a2c04e1201236"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00493-of-00512.json.gz": {"num_bytes": 30187809, "checksum": "a0918223c5523da20bd8230de1985b0a3cbb1e239af3d62a83d720a3a528c567"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00494-of-00512.json.gz": {"num_bytes": 30149878, "checksum": "6e9a5e329f834e41b4a8a9a6809df3243e5bffc580327912288ad7f790b43ab7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00495-of-00512.json.gz": {"num_bytes": 29711944, "checksum": "3b9ba9d667e1241692ff9a654a68e98e8e94e32244a9419b2542137b63fb4705"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00496-of-00512.json.gz": {"num_bytes": 30114815, "checksum": "24b78cc36bb0abc67c998320e7029b6e7bbbee267a367eb538f23956c13f27a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00497-of-00512.json.gz": {"num_bytes": 30048480, "checksum": "29c3606acf298498fc3498bd769544e2879afbd0d5c46cee298cb25058694aac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00498-of-00512.json.gz": {"num_bytes": 29934973, "checksum": "8afaffea92dfad745be8aa8cd3de0ee97cbcc26fbad6c71d56683aef6a27055f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00499-of-00512.json.gz": {"num_bytes": 29796509, "checksum": "9cbbd8f6d8fe92207c4cb2f0422284726deca1bde7f30cb01cce7fcd4665b380"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00500-of-00512.json.gz": {"num_bytes": 30221736, "checksum": "902904aa9fadaecbe698402a27b4e68b00813e67b79f84d4c696cd9c72f08f55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00501-of-00512.json.gz": {"num_bytes": 30108320, "checksum": "76e848f8dbc082158fc5d3a2f7c10cd6e03585667c00efc639f2c6f47d44aeb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00502-of-00512.json.gz": {"num_bytes": 30381907, "checksum": "885bbc9788235abf33728737f72f267e60d1f5d4a77493cae76f161651d89579"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00503-of-00512.json.gz": {"num_bytes": 29983805, "checksum": "5134934392b13e3f84dd32dcb1c59f4d5416d6dfd925bf896f3eb61881d82136"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00504-of-00512.json.gz": {"num_bytes": 30041413, "checksum": "4978245a7f545d676bad6edfdfe60ffdad94de47af0fb10649fa39e9b068939e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00505-of-00512.json.gz": {"num_bytes": 30021620, "checksum": "64933c28ea3f608326f1c6ef56170886767f1ab4f9ecbc4bf3263c7043901fce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00506-of-00512.json.gz": {"num_bytes": 30260343, "checksum": "84667dbe68ecf1f9bbdaba0e73eca6fe0444f6594a1e9a4b46e9812ae7bce7d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00507-of-00512.json.gz": {"num_bytes": 30173739, "checksum": "dd6d44e4f344f3ab1cd61bacced7b5f1429cf6823fc9282452a539012bda028a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00508-of-00512.json.gz": {"num_bytes": 29903443, "checksum": "4afc46096ac2697867c3a75896c5ceb36617c4c21a749dded58a1ea4565e41df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00509-of-00512.json.gz": {"num_bytes": 29862664, "checksum": "74a720dc16b389e8122d61aa94bc12a5bc4253ca6f39679781c938e2eb556878"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00510-of-00512.json.gz": {"num_bytes": 29744368, "checksum": "6a302049e7a1668c5fb2e4b5afca518fa53ba1a9dc717015ecb5768e85ec4139"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00511-of-00512.json.gz": {"num_bytes": 29896714, "checksum": "48b89e909c0e33fd59c9623f8517cdfa90fa35a4641f999c6f68e1cc9f2a309f"}}, "download_size": 15419740744, "post_processing_size": null, "dataset_size": 76331315892, "size_in_bytes": 91751056636}} \ No newline at end of file diff --git a/datasets/c4/dummy/en.noblocklist/0.0.0/dummy_data.zip b/datasets/c4/dummy/en.noblocklist/0.0.0/dummy_data.zip new file mode 100644 index 0000000000000000000000000000000000000000..7951eb50cff74d8d79eef2f8967a9b1ee5c6ad28 GIT binary patch literal 5689 zcmeI0cTkgS+QvgiiqwFJ^e%=TDMIKSq=t@!BAw6@KmqAZdXpv~T@(0q0scP-VRHfi zlz$fDk<&5LK{&hJ{iaBYR^xav3%j`fMRCi>)R7WO39&JHKcM*m1R7$S6)2E;ScO#O zb|SNCbUKOXq&n3I5NH&v!m1R!YvVzEDtl`6I`t_(={z)IuRSQ@H68^&yFwm6S%f72 zTTaMvTO#B*cOf&au{y-ULPeW--^seQ{wT|RWv>3Ww8>kQ0RM_ABRobd07kYQMjv5& ztv90!)nsTN10xQ>8cYTxw-O6vl=25)U}76sJ<+f_S@2*%-;yxRYzFm-_S~DYS=z!} zJu`$PRsMeKfw}545G=TS!#&0=>rCG;GN+o8`r&v|6nT z$gnb(#>F6FjV9rWuEQQ`%Ea{rJe@Sr`{(q%0@k0By|T;hhS@1Uzbp0-ZqGGns1LSw zt1}aZa?@507uu8b+cV0sF7SaeQ{PRE>VhV~!fMc7isdFMVs&e^n?Z(_8jthE(PX4BCgf-9h~(LkZ+*7s50?n~g}WSX8|&0g?~ zqi1n;|G@N_`ya3|(jjxphFDLX(PJjo8HW8fEm$@$BT z%aL{DkrmkbmTY>K#N!Jdj-59hQ4;S0n%{+;i-aq>Vk>H)61@meu9zIVHy~lW^S#Fe zciJa*iJPLF7r;IYFBb8Rx#nIo>?odHa-MfOBm9WZ7%r1WO4SpBlu6cP89hCxcC&+s z2=|7(!Ft2~V2c8GwYSjaGrahLR^|FMroM_icciLbvcBG!;VjaXcuU(-U8?Q7xKrzmm4YdLh_sB1*OhlTpuy|pkAM$cgQ~dHQeH;wL}qjt zx9h?p)~Fpi$RbuMgeaOVe7z#&;*UcViVbs5Zp@!8TrO72WjqbB6`?AGpU$u>eeO9X zXd?b7K;zeCbtW+rX!hQdeYQX;&9PUji(tl|HVwgI5O(;^|CTGY0)JQVOu(Q82Yp+R zNU&mRRBTQl$50zrJ(a=lnFaULpHq-ZcqIu4)z%18Dc^_Hoy&;t|x`FaY zK=!9FS4@l>k09J%!e#vf9@$2M<)5)a^+BJ0JKAO~Qq~vpC!1WDZT3Fej>*PVFAvhW zn#47>d$8l;FzuN)qaViI%s;SBS~<31`p6h)`Dk>!PF>G9d9$ysM1cRa>siOEI9z2v zr4Q>q&PuDRt#6}<*Hwtt!L$jkh_|$mI#+j%QfJ#DliVe{Jc?3;iddYAF47~UhF!RY zEJb6T7vfw}pxr!?q@vzZ=BpGfSWKrq+oog3d=FKIwcKN`|5R$=qXGhYlZlD|FQwsj zgAvmxVuRrRX26GNlA1Lw!Y|s;>Rq^!{#-Spti;}q&PSfNd4&Jf=F2@}^;Yg$>0y@p zIk#N6rADsviekuni*;`tO(pCoJ22pz$r9>UaW|Kfwmvbp(e75h$~tVYsB6mwCu53% z&p=Y;$eBCM5}uxo*_oDifZSHUaypeJQcAylQMq4WHF<8Iz-n&-&j_Sr%}g0+azI?u z9;z=sVM-%db~!V!8|Acr?q0)+L$1RI#W7BLm3t??{?eYc6K0tFK=Q((lwZj3GDKxw zKQJP4(lzMR*AF2BF4>JBQfu;mX~6PCg`Qk6f}|{HoW%$qp5J)Xk#$rs1d9*Q?6I(u zVLsMEu4&bJ%e%hSReS6sH(wh1aGZ5X{ z_uas0Sy|!`3DGa!J0Cr>TO5U0hjm?bi?4l+e<);nJxEVpoM>k?Xu!ZW4T{mzLqJh$ zxMx_BRDFK*cF9&iG#yeu;qOkd&#q90pIS#_^7JuJ$^l37QZ~JMR~`ya7|UXdy}a69 z+1KFS{>UQJdG0lJl&lZC&Zx~U>3Q|;rK-#*R0i-&I{vod^}tu$g}2`xq?&xyK>dL#Y=3lI7~|s_?&P0-va~fRx{KiuJ4xvEcid;`FV=Z z5y59fPkp2-UNdsdbc||XX@sN*NO<|LyM<ZYPp7Y$&Af59_5; zf(fZ&iM7)OQzm>b?a<22R5!CS?XpO;-s$_;6mjoT(ZRyxUYLYah}AHdJ3)TV0p4jc zKVukOlQU7fqRP*(2Mc7J2pqR)>bI^e(``=75zl3eP7XvIY>TH*In~?1SVPqvr3|^* zqBHv@aLu{Rq-bSw-@C5O+PY{yEBw^t*}_nvMz3(CGnl2}nU1&ra3D3(I5F#kJf656 z(IwnA8Q7@Er08O82-n)!axyGgjO2*(3P*>DVYc%vJ|dv3Sr|M7n2w53>zcD1lk0x` zn}YSt^w@Od36X}GGEW5~>E|q&?ad>y zRpjQ?h>XLlI~8@_kVfQq(0#LOZ7J00|&11QUNwdHcQLGBe@HE?H;M=rG&kNv-GncAu@K+2}_=yb%#!r_);vUYLUOT)3)kKvD{ zngk80XS=iceIr%QIK>KAR}szPAN%!F6Adgx@nagC1%L(1z>(?LL1e9JB4s8|gSMKe=hdmD=gWRZ?-)rV%9GsD)1Fu~_gO~$<) z`=aW|Fh8}dGm(KT8htC9N!qbFQ^a6XMV&P#BGYOANib&#vHluK6Lp{qCk182j-%V{ z9w%dV0}hk%0qu4;imFNC3Fzb3Ytc43Hr{DCN#VR6&kVY))_Je8+^0X**0gy2sAXl` z=Q-p7_N@}^mIp$>e6O5`(~bRydmpCtLwDDAj}bjh=Xi;4#0fG8|3RhI~r`xCu9%pL8}amo&jt3MEiUWxpKum*I*`h~Dx2>XSwUkLk!uwMxKA0rF{lM?Ii z=YYSD1OZ#p7potV;=i8?{zLftT=2(SdNCLLUiksae-{2Zfd0*tP*e5KJN%d{FY@j8 z$`4pX=i&b{?f$sgMO6Lq7;q6)zgK=h2>M{~!|(KS)clWv>%ZFf;*jyZ@&jav|GMvg ZedN$o#X)}=000O5qQe9LaKHUe{twuy+iL&- literal 0 HcmV?d00001 diff --git a/datasets/c4/dummy/en.noclean/0.0.0/dummy_data.zip b/datasets/c4/dummy/en.noclean/0.0.0/dummy_data.zip new file mode 100644 index 0000000000000000000000000000000000000000..99b4db9781c42701e23331eab2fc8ba14fa1c777 GIT binary patch literal 5689 zcmeI0XH-*L8iqqhiqwFJ6zPbeM~V=72dM!<_3oXs&U&Byei|xR*pz_tN_Lsi`hN1)7a@QV zV2N~eyl-M@hA`uS>JS6)Amvl0QfJ5ci1Z``U|{cK007?wG`LF8EE*AF8s$8J{u{K_j0@EEZG7+JO$-Gpyy zycnIS#zMLo7;y-eO{GDyi!ne(Nk0GvCbquiQ+3OuS$F2MOOor8Yk}P&o%hGB=hrcp zPGFG4ioY)1F_*l1g9H|Cx<$KYeoi&1jOBsEGSD0m;BZ=}y6s62i%9w@5NwP$UL)@Z zfIoJ_nwKD8)7LJajnSWL_!|s_F>bwZE0H%9%dA4rh5)TyAmK4I_3N@sCb_Z6&6X?t z(kx6RvC)VagE6>*%YeJ85^-HVcN8Vkl8@#G!biZc~4! z`|$1j&{)LR4{oF69H_NCBZFln&GjHM>()2Hxcu^~^%T0U-J5#0UjydGQgwZ+cY-Dz zd=k<@ng;Z%>j}8HdqMZy*XG7~L6u`l)96RWoS;^=0tqvkl{{OL!JHs-mVuC28&Js1 z)d{R<_i>kl%VWBow);e(oN5!}Qc+_oG$m0mfzc#*UN4_QjcS9s%2*^oE-n?#4NbvRRgfsP=hVFU zW|dxB$xcY`C1-wiRraeV$xdHlc(Ri$8RqmyQ%@KEy4(`hnTIo4vb3WH)hZIUEd zr)hviUZIy?KPV`o>&FRvDou4aXxABoyA@iCJ37OBhzV~=-U52#Nwhj10>Ao6%v^3* zh^QrxD96^bVAZuC9+`D_XuIWr7XRSi_#yOEI84C>TR{_@;7NdX!DQdQ2?^zy={h91 z`(|{T7!~O>3-)GsIfr-1IsKMlOX1{_(~RQ@;U+#~m~<*BRcA0#I!S|h==hY{)fOTw z)D`>=>mA#}bqd_2t^(&T@S=yB6)O{%ddhNK5h}V#db-07Q=f-QX_Ag|x>ua5o5Yp+ zl(5wYGD#QXENn`2s5b85j;}OS2qgO=Qq$AlR@`NW2Ca}k20nBNtmITpeigYDk=|=4E|v*t7Z{k1cDp4mLZnKPT1s7cAFYwPn|@Oo~OUz@bd&$e%23be2` zH8Z|^+LHC`FdAKD~4B%9~%NK9uJMws_7agt##KH^Yb0IKW}{< zi>u_T_-V!4NpWeZ`F$kuiZam(m^R)8@tzh^>*A(f;$%~3lrwLeOHqPQ7L8TbLAnQ5 zvk5hkC9ALSK%9#6wHikgmDQR`eH5bvis-baTC{DM?xRbw7CP*qp&wK|lpvJB|Y>DX|> z$*xDkCm|`a!XL9R>RI2=n7D5c)Ntk})B96Pm(XR$Marw7onWF+^Z z>=D`cWKAU5i?Y-H)(cG(l>Zu z0iryk7Z4sX<`Q`9*#t`s%1Cgh4g`SY{|2|D#m z%egs+2d?1M%uF$exX4$ptxb=tCI>;50UZ~eqHEvc9tj%X2-KAmBidRD?A5nPg<^De z5>V8@c3{PcRi_8<=WX~!(jaxCer^=IZ1Sb}DYZ04&z^86@3A+|XVI&*=c4h1u*}!l z%Bt*?eDv?{4$fUa&AFzAmhooO9}+to}<@8LPmXUL^bx0jcJvfjTy$qGh}o?c;?X0Li>5Uu!;%$P}8wVrB!BY~uTRX%NZ zKsSXFOh^?&td%B^JnD04i&l2Bs*&aTHnVv1-R@0P`29P05#GuA@h?Q zo|rAsCEONi(;?w8k-3^+&gJ2SB-12Ok^_z_?5#$yET`MNL_isnPHAl=%4@wK4akwe2PW5AUM}+r_MSQc!VP8_R220ga52Sj*cW4t|HEzm6?ApU-zj8@>gjLOP*2SXxD#$(PbO*cOa0^ix+gR-Rff(#3 z@F$We0T}gEM;4z?gz^c8Xu;AFqET$KM=vEo-&_Pgy55N&n7;rVoQUZ|)~FuHV;P@YTHzPYNR=VHHU`^ynt#j z?rhl=Rz-yRs%D-D_h!=QSz3?L4o@2+`cUPyRvd^7$K9tv9L2_-y~J^MSKCiFtKSGErkov2g1gm+>D>4bkGtfX4}k^C8? z&O!C>5q9Gzg#8O|c!l_G3I9Yd!83XZ|IFLp^!iP&-}L%Tuiy0gO|Snay)ZB-vHpD@ z@UNC2U|s6`>_Srf?_I$^g@5z~FXqzozTl6_^H=)2@UH{tFS>*pDu18hVy-;Tw?8V+ zf9@;~|Bq?+;$-Jh_2LfTJgWYvJpbUcJ;8 z(wlUUBIpf%$9p_SzkBD-cmMRw?5wqC_B?APv*-D(=haZb!lndV6x3x->)YhdFG2t# zz!K@`c;D303}MCt)gcDpwUy1laLQ+37bDV>5P*Swhyeh66VUi3gb%<6cslcs5|fM0o~As!A)%)2wAZ%M9CZv^&=bl;z}Ufjf7 zIWvGHR{VMEj=AF9A0)7J(=FOH^HZv6Wh@UQmVxGk0Eg2$)$KrnSVYoKfnaO0=^FVU z0Q{lXpk)ODhP`(AWPf+#NJg`{(pM{8pcmJhMvgh1x2;xF`AuZpS%bpa-^c ztu+;ba?w@{71)vV*)htp%=3aWQr=IF=zzw-LaNXnim0eKySnU$QzMCrV-Cerb=&%T zy~l4BMGd5gR(%cLpvuY37!Nf7fklun~+eRxt?Q! zyKUpU#Ep?o^I&g=mkW5uoU?Bjb`;JoIn6nq5pLr%hDoQAQgsI-rIR$6M^4YFU2P%4 zLOsE6vEH&h+@!!==_zpj3@>`9S+O>Ssi!Q*6``V=q^CRTF!O1olqTsUr+3Y{x>;Ol zKnYuYD3f$K&cdcdhidB{?&MlSg+Q_|A~ikzO~qYyXwVw@W8g!Vz)DWlZhn{#LLmy1+$7*B(3gsBSPr_;=fpSzC< z8i}|0X?!~^&%~z#Oh0(A&EzYlI`n9E5={HirXra2Ll58k-FBgt=j#lb_8%~3r*91u z4pK;ojL8mQA8chwOX(0$?M)Ew$U76uY^UCVip5axfE!oCPfHqP>pe;pce|zK(kdq> zkBQSLTaNDUJ2gl+7m^IMKS=hcwZK#)vn-EJd_SN6 z@f8oB^n))^uhRxR;`O;Nd&9uwy=uB1k=B+Le9|)sBIs^?>Q_v0V;-!4L*KG5zKHR! zzE~P6c=#n|lwHC&Xlq9M@2{QN6K(ShXlFJxRg;oY*VgCx!RxtAe{ItEXzTxnNn5~x z7S=Fx*p8a2?hc7=n1&x_>=i6_Qd*31TGGH{pkyyVdycWy4@)>C2wN%@$ZN8Cu_HWu z!mw6hFnSLc`}k{z(m$|63Ksyl@ppDu2!ar<6fc3N5e~STpbj_TmZjqiho4SB;D_`G4xyK{> zl9|fK$Bc#%Zm-}ne*TYbBEWLbS)h8LPk$V3u@oxl3Hp&u%+EA=9c@Kt;i{DdYF|y{ z9Nj(GakiiG$eq>;9{dFv^lCR>& zHE$=ym6euvk;H4tL~CH$co)PwT1c&nn|g_pO`&nlqHQik2|`&kR#^w>9$d{P)J&GF zzQzM_D$dtx8c$SKYcBOsj1nlK)0%13wq?4HD#cprw$pni*}pB1fZn=JMSz!Ff2ZE? z`Uqm3;K7Ff$0(BORZYS#TF|OpxT4-{6{57*&X&$wj;Cpu@Aby3JtMUit{SN!<_Fog zow+23Z}5m<$a#r&tshOs?Q!i0diSzoKi_iV+%BHQ&KRB^K*y4i+}~)AxTZB& zS9Eecm0-#FOy72d!|sJ!H46^8HZK&%DDid9-MG3-dsdE^p>q96^9z!`!9zq+=@=izfiMQ-rNywuymPO@PMLOi=m+N(4`6gRgm7S80 z{{8*oh3n@z*VIrl-fY?<*1M$VRlAoeGa^yxz%!}1I|erbUUL=Pd3TUv3QBg5=oXjuo>9^(@k_ishjoWD2H+vD_WK5>H3dRb&O%zQJ!qVjW zdRL;!Wn6PuH5fQQ;5}o`=&Zs%0m^LoNyqSD^rIP5hKaNq({V zw4sQTCv*p__bvwy<2=P=1tZ7LuQ1HASG_WfR{TI_!lbNPPj$GJKvKUhpSC}wn?eaD zq>3TdN)t#P_qnt~D?44)#BzO?S-j;SL%Axw{FRO%=KAN_UVcLX)JUU*%#U(-Vzxw= za9gEeBf=9R3pK%&YMT zR=3h((vZ{a7zZX35Uf^3a{U@nFYGpIv4*%_DIWEt!sy1^qK8S`<&31CGo`mSj>uM! z8&|{A53lZ&*Lp!3kYj-lOs}=RT;&z)KX(FzC3x+$(|`7-EYs1F&E5jJm3NNSjYB*P zSE{8RNcDs7&?dgfhc8TDsq~uHaMucEPB447-K2JS+hxnB<}M_klvzFyZR1? z1XH&kub3m(q&W+*Z*MUFg-g;StZIR?E*3RVLGD4PJKO_@TZqco#$qoH#b7^yKap${ zFrc34%Hs2hP(I@jEm&DWG>L8Z>7^v-n~UH_*E{h8^Ou0bQ!xX`8kGc&_&_=PTdYFz zOLDmy>7F4krCAT7MuqCqBGpkb>g)=pCO&r7=HbXfZJWxEO*Cf)E#aX8FQ6KXdpmZ8 zRS}`Ss+niP{h2g+mev!rqq8Q6fyVM$D-J}4_<}#eTRD=r}RR0*LIH)-HqpX32(&+(h2`XuaauMiS4HX>pj{yL1&>uQX008&fd-7lI(A(7j literal 0 HcmV?d00001 diff --git a/datasets/c4/dummy/realnewslike/0.0.0/dummy_data.zip b/datasets/c4/dummy/realnewslike/0.0.0/dummy_data.zip new file mode 100644 index 0000000000000000000000000000000000000000..935717a27637852129041d67ea8598f2e9c0c0fd GIT binary patch literal 5689 zcmeI0cTiMY5{Cx{7$is>5Ro7mamXV<7;*;5VF(f>Go%?n0m(^nk|a5a0*d5}B8+4t zN_>)&WRM`}g8Qt8&)wSE+WphMb?-T+>Q?tTw{G>XzgANMVvz&RE#G-YiZtcY)*=Lebjqeo;Ai*wi1NS(U|{WI007?|sC{>Y3%~_PI{oEH0tW!N z@v|dyehAXV)CR%HeQpp(O9(eNl!uqo*3}WgY4zZHoQBdV6V;OK|k-IPUY-?~nL2TH2DQ>TA@2)T;)V9oDSBvI9}I{sG; z?aFP0yzX=*vb5ONhQ>>Vt8tL$_1dc)1C?fuYKZ~H2idosIK&5Ua0y|^cnWu{9*oCr zDcI5B8cX5pR&X@FByP?!wbJNNxXLu3H>YLIjv%=ng_wjTOOrCR8OJ?68MZNc*$Q!4 z`o`u^5>GDi{zdt2zQx$7Z5)%WAtKG6hABO%x4{m1O{2fI=;(S1-h$JKp3M-O?Q_>E zCTvnoZf$IXgx5KDV{0$%SUO;a$n+-8&WZa34J^PEXLS9;!pEEgj=g=5lF;JqFaqTU z-&cB!S&Fozd|^bT0V9n1xQM*^gVv0L{C<;IKebLX8%c&kb=0zYwWo~pdoATBUeYrq z!H-6m<`rKRX_1y)uG5jAWK@S;@gsefx*$fQnqe_FXaB$jnv#(r0uvSb>bbS)p4nv2 z&orRrtW|XFTkIo#qZ!&%_RM1jhESf`B z+r+1p+m|ZRBhYE!6N%V6@EiWGISTH)-%B=zB)RG}utVPwl{`gjW`dyV<5xn96xwrC zIz)=CfviR)NL;peJs-jTHcM$LVK;VP0?c^6fPCCVrU?*}LdRYbWpC-(CtHV9fvQ1C zyrLeyD=xtq&>)@IwZ>i3=l+g{B@nZF95jfXg~<#> zjhjc7ZObp zg^3Q>uCTTm!ZRIja}$82j6)DX;8b*!a{ILTuyn_hKV&U$rADWsCRs7|jK*NV7I{*= zYGF^THbB4Y!5&6FJN1iN9n>Zmb=UETPt}hNbOa-72f`gw>-)0v;G& zYk9HE&EI?K2ndb$+-jx$;z#~cOG7$)1L9iNK2kdhbJt(0l6WA|3%x^~@H`(eH+iYj z3U^UYk%thzSAALdbTuK`LW;e5odQMJ;~p=$L7{T>JvI@hPA{mKE!U_i6S->#pZ&@q z?jBk>$6gzQ?kgvCr_mYgLLkhArEFrb<_Ds&o*vo{iC}LAm9B-=81?Y9 z5wfqLtj3ZJneMQg706ahsJl$mKHSx?POb^pGE%=aKzrqP}N; z=hK94@b=2~A+odK6cqnX1TPIA08mo`;g(d1K9W7tr*n<^OTDr#$RHLQ06_k;dT~l? z8fzjQUG9C?DdjVLVtp}Xaz6e|57+gL?8&vsVOIJdd(}QcApOi!y!qmfDo{!s4kQ-! z4o6{a6vwK5y!Ct)z;eEOR&JEXQpXl=lb`Ys&uEA3ya@<<3nJrTk9%Q&KPS^gCGIqNh;9FLq526PGFfwg0y7Avsd(t~m zj0Jbo(PQH+n@B>W7o)-S;=TY3Oe{T%ELDr6SvSVBCDHZCwSaD+&imt5^Xr&PCvaFo z`JYQS%q6ehK)!{Wu2C)-pHqx0Vz^*2bW}%p*z8s*u6tsHLgK!1cpKx5*GT&T(2w2l z<|P=^BlPEL-ggPYd%}+pw(NayU8to?jj@0> z2X*;Cfh|#wExk0;EH@-Q`NQ~-7GxAEpsd|R78x09TbuoGVkkj=#J+fg$0dR;_P>aCl``>&SFmx;J%gzWUFNrRexn?F3HRd&j3i z)b(js*W+<;_5$y@t<8;dLn_7;rqPd#*deVf1!AUDD|t3VgE@g_OasBQ){x+ts}sN| zw{ho#%VRp7Hv0r2>?#xE5|LvoR3(vczR^TPUN4VawQ{|x(pUsX?ulQlN2Q6j$7um1 zmbF@Js;)41ZSfHruZRhpv}c7hh^8LTGGpb}9PWvoE-n?$4N1mSmJ=(rV^_cVW|dY` z!B#-`1$%yWW%jElNseElxv~>2=xIh(^HEC?J`pj7*GZ3iO%qWr&G~gC+Ao;N;{-@~ z=SQjw_&=Apg!Dx7f%4IoQj1f?-jd`+Q?79xL+**I)S>djccsGYa9-HjT59+0S)Ii0 zcFv|tUo+uLw+JXZGBq#@?2nGF18u0;7rH9*jg>WKcVtfm64XH;&pL0cqz(*w9t25- zd{Sr5M_IzB`>6vx_P@Xz1>%d_A_q%XqY`H$K@GCc(x}pz+18>n3jVe2 zo*|cCKPV`o>BkPplBBpBxa)+$*{WTGGdja~h>2)P+5&rl#9AE=!C!sFW-iw+gx8RU zmtpCeGwYZWj?B8*x81Twi+=EH{19>~7%JzCC8v&#_rOCtW3q1FgoSX;bRFW|eKWdE z*bw133-zLVF$X$ipMFcXC3kYkamL{Ue-oEJR5FE_qB963nW)A%bbLzbVgnNt=n8rV ze8=)|oeXEGtH9|CqUfP|`N{;QuA&S_xROqyuFkOi)aRj6s>Gw5?iHu1CQ*ex1uWHp z4C2LDbL$c2y^7chPir-Jqh%7d zOlj9j61G^zPu6JW?GY{=dl)2J1kX9TIdd|5xkx#O{y4~5kfH!_Jjpo!rSlN4fpC+T z%BS7pM0C>M_@g_^RK9$QeV2MW-lQ*e3X)MTWdDQjZD&eZp7y{=zdkco+Li#pK)K|I z=xl%1{uZXx-Xv1>YaY?;&oqMVLcBiCFYQ^~YAz>re|_r1THiN*uZpHisHM3Xm-s}CKzq9`@Q zY)alChl#~dR!Msh12-gB&~mzpwI8WC24aLu(_3q znaP%lvd$KfPN94rwL|1a5qBtkIAC~6_0{wKLUrUF7!*_p=aIqpduS|Yeo?kWr;D4=CE(SX< pGA@3`^CIJi<@rew{&bxGN6De4gndTH008#cMS}?d;C%m2{sEGI+3f%T literal 0 HcmV?d00001 diff --git a/tests/test_dataset_common.py b/tests/test_dataset_common.py index 49d30c49a49..f319a90ed31 100644 --- a/tests/test_dataset_common.py +++ b/tests/test_dataset_common.py @@ -17,6 +17,7 @@ import os import tempfile import warnings +from contextlib import contextmanager from functools import wraps from multiprocessing import Pool from typing import List, Optional @@ -75,6 +76,26 @@ def wrapper(self, dataset_name): return test_case +@contextmanager +def prepare_only_one_shard(dataset_builder: DatasetBuilder): + old_split_generators = dataset_builder._split_generators + try: + + def one_shard_split_generators(*args, **kwargs): + split_generators = old_split_generators(*args, **kwargs) + # if there are many shards, only keep the first one + for split_generator in split_generators: + split_generator.gen_kwargs = { + k: v[:1] if isinstance(v, list) else v for k, v in split_generator.gen_kwargs.items() + } + return split_generators + + dataset_builder._split_generators = one_shard_split_generators + yield + finally: + dataset_builder._split_generators = old_split_generators + + def get_packaged_dataset_dummy_data_files(dataset_name, path_to_dummy_data): extensions = {"text": "txt", "json": "json", "pandas": "pkl", "csv": "csv", "parquet": "parquet"} return { @@ -157,12 +178,13 @@ def check_if_url_is_valid(url): dataset_builder.info.dataset_size = one_mega_byte # generate examples from dummy data - dataset_builder.download_and_prepare( - dl_manager=mock_dl_manager, - download_mode=GenerateMode.FORCE_REDOWNLOAD, - ignore_verifications=True, - try_from_hf_gcs=False, - ) + with prepare_only_one_shard(dataset_builder): + dataset_builder.download_and_prepare( + dl_manager=mock_dl_manager, + download_mode=GenerateMode.FORCE_REDOWNLOAD, + ignore_verifications=True, + try_from_hf_gcs=False, + ) # get dataset dataset = dataset_builder.as_dataset(ignore_verifications=True) From 003f411a00b66b3e70905a56b64fcd391ed2a1ee Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 1 Jul 2021 14:21:57 +0200 Subject: [PATCH 04/19] typo --- datasets/c4/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/datasets/c4/README.md b/datasets/c4/README.md index 4b24881da75..ee1ee99f98f 100644 --- a/datasets/c4/README.md +++ b/datasets/c4/README.md @@ -138,4 +138,4 @@ A colossal, cleaned version of Common Crawl's web crawl corpus. Based on Common ### Contributions -Thanks to [@dirkgr](https://github.com/dirkgr)[@lhoestq](https://github.com/lhoestq) for adding this dataset. +Thanks to [@dirkgr](https://github.com/dirkgr) and [@lhoestq](https://github.com/lhoestq) for adding this dataset. From 91c7147579efb87e357286d7654ee0b55b0d0774 Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 1 Jul 2021 14:26:00 +0200 Subject: [PATCH 05/19] fix tests --- tests/test_dataset_common.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/test_dataset_common.py b/tests/test_dataset_common.py index f319a90ed31..cf9222803ef 100644 --- a/tests/test_dataset_common.py +++ b/tests/test_dataset_common.py @@ -86,7 +86,7 @@ def one_shard_split_generators(*args, **kwargs): # if there are many shards, only keep the first one for split_generator in split_generators: split_generator.gen_kwargs = { - k: v[:1] if isinstance(v, list) else v for k, v in split_generator.gen_kwargs.items() + k: v[:1] if v and isinstance(v, list) and isinstance(v[0], str) and "000-of-" in v[0] else v for k, v in split_generator.gen_kwargs.items() } return split_generators From e9d55dca01dbede6c4a34906a1f80abf115473f7 Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 1 Jul 2021 14:46:07 +0200 Subject: [PATCH 06/19] readme --- datasets/c4/README.md | 77 ++++++++++++++++++++++++++++++++++++------- 1 file changed, 65 insertions(+), 12 deletions(-) diff --git a/datasets/c4/README.md b/datasets/c4/README.md index ee1ee99f98f..e389e86c5f6 100644 --- a/datasets/c4/README.md +++ b/datasets/c4/README.md @@ -1,4 +1,30 @@ --- +pretty_name: C4 +annotations_creators: +- no-annotation +language_creators: +- found +languages: +- en +licenses: +- odc-by-1.0 +multilinguality: +- multilingual +size_categories: + en: + - 100M Date: Thu, 1 Jul 2021 14:47:57 +0200 Subject: [PATCH 07/19] style --- tests/test_dataset_common.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/tests/test_dataset_common.py b/tests/test_dataset_common.py index cf9222803ef..359ea706651 100644 --- a/tests/test_dataset_common.py +++ b/tests/test_dataset_common.py @@ -86,7 +86,8 @@ def one_shard_split_generators(*args, **kwargs): # if there are many shards, only keep the first one for split_generator in split_generators: split_generator.gen_kwargs = { - k: v[:1] if v and isinstance(v, list) and isinstance(v[0], str) and "000-of-" in v[0] else v for k, v in split_generator.gen_kwargs.items() + k: v[:1] if v and isinstance(v, list) and isinstance(v[0], str) and "000-of-" in v[0] else v + for k, v in split_generator.gen_kwargs.items() } return split_generators From 0b9746cab82f1dbb6338268f22840808c8f7a6a3 Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 1 Jul 2021 15:00:47 +0200 Subject: [PATCH 08/19] infos --- datasets/c4/dataset_infos.json | 10469 +++++++++++++++++++++++++++++++ 1 file changed, 10469 insertions(+) create mode 100644 datasets/c4/dataset_infos.json diff --git a/datasets/c4/dataset_infos.json b/datasets/c4/dataset_infos.json new file mode 100644 index 00000000000..86514075daa --- /dev/null +++ b/datasets/c4/dataset_infos.json @@ -0,0 +1,10469 @@ +{ + "en": { + "description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", + "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", + "homepage": "https://github.com/allenai/allennlp/discussions/5056", + "license": "", + "features": { + "text": { + "dtype": "string", + "id": null, + "_type": "Value" + }, + "timestamp": { + "dtype": "string", + "id": null, + "_type": "Value" + }, + "url": { + "dtype": "string", + "id": null, + "_type": "Value" + } + }, + "post_processed": null, + "supervised_keys": null, + "task_templates": null, + "builder_name": "c4", + "config_name": "en", + "version": { + "version_str": "0.0.0", + "description": null, + "major": 0, + "minor": 0, + "patch": 0 + }, + "splits": { + "train": { + "name": "train", + "num_bytes": 828589180707, + "num_examples": 364868892, + "dataset_name": "c4" + }, + "validation": { + "name": "validation", + "num_bytes": 825767266, + "num_examples": 364608, + "dataset_name": "c4" + } + }, + "download_checksums": { + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00000-of-01024.json.gz": { + "num_bytes": 319308785, + "checksum": "8ef8d75b0e045dec4aa5123a671b4564466b0707086a7ed1ba8721626dfffbc9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00001-of-01024.json.gz": { + "num_bytes": 318039285, + "checksum": "b945059cd1a343cabe311881b7840a6f0363f570e745a0eff0e687e266f6b55d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00002-of-01024.json.gz": { + "num_bytes": 319748667, + "checksum": "2967dc7e587ced6ecb9ba617ad2d4c44901467969de5bf5b0f5a9e5b70555d75" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00003-of-01024.json.gz": { + "num_bytes": 318564193, + "checksum": "b79d9abef5741578929be0d59db9ca652a8276207ef18a944b7a5f11fef5beb6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00004-of-01024.json.gz": { + "num_bytes": 318579884, + "checksum": "cd9f98eac2bc6062f55d9a36bd744cc924a78ea2fd998830e0034e4456f5d014" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00005-of-01024.json.gz": { + "num_bytes": 318003681, + "checksum": "8ac5907a54dbc7ab9c14624448c7c3f6afed33af9d0a855f1eae955e62e255b9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00006-of-01024.json.gz": { + "num_bytes": 318495137, + "checksum": "8fd9b9a4b74c9414466b245ebda7db041e7bd8603971de51b5db782bd758aac7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00007-of-01024.json.gz": { + "num_bytes": 318417273, + "checksum": "41dd377a1ba6b72eab0260c39c626fe45ab6b649d42d57b311d3ba21a0337cd0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00008-of-01024.json.gz": { + "num_bytes": 318131845, + "checksum": "64da652c235f089a0b52f6db5883ef5f1e9c31edc4c950332b34dd12439c99a5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00009-of-01024.json.gz": { + "num_bytes": 318185592, + "checksum": "807a548efbb10153c9eff0df5733a97a1b51ab1743242530de1b02a8ea17ace7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00010-of-01024.json.gz": { + "num_bytes": 319045292, + "checksum": "3bd0f6f664069c3bd964ce48ceae60ba47b55b54745a4b00c207bdb3a1926b17" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00011-of-01024.json.gz": { + "num_bytes": 319686980, + "checksum": "5baa0c010083459ba58e34b4e93bb758caa878f7db6fba0528921329fa1a6cc5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00012-of-01024.json.gz": { + "num_bytes": 320119088, + "checksum": "fdee7442c06856e2c4b7665cc51978e9011b5e0a2112c30dd15bc9e53818842d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00013-of-01024.json.gz": { + "num_bytes": 319474856, + "checksum": "a4ab3b24087781c3577945492525696e182ffd7ca5265b958f49803a02867ecf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00014-of-01024.json.gz": { + "num_bytes": 319693210, + "checksum": "62215b2451e71b117018ef73570c944aff890624b384c538950b64c37f184c49" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00015-of-01024.json.gz": { + "num_bytes": 318427305, + "checksum": "9893c9f413a1223e7b535527829bcd6df3219929fb1abf8f2a114dd8f6ea0919" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00016-of-01024.json.gz": { + "num_bytes": 318785714, + "checksum": "bd0ade8b8a57348952ca31c39efdab538f54c852941a225ccd13d0a7170724e3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00017-of-01024.json.gz": { + "num_bytes": 320134331, + "checksum": "4132cfff3f5126d9e783191a5ccc34e5d85938bebf0b8489657805277a227202" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00018-of-01024.json.gz": { + "num_bytes": 318653930, + "checksum": "4675ab1d77da3d676d9743dca15bfce8478498f7738f79816a25ed790d28fa46" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00019-of-01024.json.gz": { + "num_bytes": 319468974, + "checksum": "1d2f3a6aeb0f6c159295f283d302794cd3eb944cff3fe68691997bb2dc4c7780" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00020-of-01024.json.gz": { + "num_bytes": 319109754, + "checksum": "b5f26d832a0ec9b0489a27169d94496f5ea33c7fb046868c565c7b5a2407221b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00021-of-01024.json.gz": { + "num_bytes": 318514423, + "checksum": "428da5a8d4585de16f6b3f30865a5ca7a8d1ddcd3b6002dcc1283368b0c3d60a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00022-of-01024.json.gz": { + "num_bytes": 318715623, + "checksum": "9bc4812ba5e08c0b2d83cd3804129ba3d77cf84ba3d8828159788ee02e155a51" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00023-of-01024.json.gz": { + "num_bytes": 319874293, + "checksum": "38843ab4f5c60ed2b9ec0cdc65074eaca454014d5702edd809a266190689d2c3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00024-of-01024.json.gz": { + "num_bytes": 318105764, + "checksum": "4fa0c7ec94445ea57dcecda7864b1346275e711c9820c2c39dbb9fdb95c97674" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00025-of-01024.json.gz": { + "num_bytes": 319122521, + "checksum": "0758514fa2e2c133c995c00d5f4abfc14b66582a4eedd0e721bdd95c4632a755" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00026-of-01024.json.gz": { + "num_bytes": 318116783, + "checksum": "56a73b9a556d6794d9c706e1b1c7e729fa13b711ddc25dd403b110eb5ed857f1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00027-of-01024.json.gz": { + "num_bytes": 320171191, + "checksum": "fea1eabb734cda33d72f3d959234a240080b4fd42cc70494814a8429b087f9e1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00028-of-01024.json.gz": { + "num_bytes": 319047090, + "checksum": "47d1c385952d6c18c431a7294339a030c213b8832f970ac987965b621c8181a1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00029-of-01024.json.gz": { + "num_bytes": 318705639, + "checksum": "3c744d3dd915ceef3a93fd18c3ff5b117fb5118d1ced2089979b6cafc81c4525" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00030-of-01024.json.gz": { + "num_bytes": 318327902, + "checksum": "7f6959020242fdc841adfc10c102bbe79e2ef8502a09dac8451e0cec6f2add16" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00031-of-01024.json.gz": { + "num_bytes": 318990600, + "checksum": "e56f29011594c765192c34298558e7227a829313196748f9a16ec34ecdb76d23" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00032-of-01024.json.gz": { + "num_bytes": 320451482, + "checksum": "9ea843dfd85e449439f3106d657762daff8f326730fefb342455c43cb48144e3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00033-of-01024.json.gz": { + "num_bytes": 319878207, + "checksum": "2633cdb7b058f126173608897f69add614659b0b21cf54ecc8a2f4a79bc16073" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00034-of-01024.json.gz": { + "num_bytes": 318701510, + "checksum": "853c4b9ff2d79621ed27a6be826dae198af609d9f9dbd1c2773b778241cf6137" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00035-of-01024.json.gz": { + "num_bytes": 318529104, + "checksum": "fb50dac3f35cb71472464f511e6b8aee72ded10b3b6896d0d1f74a18ded2b8d3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00036-of-01024.json.gz": { + "num_bytes": 318849657, + "checksum": "5cef5cfd50cfafd58feb452b85324a3d8198fca48789f0ce69227755e72d8e53" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00037-of-01024.json.gz": { + "num_bytes": 319621215, + "checksum": "f0b67abf30e2d58d291aa9bcc9c8a03668afe819549802e4e591a261c171d970" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00038-of-01024.json.gz": { + "num_bytes": 318135467, + "checksum": "991bad578a83294d34a1b11649af07339aa8cb26d49330afa9fcbca0b87942c6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00039-of-01024.json.gz": { + "num_bytes": 320131759, + "checksum": "abbbc21f81555e94484e6afe1975e13f67af19a820cd6f8d090c987a250bd4fd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00040-of-01024.json.gz": { + "num_bytes": 320214476, + "checksum": "48020d2656709899abd2572b3424c0455df3c1089a69fe26b776aeb24f0da0ec" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00041-of-01024.json.gz": { + "num_bytes": 319581259, + "checksum": "db6fb8db7162ac87ea002c153ef0c54322f24c8f7ec263cfa290ac8c3683b194" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00042-of-01024.json.gz": { + "num_bytes": 318100985, + "checksum": "d499cba2383b16bb0f26b98416211eabf2599641ecd6708a5ef487692ca9e791" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00043-of-01024.json.gz": { + "num_bytes": 317803029, + "checksum": "dc6f1ccc3fcce79b16c5157f7125942e351d74744efc593f8372f8a408720340" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00044-of-01024.json.gz": { + "num_bytes": 318837063, + "checksum": "6170fced793461bd687640a658a085d02f971c2e609f6ff33b90df944fb56409" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00045-of-01024.json.gz": { + "num_bytes": 319659188, + "checksum": "b2f79e8600815578ec326cfc6c5242c2827cedbfac51772fdcf15ef5d027aa38" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00046-of-01024.json.gz": { + "num_bytes": 318771753, + "checksum": "e4b4a3e53ee66c280a5e7ee33602ea0e910903748db8c2adbbec4b48bab1580e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00047-of-01024.json.gz": { + "num_bytes": 318088661, + "checksum": "bf8597fc359d8e9c721fd1d98b8ff3db5c011afd0fec9640670f31c7a7dddb79" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00048-of-01024.json.gz": { + "num_bytes": 317777133, + "checksum": "369db8e9646b8229a23044a7257c2face97b8e05738f0413b581892876f268e1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00049-of-01024.json.gz": { + "num_bytes": 319329891, + "checksum": "5cb2aa0432984b355b0ec6aad92f926b2fb75aea2a0e08b97f4c6a62838e6cc8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00050-of-01024.json.gz": { + "num_bytes": 318172322, + "checksum": "11a7cc48539ac97eaec87beacef9d9bbb71fc875a0bff0c9ff096044bff46a44" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00051-of-01024.json.gz": { + "num_bytes": 318704544, + "checksum": "ac2beee992c2b1ae8b1f162054e843e2b971bbd7cec45a0a7a7b7795fcdc7c26" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00052-of-01024.json.gz": { + "num_bytes": 320806303, + "checksum": "3a591fe9993c3d98a9e7949e98ca215ce164cd313fe53f3ce762c91b5fec7c53" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00053-of-01024.json.gz": { + "num_bytes": 320565764, + "checksum": "60e67c8e6f3bfdf8b490ecfe62c79a13c5d04d393fbac712a6cda49fd78e883b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00054-of-01024.json.gz": { + "num_bytes": 320425170, + "checksum": "d69305c853e9e516f5fd4e2a9afb1939d829925f71102d8aa09387ded5d000df" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00055-of-01024.json.gz": { + "num_bytes": 318713224, + "checksum": "e01737df8097a1526d6c31d37d7aeb1b92c0a7253b39f6964fcc897bf0eba9fd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00056-of-01024.json.gz": { + "num_bytes": 319441227, + "checksum": "fe516c8c0a9e59f9f035ac5fdd13e973d25dd6635eee05d648740d3e8c1fc742" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00057-of-01024.json.gz": { + "num_bytes": 319821142, + "checksum": "7e058ed9072e968e9c8b92f9b50dab318515873cca6c617b544dacab5a2f018e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00058-of-01024.json.gz": { + "num_bytes": 318643105, + "checksum": "3479dc5a5b111b7f45f87e5a91c433907af97dbe15b9db1637bad666dcbdec40" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00059-of-01024.json.gz": { + "num_bytes": 318053548, + "checksum": "8208b0943f59b5914fa13d29108ede31a8d8d34bc6d603a2278ab8b80d28b1d0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00060-of-01024.json.gz": { + "num_bytes": 317935826, + "checksum": "71324b62706aabd6faee682205cdedcd10dad289579b534d0e53f8d9b92bf2c0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00061-of-01024.json.gz": { + "num_bytes": 318870698, + "checksum": "cdf0abc5804f0991871de48b249e30b666cb96f2254762a570c39904c5780f8e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00062-of-01024.json.gz": { + "num_bytes": 318945246, + "checksum": "5ac676e16108446bd2980f9601c787eb754811a68e92ab6403c333820a6b9622" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00063-of-01024.json.gz": { + "num_bytes": 318827790, + "checksum": "a26f7cfe123cfdf3db7687996d0163212e70ff7635872b0754c03cbd5c31213a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00064-of-01024.json.gz": { + "num_bytes": 318914155, + "checksum": "858a145617a5902ab02bc77e47ee2f036a6211384c4f2285767c7558eb93e245" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00065-of-01024.json.gz": { + "num_bytes": 319794084, + "checksum": "52742215df5aaca43bed5405a397571efe7c22107ee2caa8c05e3ed229796efa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00066-of-01024.json.gz": { + "num_bytes": 320294453, + "checksum": "5b11cd54de0e95a75e53e4e32f72912cb01053d3fb609de6b7a45afafab414d0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00067-of-01024.json.gz": { + "num_bytes": 319468309, + "checksum": "4c6c69b3eba9bcd6786d7dce893340f2d7093012ead04f3539352beccd2794ef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00068-of-01024.json.gz": { + "num_bytes": 318800742, + "checksum": "ce94afc3c612e9de423a412147505ad7757216100becba2677bf5eaf443c4b6f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00069-of-01024.json.gz": { + "num_bytes": 319416585, + "checksum": "ff3084a3e5a3960425a5c605274684c42fa638f99045527f77e74d165e52b6ea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00070-of-01024.json.gz": { + "num_bytes": 319165846, + "checksum": "04c368b05f0ea42b3a51ed9bc0e817894f205c0ecd74084da015158d509ff2a3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00071-of-01024.json.gz": { + "num_bytes": 318017381, + "checksum": "e8320e9982fa377b07c5b3e8a4451ac143b05ab7a4a03f748034b37fb998bfb0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00072-of-01024.json.gz": { + "num_bytes": 318874499, + "checksum": "920f8d5ef2cae6bdbd52f724d0952e04146ff29f4aaec4dbf10bef7b66a98f40" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00073-of-01024.json.gz": { + "num_bytes": 317890112, + "checksum": "06a41bdb7bf0d52e2fe8e71f594de8d36d77880639ffdfb41e883237f76e8a0f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00074-of-01024.json.gz": { + "num_bytes": 319201956, + "checksum": "e0267d6782d30f1619a82c49c20be1c8b5424e653c093e4652a5c8ed117c6533" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00075-of-01024.json.gz": { + "num_bytes": 320575937, + "checksum": "42108758abc3c3197e7dca8293eed3800f3e79ceae80d3208d90c7a9fd205594" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00076-of-01024.json.gz": { + "num_bytes": 320070510, + "checksum": "c904b6e6041e23edeb1d88b7b69f07a339b7ff9835d0c22e0b6c354519369842" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00077-of-01024.json.gz": { + "num_bytes": 319042024, + "checksum": "1eb2b70ad4d12b7587eeb1ce86477817ad992c08fecafe5ccafc26af6b5657f7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00078-of-01024.json.gz": { + "num_bytes": 319997520, + "checksum": "070370654960e02f766c10321546b280e9933531b796c252a94999d645f360b2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00079-of-01024.json.gz": { + "num_bytes": 320736487, + "checksum": "3aa4f007660706563030b590cef9be992c18ba7ec1876210bc92665ec42c4be2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00080-of-01024.json.gz": { + "num_bytes": 320082337, + "checksum": "3b54eaf407bb593c2b16df99690446f26497530d21cf433a7d525e0eaebe9c3f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00081-of-01024.json.gz": { + "num_bytes": 318008114, + "checksum": "d01975cdbd4360331b1a0f55e9b7e731d7d9fc70c7cdd0f33f1c772eff7aa03b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00082-of-01024.json.gz": { + "num_bytes": 317829809, + "checksum": "2a65dd37027fae03819ea5a5f6c3b16d921706ad758442881dc1d15b08bc5048" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00083-of-01024.json.gz": { + "num_bytes": 319265318, + "checksum": "e14cf18c687f7eb304df6abef7235e263a5736c799d742524205dead2abfb043" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00084-of-01024.json.gz": { + "num_bytes": 319166958, + "checksum": "1dc3fa8702a4477e3a3128440b68d4cc17e6d2ce7f3c53da28d50a57b8332020" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00085-of-01024.json.gz": { + "num_bytes": 320338078, + "checksum": "0222db7b1ae14c9b10aacdb05d055d1432b6d035e3937df5640facd242c52aea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00086-of-01024.json.gz": { + "num_bytes": 318941314, + "checksum": "55ddf7a27dc91bf8d932a5efec4aa458122ee337f2cb050e2c4b0ae8e770f3a9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00087-of-01024.json.gz": { + "num_bytes": 319218368, + "checksum": "c61552d76bedbfa750c599a674d6732fb224c8a1e6c6583fca7ccabb20532920" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00088-of-01024.json.gz": { + "num_bytes": 318974308, + "checksum": "693fae3d50068ec39ad27a14335372c3e1530138cc65931edac5268dd62b7e96" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00089-of-01024.json.gz": { + "num_bytes": 318781044, + "checksum": "2d90b9318432a2313dfaec542c8b91431505035cca7416a63e3197ab26ad6e75" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00090-of-01024.json.gz": { + "num_bytes": 318569651, + "checksum": "ee674beda8ed39395e69c899f666990c5190dfad5494867e51fa727e4d38d86a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00091-of-01024.json.gz": { + "num_bytes": 319683433, + "checksum": "add2489350310ce500dde6637518c747c156f95f079a34367842bf875a8fdf5b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00092-of-01024.json.gz": { + "num_bytes": 318734793, + "checksum": "5cfd4f25e9effaa2f7381bfcf49f9263e10619811aeaa32a77d3fdfc13517006" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00093-of-01024.json.gz": { + "num_bytes": 319161014, + "checksum": "bed8774909bba5ac656ebaad6e5cacca9e5ea12c80a41fd5689e6798c74f3c89" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00094-of-01024.json.gz": { + "num_bytes": 320143246, + "checksum": "96abe370925f6962b4e75da530b5234eec21fab820d6cb02ae59b6070ab63859" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00095-of-01024.json.gz": { + "num_bytes": 319707377, + "checksum": "37b68cd632e8f86f364fd61c9581f48ad7602122b7f33c55103ac5bd727f015d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00096-of-01024.json.gz": { + "num_bytes": 320159279, + "checksum": "fb93c7467f0361c1d4b186d5e25f4bce4f237adb33b4e0ef56f57831b4f97f81" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00097-of-01024.json.gz": { + "num_bytes": 319841818, + "checksum": "7f4d4a9536e37a0c2b9a1806fcb472784ff4d3840aa57e9603e74233b877fbac" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00098-of-01024.json.gz": { + "num_bytes": 321001731, + "checksum": "239b9fefebe3815c8d785bd48086013d1a6dcd76c142786502c674d2d874fb11" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00099-of-01024.json.gz": { + "num_bytes": 319475885, + "checksum": "0a610d25a547839b8b6dfc2fd964e3ca64b23f0edc52d311c89dcb5e8a44a2c5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00100-of-01024.json.gz": { + "num_bytes": 319515329, + "checksum": "f24d17cbd27296a15f51b9edc713c74a6997bbe82267403fdb6282404c2f4e6d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00101-of-01024.json.gz": { + "num_bytes": 318803422, + "checksum": "54b8b0c72ffa325abce3dd15bdcd0856b5594500c37f4bc6a6327721ba91e4bc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00102-of-01024.json.gz": { + "num_bytes": 320934688, + "checksum": "24b99b4afa3b631a718a487d679026c91e2c936132df01df969e3173b49e091f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00103-of-01024.json.gz": { + "num_bytes": 319835920, + "checksum": "a2c68654ba81fa55bc24beb4319c8905f7b532fcb6793a6a311344d4f98a82b9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00104-of-01024.json.gz": { + "num_bytes": 319402378, + "checksum": "27764d82793e35b8a7be3a3fb0470d018243a89283b5501c0b76056de1879389" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00105-of-01024.json.gz": { + "num_bytes": 320100928, + "checksum": "3bb2499337ebe52b63a5f20ec6ca6283971937962439699bd5e483cf80fed02a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00106-of-01024.json.gz": { + "num_bytes": 318707110, + "checksum": "83510312aa188431a8dda8746903d70cfc7ffdf5437e44c1f74b7670b78bd52b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00107-of-01024.json.gz": { + "num_bytes": 319904239, + "checksum": "40d42c39dea8e4898efba1886aa3be67742501f7a51d5bc635b03a2c6c2bd63e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00108-of-01024.json.gz": { + "num_bytes": 320050265, + "checksum": "88ce3ddae88e8024e76614a1b701c157f66fe39c6f0852a4869c5063876f6e87" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00109-of-01024.json.gz": { + "num_bytes": 318053254, + "checksum": "865a124b663037f36a5738f25c82f8bea2ab54d4bbf8255ca0d1d00d76f8b250" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00110-of-01024.json.gz": { + "num_bytes": 319794699, + "checksum": "b17e210c8ceef98219ee12eba5dddd2001ded0d417c93955743c238360d96e76" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00111-of-01024.json.gz": { + "num_bytes": 318761540, + "checksum": "05be318a057bb33bf9d7faca58569cdb0880fe8eeb0fc3f57f5999d5f2af55fd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00112-of-01024.json.gz": { + "num_bytes": 319121509, + "checksum": "858dce8e43b06a0c1e26ab3e4f109814b6cc50c6b0e4d146ec79fda001ad471d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00113-of-01024.json.gz": { + "num_bytes": 317916736, + "checksum": "2e3968e48cb15a3326457d5a6ad49838d20d38c8138c529eee51f94e6bf269e4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00114-of-01024.json.gz": { + "num_bytes": 319319540, + "checksum": "b72dc8207d93848f4fcb265b3e618d0eb8649445f7b9187c5165f4adec3e0708" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00115-of-01024.json.gz": { + "num_bytes": 318863372, + "checksum": "85ef0bf3cb12bc2fede4158853ed2259dff5d25adf99b43e8c35d7e0b9d4fdd3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00116-of-01024.json.gz": { + "num_bytes": 318898370, + "checksum": "a0c82c8b48e086be7396338cdda0fed52e8c4753f04fd086b9472c1bedfb150c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00117-of-01024.json.gz": { + "num_bytes": 318153138, + "checksum": "531d5d03fd8099806d92fbff2a48a0d68dcf46325e732e698e9c142902d152f5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00118-of-01024.json.gz": { + "num_bytes": 318966511, + "checksum": "24b1c5ebbd07d50043be0d5d5c5427e042bdc53280825260226a2823e9b7546b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00119-of-01024.json.gz": { + "num_bytes": 318733748, + "checksum": "ce1fb1192b770e625430798aee94c93bd748ed474ff815a7f95cadebb826161a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00120-of-01024.json.gz": { + "num_bytes": 319672996, + "checksum": "4c2a6874921ac4a626a9c8ac4c6e91dae58f1f5b52e79124b3abf254b7433119" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00121-of-01024.json.gz": { + "num_bytes": 318779046, + "checksum": "029d3ab92f3e1724e3708790148e63b4c211d2ddfd04e3d194b24145e97c922a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00122-of-01024.json.gz": { + "num_bytes": 320861175, + "checksum": "4bb595140e5cf92147f99b58d236634ddfafbc0b160b4c88b337255482611ced" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00123-of-01024.json.gz": { + "num_bytes": 318338141, + "checksum": "d508261be287fa3d27e5f44524e22870269054213b61011ee8a6728a77910cc0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00124-of-01024.json.gz": { + "num_bytes": 317655056, + "checksum": "7612cb9fdd9f4b3a4f8958087ace120d4a73cf26bd16289bb20fc871f5744f2c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00125-of-01024.json.gz": { + "num_bytes": 317524610, + "checksum": "049ebe4971811bb1fdcfd10cc264b2074b3ace18536340644e718dcc3cf3affb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00126-of-01024.json.gz": { + "num_bytes": 317902192, + "checksum": "d97bddf003b8f647c587fe9a9a9aed75ea604478e0b550d501ad7f07b6061b86" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00127-of-01024.json.gz": { + "num_bytes": 319243191, + "checksum": "6da4c882f88816a452af54ed217f84d6e4601c11a8e33bd47c49c0a1ea04f49a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00128-of-01024.json.gz": { + "num_bytes": 318045852, + "checksum": "ea43f63e6ef3bb5723ce75bb51f7183a525d8ccb00c93f49aaf2d9b560f7bdbb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00129-of-01024.json.gz": { + "num_bytes": 318436174, + "checksum": "72ceb525367d6e8d1c0fca94d99d4fe5353ead08a5d52bf00e30e3b596fa90a2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00130-of-01024.json.gz": { + "num_bytes": 319017217, + "checksum": "92f1b2687bee78441eeb4e05bbec2a491469b23c3aad0d951fbbe35a3c27998a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00131-of-01024.json.gz": { + "num_bytes": 319237739, + "checksum": "0fd07585a82b7d71ddabbc315195c84e2fa78a8319de7dea971cfcc9b38707b7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00132-of-01024.json.gz": { + "num_bytes": 318123742, + "checksum": "c9f5604ca28ea2a9ae5267db50f6e3d1e576841abe840134b3817f370c057073" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00133-of-01024.json.gz": { + "num_bytes": 319009751, + "checksum": "7ec982de577e0eeff57dc60346ce35a7b35b3c4f037987316cfc071b0ed58a87" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00134-of-01024.json.gz": { + "num_bytes": 319750057, + "checksum": "2619d265d76d82f6b84e2686371e5b6d6c08058cbd5765dd2906af9f549af092" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00135-of-01024.json.gz": { + "num_bytes": 319068231, + "checksum": "5e1bf5b09f2cd132a7747116442d6f26ce0002eaeb9f56fb02bc00e3abee8716" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00136-of-01024.json.gz": { + "num_bytes": 317800994, + "checksum": "80ebbf64fbd91215da553e3a8d9442380cee6c3b09fbbf8353a0817993d15862" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00137-of-01024.json.gz": { + "num_bytes": 318954070, + "checksum": "3b5d2ccafe526a19c52ac0fee50109b6a95ac3c8f7f2272a9a0302c4219e82f7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00138-of-01024.json.gz": { + "num_bytes": 318452853, + "checksum": "2dd88569a62003383a3bf70d68143f16f234535469bdc8ab01a8764f6babb5fb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00139-of-01024.json.gz": { + "num_bytes": 320013821, + "checksum": "f32ca62f6a9d2c8a72901e6f2c08880c2d1907f52beb4e8fdc30f4c02c7ad10b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00140-of-01024.json.gz": { + "num_bytes": 319510423, + "checksum": "7799838d8019d7cd71a505951f155bdfb862b4a3b3b77e182c706a624617169d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00141-of-01024.json.gz": { + "num_bytes": 318339814, + "checksum": "1601f6dbcbf4e7f1db119b232e862f3c9fe29e9abe5827177458079299ed511e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00142-of-01024.json.gz": { + "num_bytes": 318438444, + "checksum": "71d891be156e1b608733a3abe8f8dab7a6213c02931117b99889bc3fe8329d38" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00143-of-01024.json.gz": { + "num_bytes": 319413540, + "checksum": "88fb2e7c3d426a6bb5775041658c07005a469306af0d97df7d68f148b64cbfe8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00144-of-01024.json.gz": { + "num_bytes": 319901095, + "checksum": "2734ff57f4265653b0b1f292f513017ba791c3091cf8ac0bbf6d75d0074e3386" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00145-of-01024.json.gz": { + "num_bytes": 318500183, + "checksum": "da2e6747f7230af5941c6bee262a606b4f7792da359dbf7516d82d8301cdf90f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00146-of-01024.json.gz": { + "num_bytes": 319315120, + "checksum": "6daac97153d51addc8b1e43b686e3d641666df3a106270a141d734079db2ad35" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00147-of-01024.json.gz": { + "num_bytes": 320621434, + "checksum": "fb2584e0ce366ad30c8110591484b84798e9f06e8a27cd864e7800b8d5e2d225" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00148-of-01024.json.gz": { + "num_bytes": 318269045, + "checksum": "1c963c0ceb6cd776822352b186ae7e3d829ef334efcba0fbdd9182dde4deed05" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00149-of-01024.json.gz": { + "num_bytes": 318576426, + "checksum": "6a21397e0104c7fe0fcd9f1d43a8e546000596d896a95eb9b6c4ab92235e6a49" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00150-of-01024.json.gz": { + "num_bytes": 318447048, + "checksum": "075b113a73e6e21d7cac49391ee559ee8aaa2bb3338f709017077a4007a7bbb5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00151-of-01024.json.gz": { + "num_bytes": 315388730, + "checksum": "bd47e3ac0209676d8a32490eb20ca8c07ca3c45c2beb88dae18b5c8d925f349a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00152-of-01024.json.gz": { + "num_bytes": 319701880, + "checksum": "241d9cf003f49d95168ebdeccd8209230507d4dfd0d170fa1b57d2355240a95d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00153-of-01024.json.gz": { + "num_bytes": 318370254, + "checksum": "3aa86900a749224dfed8a67960c166e43c3b9ef3ac7b49d28129b496c7193e30" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00154-of-01024.json.gz": { + "num_bytes": 320064875, + "checksum": "3160c723cea6717fa9f5a9eb627d76107040d084a64106973099fa0e8de48758" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00155-of-01024.json.gz": { + "num_bytes": 318089754, + "checksum": "5b6e76a85bb1093eaba698864a54a938329b04494f9f72c3c3bbb155174da5e4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00156-of-01024.json.gz": { + "num_bytes": 320049467, + "checksum": "cc013e8aa7c1cf7fc28ebecc64d893d03b092a09d725b5e626851de0b311c814" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00157-of-01024.json.gz": { + "num_bytes": 319931950, + "checksum": "2a27b4c29455bcd813a84aa3a54100d16cb6bfed25171aa3c552ea452ae569e2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00158-of-01024.json.gz": { + "num_bytes": 319963615, + "checksum": "e477f769ea1513cf607932a29d793fdf1722cdea757e00c814dad594329cfac7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00159-of-01024.json.gz": { + "num_bytes": 319000491, + "checksum": "ff5d09415753c2aa4b51196e8f4bd6c77ba100ab281314aede118f501565cea2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00160-of-01024.json.gz": { + "num_bytes": 319069618, + "checksum": "e08c35aef8a20dccad80f6bb1579d6d2ce80113c8bf8459730c69fb7048c3cc9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00161-of-01024.json.gz": { + "num_bytes": 318750642, + "checksum": "13eef84873b58e29894f9bf68a4de72a530c1bfc80a5654262fe71420292b8ad" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00162-of-01024.json.gz": { + "num_bytes": 319847814, + "checksum": "a8579c6bcc906fe018881a8474724576c3d0f7f1787f1568b79e5accbd9f962c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00163-of-01024.json.gz": { + "num_bytes": 320370365, + "checksum": "b97a74837ab9f659c13dcb4deb53c600584beb9e5ceed29e99974c4953f644c9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00164-of-01024.json.gz": { + "num_bytes": 319894618, + "checksum": "9b63afffa2b84c91b749991ddb384399f1d408bd7b6b643e7329e49531ce9a53" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00165-of-01024.json.gz": { + "num_bytes": 320166197, + "checksum": "5b2414477dc4e2b080b34f3b98672bfe3de6028e7ad83c323a7dd1ee08c05a0b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00166-of-01024.json.gz": { + "num_bytes": 319612575, + "checksum": "2cda682db53000c14fcb5d251bae4f50c8c4159348f8594c3ef020260f277a99" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00167-of-01024.json.gz": { + "num_bytes": 319183884, + "checksum": "5c406d7a8a404436039fde7c2019f0174ff8855caff319fa62bb7960d341b41a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00168-of-01024.json.gz": { + "num_bytes": 319396348, + "checksum": "df6a422d57a2e1443d10d61b13ab2c5227734195c82b43e1ead2db723cdea293" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00169-of-01024.json.gz": { + "num_bytes": 319452933, + "checksum": "81c81138e7163072e3779dd10ea8af7dff12b705fa008665298e08cfc2699f03" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00170-of-01024.json.gz": { + "num_bytes": 317748609, + "checksum": "6586ae8862b8ac925f424afb6ba779e95a147323fb83fc8c4bb0813877b17718" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00171-of-01024.json.gz": { + "num_bytes": 319052376, + "checksum": "8b3cd21d8ffbe963ce935ef9e0b6efc45f4d5abab703fdfed19a1309b700dca8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00172-of-01024.json.gz": { + "num_bytes": 319068859, + "checksum": "a42f5f5a10bfc84d51dd0855166959462faccd6a182af4c5d2115ff9995f5324" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00173-of-01024.json.gz": { + "num_bytes": 319142377, + "checksum": "e26514c5d6cea27c0cf7fcc1daadfa6f218ef9e62039c6d6fccfc31660c0c96f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00174-of-01024.json.gz": { + "num_bytes": 319134484, + "checksum": "75349aa8c734ed894965500eab2fdf59657a63e40e5a53e822ef1e5a12838a02" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00175-of-01024.json.gz": { + "num_bytes": 318330467, + "checksum": "a3d0d14b28a5a3cc559d6d89e2ec09e49e92aa189e44e68dbb4ea47978e1eca1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00176-of-01024.json.gz": { + "num_bytes": 318584643, + "checksum": "dd68b42e5bfc656b71fe5701bacb929edae84055131f1dd65bbf3f3ad734e57d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00177-of-01024.json.gz": { + "num_bytes": 319275087, + "checksum": "05a8ff159006241cf938ef27b292f65906158ac25ac28919aa6761eaa634052f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00178-of-01024.json.gz": { + "num_bytes": 318490550, + "checksum": "a3aa38083c85baada29b207240bcca1a0d562a93971b420428d039092e58bd31" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00179-of-01024.json.gz": { + "num_bytes": 319083249, + "checksum": "12858fecd1dec728eba2c8c4311b17e4f2ac1fdb27c23e9adcd9258c5c4fc777" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00180-of-01024.json.gz": { + "num_bytes": 319752094, + "checksum": "67e968cb8d3ebec2f68eddfc539ea7402aa72c9274034494a43ea7d207b69a88" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00181-of-01024.json.gz": { + "num_bytes": 320476195, + "checksum": "c1bd59eb7ca799e31bf037dc7c087c1ad94e4f88a4f12427c454510d97e1c803" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00182-of-01024.json.gz": { + "num_bytes": 318538551, + "checksum": "dbe7205a1919dca9d6936158d5653a20d239f2e547ec73280956da4f8c609220" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00183-of-01024.json.gz": { + "num_bytes": 319620265, + "checksum": "46f9e603e04040b59df8da6ee01d1c30588aa7233a00526d6f0fd84c4172ba93" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00184-of-01024.json.gz": { + "num_bytes": 318301621, + "checksum": "880a02eabae231da388a5782a7194eef0d0211c2d1314db0c56d740647a114c9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00185-of-01024.json.gz": { + "num_bytes": 320515340, + "checksum": "f522147aed30ebb3ab352c92a9dd24cd2e8b93df1d4c4a6284d89ceaa2858509" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00186-of-01024.json.gz": { + "num_bytes": 318374733, + "checksum": "5005f1c42038769e225a626a88c10bd4f6af98dcc14deed475954b00c088bc53" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00187-of-01024.json.gz": { + "num_bytes": 319116182, + "checksum": "cbd7e0f486c6dac13090cd344337da1c336973e7ec75e32b0bd5b18b98f24bf8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00188-of-01024.json.gz": { + "num_bytes": 318981305, + "checksum": "064ce8c30b7a960b20720c133c3dd3281d27752a66def44d5133ff8f1b8279e9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00189-of-01024.json.gz": { + "num_bytes": 317036462, + "checksum": "acc052da4501691fdd28f269c633ed826840f2634be49b5e2c5e1273de0cb4a8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00190-of-01024.json.gz": { + "num_bytes": 318061662, + "checksum": "5a436e97c59b8636ca5081b71ca6fe8f8a3a99dd3f426c79edb2bf53345ee810" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00191-of-01024.json.gz": { + "num_bytes": 318556228, + "checksum": "2eebc89381ff78ae63f311c98b07853cefcc42fbcc210995095d568a6ff70ead" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00192-of-01024.json.gz": { + "num_bytes": 317987733, + "checksum": "99de46c4702c06a2303262b185b92fad82e12e189c923d5b76d9d8f96faabfa5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00193-of-01024.json.gz": { + "num_bytes": 320294532, + "checksum": "bccb7d8fc34d6cd6eb41e2a1c6234596b00a5517fdca7c47562fdee0e675377c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00194-of-01024.json.gz": { + "num_bytes": 320852679, + "checksum": "bb1e7768a57145fdbca7957ed964648d1deab5edc5dfad4722a81ad411c5e0f9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00195-of-01024.json.gz": { + "num_bytes": 319016077, + "checksum": "ac520468a5bd933dbac1aa5f7f21ba276bdce15abf99963ef9d73af294e81e70" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00196-of-01024.json.gz": { + "num_bytes": 319289881, + "checksum": "9eec5740115ab52ce98ac9efbed4fa1c5c06787fe93b4b28f6a1e4df06272870" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00197-of-01024.json.gz": { + "num_bytes": 320180232, + "checksum": "07a03763b84b4a86b4f71d725927d62c40925823ee454122a00fdb625ddb3a22" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00198-of-01024.json.gz": { + "num_bytes": 320004709, + "checksum": "a1b250b01289fdaf6dcd997ef31c59c580f81f961aa0fd88ae0d175bd07c02ab" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00199-of-01024.json.gz": { + "num_bytes": 321006991, + "checksum": "650e57c3dbbf4ed929da8c6c5d78f35fbac4644722a84d98f93342a8d33b2140" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00200-of-01024.json.gz": { + "num_bytes": 317913111, + "checksum": "42caf6dee42bd73d9e4bf0c7bb16383caa936b2e0a913489b9f0aef57b6004cb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00201-of-01024.json.gz": { + "num_bytes": 317897148, + "checksum": "990974a82de2b1c27465f6d097d7a5718c5ff334271e722ab3736e7aa5b89d4b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00202-of-01024.json.gz": { + "num_bytes": 319510250, + "checksum": "8467066f2417af774363d4984a37968a0189adfe3a581723eab15004930e621a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00203-of-01024.json.gz": { + "num_bytes": 319762388, + "checksum": "4e7e20980dea2d5e77f380b24580f0df9319a0d1d73ec319e17d8cbe044e53de" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00204-of-01024.json.gz": { + "num_bytes": 317418128, + "checksum": "2c027c5225ea7ce3c31f5f32dda12b7c892c6fdc9c52da6d0af749171cdce738" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00205-of-01024.json.gz": { + "num_bytes": 320157174, + "checksum": "d953e79c60be0e2c3b072c2186a845a351392ef395fa95135f47e6b8491c6f88" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00206-of-01024.json.gz": { + "num_bytes": 320459080, + "checksum": "bc70c34931942ca143f7eb555e86458afcc36110aa9559151f31d781969d4458" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00207-of-01024.json.gz": { + "num_bytes": 317361718, + "checksum": "fad5ebd7a81bb737e12e9d4c803aea1a9e905d43a3fa87cace32a64eef01e8e3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00208-of-01024.json.gz": { + "num_bytes": 319976693, + "checksum": "21381c727d945d8d3b4a275e3622bce64b07ed87d7f2371ac28b5d2023359cae" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00209-of-01024.json.gz": { + "num_bytes": 319550585, + "checksum": "8b74e5f1780c4bf12936ac3a86be7a3d11287866522da8275aa4232c1e3d8898" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00210-of-01024.json.gz": { + "num_bytes": 319574289, + "checksum": "1594bd49cde9641b49a1ad9373a53e10d65440000363f7532a7d326d17c44236" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00211-of-01024.json.gz": { + "num_bytes": 320615302, + "checksum": "5b6f7eddfa3a9ffb0d6668d10f398b1d86482b64daa9817ca0af549433071244" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00212-of-01024.json.gz": { + "num_bytes": 319395225, + "checksum": "db58fa453269c794fedb595c6193dea5a85c72ff8b2d43e77c9bb371b8c86b78" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00213-of-01024.json.gz": { + "num_bytes": 320131797, + "checksum": "1d21d19b5e36820559590b339c049be29f27505ab4e88572edbdb84b649e0b66" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00214-of-01024.json.gz": { + "num_bytes": 320153141, + "checksum": "55c9b4ff1cd8cc88738196f867aba620dec3c8b27b9a485c7e75d3129d76e9c7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00215-of-01024.json.gz": { + "num_bytes": 320525443, + "checksum": "dfe9f44676c1abf0e2875924c094c0d788f8a0172d641d5f810258e948e37feb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00216-of-01024.json.gz": { + "num_bytes": 320100146, + "checksum": "57f19f5437b0428d9f40799af14f8bfba8f6c82ebacaea8f6fc7531524a6d4af" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00217-of-01024.json.gz": { + "num_bytes": 320688377, + "checksum": "fad4f3143aa303c9c35165a15c6d90087c204c586fe20b0c0f45cf4238311b70" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00218-of-01024.json.gz": { + "num_bytes": 318896471, + "checksum": "aabd471960d6db1e93e1129410d9138d9d9efa3292af7491b3b6844c2bd3f543" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00219-of-01024.json.gz": { + "num_bytes": 319298204, + "checksum": "f676701589e39802779a0947585638347bb4fe55376a33c6d0afcdc40c5f8938" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00220-of-01024.json.gz": { + "num_bytes": 317757045, + "checksum": "f3d0994379d244054c5e2db366a081caee28d301aa6b0d9431e7d9eb1cb38c30" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00221-of-01024.json.gz": { + "num_bytes": 318568870, + "checksum": "8026854c8a8cc1d16b52a898b9dd8a8df7901dd8cdf285f5d937c4d5d45919f3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00222-of-01024.json.gz": { + "num_bytes": 319096912, + "checksum": "71f76f898864de3ae60f7c0cdbc68d53cbfa04b2f8493c40d55e1cb56727b275" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00223-of-01024.json.gz": { + "num_bytes": 319350414, + "checksum": "ba01faf3fe41a738c255b5da83daf53a5858144557af6c6f8d6208a049e4245f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00224-of-01024.json.gz": { + "num_bytes": 319007151, + "checksum": "94200d12c61f7c73a9e3a2bb089a05b017a215348d52018a34e3224578c0da06" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00225-of-01024.json.gz": { + "num_bytes": 319502985, + "checksum": "0b7ce650e555baa546bb329d7f0567a3dc0a7ec9d49149792032a86321a73d6e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00226-of-01024.json.gz": { + "num_bytes": 317983607, + "checksum": "40cf6d4b3deb05cd97ebed01405d08ae67be6e896736e4f371d15e5404567599" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00227-of-01024.json.gz": { + "num_bytes": 320199564, + "checksum": "e65ee475e3b6682b57bfa3f7b9c1cdabf36a7282fc793865df63dbe6a6a3d1fe" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00228-of-01024.json.gz": { + "num_bytes": 318852183, + "checksum": "8b27f2fbb0233802229fc776cfcb0b6b43af3149d217d0ab00cca0f1286482e4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00229-of-01024.json.gz": { + "num_bytes": 319407418, + "checksum": "f2d5199a0022134ae127c88f0ac20d1b2b8a88014a774b5432b41085c83ecb5b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00230-of-01024.json.gz": { + "num_bytes": 320787790, + "checksum": "e1b040895ac6068dd1aa892ec93d733096afc4adda698379006ef89926491255" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00231-of-01024.json.gz": { + "num_bytes": 318220053, + "checksum": "648a6349206c50c17d4e3562fd6fcb0a723b4cb40005890173d5de0c7ecc2ade" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00232-of-01024.json.gz": { + "num_bytes": 319702777, + "checksum": "0a44b7cb4f354e1eede683a697aba4051c1542fd030dd59767065f5f0204554e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00233-of-01024.json.gz": { + "num_bytes": 319154465, + "checksum": "4070448b7844776db6754bd33791900bf9ac8dbd81e4cd774a3055ada67f6fac" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00234-of-01024.json.gz": { + "num_bytes": 319846160, + "checksum": "b1e8c73078c347fa062ed408e81bbdcb2f714675bab2c082016e822e91ef63a9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00235-of-01024.json.gz": { + "num_bytes": 317722912, + "checksum": "d8aa694e870157b2b5411f496db46dc71dfeed01a42973a65499596921198abf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00236-of-01024.json.gz": { + "num_bytes": 318593592, + "checksum": "e0c4ff6c8a12128da88777074d0b097664cf2f2395913c4d82b0eecd501946f1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00237-of-01024.json.gz": { + "num_bytes": 318902831, + "checksum": "adce772ed699d7e908ae1fe1ddf1d9875305c7875c93cedf1b3ea0bbc21ff922" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00238-of-01024.json.gz": { + "num_bytes": 318696723, + "checksum": "926f9fc42cd248077afec1f4b88603c646fc5ae47c4ee3e9b8a5f6b8b6ff7f46" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00239-of-01024.json.gz": { + "num_bytes": 318321822, + "checksum": "439d756b0ffc97ebecc6c48a7dc90da77de7ada05a6eae929db98057ea15bef1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00240-of-01024.json.gz": { + "num_bytes": 318992553, + "checksum": "1f57af6ff9477263806c0827c0dd8e494e103b6f54eec2cd5f8f8327b01ee39b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00241-of-01024.json.gz": { + "num_bytes": 319345185, + "checksum": "493932a44e09f4b311ac5bdb519111fad0982708d4b467688f2b1105316544eb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00242-of-01024.json.gz": { + "num_bytes": 320108156, + "checksum": "de5603f1b276f1373011c8884f06af017c71b03c5de3b3bb89cd6d550a0d5902" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00243-of-01024.json.gz": { + "num_bytes": 319855563, + "checksum": "7c1b74de8ae3699c567edaa6e2d1a1f1ae82f4810e769c710a23cd2dfc536c60" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00244-of-01024.json.gz": { + "num_bytes": 318966332, + "checksum": "d3ada80bad9fa776374878bc7504138e14c161bc9798ea8114b0d187d4c815f9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00245-of-01024.json.gz": { + "num_bytes": 319541864, + "checksum": "3fe5f26e32795c49743d1b2497c333be57248c9db2ce12fb93e103d1a9595347" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00246-of-01024.json.gz": { + "num_bytes": 318530369, + "checksum": "a0bdeb2dcb5dfb46f843c4086230ba918f2d3ec125654cb924ea11e7c75cafbd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00247-of-01024.json.gz": { + "num_bytes": 319496627, + "checksum": "0c4099f832ada6b24ef6c1d15267cd3c179f5b3d79e3d813d944e3ebea908c99" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00248-of-01024.json.gz": { + "num_bytes": 319132981, + "checksum": "608b1cd27ad345f6511fb677c00d56b6e827f288877d68aea1bcad3b02dd040e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00249-of-01024.json.gz": { + "num_bytes": 318529093, + "checksum": "8fd580be09f913cc3809e3b0e467e2faf657a5db6f71b75aa931043267b9b0f3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00250-of-01024.json.gz": { + "num_bytes": 318248903, + "checksum": "faeac675c3634b0834939046e60cdfad6a13558d7a6799c5bde25567898d86a0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00251-of-01024.json.gz": { + "num_bytes": 319184870, + "checksum": "038972e03db75417fc4cb25e54c3aee01e4f022eb0fab202142f539e4d866e28" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00252-of-01024.json.gz": { + "num_bytes": 319631399, + "checksum": "2fda0c2cec4624c6068556e16630c3551ef3110759bed59628913a9debd547a3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00253-of-01024.json.gz": { + "num_bytes": 318275716, + "checksum": "b5da4bfa564fcc6c49a573b90e679d60c4e222249858f4e58fdb3727a5f279ec" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00254-of-01024.json.gz": { + "num_bytes": 318638865, + "checksum": "279eb2978fe94e1570318a247b82487c04d7494ceed74dccb1d7a5734ea84e5c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00255-of-01024.json.gz": { + "num_bytes": 319640339, + "checksum": "aa0a1ef845d0df7d81d2588d53f29205a4e3858a0888c1b7d9c83eb2fe1d32a7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00256-of-01024.json.gz": { + "num_bytes": 320353593, + "checksum": "407133ea3b32a9e004b992a1bccade0440a39d0bfbd12993ea78c6526c0864a8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00257-of-01024.json.gz": { + "num_bytes": 318165587, + "checksum": "72b7a72b8402b22cb51db44c9e7859460366c7c9d33e16a4c038ad07f7ad8f3f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00258-of-01024.json.gz": { + "num_bytes": 318003534, + "checksum": "e5f9f2f74b7f9958dc9535f04a8965749ca4bd68005a6efa36f480fb487ca930" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00259-of-01024.json.gz": { + "num_bytes": 318990454, + "checksum": "7cb3c284613537fc6b1a85d7187dfca30b37a7a1a5708094f17486e3184e2d62" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00260-of-01024.json.gz": { + "num_bytes": 319514850, + "checksum": "0067e36b7156196e2451cdf78dc8832352f2481a4740afbef9046104b6810bdc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00261-of-01024.json.gz": { + "num_bytes": 318747661, + "checksum": "b1e4597420035c355abe15efc576751169e2b5e4c38e073c178346a7202d5ab2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00262-of-01024.json.gz": { + "num_bytes": 319868329, + "checksum": "374f4b951e545968da45b5055af2aa0b128c1d65d6c854f5b8f7e02d22c352e2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00263-of-01024.json.gz": { + "num_bytes": 319268788, + "checksum": "7168e635a32859a85a152b29bcd1f699257ee4e340517e218ea9b8dac3922210" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00264-of-01024.json.gz": { + "num_bytes": 319270640, + "checksum": "1da08b65c83e79a0f5b7215e5a4ee58f21383b69f09dd9a3ba95381ba3d56d25" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00265-of-01024.json.gz": { + "num_bytes": 318744354, + "checksum": "0c908e81d59b2099eda038731b387a0ad86fa3d168eb2955413dde9cf29d947b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00266-of-01024.json.gz": { + "num_bytes": 318518406, + "checksum": "115e375464931638de4af669b7301b6112d18b23835f2db2b092f47545b1a855" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00267-of-01024.json.gz": { + "num_bytes": 318921711, + "checksum": "6d66c715137885a46f2472489b21751284ec8ecfde6dca6be3ec1ee75f6cd5af" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00268-of-01024.json.gz": { + "num_bytes": 317786222, + "checksum": "588865d8f9d3da5a70c958997060ce4792e175c8fc5323f1887787070c8c160f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00269-of-01024.json.gz": { + "num_bytes": 319004956, + "checksum": "163ec7497602931de2eaffad320704e508e491937a2965e39907a086f640d975" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00270-of-01024.json.gz": { + "num_bytes": 319175186, + "checksum": "794e0e7ceccf28457a8ed5b0724337545661da16feafd0a53e4823b2cb1c92ae" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00271-of-01024.json.gz": { + "num_bytes": 319785821, + "checksum": "9c9ec0348f7d4ffc61e5f19f1f60c8382b33ca2fe4b852567cbc3c16024a4627" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00272-of-01024.json.gz": { + "num_bytes": 318933435, + "checksum": "883d85985237948018b13c20f4d4ee567c6ee36a135b326e8117d73dad4fe37a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00273-of-01024.json.gz": { + "num_bytes": 318456664, + "checksum": "fdca13067e8e118e538b8de538e164fb5397724045a5b1b02764510c8de90969" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00274-of-01024.json.gz": { + "num_bytes": 318418161, + "checksum": "27556558fe8a91a4aea4800ba9b7e844336a7638c5b96e652fcdb359f631b04f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00275-of-01024.json.gz": { + "num_bytes": 318437784, + "checksum": "6ad4e6a3e1cee04aee3051a66531e3f4aa97f7bbb7602c6aa5f46a727b319f2b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00276-of-01024.json.gz": { + "num_bytes": 318470946, + "checksum": "145a4d85ddf1e72fcdb8477dcd2f70a5554d9cd9349e02e058d3e7837204b6ff" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00277-of-01024.json.gz": { + "num_bytes": 319580624, + "checksum": "7116de0dbc5c7f6621f7c107dded9d85788937a87f2d56efca32ae9f25fc6865" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00278-of-01024.json.gz": { + "num_bytes": 319619699, + "checksum": "8dabdf2d26035d30c22204e6f46f292c58f4a4c3b0b77a1826a43341d4282df9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00279-of-01024.json.gz": { + "num_bytes": 319344020, + "checksum": "c2b7d5bf62be1772c6bb80f597b28d948cf3cdefb10b6df6f777f0ab7d8fb015" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00280-of-01024.json.gz": { + "num_bytes": 318997864, + "checksum": "025457720b0045e7bf01f9b4b847f28ef94af9ca250675efeee73eeb340a3f36" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00281-of-01024.json.gz": { + "num_bytes": 318718146, + "checksum": "2979c0ac06570a9ee437521778c514bd8755193b9f1ae6a5a671ef885243f019" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00282-of-01024.json.gz": { + "num_bytes": 318434530, + "checksum": "a17bca50ec20c364adb899a9073bbe3a1505f81803a58190efc5d4f3f78b58be" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00283-of-01024.json.gz": { + "num_bytes": 319317663, + "checksum": "9034f524fc5c2e246b22e2dee00b47e0c4da0316bc60d0a11d966c28db917f9b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00284-of-01024.json.gz": { + "num_bytes": 318957832, + "checksum": "f08b96047e711831dfb8a44d90cb712d3e78c98dd28ec6b937ee83949bbef5b0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00285-of-01024.json.gz": { + "num_bytes": 318643283, + "checksum": "c5df1f2e2dad46d71f8aadf856a5139020da8afc2ee010d53c0372ea09b2362d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00286-of-01024.json.gz": { + "num_bytes": 318064839, + "checksum": "16f7fd6abcbc69750b8131bca3e38ddc40bd7c86c48122ad2a9a77cb9cfd552e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00287-of-01024.json.gz": { + "num_bytes": 320328448, + "checksum": "41e82bd357b47a28f28a4a203d5b54263aadb3c9a08899f78302c727c56d8b38" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00288-of-01024.json.gz": { + "num_bytes": 319559271, + "checksum": "970b9df224b58ca50b3023d92f6be0c37dbda479155c29c535e457ef6f2bca0e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00289-of-01024.json.gz": { + "num_bytes": 318786822, + "checksum": "36a6515e7f516335d3fe057bb6ed9890a2aea033e08edd8588b3168b3445b2f1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00290-of-01024.json.gz": { + "num_bytes": 320634782, + "checksum": "7d19fc82b9a5aa0e0046cd17cd2c46f356f8a4a7d203d5e03e1f319156f05cb8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00291-of-01024.json.gz": { + "num_bytes": 318746713, + "checksum": "86d610d4590bca69281348dbfaaec9e704fd6194141c50c71e84aad51ce26b91" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00292-of-01024.json.gz": { + "num_bytes": 320049630, + "checksum": "d045df646213e29d4e7de4ec8915eb3b65bb962f35b0d74abf00889bd5aae8ab" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00293-of-01024.json.gz": { + "num_bytes": 319966146, + "checksum": "c66fff1a64b495211bfdcea650ff76115f8c857b9154c1b869062e702714b9ec" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00294-of-01024.json.gz": { + "num_bytes": 318805332, + "checksum": "ef3d9204ec85a1e65ae48af7924f614403d297a15f232ba41eb0e4fe223e507f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00295-of-01024.json.gz": { + "num_bytes": 318898465, + "checksum": "2a071fc28b1216f2dc0579528d9b04e597b5cdac9fd14719e312092242da190a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00296-of-01024.json.gz": { + "num_bytes": 319406630, + "checksum": "ea71e9fd444860d70d3728f7e2213a4bccf3aa31a164c9acfa8df7a0b6619786" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00297-of-01024.json.gz": { + "num_bytes": 320312971, + "checksum": "ddaeba8aad38b7e9727c579cc44f15b3c82d292e2901b47b785e9c8d3d5cdb9d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00298-of-01024.json.gz": { + "num_bytes": 320660744, + "checksum": "814460ccfda29b45edaee5f44e3c980889aee2ee52e4e5323931ea489fbe938e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00299-of-01024.json.gz": { + "num_bytes": 319848186, + "checksum": "3b91fe32d3a731a5be3bf778eedfe13e8a7e26ba9eda51c278c5212aa7925681" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00300-of-01024.json.gz": { + "num_bytes": 319647278, + "checksum": "1e0424631f7f354bc63b3e71c5c6516c85343dafd3896acb9560eaf93b672799" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00301-of-01024.json.gz": { + "num_bytes": 319080252, + "checksum": "46c21af013f611729cc06ec033dbae80151987f9098e57fb98e2631f6fe76c8f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00302-of-01024.json.gz": { + "num_bytes": 320028246, + "checksum": "d1ca8ad6e5bd6cb18db1f1be9154dbc8ba9df7ca02db4c1f8a7df9d40820d8ff" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00303-of-01024.json.gz": { + "num_bytes": 319388787, + "checksum": "bce87161f77464adfb1fc04fc2993211bcec502d7172b86f726daf7096b04f82" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00304-of-01024.json.gz": { + "num_bytes": 318627831, + "checksum": "235b8085cbeb7b13f8e1a5f6d2225a9461b7bcd76e21466a189c2411ff4c4107" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00305-of-01024.json.gz": { + "num_bytes": 318148428, + "checksum": "f13f124e0ea150da13ebeb3390c311b3db54018de0d640579307bbcf2c46068d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00306-of-01024.json.gz": { + "num_bytes": 319451712, + "checksum": "de5c3fa2cd6a47551ab43268484d017602e2c3e1f66f43f1a1d8f95bac52cad5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00307-of-01024.json.gz": { + "num_bytes": 319026244, + "checksum": "88769fbf393671db352227a64cb8ba6b4ba60c5bddb4a14294b1ad9a65a750cd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00308-of-01024.json.gz": { + "num_bytes": 318447454, + "checksum": "555bcfc0ba4db0551ce5ffb18057027ee695af166856125aeb79f7ce013851cc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00309-of-01024.json.gz": { + "num_bytes": 318147676, + "checksum": "bf28e60a7970c548190cf0f4fe56f27ea55a1ad8313fa353a8013f0a0e7919f1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00310-of-01024.json.gz": { + "num_bytes": 318930650, + "checksum": "45a68c0ef70ecd10838d604d51fecd26e5199f5372022b9c2af461a71c24c6ef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00311-of-01024.json.gz": { + "num_bytes": 319955339, + "checksum": "fb3c4e93166f1cb2ccc8a7b68da0246f0827d3a81bb5614c8c84f1c01c6d53c7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00312-of-01024.json.gz": { + "num_bytes": 318554567, + "checksum": "0dce2ac88ba7ac5340d551add9fe7b1a30772a6cc082347c536427b48daca598" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00313-of-01024.json.gz": { + "num_bytes": 318978931, + "checksum": "c5f99dab085fb705769a514626c9af8a26cf846fdaee4b403a3d6f84c892cb66" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00314-of-01024.json.gz": { + "num_bytes": 318158197, + "checksum": "79de4fa2aed5e3efa71e75d13f08d7c1869aa59f42a819f4429430b3db6c1b27" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00315-of-01024.json.gz": { + "num_bytes": 319744521, + "checksum": "5a47a89a1537662a91853bbe2a5b3e243f5de74489f820621192cacef192593f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00316-of-01024.json.gz": { + "num_bytes": 319861527, + "checksum": "1cd34f17f3ae3c8bf8e1636714a9ff600a26799d5ec02ba42abefa5db9d00e5e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00317-of-01024.json.gz": { + "num_bytes": 319286030, + "checksum": "a3e34af81264a72b523b63fdc0268f450675f7993fa0885eb2b4c747b0d6703c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00318-of-01024.json.gz": { + "num_bytes": 319054871, + "checksum": "02fa8cf278578108083bc9a3c5cf07b0a9d243f2162397091ede6c85a1df31e7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00319-of-01024.json.gz": { + "num_bytes": 319943810, + "checksum": "93ef0d7f1610043a6f7634af73e89ee9f3d7e87828ad34558a4d688e6fa6b6dc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00320-of-01024.json.gz": { + "num_bytes": 320037211, + "checksum": "06fbd99a3d64df293db2655f321117f1afcf1cda51e421edef9335a25cb1a902" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00321-of-01024.json.gz": { + "num_bytes": 318584237, + "checksum": "a224e4d902f7368f91d6a72fc9f5730996dc37de576bc2211eb632e3690f1b38" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00322-of-01024.json.gz": { + "num_bytes": 319686632, + "checksum": "57fba28c7104ff659f8a0f330ae89c68d3a392dd14a78247fa357a3bcc8b94dc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00323-of-01024.json.gz": { + "num_bytes": 319834993, + "checksum": "e61c760cd3c42f71a1a7bb6adc4e0bc970bbf864b69e2a4a5d56bf0a14d4e0be" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00324-of-01024.json.gz": { + "num_bytes": 319243057, + "checksum": "61d21ab1e7729f172ade5ab6c0dcaf07eaeaee6e047ca1c24722c06ddd919678" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00325-of-01024.json.gz": { + "num_bytes": 318569583, + "checksum": "2192a891ecc2a6aa9f6ea64f1d76ce763e0a3963ae03c95275ccd626171835ce" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00326-of-01024.json.gz": { + "num_bytes": 319175980, + "checksum": "d35e4d5f8e924ad97520db51a2c361bbc02097721195932b6768e7460df092a6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00327-of-01024.json.gz": { + "num_bytes": 319892298, + "checksum": "ce967065d3915d466982b5258e07ad2c46b02d7637057e0547586657ea0f53a4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00328-of-01024.json.gz": { + "num_bytes": 318004026, + "checksum": "0676d556f46b1f057669d3378c6fc335db6e3ac67a02e11dce3823658730f4c5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00329-of-01024.json.gz": { + "num_bytes": 319066225, + "checksum": "b00bb4bda957e1287b98c432165448b3899f9155363f7b61bfd0f0181181acfc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00330-of-01024.json.gz": { + "num_bytes": 319268288, + "checksum": "d14d1883941966ef3b35203d06e6fa1bb485dd77118bd7b6c811b0d06fa72fae" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00331-of-01024.json.gz": { + "num_bytes": 319131311, + "checksum": "4d5d41c2b2242b299fb67fa8c9327db8b4f612bdf4ee9af4d4e45aba8cd1e409" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00332-of-01024.json.gz": { + "num_bytes": 318827508, + "checksum": "68cea08d4805b392bf4c2894a4501ee3fbbe9aac4b1b6533e686ea749ced2dcd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00333-of-01024.json.gz": { + "num_bytes": 320572240, + "checksum": "06f211ae2fe1c4eef5e41caceda8ebbc289261057911fcf2583a59c730b7951a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00334-of-01024.json.gz": { + "num_bytes": 318121862, + "checksum": "46c62769e04ce8acde4562ba24d72e245babacdfb50600da4e6217948ad71d24" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00335-of-01024.json.gz": { + "num_bytes": 318692168, + "checksum": "dca69a6976e7387a12c8da16b696ed4f604254693a3280be0f90fa694700b595" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00336-of-01024.json.gz": { + "num_bytes": 319479902, + "checksum": "c52969fad97f1dc0e1e115428e7dad1ac6cb6d804db0cd34f0fc7846b1b50c7f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00337-of-01024.json.gz": { + "num_bytes": 319987407, + "checksum": "2c570f02aa6a6bac96be1e02663996c87f9a94c160f22101ce8ae1d549ae1de2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00338-of-01024.json.gz": { + "num_bytes": 319051086, + "checksum": "77132df95b147c471ead74bef16ed4fa11e15209f518dd460110132358816834" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00339-of-01024.json.gz": { + "num_bytes": 319473192, + "checksum": "7f3ac20a72d395c02ed3cb50052821521dc2d8d97303d00e0d0982e2c29e7659" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00340-of-01024.json.gz": { + "num_bytes": 318423485, + "checksum": "d1127da89e960d939cfc06cf1985df415b60d4bf02b12b7fab02b796100feaee" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00341-of-01024.json.gz": { + "num_bytes": 320087690, + "checksum": "f753423f82157e95506566d3653d32af6a181e69ea0e10b4d4eb24b626d3ca49" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00342-of-01024.json.gz": { + "num_bytes": 319767100, + "checksum": "db7410e6a6ca74163098681038f497faa373e1d81434b45c1a2f273d467c0a2d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00343-of-01024.json.gz": { + "num_bytes": 318389429, + "checksum": "7ea1e432a1ffbed8f4ad6cb985c5cf1b2584d8eb7d2fa091a2db3f104a3f7210" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00344-of-01024.json.gz": { + "num_bytes": 319117212, + "checksum": "c7317a81a6224dec9be07b41134ac7a7db4039b7c98b2061b20bb59b82ed0a1e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00345-of-01024.json.gz": { + "num_bytes": 318504232, + "checksum": "1498efe8280609d9d66c324e332c9433c6351bb7b99c5891a8f27d6841410407" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00346-of-01024.json.gz": { + "num_bytes": 316721169, + "checksum": "0cbc6b494d653878c9d52a37572064b88356058ed291aa773e5f47259fbfc722" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00347-of-01024.json.gz": { + "num_bytes": 319007736, + "checksum": "6265505e19a42a01a159297d33b1a91cd0e042a31ba6a1a867404a143ae565a4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00348-of-01024.json.gz": { + "num_bytes": 320167918, + "checksum": "cc8b29deb44c8348aa4d05836f89cbae995c946f38d9cb8e7fedbd4762168ba0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00349-of-01024.json.gz": { + "num_bytes": 319901226, + "checksum": "2a0f2188b43ffedc8b95a8276c7647147587c5e544c9e6475e790f4b5e362992" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00350-of-01024.json.gz": { + "num_bytes": 318999223, + "checksum": "1fde48c503998872aa71fc524c7408dc84cbc1faa0d885895d5c57708a15fced" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00351-of-01024.json.gz": { + "num_bytes": 318935410, + "checksum": "72d577eabcd814a7ff61b894b3fe9089f483a793e692d3ab20ce4ee59921f975" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00352-of-01024.json.gz": { + "num_bytes": 318655907, + "checksum": "8686dc0e4ff7b35cbc4fa6f3abce50c06f8b95378031c132a117e1d458cb4616" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00353-of-01024.json.gz": { + "num_bytes": 320619683, + "checksum": "cd5816469ef54bfeb0db6b55a78e0d34eb2e1f82448a41f67dfb70061c3ea91e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00354-of-01024.json.gz": { + "num_bytes": 319352400, + "checksum": "bf082c093423d562da4984b1f0428225d853a05b5f8fb3696273f36ebb5a235d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00355-of-01024.json.gz": { + "num_bytes": 318868462, + "checksum": "3b8baeca48e55a2cd268d6aef75f7eed96ef10fceca593a5179d52a2b0121f8b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00356-of-01024.json.gz": { + "num_bytes": 318903295, + "checksum": "4c9a9926a4bad6721807d99cc02a9b6bd28bb0a6254aa1c15527b745c56a06a2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00357-of-01024.json.gz": { + "num_bytes": 318881446, + "checksum": "84b4c2e05bc162fef4824e97ba7a03b1cecb41eda08a3e0aedd264b66e859a30" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00358-of-01024.json.gz": { + "num_bytes": 318521100, + "checksum": "aee99528ffd0323fe81e4ed26ed1b9295baa2a3910771dd2a42f4f378fd82569" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00359-of-01024.json.gz": { + "num_bytes": 317796778, + "checksum": "7b01f2d5ae54f60c2aeb7b96bd366d21e558e2dac48c83a78df9850f37e02f1e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00360-of-01024.json.gz": { + "num_bytes": 319502919, + "checksum": "5b54f9a050e6f9008a1806101ea553d90eead56c949a5f3f46c8ccb88812081b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00361-of-01024.json.gz": { + "num_bytes": 318595505, + "checksum": "49f4164d66187d46adff7f9bbac97b232ab7906d812e571c2e0bf028895e7f47" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00362-of-01024.json.gz": { + "num_bytes": 318851572, + "checksum": "17accad3c0706c54530f128260cacbf986cbbb20427d4ba8d3444a3702a22c55" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00363-of-01024.json.gz": { + "num_bytes": 318555337, + "checksum": "2327866e541aa6aa73f7289c3ad82a19ff154d39657d98cb78a2f481a8765920" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00364-of-01024.json.gz": { + "num_bytes": 318641145, + "checksum": "6f52354d804e8d4a1af1f6c2c6b759ae115c4f23a63f1206a73e7e25acfbdd02" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00365-of-01024.json.gz": { + "num_bytes": 319212614, + "checksum": "8f1834eeacc9bbdee95b1f0a4078eb9488bd1a7c5693489bff7943869674cad3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00366-of-01024.json.gz": { + "num_bytes": 319336585, + "checksum": "a9cf01b76104eebb4ef8462a924f61c262fa197a7c68a50e48d925cb81586e3f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00367-of-01024.json.gz": { + "num_bytes": 319161263, + "checksum": "5ac822027d50c3196026fbaffc7d968e1ca702b947688a6f4d268b942b5067b5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00368-of-01024.json.gz": { + "num_bytes": 317911640, + "checksum": "f9acffbe3c6617e85911ff9dcecec2378b3469ab4546a6973cceb460f9003cea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00369-of-01024.json.gz": { + "num_bytes": 319585031, + "checksum": "9234553649cfa5265c5a9ccc88486402f88eb81275067c51d9deef16bbe7211f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00370-of-01024.json.gz": { + "num_bytes": 318345879, + "checksum": "2fbb410346d31a33e8532602f4e3340fcc75c96be803250e9f0f1a6894ca0052" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00371-of-01024.json.gz": { + "num_bytes": 318996184, + "checksum": "b069b0c8a830ea841e82077548706f286308ef0420e163ff6d8312c8853af172" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00372-of-01024.json.gz": { + "num_bytes": 317989343, + "checksum": "bfd62e448d4d9f89353abaa384007b0b72bd860402ade3a9d938051a6446530b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00373-of-01024.json.gz": { + "num_bytes": 319770759, + "checksum": "e4e176250aceb7362ce38d496556a46409e9872e69f45166afe71aa750de8fcb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00374-of-01024.json.gz": { + "num_bytes": 319212902, + "checksum": "28aa4510c3ddb9ee0ac56aab3792bfe5e899531919ccc0214a4b68bbf2ba18a9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00375-of-01024.json.gz": { + "num_bytes": 318968029, + "checksum": "35326b1f2280e07dd754e89dfa29989d0dfa5c78995d393b36a752d8364bfcd7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00376-of-01024.json.gz": { + "num_bytes": 318685188, + "checksum": "0060dbaccf7f2f956fb8b57891cb176914ddac1bc485dd86c2fd110c46d174b9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00377-of-01024.json.gz": { + "num_bytes": 319291982, + "checksum": "99fc38654197e506868e099c15b2cb15b93238dafd33f81a7d069b3e01c3b085" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00378-of-01024.json.gz": { + "num_bytes": 319259094, + "checksum": "9b8d97f9d57dd97373c4f57eae2b9c01a58e49017ee41d3969e94fb4dbabc260" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00379-of-01024.json.gz": { + "num_bytes": 320228224, + "checksum": "82913f2d182d2a57f6c93e9b229862cb72feaa6331d04cd4419113e1eb9d52cb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00380-of-01024.json.gz": { + "num_bytes": 319738339, + "checksum": "e0de43f754ab97d103a02c708d1cd7e771ba079bd9e1f7c532a80a30bd5182ea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00381-of-01024.json.gz": { + "num_bytes": 319210620, + "checksum": "df74823f78564b544677410508e675e2811905c56afe2a60d19d3e049dd65394" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00382-of-01024.json.gz": { + "num_bytes": 319810275, + "checksum": "f5d5291a695fe2cd228213fa2bf090bf6513c49c6911826aa43ecaefec0622ad" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00383-of-01024.json.gz": { + "num_bytes": 319190426, + "checksum": "a861ae79a66b72d6cd5e0a030daae52cffb85ba1272c36ae2be04a9b7c0287c4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00384-of-01024.json.gz": { + "num_bytes": 318501845, + "checksum": "b8d0f5078ae82980f0f64120530bbeb20f627be0a8629d68885acb867091417f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00385-of-01024.json.gz": { + "num_bytes": 319530458, + "checksum": "7da119f3f63e25ff63cacd8ba0d77987b2d576be1f4b86e7e45aa3f2d194624b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00386-of-01024.json.gz": { + "num_bytes": 318938980, + "checksum": "c21f3de56fab26d7fb60bdb47c216b22793f67b8fa6d382520c79b88d1896f05" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00387-of-01024.json.gz": { + "num_bytes": 319207426, + "checksum": "e28b0884092f75836eed4d73ed24b7403d7b0530fc389386a68887420b0c2603" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00388-of-01024.json.gz": { + "num_bytes": 319835376, + "checksum": "b4f0db632cc9af66e8aea109c80d73a6281207e29ece131d5bf8b57ff8f81262" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00389-of-01024.json.gz": { + "num_bytes": 319346837, + "checksum": "413a8d8df1f6cf3094839b57231da5323f33f7115768c65d83f0af1574f71b6c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00390-of-01024.json.gz": { + "num_bytes": 318632301, + "checksum": "a3e8664fbb3ec2af5a217225dbb7fcf3e93b427e5da1a88e35c04c319d61e4c3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00391-of-01024.json.gz": { + "num_bytes": 319066082, + "checksum": "e22eed3415c90510e97768be5a685e0a8035e2635ef773c56e9ce2718c278658" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00392-of-01024.json.gz": { + "num_bytes": 318356286, + "checksum": "ddbf325390648d9d86f1e7901b75c99fe8db538d203de8dfb4c304282f82cd74" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00393-of-01024.json.gz": { + "num_bytes": 318048288, + "checksum": "974fd05f356c86be2f9109b0272eee69c5b2eaf0b16104cc573846c925d13b4b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00394-of-01024.json.gz": { + "num_bytes": 319444683, + "checksum": "0d27d6f8c3b935cef23ea60abfa82bd6a4f5e2e061080419dc9c6bc455b9f868" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00395-of-01024.json.gz": { + "num_bytes": 318353166, + "checksum": "24d9956bd857484ffbabb3ba6f6ac688f48a94b50228238c7c9153a5c6878a7c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00396-of-01024.json.gz": { + "num_bytes": 319960396, + "checksum": "9425f4f18e1690ded866c4b5313cbac8a6210092dc42f720200b7143b69eabe5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00397-of-01024.json.gz": { + "num_bytes": 319030577, + "checksum": "dee166674b835b9849d281a87238aa136e14d26edaa72d0ecb6b7e82d556a72e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00398-of-01024.json.gz": { + "num_bytes": 317664320, + "checksum": "f85e08272f73ce4aa602719d59205db54d230a6b7247830d78f91eac63d753be" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00399-of-01024.json.gz": { + "num_bytes": 319623875, + "checksum": "85dea0672a0362a08503b70623907c8c92bd105f788fbd7f3816212a9181e7c5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00400-of-01024.json.gz": { + "num_bytes": 318840274, + "checksum": "a104345698500611cd1a71a6647555300d315490918740a8c6e3b8dcff315407" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00401-of-01024.json.gz": { + "num_bytes": 318336377, + "checksum": "808327d156e183e102fd75cfbdb7b5a1fbde3740168f59b767ea380608305b67" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00402-of-01024.json.gz": { + "num_bytes": 319270185, + "checksum": "b6a5f7c1ade628091fe86744a6011147ec32795ad694ccbc82929791b93aa307" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00403-of-01024.json.gz": { + "num_bytes": 318038520, + "checksum": "108904ab05b3ad23318f8aa0f7ddd00d97aae1872fb157eea73273e011cbec04" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00404-of-01024.json.gz": { + "num_bytes": 320933185, + "checksum": "cd0c068c0831218849149eaab8f8a98748823911c745ca0ea33ae839bd625e04" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00405-of-01024.json.gz": { + "num_bytes": 317694827, + "checksum": "d99909ccd59e2ec183b41a7c6d1bd5677798bd7fd784ab681546a7bf8292f353" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00406-of-01024.json.gz": { + "num_bytes": 317937468, + "checksum": "c7f2bd7a366b8c389e41fdfad4891068c86039e1a5fc3b8a0b993253badf33d2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00407-of-01024.json.gz": { + "num_bytes": 320226074, + "checksum": "765db6f9f0c8c3d9bbb0499f0010928fe4f90d5915dfdd3b6d09d3dc78ad07a9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00408-of-01024.json.gz": { + "num_bytes": 318613788, + "checksum": "165e78c858dfaf010307392474d4917846c9d21658558912e5ffc915803bd2fb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00409-of-01024.json.gz": { + "num_bytes": 319212414, + "checksum": "5f7d5952aad1ae31413962983971b2b422d77c262ededd2ce1c1e186aeb6d87d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00410-of-01024.json.gz": { + "num_bytes": 319023647, + "checksum": "24588d41f40e3fe389575b97d41ef761be46bc9a9b3965c5e3f994760f7a4070" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00411-of-01024.json.gz": { + "num_bytes": 318408922, + "checksum": "b35d4ada5a000f51169557b00e508706d51a7becd33370014ff07c8b8dac1af5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00412-of-01024.json.gz": { + "num_bytes": 317166932, + "checksum": "d3ed1cae269ebefe4716843bd7954bf7e44ee889f72066afbdcd95f4e1f06703" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00413-of-01024.json.gz": { + "num_bytes": 318519121, + "checksum": "07fc61a7e164301113201e78c99d40289d88e0b463048e14aa5fe69c7490ccac" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00414-of-01024.json.gz": { + "num_bytes": 317417235, + "checksum": "c5a7222b2eb8e8fe690f29a0fff7e214ba94e4d9dae62f67281fe25dd385b721" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00415-of-01024.json.gz": { + "num_bytes": 319690993, + "checksum": "37052fff729bdff124577d5ba041906b2ea7420c5cb28195e6cfca0e41d560c8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00416-of-01024.json.gz": { + "num_bytes": 319466518, + "checksum": "6e8ce2b9e6e8208ad7e43ce709454cb0b96572d793e0b11c15892f5df18f6137" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00417-of-01024.json.gz": { + "num_bytes": 319694381, + "checksum": "20892d7a33c31d7967ae0cf595a2108de96a61c0bbd773aebc5d3d083f6ed93b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00418-of-01024.json.gz": { + "num_bytes": 319048918, + "checksum": "fd795ae8d53e632bb3e89a2becc5b801e10db781b14f2c0ed50b12def5376c8e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00419-of-01024.json.gz": { + "num_bytes": 319791424, + "checksum": "5a8e56faaa0892249e5694ae01e2e4dcd22d9750a9aeea5ca390117c77b8de2d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00420-of-01024.json.gz": { + "num_bytes": 318060925, + "checksum": "795ee64f4c9e2e35d9dc0c91ea593c9e41a3924162901fbf782dc7112f8094a8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00421-of-01024.json.gz": { + "num_bytes": 319328927, + "checksum": "2670b7b6b53e9082c90e4a4e915f72673831ff15e9f55918a1244e0c19c8f963" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00422-of-01024.json.gz": { + "num_bytes": 320065363, + "checksum": "34df2d1afac2ae4699524492d6b93e4a2a1e551cb4a4ae35fc19353930afab8b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00423-of-01024.json.gz": { + "num_bytes": 319349887, + "checksum": "a2b19afafb45cf30493ac2a3eb013e136e7213f63bd633374ca0d9fe2780efe9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00424-of-01024.json.gz": { + "num_bytes": 317515288, + "checksum": "ec2a84fb16dd16f9547f0c3314a91968324f2c537118ca36e982b235e23527ee" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00425-of-01024.json.gz": { + "num_bytes": 319092219, + "checksum": "1ac0b93c0faae7d446add3af3173637a4b0d638dbd5285b0f4e1bf3abd0d1542" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00426-of-01024.json.gz": { + "num_bytes": 318421245, + "checksum": "bade501dc71c0b4968a9a7c833751cee5d8f7067a45dabd53aa03534df48886e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00427-of-01024.json.gz": { + "num_bytes": 317847935, + "checksum": "7aef554aa2b120c4d787395e28aceba743e309f2540fab283e077a1429a2f7ef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00428-of-01024.json.gz": { + "num_bytes": 318822008, + "checksum": "cd94547fe1953a1cc074d97558a70d1e55834606379a8f5e6e60e1b15b56fd35" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00429-of-01024.json.gz": { + "num_bytes": 318507684, + "checksum": "4d3c9245565a808058293558603c657d6e9a0c87b6d2d4b871b856cea2eb3a19" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00430-of-01024.json.gz": { + "num_bytes": 319042136, + "checksum": "9c5a4fe50db5d0822923fe29a5aa8ca6cb09e3629472b1bf61f670388b6c2076" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00431-of-01024.json.gz": { + "num_bytes": 318925124, + "checksum": "8f18b35bb952da090ade742753e30861ba39c6c54c8ff2d76b358ca7be475ed6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00432-of-01024.json.gz": { + "num_bytes": 318680251, + "checksum": "7968c370d0efa4601ab8b5ee68e480b211fb969593608bf7e00a0153f00f99b3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00433-of-01024.json.gz": { + "num_bytes": 317822797, + "checksum": "f62d7e74434d52c36b22f6a8cd56ed3937ed6aa03f140d0fbdf5e360632d51fe" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00434-of-01024.json.gz": { + "num_bytes": 320094364, + "checksum": "55d7678c7e197e165b4e09bf3f8ac159853120acbe5801ed6ab3ab0f801c11bb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00435-of-01024.json.gz": { + "num_bytes": 319008936, + "checksum": "09b451c8ee06bc06507b3e75a60c544a6b70f27e3d07daa29c59803f785faaf5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00436-of-01024.json.gz": { + "num_bytes": 319023456, + "checksum": "6fbcb93f9dfe65e12b7efeecc8af7823471787438b1ce90e5f48b68b2dcb1d14" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00437-of-01024.json.gz": { + "num_bytes": 319484997, + "checksum": "9e70c8c1ccbfe93ec9296811ae496a518dcafbf38c81b7972f885e297da9e726" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00438-of-01024.json.gz": { + "num_bytes": 320319141, + "checksum": "eaab759d8c603e8a2ad3ebacd99e30338fb904ba307aeaba0d2e0e63679cfadc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00439-of-01024.json.gz": { + "num_bytes": 318410397, + "checksum": "7a03a92bf97b6750941c1070f933c68f1b2a3e13fb68b3a21a4726676ea75d34" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00440-of-01024.json.gz": { + "num_bytes": 319447470, + "checksum": "bc899e436da7b3bf13c1bfa2fd2bbf9d90b42a0c00f2971259a14d858ca3e5ef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00441-of-01024.json.gz": { + "num_bytes": 317582955, + "checksum": "4d777860c2750e43038ef709d77bdc403b3b3bcf0f08e3c4562952c9ac70b113" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00442-of-01024.json.gz": { + "num_bytes": 319592118, + "checksum": "d9e5dc244bb6f0b629b2a929aedf506dadaf5eacc80f0997816b95279552fe8d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00443-of-01024.json.gz": { + "num_bytes": 318104403, + "checksum": "56133bbd7cf96dbe87d48898b886a024af69ca405d7cea1799bbd30f185e9c1f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00444-of-01024.json.gz": { + "num_bytes": 318547808, + "checksum": "8be0270c3cc96dd7f7b3aad08bde81ea245feff4a09923277fb0d38a7c095604" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00445-of-01024.json.gz": { + "num_bytes": 320463920, + "checksum": "e02316fcd355914e4d08ecf37036d4727ae9ebe45bdc5c98279aa3437c2c1eb0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00446-of-01024.json.gz": { + "num_bytes": 319583221, + "checksum": "80c9b8c47665b2cef6c291b0eefdac5b14be1d7cd4a4c06c2e14cf48b42da92d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00447-of-01024.json.gz": { + "num_bytes": 319546881, + "checksum": "a18d5aaca1717ec33fb1822a633268003bf88093dd7b48db080503c3d01b6ffb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00448-of-01024.json.gz": { + "num_bytes": 320234711, + "checksum": "c41595d2b9cbf0e23fd65df1cb51499ee262d345d79d2625388cf149c3c39f8c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00449-of-01024.json.gz": { + "num_bytes": 320043698, + "checksum": "3bef99334be9d39f41296f8f134c88f04fe66502da2d2639f0d6d2485338e607" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00450-of-01024.json.gz": { + "num_bytes": 318033740, + "checksum": "9cd05b1b70ffc3c004b4b4a2f21f91abee1395f3a485efd1aafda550193df9fc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00451-of-01024.json.gz": { + "num_bytes": 318549622, + "checksum": "b2ef6cc4ac7c4c69fb1661d7ed9b2ce4da261c72f9e49dc3c934180501ef3a24" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00452-of-01024.json.gz": { + "num_bytes": 319317230, + "checksum": "89927f1fd79a5b1439988fd37e0377175176d9ed22d14611f67a81e185a336b3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00453-of-01024.json.gz": { + "num_bytes": 318952561, + "checksum": "427f55bbcfb6c1a0ef12f96cb122f362b975169770ce1d392b763c4b4408cb34" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00454-of-01024.json.gz": { + "num_bytes": 317545286, + "checksum": "2fc3b172ea721bc92b0f7614e8fea61b0781e6f4f3e6b7263cf0190beef3ec52" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00455-of-01024.json.gz": { + "num_bytes": 318975631, + "checksum": "c96f688ecb19bdb1592b0124021fb80d48965303442de76751d82fa03ab8f6d5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00456-of-01024.json.gz": { + "num_bytes": 320016575, + "checksum": "61d2be7a4b9e34cfb994ae2c120ed5a51a6669564046637445a46b9872812416" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00457-of-01024.json.gz": { + "num_bytes": 318236935, + "checksum": "a74dd51c3c490458ea0e61196d7e0085aff80d50cd149a673f54f661b364a671" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00458-of-01024.json.gz": { + "num_bytes": 318495925, + "checksum": "adf9cd717f2c79504dace22b5929d4c4064353e869457c20cc81a0b2db390c89" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00459-of-01024.json.gz": { + "num_bytes": 318956821, + "checksum": "d7be5bcb738a75586125e56a25aa234618528accda620eaac421beab6288b992" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00460-of-01024.json.gz": { + "num_bytes": 318968681, + "checksum": "6181280df5418fd9ebb52aa26a631100b6c3da0750dc5fbae152a6a44fccb942" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00461-of-01024.json.gz": { + "num_bytes": 320810761, + "checksum": "5e943c458674371dffb2466274b8f2a9df9902a370901ef97992bdf920cdae0a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00462-of-01024.json.gz": { + "num_bytes": 320154899, + "checksum": "76b3d1b120cbb7cd71d004440e0c6bd9f9c4395424c568e8362973038017a90c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00463-of-01024.json.gz": { + "num_bytes": 319247449, + "checksum": "9de2c86d85289113b24c2f7eb4771ec1391511930f5f26a12133d41faf0ce908" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00464-of-01024.json.gz": { + "num_bytes": 318150152, + "checksum": "85fce3104ef0b247798c1de8d9d616d3de754841fb6c49a01cca5b9da5efa94e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00465-of-01024.json.gz": { + "num_bytes": 320342803, + "checksum": "ddf312f0b8de8f53ed556483fd998ae308d4829d18195a48869db6bf1866c332" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00466-of-01024.json.gz": { + "num_bytes": 318619029, + "checksum": "01239a1ff6ffe9032da320c5a7d1a93125d0724851e3e10746821c9452070887" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00467-of-01024.json.gz": { + "num_bytes": 317677227, + "checksum": "41783d20189a4bcfc33f543597a5473900e692ea13fa522f2724e27e810b4e9c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00468-of-01024.json.gz": { + "num_bytes": 320038217, + "checksum": "7131b6f4dd423f2efe55c3f598893676300b31651cce7eed32ce633a015f8ca8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00469-of-01024.json.gz": { + "num_bytes": 318359701, + "checksum": "925bc76c045f25532414f29820adb0cf1a56c54b406333a6f348c29e5efda9fe" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00470-of-01024.json.gz": { + "num_bytes": 319329235, + "checksum": "9be740483aa7bbaf94dce550f2c20404c89326f6ec4ebe1b7070f85f93507038" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00471-of-01024.json.gz": { + "num_bytes": 318792779, + "checksum": "0e3d9492f15dc9867bb0dc803bdf45608fbe67255014b4488902d7bf2e2554cc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00472-of-01024.json.gz": { + "num_bytes": 319552622, + "checksum": "00484bbc10bace3dfd93b57fc53d6f5fac26b7dd54fd5b5428d75eb9e6dbb0e2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00473-of-01024.json.gz": { + "num_bytes": 319466828, + "checksum": "5db5d585798e8ed8e4a3bc540871f1185f67125f397a12942d21b24e6b374519" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00474-of-01024.json.gz": { + "num_bytes": 320014669, + "checksum": "db07fd0e972c1a474806c1b4464ad4cefdd2e8fc15806ba0d259d4f9e594c3f1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00475-of-01024.json.gz": { + "num_bytes": 320379280, + "checksum": "e6e36a9eed8be84c928980fffd8177b177182726c9e13b41a47343d431f76a7b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00476-of-01024.json.gz": { + "num_bytes": 318820301, + "checksum": "0543ed2d0b3aaba0b0fccbf0311836143bd19175c5eed9bf0f024ffb9ce3c50a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00477-of-01024.json.gz": { + "num_bytes": 320577830, + "checksum": "a62fd62ad771dbcfb7af73841e15a49e9d7239c53dbbbd84de2282131bca9c99" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00478-of-01024.json.gz": { + "num_bytes": 319593908, + "checksum": "beae9334a8e93e4b036c4a9b3c5b3a75fff17264177184d243d9e6da286dbe2b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00479-of-01024.json.gz": { + "num_bytes": 319728825, + "checksum": "ae5b475c7be35d98b77d6c4aed5d61cbd1c98544c9a6e73a53ef2911757ab7f0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00480-of-01024.json.gz": { + "num_bytes": 319903674, + "checksum": "51e0611378455d909e8b0f292eb62038848aa7afaa4f93c9c83061258b211a95" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00481-of-01024.json.gz": { + "num_bytes": 319998409, + "checksum": "68c640304ac952f544ea88c88d7c994c8d2955b95036f8352a67b57a836fa1bf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00482-of-01024.json.gz": { + "num_bytes": 319047238, + "checksum": "74cefa57158d0008a06ae85b2a7a1c04d57a79b7ae3f7b4b3426dbe9918b36ca" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00483-of-01024.json.gz": { + "num_bytes": 318775875, + "checksum": "e99faa71222017521f1fc9999bbb0832df5c91f8b9f6e2ef501d3f827d3a1e85" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00484-of-01024.json.gz": { + "num_bytes": 319190491, + "checksum": "4518faae7c9d51a51f0b02cd895cf27e7c87a623b787346c844a8d9f0b52d6ce" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00485-of-01024.json.gz": { + "num_bytes": 318974502, + "checksum": "1bc8b207583b9f36169e0e9facd258de8eb73dee8bf831051dd1ab04b7726c6f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00486-of-01024.json.gz": { + "num_bytes": 318599424, + "checksum": "0b1d9900e1921483b85305491f914b6b78fabcd0686a20695e61b89b7380a894" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00487-of-01024.json.gz": { + "num_bytes": 318958015, + "checksum": "c0c789c5f3b34d170d2aeb72642c70d2fa5eca567e7850d0c89b3d170f3bbf64" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00488-of-01024.json.gz": { + "num_bytes": 320205671, + "checksum": "6eef7a1ea80be43e84cb0c974215a477c909844899ac694afe1af2e8f4ac171c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00489-of-01024.json.gz": { + "num_bytes": 319193967, + "checksum": "eccf5d7f682a76e11332f07e7d54a080f76c0be58a98a853a9fe90c815a22087" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00490-of-01024.json.gz": { + "num_bytes": 319833603, + "checksum": "afe99e32ba36134f23b59a2ee43965bf185432de947740fc19e26eef41027aef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00491-of-01024.json.gz": { + "num_bytes": 318912982, + "checksum": "e981151b23b233bd3e5798f78658b5f52a73f69db39c30615f615069cf0c4984" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00492-of-01024.json.gz": { + "num_bytes": 320057824, + "checksum": "0cc5f7df318e0718fef93d24e7ff904b3e8e2728c4fc0b1d13893c81d8e6e2c7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00493-of-01024.json.gz": { + "num_bytes": 317967559, + "checksum": "93749543b04a5a7093177d2a03acfc0bf6f26d5b53864ae35839a9421fb48169" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00494-of-01024.json.gz": { + "num_bytes": 320426917, + "checksum": "e461f56b461a4d5ce353c60889dcb99e10818985d3788440c6119bb145876277" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00495-of-01024.json.gz": { + "num_bytes": 319528392, + "checksum": "e530f3030ddbf7191bc4082e8209f63eb48733d7085d79a8469ce3611ccb79b9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00496-of-01024.json.gz": { + "num_bytes": 317570766, + "checksum": "ddec34b528bd5314019d12089e600df27e781d78f43b6722b9c0202ccf385755" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00497-of-01024.json.gz": { + "num_bytes": 319154838, + "checksum": "e7438a08000fc7a158f887755cc496edcf51c8bdf2bc4a888ddd2c829bf8fa3b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00498-of-01024.json.gz": { + "num_bytes": 317955368, + "checksum": "ad133d808ca5b6181bae1921ab1261d79630c09bf9d6c904db036f22e6f32e6c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00499-of-01024.json.gz": { + "num_bytes": 318286671, + "checksum": "cb40879ea08db5a9eb6f2c23756574bda34deb9acf039b992f0ab90fdbb01594" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00500-of-01024.json.gz": { + "num_bytes": 318510936, + "checksum": "21e5f7468a907f38c3dc0a5c19f09921476f9186beff967e829329f191dad6b0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00501-of-01024.json.gz": { + "num_bytes": 319611074, + "checksum": "38829434c8539bb9fa9ea32bfba3c6732c5021ffb60c16fc502fe61de83906ce" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00502-of-01024.json.gz": { + "num_bytes": 318630954, + "checksum": "22d1ca1edae179d2587495fcdf1d3e515c6f547cebafc54996c93a121731fd8d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00503-of-01024.json.gz": { + "num_bytes": 318253198, + "checksum": "e95689993390086880e630ec4540e0629551076c0cad2c70f5aedd3aebfec181" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00504-of-01024.json.gz": { + "num_bytes": 319497151, + "checksum": "0cd7b986d247e010fd76fa2ab2b62d5f9eec292b28c1e7bd3e4c577042b598af" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00505-of-01024.json.gz": { + "num_bytes": 317498965, + "checksum": "f1504912fc53cc3690e26ec3babf736ddbeb8f7d9196dac83f757699310b30ad" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00506-of-01024.json.gz": { + "num_bytes": 319684193, + "checksum": "9f6defbac132e097cbf7cb7d181cb154bace6af48964fe09d111bc610fdcd2bc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00507-of-01024.json.gz": { + "num_bytes": 318394726, + "checksum": "a58f39d0bef19abefc089342d8bb6d75dbb2c663f67127673ec395404bcf15ae" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00508-of-01024.json.gz": { + "num_bytes": 319013108, + "checksum": "176443b39840826bfb1db2cef2541449a6fd0c465ff9bbf0cb2479f07fb8baa8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00509-of-01024.json.gz": { + "num_bytes": 319832758, + "checksum": "cce5a142cd7a121eba8c182d499442f4b0a397ea1484c33ccd79b1acbae832fb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00510-of-01024.json.gz": { + "num_bytes": 318762241, + "checksum": "bfc910625f0fd6074955906bb86e789b0d0adcd1f8956cb8da276933dceac256" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00511-of-01024.json.gz": { + "num_bytes": 319240643, + "checksum": "ce53021b90d1c86e2d46293e7053aa174387d7408bf0cf907898be69b1a7befc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00512-of-01024.json.gz": { + "num_bytes": 318353376, + "checksum": "e9333c6f73c30c9cb7f31794025eb9129455fac2edd64f8b3f22f879124c6a85" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00513-of-01024.json.gz": { + "num_bytes": 317653011, + "checksum": "d9450c6f541e82922b37d3b7cc25611707b44884f27825db4dbd65466b59e8b5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00514-of-01024.json.gz": { + "num_bytes": 319391160, + "checksum": "20b77f5fc2a939fc291f901e8774acfbf04ffaacb08192b724673eadc9f83c12" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00515-of-01024.json.gz": { + "num_bytes": 317994258, + "checksum": "32ca1f60d0deb395538a93ce5044a48fde05864f2c26af42dc53405b6dc05031" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00516-of-01024.json.gz": { + "num_bytes": 318786801, + "checksum": "eba4f34749eef4da2b0729abbdfa2ada77bd65383c01213d4f86625670430a65" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00517-of-01024.json.gz": { + "num_bytes": 320010732, + "checksum": "617765f971b879182db7debf879025f8dad4fd8846b11728ee1230767c031c04" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00518-of-01024.json.gz": { + "num_bytes": 318681019, + "checksum": "6987893764c56b84fca014532824a05d4187db5c313be4f7bdcb363b7e8cc8db" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00519-of-01024.json.gz": { + "num_bytes": 319951543, + "checksum": "ba151c4734db52e7c220dbefe380825ac6d66a9c6abb901b8096a87d97a2deb5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00520-of-01024.json.gz": { + "num_bytes": 317948056, + "checksum": "7e53ed26c3c068b0dedd026219b7cdab79775545ebbf31b5dadadb45364c9985" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00521-of-01024.json.gz": { + "num_bytes": 317993802, + "checksum": "4d1d4a5583430e373bd2cfd191e59cd8911953fbd73fa924e0c15be76499b54b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00522-of-01024.json.gz": { + "num_bytes": 320189449, + "checksum": "71d851498785e312acf93861a43169794d4d576f5fe8b960303419316c8c898a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00523-of-01024.json.gz": { + "num_bytes": 320443871, + "checksum": "587867d619115c2accb69322b197239b79f12de41ae80427fd369813ad8d81af" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00524-of-01024.json.gz": { + "num_bytes": 318192840, + "checksum": "7324c02db00b06d0f41d6e5ebfa4e4dd6554f5f4849d6de187ebb84162d0446d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00525-of-01024.json.gz": { + "num_bytes": 319294602, + "checksum": "24ae3495e5b59883967c62b8fb3a4fa7525d33c40957fd5fa3be413d66c24eb5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00526-of-01024.json.gz": { + "num_bytes": 319783465, + "checksum": "27cd95e7bc6a3f156f1f8f26dc5e490818fc4810562e3964a19fad401cceacd2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00527-of-01024.json.gz": { + "num_bytes": 317240081, + "checksum": "6b84920fe7e28c01a03800512915c7a9e47816267ac652f9ee0314e3428bca72" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00528-of-01024.json.gz": { + "num_bytes": 318320694, + "checksum": "fec06589f714ffe1343cb6781898e29e5d0cb789deba3aa4a4ccf86514d3f690" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00529-of-01024.json.gz": { + "num_bytes": 318391515, + "checksum": "a98c34c04c1b6f0ca3acc9e10fdf4bd0ead2ea7271832ce4972df8677590918b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00530-of-01024.json.gz": { + "num_bytes": 318473966, + "checksum": "1677d541c7bc10971c711f1eb030faa2e85e0967112ba57d7f04712908e4f040" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00531-of-01024.json.gz": { + "num_bytes": 319463272, + "checksum": "92b5d82a058554d3396a2b54504f45fa88581cb2951140c0f0bde67ed11bed0c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00532-of-01024.json.gz": { + "num_bytes": 318228175, + "checksum": "291bb3d7613f7f00b6910a0de78dbab0d87602243c9c83014de341c131200853" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00533-of-01024.json.gz": { + "num_bytes": 318966937, + "checksum": "a0ce39eac6d6ecad3478373c264e88b2ea20b77fb2049537c229ad3da2769c85" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00534-of-01024.json.gz": { + "num_bytes": 318968162, + "checksum": "387db79d4aacf8fa4c512fb78023ff94a43d5d597d5a8c2ec6198e62e4b8c98b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00535-of-01024.json.gz": { + "num_bytes": 319253588, + "checksum": "3ff8f4a926fdfb6201a94d75c17ec5afe662a339a65019eb5e1193c1238bd388" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00536-of-01024.json.gz": { + "num_bytes": 319662526, + "checksum": "0c805e83d8cfd979701df5714713d062e14853d7e2b0f77c0b414a626686cd33" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00537-of-01024.json.gz": { + "num_bytes": 319177095, + "checksum": "f9a0ac216e316075e5c2219449a954f989eb160ead2ca07ac9f3813274e18f2e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00538-of-01024.json.gz": { + "num_bytes": 320109104, + "checksum": "a425ef4dddefb40bac5a8cd3191161a41737aea5088a614410d10d83bbab5e37" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00539-of-01024.json.gz": { + "num_bytes": 320600564, + "checksum": "3580ea8da9c4aff1296e89136c5d7f1a37d021e0b10f3ebd1e05612c092faebb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00540-of-01024.json.gz": { + "num_bytes": 319993281, + "checksum": "ad8dc83bfbe7c8976f08708c5f0229cd4e1a2d80e272b225a8d208133b129dfc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00541-of-01024.json.gz": { + "num_bytes": 318256020, + "checksum": "c7452669237323fdd09ce97624791a0261f3ec07d8a5f98e71a4b1252a2805e1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00542-of-01024.json.gz": { + "num_bytes": 318843744, + "checksum": "1e5a11c25f82ce717302dbcd9acc1f8b916d83eca88d345d8434b1f88768137b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00543-of-01024.json.gz": { + "num_bytes": 320482002, + "checksum": "bbf96edf50c913d5162ee154423242e7c8faf490ba229f325bac98a5e3eb9477" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00544-of-01024.json.gz": { + "num_bytes": 319059260, + "checksum": "22c04506b5744df8c71727fc6527fa2bc495a10a237c71762c66d09625d34097" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00545-of-01024.json.gz": { + "num_bytes": 317874034, + "checksum": "84a78bb62eb6f72de7a75325870d9ecd419f77c4f6728d29609b2f7ab1b8bcf7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00546-of-01024.json.gz": { + "num_bytes": 319891407, + "checksum": "28631c527dc398c9626fc60b39ad94ed880b41c71f55b9c7c670f6a1837f98d8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00547-of-01024.json.gz": { + "num_bytes": 319361268, + "checksum": "273b8598405def0165ceaf9723d1425c9b74368fc22a414616c7ac9327930225" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00548-of-01024.json.gz": { + "num_bytes": 318360761, + "checksum": "59990568c0ea055fab27f2b9cd028e1c7177df0479712d1e2d8372e9b017ccad" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00549-of-01024.json.gz": { + "num_bytes": 317320452, + "checksum": "fd1e361f28cf099df6088e26d06d79f7f62bd8bd89b4524b9baa80ea49a1a4a6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00550-of-01024.json.gz": { + "num_bytes": 319017444, + "checksum": "4424833afcb143f6fdbfc2f5fa2508d6226a4a1df391969b2a751d2d0070158d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00551-of-01024.json.gz": { + "num_bytes": 319118159, + "checksum": "77b78f94a8bc8f905cf8b1997df1fc3b8c6d77ce65fc28bef68c6083275a832b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00552-of-01024.json.gz": { + "num_bytes": 320058125, + "checksum": "e7b71167c4ad947232b6acba26e4d3cc9214c25b50b853b5745333bba942f50f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00553-of-01024.json.gz": { + "num_bytes": 319220671, + "checksum": "ce7891f3820ce065e3bd7afa006e90889428c80bd8e771d66fbbf023bb2a9eba" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00554-of-01024.json.gz": { + "num_bytes": 318858928, + "checksum": "015a707235f46f179a08d3f6674b6d368dc9612841e2bf39f700f11fef8e64c7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00555-of-01024.json.gz": { + "num_bytes": 320490725, + "checksum": "041dd2e902ed04dfa143476da03d5fd00c30ce1259c0658150af5b77a5a092c0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00556-of-01024.json.gz": { + "num_bytes": 319863694, + "checksum": "22e3d9e4dbdf2b1b822a7bc8c889f4747aa16c71f4c91436d028a228bffe4b87" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00557-of-01024.json.gz": { + "num_bytes": 318940362, + "checksum": "4cb8b113ad9687b7dee590242c5f50fb3ea3a8775c67492a8ce0cb5c15fc26d7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00558-of-01024.json.gz": { + "num_bytes": 319797786, + "checksum": "ad157a34c6a8d496859f55b00c79fcedf7305d8502ca86a511026f39cdcaca59" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00559-of-01024.json.gz": { + "num_bytes": 320156705, + "checksum": "816d84753b71fae446428587f41de5b3490e88321f1fa0cfa2ef1fd5eef851e5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00560-of-01024.json.gz": { + "num_bytes": 318346216, + "checksum": "0b1b3d26316f2c0e973ff19820793bcfffa957c3869f74f62fb40cb6839227e4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00561-of-01024.json.gz": { + "num_bytes": 319571572, + "checksum": "4f92594382c897bf94211f1446dbb38c2cc1fff3647acba731dfe0ad89ba4061" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00562-of-01024.json.gz": { + "num_bytes": 319453711, + "checksum": "2a6ba0c64806add776081f417c8d1afdb324dd8b9aebb603372afd7fc2c4cd6e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00563-of-01024.json.gz": { + "num_bytes": 318990092, + "checksum": "e3032365b9b86883c24bfe387d810c2d9fd1d0a55ff88acd1f5b5357246b13ba" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00564-of-01024.json.gz": { + "num_bytes": 319491917, + "checksum": "da6196ab8650fc9f8fa391b821ff070070946412277bd423c40d9fa1de325f93" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00565-of-01024.json.gz": { + "num_bytes": 318756269, + "checksum": "edeb5b13aa0d65354d78a5ca5d1698732e95f1fcba249c42825a0351d4a34f79" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00566-of-01024.json.gz": { + "num_bytes": 318461036, + "checksum": "f179addbca50d8612612b0e09138d7ecc89ba7ef2d6e857d7ef0b10223dc71d4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00567-of-01024.json.gz": { + "num_bytes": 319625728, + "checksum": "eaa1d0ee28eb17c6ebe3d85c8af8b7adac28a720b2975f86ac83f3f4d2bffbcd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00568-of-01024.json.gz": { + "num_bytes": 318428567, + "checksum": "3677e88545f2d76b601995cc3e2b6b12fcf65e350ed7eb4137ab4beef3d475c4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00569-of-01024.json.gz": { + "num_bytes": 320114923, + "checksum": "2d8810d8bcfc0fc19d82313be6516b2fef4cf68f56b0448af48b512c98e1ae8c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00570-of-01024.json.gz": { + "num_bytes": 319148416, + "checksum": "8e5356dc0fa2b4e5fa16b36a1586f16920306af1227c765e5d2f0818e74d30d2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00571-of-01024.json.gz": { + "num_bytes": 318223973, + "checksum": "c87cf8b88e8e4fc0a664f4b3a381b78b317680253a83a672cb86e02adb43f2aa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00572-of-01024.json.gz": { + "num_bytes": 318322508, + "checksum": "2bdc857dfeab99c8f83f0267ed5ed7529bca8ee086fce268534bc0264ff738f6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00573-of-01024.json.gz": { + "num_bytes": 319203246, + "checksum": "564fc77dec25ce0d47f4e3d8d04bf114dc06119b28b3ab00d6092a799d496e51" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00574-of-01024.json.gz": { + "num_bytes": 318397937, + "checksum": "dc3f206e1b5da963184da72e47959844bb164335c76e3261f3a189a4b7b022cb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00575-of-01024.json.gz": { + "num_bytes": 319183651, + "checksum": "7f0c46955e37d5d52b305f71b4ce4fca5368d72e8698e8b832ac0177f868e145" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00576-of-01024.json.gz": { + "num_bytes": 318690625, + "checksum": "b37d0fbd439bdc05021a71c192ce5e61ebce27448a17819bb53156d9d5f27e17" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00577-of-01024.json.gz": { + "num_bytes": 317926085, + "checksum": "3092d1ad70fb2d262ecb33f3fb6ea554af3ddd26498ba42b644c383f6d4bd1a4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00578-of-01024.json.gz": { + "num_bytes": 319190472, + "checksum": "d9833fd591a618a167b31b7aaca420f3e719ded98987dbc0f46fd4bfd12564c5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00579-of-01024.json.gz": { + "num_bytes": 318958744, + "checksum": "a11217af10c85ad828de38847eeddcde6af6899563585d581c20adaed3c9e7dd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00580-of-01024.json.gz": { + "num_bytes": 319893900, + "checksum": "71e8be705bfa8563e33392d1c14decd84f52d6a0139b98344f1a0ed9bdc94198" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00581-of-01024.json.gz": { + "num_bytes": 320109861, + "checksum": "c5f13ba973803ef069762d22bc37ee02a4348af379c75848d93b2685fc4280cf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00582-of-01024.json.gz": { + "num_bytes": 319238177, + "checksum": "da815527ca68b5c2ed604d00ccbcc7c631c60f33e3132f79212634a82c266844" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00583-of-01024.json.gz": { + "num_bytes": 319375634, + "checksum": "a332b791df0801f0b7227117f0ea3971563e8e420ae24dd94b38d532c1ab0573" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00584-of-01024.json.gz": { + "num_bytes": 318596018, + "checksum": "e6496d31f42921eaf9f85047e7c2eeb5fef46e01e99760fa676da96481d7d5bd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00585-of-01024.json.gz": { + "num_bytes": 320156294, + "checksum": "08b978ec05d65edd22c301ddc6ab44174eeb7bef5c5997a84342b6faaa47a79b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00586-of-01024.json.gz": { + "num_bytes": 318716838, + "checksum": "567ce600ad99e543507fdf27b9009fe1782bc867f44f3dabbeb93fab1208f337" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00587-of-01024.json.gz": { + "num_bytes": 320247814, + "checksum": "8f5c82f5eaac4a315d8615c9700cd81f3b9c2e1a17376d3b2482f8694dfe2492" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00588-of-01024.json.gz": { + "num_bytes": 319546079, + "checksum": "bae91422f87091b3974ca92781a14fae8f10c5c41de9c9132f745b3dcb8bc468" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00589-of-01024.json.gz": { + "num_bytes": 319771959, + "checksum": "babb615d77f80e5ef99aeed3889a26cef5c9918a7fe68b70a503815e69b0b189" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00590-of-01024.json.gz": { + "num_bytes": 318926571, + "checksum": "61f2ed732f3b2b5e24882f47b4eb84fea28bf89d112f6f173cbb50523a43c4b8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00591-of-01024.json.gz": { + "num_bytes": 319669791, + "checksum": "3aa2e792ec775a52ee78447b81204867e58b0a46727bab4b7974977aaec2889d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00592-of-01024.json.gz": { + "num_bytes": 320393142, + "checksum": "1419c263fb74409cb0e39ebd87b1c020ee6863a3a6f2f427be27d3c76b84043a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00593-of-01024.json.gz": { + "num_bytes": 320977171, + "checksum": "4f16f33217c35a2b155d5b6fe8014c2e52014e63c419e7d3aaf71a35246c1323" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00594-of-01024.json.gz": { + "num_bytes": 318211092, + "checksum": "c9301ddcafea22d085ae48f551f486e73089a76c7990871f787064c61e4e60b4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00595-of-01024.json.gz": { + "num_bytes": 318978629, + "checksum": "349e104763320eaae96ac3bc53c5fa7a73e7dec93b8cc3afaad108a97e7c170d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00596-of-01024.json.gz": { + "num_bytes": 318573003, + "checksum": "0eb6c25cf57764ec3aa7f74d6d967c52003f872f2f3b140fe6d5ac6360241a8a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00597-of-01024.json.gz": { + "num_bytes": 318931514, + "checksum": "b42b7b984aad729185ca9b3a6ffa856b2a79165ce2feebe519b10f8ff42c4ab9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00598-of-01024.json.gz": { + "num_bytes": 319002677, + "checksum": "8306c5971408767b3735288fd0ee7ee7d01d9af4ef4cbec2e57c97b1f78e6d63" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00599-of-01024.json.gz": { + "num_bytes": 319637870, + "checksum": "844df34f2a263011f9d1d85eaad5a1d95243769e9cec5a104807dd55e1fe431c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00600-of-01024.json.gz": { + "num_bytes": 318099852, + "checksum": "b05e66568a4472feee31f20918e9813aeae2d881f47b5281ff29fbcfedf4d5b2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00601-of-01024.json.gz": { + "num_bytes": 319136069, + "checksum": "8dff2d56c9915d73e6154533e5de0ca9d867c5fdedcfeceb3e0ab22f3ba509cb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00602-of-01024.json.gz": { + "num_bytes": 319369121, + "checksum": "45b2c1757260395afeb168b545892b315fa0bf14b3d144bfcab1fdaa6d79086f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00603-of-01024.json.gz": { + "num_bytes": 319499076, + "checksum": "46edc9f556ccae692900b222b8e4843360dd5dbe0798a8ad9cb51c07a451dbb2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00604-of-01024.json.gz": { + "num_bytes": 319132921, + "checksum": "0cba8c8738ea7ff9a08bd1bab215010b03c6c83fe35206d83344d78005bdee6b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00605-of-01024.json.gz": { + "num_bytes": 319315562, + "checksum": "0dc0d37658fd672c8d72775bd8855dce9037cf9715feda35a76afb1f0e87bebb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00606-of-01024.json.gz": { + "num_bytes": 319223528, + "checksum": "f679e437a3acda1a81013dc0f3fa93fde6c3309905e8142f8699a76bc04b7114" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00607-of-01024.json.gz": { + "num_bytes": 319326218, + "checksum": "7fe91f86f751b9aa3abf1c5ed0fdab89a76c7fa4eb7ab8b809ef29b0cf4a78d9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00608-of-01024.json.gz": { + "num_bytes": 319393715, + "checksum": "a5daf706100eb797b5b0770fe0c790856637b22dc849aeda5b445ae5fa63cb3b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00609-of-01024.json.gz": { + "num_bytes": 319554192, + "checksum": "4434338fe97d398d9565ae940c62539e868fa261be361ede1b5b0feb004160f8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00610-of-01024.json.gz": { + "num_bytes": 319786301, + "checksum": "6b0d0e0457a721af6c67a31f5016432011e717302cfdc7ee39feb253fbae4754" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00611-of-01024.json.gz": { + "num_bytes": 319356910, + "checksum": "bfe201b1775270afef3a09fcfc074920cbb01093eef90d46f26b6b813d603994" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00612-of-01024.json.gz": { + "num_bytes": 318780229, + "checksum": "29248c4732fdfda2ba97ed38192ab391457e20fd70f713ef4a7cf084f9865846" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00613-of-01024.json.gz": { + "num_bytes": 320190496, + "checksum": "f5cb9be2442797d967b9041e48771196a6c0595933ef2102840b704e355f4d62" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00614-of-01024.json.gz": { + "num_bytes": 320245862, + "checksum": "89b74d0daea02fb69289ad259bbd0ddb1a64c5d6380848f7d51669be952f8a0b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00615-of-01024.json.gz": { + "num_bytes": 316874605, + "checksum": "78600c8703d5ebf80c99c089bb7a7c1cde843a66d706fd219eeac304f80e8525" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00616-of-01024.json.gz": { + "num_bytes": 320237707, + "checksum": "630ee29d4dc4cd5062eeca7877e5c1b204b36eb0b3aeacadf036cdb75c1ce840" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00617-of-01024.json.gz": { + "num_bytes": 319739365, + "checksum": "d418fd284d06b1d2d9daebea3047ed06286640ac75d23893f1effc2ee9d7aa14" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00618-of-01024.json.gz": { + "num_bytes": 318634299, + "checksum": "f5d75d129ab6c0f052028cf0139c3cf20eed3a9c5cdb151cd88ae42d5d1a32d2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00619-of-01024.json.gz": { + "num_bytes": 319086471, + "checksum": "c558908f6e08b0d02f377c9aed1655d80106f4cfe26e955774bb420d19b2f74f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00620-of-01024.json.gz": { + "num_bytes": 320665446, + "checksum": "977f959e5b5eaa24081ce025d137647fffd65f1a54d2c45db9805a232e0c0364" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00621-of-01024.json.gz": { + "num_bytes": 318576410, + "checksum": "d07f3c31d7ec1c71b5ab9539a2ed49f6d5f46b48ee2e51800b9e28cee588a163" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00622-of-01024.json.gz": { + "num_bytes": 320053075, + "checksum": "58b897603eb83f789a1cfc6bf40a091093cbd8a0c20702018c411adc7b07a437" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00623-of-01024.json.gz": { + "num_bytes": 320045187, + "checksum": "3665d7579b3c57eb21ec9e55850e39307cc6f4ef8aa8b9937076ad6f142063a3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00624-of-01024.json.gz": { + "num_bytes": 320136842, + "checksum": "35db069ae090e95c5a4d3db44eae73bcb29463c120584d7f6ccbe235983c5fef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00625-of-01024.json.gz": { + "num_bytes": 317314201, + "checksum": "7f6ddbbc8815e8bd10c99361fd8113cbbd84ebd92799eb6958cf98af825d2aa3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00626-of-01024.json.gz": { + "num_bytes": 320219970, + "checksum": "4e2c46d1e3a94957717bbbf1e1e4300bd27ac17e588d426e0ba688983e83f4e6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00627-of-01024.json.gz": { + "num_bytes": 320083102, + "checksum": "851ce6dfa6a4d1a4e3b8bf439e36db9ceb59eefc60558d429e2fec80655e1775" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00628-of-01024.json.gz": { + "num_bytes": 320386844, + "checksum": "86d8927f16d0790a07d6c68e745501188d13887df4a137e937ae00497d07c055" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00629-of-01024.json.gz": { + "num_bytes": 319476643, + "checksum": "c48cff721137b641fe9d5bcf30462c7e4e3a3ae631b7b4e39979c8c77f0890ae" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00630-of-01024.json.gz": { + "num_bytes": 317961579, + "checksum": "cde626b34c6c8455227fbb18a577877b518f529b6c8e16881cfdf334f2875cd9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00631-of-01024.json.gz": { + "num_bytes": 318952266, + "checksum": "0401582821f7b15f0b406f7ce00c56351b8e86a3c3282bdf4dd45b2f6146ea22" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00632-of-01024.json.gz": { + "num_bytes": 318261820, + "checksum": "be48396ef18ce0f3650eca86eb36039f90b51737f9848086494f34fa28d60e70" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00633-of-01024.json.gz": { + "num_bytes": 319748854, + "checksum": "9d5c342d82fcace21de2900202c3f2af47229aeae9d487a8b77b7f5b86c05f74" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00634-of-01024.json.gz": { + "num_bytes": 317806530, + "checksum": "00a70705afb91f6570d17257057c15b45386597b917061686f131bd41ddce421" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00635-of-01024.json.gz": { + "num_bytes": 320313573, + "checksum": "22a1286582d65975ed94f0ba25bf87e94d52a55214d0a51979a3e0fd9f95e3cb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00636-of-01024.json.gz": { + "num_bytes": 318151690, + "checksum": "026c699ac6fa30f9e156a957026d8fa8df72daee3407c8fdc5e0bd7d6a3b50fe" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00637-of-01024.json.gz": { + "num_bytes": 318665365, + "checksum": "9bd931dfc074bc99df31d7fd31a5ac1dc8c8bc75f8e87b763545cd824edcdcbe" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00638-of-01024.json.gz": { + "num_bytes": 318521250, + "checksum": "4b30ad531f7502ef7bc6398ab286e5c6c63d340c22792da9258ea95b496d1c0d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00639-of-01024.json.gz": { + "num_bytes": 319997068, + "checksum": "2bfdf36396e49ff625138d29925f54eb12b18d35f6d0bf5ca9e79194977cfb43" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00640-of-01024.json.gz": { + "num_bytes": 319355927, + "checksum": "d0d0ed7304b5d79318b5230a1ab48d3ed03183f1eb11d96070604a7008cd7b30" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00641-of-01024.json.gz": { + "num_bytes": 319002081, + "checksum": "1461ecb6b92819bfdc12808a5442d70f94538931f856c91dea602a23ba86ab98" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00642-of-01024.json.gz": { + "num_bytes": 317689465, + "checksum": "aa0af0169cf13db1f8133e8d76afeeae5f71d63d179794377a55b6c2eb938dc8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00643-of-01024.json.gz": { + "num_bytes": 317523344, + "checksum": "5c060166e776f8efda48882c118dc0fd5e058d9ef40be578bad31e477114a16e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00644-of-01024.json.gz": { + "num_bytes": 318876813, + "checksum": "ad98ee119742cb8a6efa1be46e9670969397c7bde10049886d7d6fceb82387ca" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00645-of-01024.json.gz": { + "num_bytes": 319981258, + "checksum": "8930ae8e14c124218793d2fd1bbfb1b624e918cb092b21c6ca74347abd9dea4c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00646-of-01024.json.gz": { + "num_bytes": 319624889, + "checksum": "a40705c4f9a4db4d2d698cf96e43b99fa0790b886506300eb4986a26de7063e2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00647-of-01024.json.gz": { + "num_bytes": 319240920, + "checksum": "7129182faeac82b47127458e92903a209acf8272166024e8313c167d6f358456" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00648-of-01024.json.gz": { + "num_bytes": 317305623, + "checksum": "3124091a6c438fecbfc948b1a35ffb1462287ae06866b02a6dbb1a6651ccf1e4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00649-of-01024.json.gz": { + "num_bytes": 318998755, + "checksum": "fdb286cfe9e9091a57b31be61a56a425fae07d6b44f0b45f8743d7aab0e980dc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00650-of-01024.json.gz": { + "num_bytes": 319612451, + "checksum": "ff88c4310f049344b8a3f701bce12d08ef5f9b037e82fef7f1f670b3d51e59c2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00651-of-01024.json.gz": { + "num_bytes": 319098081, + "checksum": "9c3b1843082aae39b057bbc7364e69cbc39bbdf91d5bff4f52b12cf1a264adf2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00652-of-01024.json.gz": { + "num_bytes": 317107981, + "checksum": "e6199d12a893ae5d05c5388ae7a679df419ef6a050c8e3ce3c15fe534943a774" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00653-of-01024.json.gz": { + "num_bytes": 319623884, + "checksum": "333ac93cf1f1f4da0f72c5e57b675052453b42dffe1e4d45ec680f4e3e075d97" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00654-of-01024.json.gz": { + "num_bytes": 319055728, + "checksum": "1efe352f2f2eba826231a5bff6c79390630b44039b226a5041a087e116b60f5e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00655-of-01024.json.gz": { + "num_bytes": 318539829, + "checksum": "613c741cfb738017b3fa233512296d9127d661738721d3fccd806aad54d19d84" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00656-of-01024.json.gz": { + "num_bytes": 319970377, + "checksum": "51fa9b217b6bcf664c472cc2b258813e1f1d7a0f501c29b822221bccafa4e201" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00657-of-01024.json.gz": { + "num_bytes": 318548629, + "checksum": "c542c6fd2f3284d64f8d53b71ab8308bbba59f7f13e9d9eb20bbbaf13ad4782b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00658-of-01024.json.gz": { + "num_bytes": 319845984, + "checksum": "b3d8fb6ed2258c463367108e2942742e88eac657c859cc8d128035110fc87e7e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00659-of-01024.json.gz": { + "num_bytes": 318887872, + "checksum": "02feb4e03020d767a4468251786d4857d5dc833969626bee616c7882bfda9ce5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00660-of-01024.json.gz": { + "num_bytes": 319854892, + "checksum": "a997d9187a185a29fb3bbeb1e696d32898efba8f5e9d6ed816493669f0c5ec02" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00661-of-01024.json.gz": { + "num_bytes": 317599289, + "checksum": "86d9189ebc534c99da5a4407624a623561b159f758fb04373a270887d0b45709" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00662-of-01024.json.gz": { + "num_bytes": 318138720, + "checksum": "9c626f7aebcc4fc9afd533b6c8a372d884d01f508ce49c01ddd830e4e9e8b2d0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00663-of-01024.json.gz": { + "num_bytes": 318110835, + "checksum": "441d4dd0d5d2ea7b6098a3fe006b9d7afd526188824a3325d44538fc5655942c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00664-of-01024.json.gz": { + "num_bytes": 318996945, + "checksum": "08ab0739c3565643b6a83d7091936f5d75a4d8418c956146114aa0315f205dd0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00665-of-01024.json.gz": { + "num_bytes": 320612903, + "checksum": "1ab7bc2d0f7c6704c97848a9325015f06228339bc52cc1fb593d9c56145e7c48" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00666-of-01024.json.gz": { + "num_bytes": 319241006, + "checksum": "8b1213325ceb2a2c89dffb891a31317e903d08fff911e4ba1ae66fc3bcce9973" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00667-of-01024.json.gz": { + "num_bytes": 319650665, + "checksum": "14676f97937eb3d0734e5f121c5f63002ba2d2c62b6c41b4b46d2fcab9ea9614" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00668-of-01024.json.gz": { + "num_bytes": 319198651, + "checksum": "a406fceed5b7d17ff6d5773679c3df50e747215e39926228ddc9a60c6bf9d152" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00669-of-01024.json.gz": { + "num_bytes": 319363200, + "checksum": "1d3267d77f43d3d720dcd79c40bc3e8c0cd777d421b1b7d0e69e140199e34552" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00670-of-01024.json.gz": { + "num_bytes": 320079826, + "checksum": "85111c229b8fcc8428b3c13676bde8268f027fe06e1f576a3adcd82bce1603bb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00671-of-01024.json.gz": { + "num_bytes": 319494773, + "checksum": "eeeed8d9f63a5c16ab9d62454fae5bef1896973cfa69cedfcfaac4565a793b27" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00672-of-01024.json.gz": { + "num_bytes": 318304853, + "checksum": "6793ec3ffbc147c36e471e1c06a664ac2143408c9ee46305694708eee0fb38cb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00673-of-01024.json.gz": { + "num_bytes": 319031236, + "checksum": "3c886ff71973805a59312d8d43ee9e616bcfafd76c03a64d53ab548036b1fa90" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00674-of-01024.json.gz": { + "num_bytes": 318647345, + "checksum": "fd7f4efc0c8af611e7e137680342843d0471ca072421ab3c172a169ba2f5d217" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00675-of-01024.json.gz": { + "num_bytes": 318313871, + "checksum": "3b797b2ad717749a24866a97acb95aace0dd4e91ee7d51dcf1fdd46a9232b794" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00676-of-01024.json.gz": { + "num_bytes": 318858652, + "checksum": "2ccdf652fd413dc624643d35a76223e8a44e6241997841ec2d13ae11b56400fe" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00677-of-01024.json.gz": { + "num_bytes": 319236091, + "checksum": "bbf069c696f09e5467b17ba98479948a85101efa776094084e37581e72c01123" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00678-of-01024.json.gz": { + "num_bytes": 318996096, + "checksum": "3e3dd21861c713bd38d1803c32da1c0bc2496899648b4cffe1fa2e61b35ca056" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00679-of-01024.json.gz": { + "num_bytes": 319915466, + "checksum": "6ed56468a31564cb25668ceb5df325ff7138dd231afa85f676ac7af5e81e0642" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00680-of-01024.json.gz": { + "num_bytes": 318537417, + "checksum": "959ce407e7a892495c477b9e0071dff496fd20db9cfb04dd035ac59dd5b2f309" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00681-of-01024.json.gz": { + "num_bytes": 320181225, + "checksum": "0aa77d778f24bfdc8566b390a7a1ef1d7880a42b98b3e82e9b37ee3ed821a8e5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00682-of-01024.json.gz": { + "num_bytes": 319087756, + "checksum": "a4da802570ee7bc27e752069612b633edf226078f48d5f55280f73a6dc934127" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00683-of-01024.json.gz": { + "num_bytes": 320019766, + "checksum": "587497efb7bcd4ca85ec0559e372ea285c1b95e3889d406f142cfe454d8e0e2f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00684-of-01024.json.gz": { + "num_bytes": 318814245, + "checksum": "6e904f73976ca18aed3375d1c1b308d749b9a4405a333dd0a2cf85360822e205" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00685-of-01024.json.gz": { + "num_bytes": 318586686, + "checksum": "c51012772c5bae73821b67f72c035f22a40725d42bcf51e439bbdfcd84393ef2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00686-of-01024.json.gz": { + "num_bytes": 319648436, + "checksum": "890b7408abd0cc04a84be3a3992d05714dbd30a9d33a8a9b05316a980fe51313" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00687-of-01024.json.gz": { + "num_bytes": 318909835, + "checksum": "b54b20c21ae9834b630a8aac057d47069cf137577d30b91fd1475f5824b61561" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00688-of-01024.json.gz": { + "num_bytes": 319381735, + "checksum": "422091d5ba0d44c64bb0c84ab4757318414bc01455a97f53190eddda89c2f3f4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00689-of-01024.json.gz": { + "num_bytes": 318995026, + "checksum": "ad5080fbddc914c649027d5e2214f1d75e0cf0617eb3ca0b1fdb8ed9129f99cb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00690-of-01024.json.gz": { + "num_bytes": 320745318, + "checksum": "d45492346bb4bf519e657356ecf1805b6b592683b98c20c93da2f07c50b06092" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00691-of-01024.json.gz": { + "num_bytes": 318575084, + "checksum": "43a07e8a98bc99f381558c938fc83acd4a37d565459c0f3f83aaadda816f66c8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00692-of-01024.json.gz": { + "num_bytes": 320651368, + "checksum": "21a790ef1dcc9c6ffa071d1a2e21e330d6afcb45368dde9cfae8933c6d029742" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00693-of-01024.json.gz": { + "num_bytes": 318429145, + "checksum": "85558018ee61e33c4f3e05acc2029e69447a5717be880e9a0aa8fa715dbd0c05" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00694-of-01024.json.gz": { + "num_bytes": 319562061, + "checksum": "894f4c906a33c644ea80c3a00155ced807a62e1bcd9f6e254cb6c88efeedd142" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00695-of-01024.json.gz": { + "num_bytes": 318298964, + "checksum": "06eb05f651f1d2fff495c48475894420334070df10c051c7253b7afb0bc38291" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00696-of-01024.json.gz": { + "num_bytes": 317473664, + "checksum": "59ea4f951335553945a644f7628403ba1a99a27e0d93fcfe5db18cbc3dd48ce9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00697-of-01024.json.gz": { + "num_bytes": 318839008, + "checksum": "f0203b0f2caa3287b8f7a64288af52bafbf033bcdf31dae54e501e4da47b9935" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00698-of-01024.json.gz": { + "num_bytes": 318288032, + "checksum": "fe2a581cd174429a81424e407aceb1d81b61d9796d74db4590327778fbd5016b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00699-of-01024.json.gz": { + "num_bytes": 318696527, + "checksum": "edf3aabcdb28fa2feb532b3bd55cd167c2200a6d8e19f05152be194e48acf87b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00700-of-01024.json.gz": { + "num_bytes": 318900366, + "checksum": "67d89417d1440afeeefd59a0993e4d12fb5731e917ec7f4e65d9319541b4b9e9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00701-of-01024.json.gz": { + "num_bytes": 318901212, + "checksum": "64d302459e6871325282fd890d2922cb1fb25b47d677ce793bc065acc8d1bd07" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00702-of-01024.json.gz": { + "num_bytes": 318913325, + "checksum": "f0bb360189166a0bd717bad85edf06943333b1854687839864aef3ee02814795" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00703-of-01024.json.gz": { + "num_bytes": 318730274, + "checksum": "c4e027079b9cf9b1adae3e285c5cc5dafeee5c74cf3621c424b6df9801d508f5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00704-of-01024.json.gz": { + "num_bytes": 320112232, + "checksum": "37540f6a00523cbf429764893aa15aae6a57e53c89cf51d82a815feef02b1210" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00705-of-01024.json.gz": { + "num_bytes": 319643559, + "checksum": "9dae018569fa4bf33674f67ba03732a2f85cfceb53ec2cbb9457eaea607b8dfa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00706-of-01024.json.gz": { + "num_bytes": 319941519, + "checksum": "03926405dc629f0664a3d27c700a4fa2f606496f0b52a9bbf2fd2d75faae2f46" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00707-of-01024.json.gz": { + "num_bytes": 317628508, + "checksum": "fac92295e4c85f087d27e0a6f231d782be7b2448e99cfc42c09c0e1e20964c3f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00708-of-01024.json.gz": { + "num_bytes": 318863059, + "checksum": "39d4880d3e47e65ab6351e94b015810d66295a86a9f08534260ccbef41fdaf04" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00709-of-01024.json.gz": { + "num_bytes": 318412651, + "checksum": "044fc99a1307737bc8d6d8a9b67997010309fc695eda6e8dd42e5b6bab2256d1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00710-of-01024.json.gz": { + "num_bytes": 318631334, + "checksum": "0b2c93cf298051864b8660e57182b38408ad738cf930afc09afdde26d952f819" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00711-of-01024.json.gz": { + "num_bytes": 320587866, + "checksum": "f1f6bb9770b76742d0131495879fa38ed8aebe8a0b38463e7834f0697f174ede" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00712-of-01024.json.gz": { + "num_bytes": 318191204, + "checksum": "b6873a7d375aa29ff39ca17c3bbc7e328292b1671b59a35e7b01c0e992da90f6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00713-of-01024.json.gz": { + "num_bytes": 319472539, + "checksum": "3bb12a0a806ecb8a5eeaa00188c655f399460609b8a19005a7141bbcb3a7a694" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00714-of-01024.json.gz": { + "num_bytes": 320196397, + "checksum": "ca6e1fa6f27c9dbadbbaa767fd21dddee7c84ca96bbb6735640ba2631668ad0e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00715-of-01024.json.gz": { + "num_bytes": 320075706, + "checksum": "1a773eec7d738c0e1e253bfd4533f0c43c0d133e564c3458159e0c47d767689c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00716-of-01024.json.gz": { + "num_bytes": 318736413, + "checksum": "c17a6b2115e56cc3d6bbbd94e8565fb14287057f80199528e6cba20adf557bf7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00717-of-01024.json.gz": { + "num_bytes": 317351537, + "checksum": "cdba391e16c3bcb5569d978a8d11518103e7687714710ef4eba4f7c0821d67d5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00718-of-01024.json.gz": { + "num_bytes": 318017965, + "checksum": "a25c494e4baead0af0afe6eabaa054bc15f80b6ca0ac8dadb1b354d72ffbe63b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00719-of-01024.json.gz": { + "num_bytes": 318124432, + "checksum": "94f5dfbec85a8c5b22ff1368a16ec2eb7fb4be25c0c8f004096156ae40bfa2bd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00720-of-01024.json.gz": { + "num_bytes": 318235852, + "checksum": "c0248326e698599dcad01eca25d747c138881c61b5636ba765b21f9cd0df996a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00721-of-01024.json.gz": { + "num_bytes": 318817834, + "checksum": "c11df487a966e748cec522fae4ed76abf3e8cc9bcd28c301117fa52ddb83dc6d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00722-of-01024.json.gz": { + "num_bytes": 318553851, + "checksum": "63d3d0c3f5dcdff29a0a6ef41e3a9df3fb505c73c8554839e3032293a78bae2e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00723-of-01024.json.gz": { + "num_bytes": 320174720, + "checksum": "29c97bb8ff301080547255af29bb5019a2c1fbc74f0a2711e626461d5a5f0b54" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00724-of-01024.json.gz": { + "num_bytes": 317805413, + "checksum": "65f8932f3c77b0fee5f2224643a71ff95246720368fe66d45c22df25ea4b9c2d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00725-of-01024.json.gz": { + "num_bytes": 319460597, + "checksum": "dc785a8aa3a1f4ed77512d51a9139dfb24b356b5499ae67dd5b860101b1e0e4b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00726-of-01024.json.gz": { + "num_bytes": 320934004, + "checksum": "45d857536d3535d08cddb6cf50d08d89cc28138a5be082465c3a8c27c02ae2bd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00727-of-01024.json.gz": { + "num_bytes": 318393879, + "checksum": "e4a02e43eeabbecb81b971f4201212104b6214078cafd9500d5b5f323595f060" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00728-of-01024.json.gz": { + "num_bytes": 318826577, + "checksum": "cfaa0d0c8dfb333899c73e0c2aa00dfdadd00e5b4a3d477e7518c4141899c8a7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00729-of-01024.json.gz": { + "num_bytes": 320390067, + "checksum": "528fe99b0c8dc917ac0f02a555603f9ae81e690b4ce1040f65ebbad3390c0426" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00730-of-01024.json.gz": { + "num_bytes": 318156386, + "checksum": "786e6913b4417a87cd4cb1882e181d8b2e1eb4b4db5b4b9ad2120b5efdf3e2ba" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00731-of-01024.json.gz": { + "num_bytes": 320013543, + "checksum": "f28fc2794c280fc1de263b9b2a81e42423f8dac3af7c4fbd3b3aff888821ca9f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00732-of-01024.json.gz": { + "num_bytes": 318753697, + "checksum": "69491eb25dbaef78235f769422e773de7a2578e678ecde29dcaa663f4ebfa78d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00733-of-01024.json.gz": { + "num_bytes": 318640706, + "checksum": "dfde8960d738b873bcb75abe1661fcaa096d70c76aef21846b173b8adf049bbc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00734-of-01024.json.gz": { + "num_bytes": 319447398, + "checksum": "145add76dcd73916b548e7e3b161757c1bdc1f22a0f127019f24827afd6f85e2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00735-of-01024.json.gz": { + "num_bytes": 319868149, + "checksum": "dcd4ba95672630f89e75b70dc08cb918bbe896f5d32ffeba7d3e4921b27c1f4d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00736-of-01024.json.gz": { + "num_bytes": 318404586, + "checksum": "4710b1569342b7aa7ca610d8b8cbb2248a1c5fcd8c6ab3b7f875657dff4779cd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00737-of-01024.json.gz": { + "num_bytes": 319915151, + "checksum": "7091dc758fd14c206514663eed0ae446178ff38e76c4cb7e711c63d419506e49" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00738-of-01024.json.gz": { + "num_bytes": 319709793, + "checksum": "afe1a96ced49662b14bc60b4ff8fc1f610bbc6f3c515bb73f2fade7a0ba67678" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00739-of-01024.json.gz": { + "num_bytes": 319789716, + "checksum": "9e2332cfc994483d4b913c6556ca9c1698b95e81033b7bbc5a4f5271e5cce708" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00740-of-01024.json.gz": { + "num_bytes": 319102226, + "checksum": "61ddcc3af919b753638dd46f18f790d7783cdc3090dfddbbeb40faa93bed340e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00741-of-01024.json.gz": { + "num_bytes": 318717589, + "checksum": "aa3038c23a37561f2ba92e95ffeaa3e3641c1a69f8688b724116edd128e9ba52" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00742-of-01024.json.gz": { + "num_bytes": 319456536, + "checksum": "ea9d23abfed6e3e8ab900291a3bc1faa27751ff94e35378f8c4eb07207036a9c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00743-of-01024.json.gz": { + "num_bytes": 318641730, + "checksum": "6efcec6cd087be4eaa98491e463d0fb9c1253aca275971de08c56a20be9aa579" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00744-of-01024.json.gz": { + "num_bytes": 320264992, + "checksum": "71653351253c8f7fa18673a3f956bddebd158978708c5a4c9e9b5318f598e1f4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00745-of-01024.json.gz": { + "num_bytes": 318665967, + "checksum": "347dfd824d6f4afe58c6f418ab5d332909038c880f4dcda7f774d3d7a588c3f3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00746-of-01024.json.gz": { + "num_bytes": 320005833, + "checksum": "812bc3c082e3a65c8c77fc7767bb435f9be9a999961d84eadc9e0c602e5ce168" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00747-of-01024.json.gz": { + "num_bytes": 318575441, + "checksum": "a4414d376c69ae8dd5e60b206315cf920d5a797c6ef7c08fe0c4b4e28b4eb4ef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00748-of-01024.json.gz": { + "num_bytes": 319266882, + "checksum": "f08aee694b85d5e7120652350bfafaa05495e609aa6d2fb0b913ed8a718d7dcf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00749-of-01024.json.gz": { + "num_bytes": 320205042, + "checksum": "b3402b16a5cc817d89a19fd3456a50b5b6d5f3f555eea725167558cc85366d12" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00750-of-01024.json.gz": { + "num_bytes": 319198252, + "checksum": "6b95232f6d53cff8045bd5ebaa87d6e6c511a74dc646d2a960eb87e801ff4f2a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00751-of-01024.json.gz": { + "num_bytes": 317855407, + "checksum": "badc9d82efdbc8db5dc328e8aa5e80155c52f00b105b136d8c5c948fe237d61d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00752-of-01024.json.gz": { + "num_bytes": 320283992, + "checksum": "67c32eb497533d6fd20b206c38483d171275029ff525bba3da13b0c62e1ef073" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00753-of-01024.json.gz": { + "num_bytes": 321030653, + "checksum": "5e95b1cb54d7d7f12bec1559ababcab0c364a0af99e10a42a08357647ef5d3cc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00754-of-01024.json.gz": { + "num_bytes": 319059779, + "checksum": "32cb59ad16dfda8a5b52615498fe2e6d85753fa44ab667af2f525a2467508da5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00755-of-01024.json.gz": { + "num_bytes": 317737268, + "checksum": "0ad2fef2fe37d59b163e29c2287938a768ee87acc34752394809295d0710c602" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00756-of-01024.json.gz": { + "num_bytes": 317293218, + "checksum": "db737ceace329fb1f8fe1aca38db048a1dedcb5226a4132485f26afecdc6c3c8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00757-of-01024.json.gz": { + "num_bytes": 319529375, + "checksum": "8b823e97964894189a13df393e1b3978342fb24bd81f07af6e54b7bfa2992796" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00758-of-01024.json.gz": { + "num_bytes": 319297548, + "checksum": "3f31d7ad99d88dde757a651b12db909a30cfcae5796fe3f85722598d92344ba5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00759-of-01024.json.gz": { + "num_bytes": 318154496, + "checksum": "a4b780127d6f22aed49d155e234e21a847a60626143a8e7dc6e31a5f204e79f8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00760-of-01024.json.gz": { + "num_bytes": 319386997, + "checksum": "020e68dc60004d0661de8a22fe2b9fa7f481fcecaef8fb06efa43093a2a9cc52" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00761-of-01024.json.gz": { + "num_bytes": 320035555, + "checksum": "8d7b5a97770a062276ca909a3bd20365cbaf3931fcbeb8b7e479f5ee03b47053" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00762-of-01024.json.gz": { + "num_bytes": 318099583, + "checksum": "b8fcbbf9b55cde2ff66ca046884870e1e5f2d2a729a8eedb253c16fe0d7658e0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00763-of-01024.json.gz": { + "num_bytes": 318354409, + "checksum": "ce2d9e44161b13f6226cfb9f93ad42fa0edd18eeaee923c8ab31c25aec1fc976" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00764-of-01024.json.gz": { + "num_bytes": 319181291, + "checksum": "53ed1ef77f24bdd7c189aae0905d63be97f48aa3233fda139e59af53baab242a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00765-of-01024.json.gz": { + "num_bytes": 318147738, + "checksum": "26b9b9ea2f94b322c03d1b83b25ab4e9a1a203fe9923728c5dd91f22d5f8fef5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00766-of-01024.json.gz": { + "num_bytes": 317964368, + "checksum": "e59fec52abde3fb4cea58a5a4e511f4cc61e21062bfdd1e3ffd60131a847e0ea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00767-of-01024.json.gz": { + "num_bytes": 318750919, + "checksum": "0e5eff983e793a3d7cdd1ec85a45d58e5e6ecf7a12cf83a01888e148ab08acf9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00768-of-01024.json.gz": { + "num_bytes": 318978892, + "checksum": "171509b0bed8854b6de92fe146993be80ab31e0aa56953c7b0a66eeb738ff70a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00769-of-01024.json.gz": { + "num_bytes": 319386097, + "checksum": "704e7daa85c0e3ac974d51a6e2cf6df2ee053613fd2b77b5fe16d10b29a50a4c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00770-of-01024.json.gz": { + "num_bytes": 319623528, + "checksum": "e787064473427fe17ba95d9326d009e9723148fb314a7a9605dcb6698854dad5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00771-of-01024.json.gz": { + "num_bytes": 318911381, + "checksum": "c54aaffd8162b30280e974e81e9d0669357b74394e0da2d1ca2ce613f5715e4a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00772-of-01024.json.gz": { + "num_bytes": 319386949, + "checksum": "2f9c83681632482df6c65e4c70718c83f500305ee1d061626cdef35bd794a412" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00773-of-01024.json.gz": { + "num_bytes": 319962599, + "checksum": "f47c487ba09051c9a4bf320d69db9546e98948e3de68050ae2ba025c71e09146" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00774-of-01024.json.gz": { + "num_bytes": 320370991, + "checksum": "69a1eacfdb6f6fd49ea2b729a7ab291b96fd5bd42f993e2306d044871b069aa7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00775-of-01024.json.gz": { + "num_bytes": 320433220, + "checksum": "d35934fb537d1283d40897d05c1486f629776fe9e4ef127694ecfd0221f860c5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00776-of-01024.json.gz": { + "num_bytes": 318809986, + "checksum": "9079970aa1618b6be51caeab7a2cab26e61c30aa53af361a6184ef6249bf65a1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00777-of-01024.json.gz": { + "num_bytes": 319617796, + "checksum": "5e200e354ece1713a32a3e1ebcea33412de814dd5843df3523afa1ec9a4d5275" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00778-of-01024.json.gz": { + "num_bytes": 318039278, + "checksum": "b79309eb335c0c860c85d2b724df52c3613f61b92ab6cd6276c2be8c25a7b01e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00779-of-01024.json.gz": { + "num_bytes": 319078058, + "checksum": "fc6053d53255e4d4a4c22c42049ce3eabc224320a51c94c1116f3201f87b377b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00780-of-01024.json.gz": { + "num_bytes": 317637428, + "checksum": "e38c933003910b02beef64af2d330f32af6e6f3b7346fa121e89045c136c13af" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00781-of-01024.json.gz": { + "num_bytes": 318792407, + "checksum": "b6795b4db199f7a7a92ef195aee3753e5e00df05fad2d8401b2b9feb56d71a76" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00782-of-01024.json.gz": { + "num_bytes": 319081289, + "checksum": "dc20640bded03596eeec689f1293be55e72d138cf0c576df9768c7631931ceb9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00783-of-01024.json.gz": { + "num_bytes": 318663257, + "checksum": "ac2b4ee9ab8f25ec010a17358d2f3f1fb9d8d50c9f4b73357429277710e6564f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00784-of-01024.json.gz": { + "num_bytes": 319687102, + "checksum": "fb93dee8a974f2ea204c240ed4c24e1b64f91ccb421070be305487e4e53ca083" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00785-of-01024.json.gz": { + "num_bytes": 318909034, + "checksum": "2f298b358cc619fa72097e3dbd9ac91e7dc3f7c5f9c4f2ff6881c988921d2a6c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00786-of-01024.json.gz": { + "num_bytes": 319213094, + "checksum": "60ebe35e0f23ccc61fc0eedc891ea9deb43001beb8205d31360a05b5d58e31f0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00787-of-01024.json.gz": { + "num_bytes": 318335621, + "checksum": "a7b0aa4dafdda2f3dc3c1832b71d4a92af08f99a70a315b4cf9f60c1768bf2c8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00788-of-01024.json.gz": { + "num_bytes": 319444037, + "checksum": "874dda510a01a2f78e51d917d309bcf1a0f21e7e1ca46661f93931a6200b3d01" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00789-of-01024.json.gz": { + "num_bytes": 317955670, + "checksum": "ec949a05ec7750dacfdf692c1ba118a33454097fdcaa56626fb042eb93933811" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00790-of-01024.json.gz": { + "num_bytes": 319033823, + "checksum": "0939164a602d7c7140c619130977b6814639122d0038aff7bb840093def5172d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00791-of-01024.json.gz": { + "num_bytes": 319366402, + "checksum": "fd6ea942b3402b5da4acb1a03bf59b17df402e90c47dbb66fb198ca2f4b5e1cc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00792-of-01024.json.gz": { + "num_bytes": 319218667, + "checksum": "9e8af5aaa6d5ed915eae334c6101948fbcc7bcf6c8c6beaf80fd1adecd67b078" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00793-of-01024.json.gz": { + "num_bytes": 318865241, + "checksum": "675330d6736a677760d854dcdd9a174eb7c1d426f94e34836a048c2139befac0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00794-of-01024.json.gz": { + "num_bytes": 319384084, + "checksum": "fd4c2623d9cbaed3fefd6bb88c2d88b58fe8f08e9e8ef0cea6bb22cac68dabd2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00795-of-01024.json.gz": { + "num_bytes": 317654308, + "checksum": "157533ddb56290662e25cb60842327daec23e377e116496338c9313cbf6991b3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00796-of-01024.json.gz": { + "num_bytes": 319298258, + "checksum": "fd90f055499095efa9cb848dee62406d25820f929554b0e07674d4c95db574b3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00797-of-01024.json.gz": { + "num_bytes": 320048871, + "checksum": "e089a95e96a081dd76e38acf9506bfc7b86c682892d3a8774e9784019db39306" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00798-of-01024.json.gz": { + "num_bytes": 319291246, + "checksum": "e29133ab6f83c84a69752a451053dfe20887ea884e09cc373afd89bba7458664" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00799-of-01024.json.gz": { + "num_bytes": 319175282, + "checksum": "8f3f3a67946615bdf499d64341d200477280947e5be8538748e28db768115947" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00800-of-01024.json.gz": { + "num_bytes": 316687275, + "checksum": "c9a17dc92658ce5d062af25e5c8610a7fbae501627cfc7324ace7ca6a8d75d8d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00801-of-01024.json.gz": { + "num_bytes": 318710698, + "checksum": "4b7d1e130fd8ba536da073069221f68d567492b2bff27d8769fb4ef124cec3a1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00802-of-01024.json.gz": { + "num_bytes": 318914381, + "checksum": "9f186b8d08f5d3090b7c9eb8a6954cf3202caec7cbf5c308221333cd115af561" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00803-of-01024.json.gz": { + "num_bytes": 319111424, + "checksum": "117b0590a976805001a879c49c42db55579e5bb9a5d4db9ce20e42746f59d574" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00804-of-01024.json.gz": { + "num_bytes": 318186018, + "checksum": "ea376d6cc1043dee9a00e1eca1c431aa59755d8966162701817f9cf274a758c2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00805-of-01024.json.gz": { + "num_bytes": 320382848, + "checksum": "1e69e7896202206f9f804b2497c4d99cca5c1d139efc782b8ede2cb88f68b48b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00806-of-01024.json.gz": { + "num_bytes": 319508172, + "checksum": "9da7e230c7abed9beaed9d6090efa8ae1029a418dbbf6d04bb4386aafde3dbce" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00807-of-01024.json.gz": { + "num_bytes": 319995091, + "checksum": "2e3ba0dbe85c004c6a23b4caf340282e0d0004ab574a14bedc9c83c67cc2c0c9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00808-of-01024.json.gz": { + "num_bytes": 319880961, + "checksum": "f53fd08fea0f874d727422357521176c6810a54abf4fcc7019357b50f1928daa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00809-of-01024.json.gz": { + "num_bytes": 317100774, + "checksum": "dbeed220f330b489cc262fbd7cbe84f04ba8a5118ebbd8f48bc7a4f5f63ae7b8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00810-of-01024.json.gz": { + "num_bytes": 319625750, + "checksum": "fe5dced88ccd54b258c6740d8988e10b128a869ecf28e7096e689c59fa147d4b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00811-of-01024.json.gz": { + "num_bytes": 318375975, + "checksum": "e4bcc5571fdc4f51b733d975e78ff02939d3463264a02d7e651271ab91c81df8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00812-of-01024.json.gz": { + "num_bytes": 319663092, + "checksum": "b1e41c198bc69d026ab997fdeaa4e687f7a8ddfca751add9bc85f00481708a63" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00813-of-01024.json.gz": { + "num_bytes": 319094357, + "checksum": "c07287aedf6854f581aaf83b75c4939aa4b10181977d4c4be97c20989ab8f992" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00814-of-01024.json.gz": { + "num_bytes": 319521327, + "checksum": "c96203ba5461ef92a7a2b0d4e598efda943b5b3adf42a7268c26f1c224410c01" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00815-of-01024.json.gz": { + "num_bytes": 319098749, + "checksum": "72f2e65c5b482be0d9e3a3d8f5cdb703cec7a515e927bc4411e2f6ff5085ed5d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00816-of-01024.json.gz": { + "num_bytes": 320377295, + "checksum": "df95ac17a25cebb854088cca345f60c2634d07f088e45e251d7f9afdb334c0c7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00817-of-01024.json.gz": { + "num_bytes": 319007451, + "checksum": "bad1cc25de4f66ff36c69284e6b615f68bdc25e45f08e04e33ee463a0c6ef0b5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00818-of-01024.json.gz": { + "num_bytes": 319609737, + "checksum": "acf1b390f1c492d97bf027f06898f1dd5cf8cc6def41f4d43b38a0c99f4a85e7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00819-of-01024.json.gz": { + "num_bytes": 319164157, + "checksum": "3d973eb401876c57e9cd1420fc938da9dd7b08f97d4596c66a8c159e2b56b1b3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00820-of-01024.json.gz": { + "num_bytes": 320181073, + "checksum": "101d5f0079caa840b934c14800ba5cbb7fca22e9e6915b98b4dc5f37c57f5b4d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00821-of-01024.json.gz": { + "num_bytes": 320949305, + "checksum": "34ba423c93c4262234e6e2005aba0436daa99b05570cff0a58e9d27b65d76896" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00822-of-01024.json.gz": { + "num_bytes": 318392521, + "checksum": "4a586e220fe34f544dd068f4e1c310459cabd5dbea9a991c21c09f70079eb4c9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00823-of-01024.json.gz": { + "num_bytes": 318526893, + "checksum": "3b10a8e32a3a8f6541400d697516fcd3fffba3554e8d8a96451f01fc6b729d8b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00824-of-01024.json.gz": { + "num_bytes": 318640792, + "checksum": "c921270db8004d309f91e3209340c476191793d47b3cfa9d19fdc602d43dfe65" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00825-of-01024.json.gz": { + "num_bytes": 319524026, + "checksum": "a6eb347db464976ba5d1aaa4fa64e103ba36520dd1e9c103644caf187be471a5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00826-of-01024.json.gz": { + "num_bytes": 318469810, + "checksum": "dc5f88e6161ac06165f3cd4cb91a00cdff75d2f900e8f53d62bacfd833e352b0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00827-of-01024.json.gz": { + "num_bytes": 319391185, + "checksum": "66a240be851d6622adf7801d9634a456e83e9edfd135601c0dc1aab48902d7cf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00828-of-01024.json.gz": { + "num_bytes": 319625277, + "checksum": "2e989beeeb2a63bfb87a5a401619a8e4155a961b44441cb5f627c29f25962dd4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00829-of-01024.json.gz": { + "num_bytes": 320001237, + "checksum": "0653e4052fb7a4ef503bdfbbee332d650492e99c130a85c04250e18d91cfd30c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00830-of-01024.json.gz": { + "num_bytes": 319240468, + "checksum": "bd56e55e75a8237b5292fa65e5ecb0dfbabef6ef0dec6695b13522803210f40c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00831-of-01024.json.gz": { + "num_bytes": 319174603, + "checksum": "ca9d6c643127a390823655256a45462ee6e75aa2485141f6530a3bdf6ce4f572" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00832-of-01024.json.gz": { + "num_bytes": 318909883, + "checksum": "e91c35d94e183515e660cd8c874c12bbf22e1fd683312446f02287b0d032fb68" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00833-of-01024.json.gz": { + "num_bytes": 319095835, + "checksum": "971d9a4f8bfce564d42dc0a80009acfa7d2f47557ac19836ab426defe1877714" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00834-of-01024.json.gz": { + "num_bytes": 318319786, + "checksum": "159412a58fb8deb59e039fa0102bdb746065cbc6b4d1d3da892930fbf8b0f178" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00835-of-01024.json.gz": { + "num_bytes": 319959334, + "checksum": "814518d53b3023e3b8ac22dad9d65dd50d455a4c7db1490022f447f793f4d24f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00836-of-01024.json.gz": { + "num_bytes": 317642779, + "checksum": "19ad4fbaa3ff5c638b77980300b8c162c21a8237b87d054a30c46aee67d0ad94" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00837-of-01024.json.gz": { + "num_bytes": 320687986, + "checksum": "190de7948a4b163047ecdfc856e5f78bbff52ca883edfad26b32fbc0b57ffe36" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00838-of-01024.json.gz": { + "num_bytes": 319802866, + "checksum": "ccb4d342791a187f3bde225e008ff8cf70465f7fd3eacaa8bbce1ec4e52c2622" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00839-of-01024.json.gz": { + "num_bytes": 318621894, + "checksum": "3ff5cf5b33996a663df5783f3f41a5b5b2f6e08a2cf91e74cad3bf82291192fa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00840-of-01024.json.gz": { + "num_bytes": 319757379, + "checksum": "8292e0854c01ca79ef03dcc1752ddc1f0df747ad67551b7c0fa5208b6aa3f822" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00841-of-01024.json.gz": { + "num_bytes": 318779722, + "checksum": "9eee9e089bd396adf5a276eddca9f6352e07f8c33877f85c1f65968aa0c06128" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00842-of-01024.json.gz": { + "num_bytes": 318692591, + "checksum": "caf3f40a144b43af08687e41a1eb7d08da1b78cd1600574566e11f29fde9cd34" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00843-of-01024.json.gz": { + "num_bytes": 318944616, + "checksum": "e74d624534091173546755ca236e5912cc8acf8cfef5f9c197b541ebe76f0818" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00844-of-01024.json.gz": { + "num_bytes": 319392887, + "checksum": "e47d3f44f996398b54f18729f4e81d88d04b19bc529847e86277a6a91ae74e6c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00845-of-01024.json.gz": { + "num_bytes": 319215311, + "checksum": "de7cffe64f422b02668137272943537946c15539954b564345d6722c4eb06345" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00846-of-01024.json.gz": { + "num_bytes": 318129297, + "checksum": "1d5ea0ab8fcb3975735aa421d646cea4544087f60a79ec209b63c93b6318523f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00847-of-01024.json.gz": { + "num_bytes": 318134095, + "checksum": "6fa4c50808df2aa8efebae3bbf832ba2b0be2f7113633fef720cffb3c50143a0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00848-of-01024.json.gz": { + "num_bytes": 318521356, + "checksum": "3aeb657aa448af82551c653802c669c985c00b7daa593de07f80733ae5dee84d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00849-of-01024.json.gz": { + "num_bytes": 319541694, + "checksum": "1cc016f58a4a2c54625214f028df05247ed319b8c1868c96c2efe8147a73d08a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00850-of-01024.json.gz": { + "num_bytes": 318861613, + "checksum": "eb5fbe6eeb4b0281604df264a5b04a3a0db96ff0d04f252375a788a0d3345c67" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00851-of-01024.json.gz": { + "num_bytes": 319356648, + "checksum": "ffe1397f1d412979cc66820555ef27345f3a2a48b8bcfe682d48301135e8c12a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00852-of-01024.json.gz": { + "num_bytes": 319662372, + "checksum": "fa78ed98d602276520e823e17adc7f796320d95e27e08d84d06e66e415b79161" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00853-of-01024.json.gz": { + "num_bytes": 317625507, + "checksum": "b10cff62fac5191b9cb5e2025227adb838088773e79bfec0937a34bb857e1b1f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00854-of-01024.json.gz": { + "num_bytes": 319665550, + "checksum": "15441b2a7c09a477389a8fbd7401c549dc8281f2bd44251b1546077301e24624" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00855-of-01024.json.gz": { + "num_bytes": 319059897, + "checksum": "f6127845b162181dd7157dd316021a4e6b5d41393c66d3e577491cdb74657f2e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00856-of-01024.json.gz": { + "num_bytes": 319243991, + "checksum": "ec9f0884c5ddf82550105f969222d3ee8b0d4907a0a2540ea6c8c67c2d2e9179" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00857-of-01024.json.gz": { + "num_bytes": 318546680, + "checksum": "840205fa73336ff51d75008ce8c530164ebcef3b50f1ad8deab879a67acf8d5e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00858-of-01024.json.gz": { + "num_bytes": 318306547, + "checksum": "e9b3819e9dc98d66a61f8f4e8f6ecb03099c79ae87a175fe1ae484174b173b44" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00859-of-01024.json.gz": { + "num_bytes": 319088302, + "checksum": "eced8de72f8755fa0dfb690c626cefcacf5fbbce97029d4589058913c31b9339" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00860-of-01024.json.gz": { + "num_bytes": 319704792, + "checksum": "90a169718609f16abe120c4b63a20adc0bbedba51de14b004d34dabe530339f0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00861-of-01024.json.gz": { + "num_bytes": 318444445, + "checksum": "d020840f09fa426ee15d19f05e5afd9cf674048e0dc4438dae0b6f02c7227d9f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00862-of-01024.json.gz": { + "num_bytes": 318606300, + "checksum": "e02bf9d3f1a398972f7d78b9b1aaff9a92146554a1358ea1b16ce7873a9f8fd8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00863-of-01024.json.gz": { + "num_bytes": 319273730, + "checksum": "c977f143cbb5e61160ce76f1cabf7bea6c158abb7e159ec3362aad1cc7af0ade" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00864-of-01024.json.gz": { + "num_bytes": 318143165, + "checksum": "bdf20dbde61f0663feb70be419c39c60acdc7ecbbe1430d47bf79ae2e114f168" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00865-of-01024.json.gz": { + "num_bytes": 319041356, + "checksum": "11c9c068ec5c1b612494c1473b7cace67a55ee66155559b19035df180ee260a1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00866-of-01024.json.gz": { + "num_bytes": 319758401, + "checksum": "ab4436f283af0ef2d33b93cf026907cf68255beee9d9dc1d6c542dee9c3f48a3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00867-of-01024.json.gz": { + "num_bytes": 318991336, + "checksum": "56beb5edbca3b66981f5f8e65f2a13a0f6e99e68ff50cc263cc529a4d8ebf371" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00868-of-01024.json.gz": { + "num_bytes": 319984390, + "checksum": "b9368d2ae0eff869c70c1a1214126c1d084f56887102d3d46e450b2c934102be" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00869-of-01024.json.gz": { + "num_bytes": 319462888, + "checksum": "68ab404e0ca2247686eb264a0d7feeb9d2460162434f5babb2b1da82d865343e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00870-of-01024.json.gz": { + "num_bytes": 318426018, + "checksum": "2d60208a558f6ba92d6c6307e1ab626acd7ff3b7bc25963b09e87e464751c42b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00871-of-01024.json.gz": { + "num_bytes": 320233396, + "checksum": "ee2517922079c713605dafffe6bc0db0a947abf64ff92c409aa1015b92cdb099" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00872-of-01024.json.gz": { + "num_bytes": 319570251, + "checksum": "83ca4f125bd628cb28210fb874db717635009e36c60b42237bda48fcb611a53f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00873-of-01024.json.gz": { + "num_bytes": 318755978, + "checksum": "d94ce49fd17da5f70d1a89bc9e5323daa54f0b8417e1ee5d991467c80c068ec7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00874-of-01024.json.gz": { + "num_bytes": 318986904, + "checksum": "f634915d1b529d9d728fd96993bb151dc07016767cd44ceeedddec73eaf37074" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00875-of-01024.json.gz": { + "num_bytes": 319116193, + "checksum": "6367b1216e1c6ab18af66471d866f39caeb9a538209134a9e6bbbcb81bc51db7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00876-of-01024.json.gz": { + "num_bytes": 320829257, + "checksum": "c9ad4ab8c6e5995aaacd72ebc6654b43b4756804bf3cea808610f9b618f98fac" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00877-of-01024.json.gz": { + "num_bytes": 320082625, + "checksum": "835ae7d54732c309bc9aff231268474af66653b06ad6ca17b54dab6f4a7d30c5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00878-of-01024.json.gz": { + "num_bytes": 318964554, + "checksum": "49c761449d5052dd6c408268c77196bffc5125eb5189390f73ba0ce8550f0175" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00879-of-01024.json.gz": { + "num_bytes": 318699617, + "checksum": "521e1c5fa967a6f29641e7c4c2b210acda0736b32f318e24aef0e587895ed492" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00880-of-01024.json.gz": { + "num_bytes": 318723630, + "checksum": "dee1814b24f9bbc3aa3430cd80302b08b863eb1b92698158960b6be216845843" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00881-of-01024.json.gz": { + "num_bytes": 319839271, + "checksum": "9e57ea6a0e3d8a7798a0cb3e6344e1711e8fd879e2e396294718ff360fc7c4df" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00882-of-01024.json.gz": { + "num_bytes": 317773196, + "checksum": "2e5e5749618e53668222c7d310929e2177772dd7c14592e61dc86f163e353c8a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00883-of-01024.json.gz": { + "num_bytes": 320262049, + "checksum": "f80afaa4495a2d41ad4d7380b79040569179b24ef5c2df17f75ce8e135d786b1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00884-of-01024.json.gz": { + "num_bytes": 319146213, + "checksum": "77338479b420dab9316a4737fc243de84b5e88392cbbb46fa0619045a42432cc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00885-of-01024.json.gz": { + "num_bytes": 319022605, + "checksum": "3a67fee2fb77e64aa13fd595d7786b432203f36712ff723ec5999a341834b38c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00886-of-01024.json.gz": { + "num_bytes": 318624429, + "checksum": "2afe387f2500c57294acf1403a8c27f27f6c7c2d228dee0f1ed70a02c438f838" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00887-of-01024.json.gz": { + "num_bytes": 318733911, + "checksum": "3fe087b3441f74730ab137ba9486650cfedfe2d724573c3d166565d7d1e40938" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00888-of-01024.json.gz": { + "num_bytes": 319926754, + "checksum": "dd2df1977458cac34ef1e52059bbc28738e541761d7ad11c0ffc8ef3ca061190" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00889-of-01024.json.gz": { + "num_bytes": 319085344, + "checksum": "4172244cc3fc4a4e9e09f04f8097cbc678aebaedb9d1fb97b1daae16b0b8ef45" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00890-of-01024.json.gz": { + "num_bytes": 319838671, + "checksum": "8ffaf34eb8209e7ec250303298f9eebd2833fedcf80414c20331e8dbed42251c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00891-of-01024.json.gz": { + "num_bytes": 318169092, + "checksum": "daaf74ba5d12a7415da94be0f4454336aa3d86ad5cd300dbe30cef596835ac8e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00892-of-01024.json.gz": { + "num_bytes": 319662776, + "checksum": "6d99c0419a6c9633620fb0aa7b7610cc5d06696e839a1a52953fd7db7a18e053" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00893-of-01024.json.gz": { + "num_bytes": 319541919, + "checksum": "5f246aeacef0dc8d40a036bb1eeecf278f66d7215a134fb746d30f3420d18c18" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00894-of-01024.json.gz": { + "num_bytes": 319528897, + "checksum": "9975fd5d23d25938f00de3fc9240d77c27b4784c2f443b1914652a06d3b59fcf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00895-of-01024.json.gz": { + "num_bytes": 317548307, + "checksum": "7af9e2abfaebd4afe05a0e28d3e6e3126800a8b9b7ad49de360e42f2eb2c8506" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00896-of-01024.json.gz": { + "num_bytes": 320278601, + "checksum": "1941689d6a0e449423faad6e41714f33d5b23cdb1bb73961a888a87678fc74b0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00897-of-01024.json.gz": { + "num_bytes": 320161831, + "checksum": "3d951cb1ae4a9b3c6ff70555139435febda83d24bb04ea27b229a05424b470c2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00898-of-01024.json.gz": { + "num_bytes": 319341305, + "checksum": "3227b97aa9ff57b62be2a26fd8131e9ea45f7731673acb43432e529ea4978a25" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00899-of-01024.json.gz": { + "num_bytes": 319658969, + "checksum": "c746f8bd5fffac933640ff39db0b9d7b022edb28d7a4b3237d8c69fd919b7b48" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00900-of-01024.json.gz": { + "num_bytes": 317494627, + "checksum": "0327f0c57a668b2b34e72f4c53d4cfaeed787d879843d0bba27b5be58d1ee5fe" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00901-of-01024.json.gz": { + "num_bytes": 319683481, + "checksum": "886449092779ee26fccd11e0c89c36e449346dc6b1f0a7cb15b6b53c897790a3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00902-of-01024.json.gz": { + "num_bytes": 320228529, + "checksum": "6960d8539df78e98858ba8cebb2e637b6c2ef20890b5f2af1cbf4621b52c364e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00903-of-01024.json.gz": { + "num_bytes": 318961279, + "checksum": "4ddb3c9e9276d220f1d4dfc32bb61a090e895e9e3c9f53c169db99a024e7cd95" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00904-of-01024.json.gz": { + "num_bytes": 319926290, + "checksum": "69a941cbbcb673efdb254c162854fcfff6fe1132182210235b91d1d21ed4d2ed" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00905-of-01024.json.gz": { + "num_bytes": 317982280, + "checksum": "1d9613f366b91102d018e57894df520aaf1910aa98e06cf369d9676e498610c5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00906-of-01024.json.gz": { + "num_bytes": 319012210, + "checksum": "4855989c814582f5cc0a5e9b8f9d1f642ae33de81625d4bbafaafb709c1cd260" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00907-of-01024.json.gz": { + "num_bytes": 318515420, + "checksum": "8f34dbaa454215922a29fea975357e4e705381a65e4dcaf8b0d8c200f9a277bd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00908-of-01024.json.gz": { + "num_bytes": 319286320, + "checksum": "536bf0610a2c14d1d59aea0b52fdc29cec19cd7eaa4c3a5e5fec04dee103b29e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00909-of-01024.json.gz": { + "num_bytes": 319938295, + "checksum": "3bb3943183f579c15d0d30440f6c82d0c9c64d6ded398dfc7c67502d73868781" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00910-of-01024.json.gz": { + "num_bytes": 318423425, + "checksum": "adbdcf170531c725b54c1e5713676b789589b2fb77310f3e64a0cc30b83602ee" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00911-of-01024.json.gz": { + "num_bytes": 319578185, + "checksum": "a1342a95ce77013820c36e7d038ed47ca4d40cdf3584a66abc310132435b25fd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00912-of-01024.json.gz": { + "num_bytes": 319154715, + "checksum": "4973afcb1d7b4816e3a3df1b9ce1e48a0eea4fe8ead5f83ea753e46a934e5ddc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00913-of-01024.json.gz": { + "num_bytes": 319011218, + "checksum": "c9a158f69a123859569e1cdd475355afda32d7e5c48001591f0b6c20dc17d572" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00914-of-01024.json.gz": { + "num_bytes": 320027387, + "checksum": "61f6c0f839908e7d3105a6926c501bcacd293d1ba50c3b8639ee227c9a8270b1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00915-of-01024.json.gz": { + "num_bytes": 320280632, + "checksum": "a74fb91d8f7d79b09017a7f996b6ca5d59e4ecad9fec354ac977c0076d53fc66" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00916-of-01024.json.gz": { + "num_bytes": 319278877, + "checksum": "cbbb8dc274fabb4435db5fef5da1d91671e1a4c7f3f652742324f9632b01c5dd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00917-of-01024.json.gz": { + "num_bytes": 319616831, + "checksum": "31e62cbd6209fb7831078e4a262d1b25c0590f9425c62b2b208d4030ed5722d4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00918-of-01024.json.gz": { + "num_bytes": 318635363, + "checksum": "95e5c2f51abc9ef4c0422e91b77f79ff83c8cc38e585df621fbc0dfef48a84c7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00919-of-01024.json.gz": { + "num_bytes": 318885096, + "checksum": "ea5960d4fbc7d5e7097edbf2c9c706e6b7c7e9d3e36633be9bd68c4038955f10" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00920-of-01024.json.gz": { + "num_bytes": 319228627, + "checksum": "73b721ae576dcfa83bd963e49530f73d76b788a669e3abc1c02189900c80cf02" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00921-of-01024.json.gz": { + "num_bytes": 319557114, + "checksum": "710c65cd504e87b5019c01f658e669d1e023473d879913a9522760d33546cf24" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00922-of-01024.json.gz": { + "num_bytes": 319356053, + "checksum": "f0b54b3c6b51a356debc9414df0438ee525ae5114cbb7c8176634b7493095022" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00923-of-01024.json.gz": { + "num_bytes": 319766600, + "checksum": "d5b80091c8113c283d91ff5826b46068b96c423c0dc74a646e2c8d1c5d815cea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00924-of-01024.json.gz": { + "num_bytes": 319733540, + "checksum": "56a54c7d4114c21c1657df0d295839c2bd4904cd1b651104e2a155c2bf1b5aca" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00925-of-01024.json.gz": { + "num_bytes": 318944357, + "checksum": "4d396c29cd1d9ba16016fac37c333c0a872f6cb0e9faae7966e53f6e5c879d67" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00926-of-01024.json.gz": { + "num_bytes": 320276135, + "checksum": "39a64c261a76d5e13f187f12c886b22e2db08fba968bc9d0c1cb0d3c241abda7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00927-of-01024.json.gz": { + "num_bytes": 319181837, + "checksum": "86db529dd52fb67173588fcbc9f0e52c99ad6dd34e44865150bc6c962de5b3c1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00928-of-01024.json.gz": { + "num_bytes": 318966114, + "checksum": "d232df8033ddaa7397dbcfa8ba4ded9421ee9bfc091c725b311fd963b29f13eb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00929-of-01024.json.gz": { + "num_bytes": 320087917, + "checksum": "fca6bfe8fe17c867681c58df081f2186dcc6bf22e46ce3783f85b918644c0b6a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00930-of-01024.json.gz": { + "num_bytes": 318921677, + "checksum": "b8031359e758cd835c44e81303e04ef7b2137d2e1a9472d7e04552c353d883c7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00931-of-01024.json.gz": { + "num_bytes": 318978028, + "checksum": "bb5f2ea8a2e56c69813bdc08cb243c0763126e7b5f6c5cb57e7f4767d2126f89" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00932-of-01024.json.gz": { + "num_bytes": 318627424, + "checksum": "f6fd2065ce202d5347243a2b396707bb606be20c1829989bd7dff6d9fb7adec9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00933-of-01024.json.gz": { + "num_bytes": 320226802, + "checksum": "b303d2ece81c1f7b882703b915765212796518010aea6a108a441dd0a84a6128" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00934-of-01024.json.gz": { + "num_bytes": 319908526, + "checksum": "e5b05714922d132073122e83933853f52f0046c9f51f985cfbdbd310e8d677de" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00935-of-01024.json.gz": { + "num_bytes": 318941663, + "checksum": "4296055a31409a778c516afe25a8108f23dfffaf13cac33e5ed834a37c46b37c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00936-of-01024.json.gz": { + "num_bytes": 318430860, + "checksum": "4634630c012ed184b264ea01c97f7bb3f1af030f2466f1d99d20bb0472f74511" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00937-of-01024.json.gz": { + "num_bytes": 318008229, + "checksum": "131cc9a2fef4ebe81749f1844b7c4b194b97de7db4f5253ce59207e68d8b4df8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00938-of-01024.json.gz": { + "num_bytes": 319099506, + "checksum": "fff55e3b2ff8b53e56ab99def626a7334ce67d2414351b2e83d84298052dd9b6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00939-of-01024.json.gz": { + "num_bytes": 320457851, + "checksum": "8431e38c86516ed88d5c028f4a1dad32b02bcccdc03f9687d18f8312e493bcb7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00940-of-01024.json.gz": { + "num_bytes": 320607829, + "checksum": "a68c577555781adc777c09c68f623431469d67e9b66af7b0813f09a512b7d777" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00941-of-01024.json.gz": { + "num_bytes": 318923471, + "checksum": "807ffde4034b6b95a5eacb71f093686586ca11e417517894cca99dfe7b12563d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00942-of-01024.json.gz": { + "num_bytes": 319880902, + "checksum": "d03d04f619a8f3afbefa6d67986f50d5ee264c45de36c0ba67b069e343e002ad" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00943-of-01024.json.gz": { + "num_bytes": 319079341, + "checksum": "e482c4dee03a34a1a5756e6def26134c9a3f18ee386f5569d6cbf16d3875a429" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00944-of-01024.json.gz": { + "num_bytes": 319436318, + "checksum": "6241f9f35640598c05bc5cd00d8cc024dde59c0065c8935da229a8a583de32fd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00945-of-01024.json.gz": { + "num_bytes": 318998098, + "checksum": "85f192c1ee9734da0f1dcad31c2b8111076977582e139ecc1ba959bf2df6b262" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00946-of-01024.json.gz": { + "num_bytes": 321951470, + "checksum": "44bccedf6a8db115bb6563d6775ff03c67511ce4e23a2de77e79edcb568c9fa1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00947-of-01024.json.gz": { + "num_bytes": 318689631, + "checksum": "36f0bfa191ad7d51452d51249c724150f8c3774142df3720f176f2772f42f3fc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00948-of-01024.json.gz": { + "num_bytes": 320347661, + "checksum": "f4a7afa90b6d81a4cdc99100b75b4d3174c4d5d670042766c3e0418b7a97ef80" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00949-of-01024.json.gz": { + "num_bytes": 318054841, + "checksum": "f39d0c9bfc0a562ede67b8cfc57e6974a8a999e2bbc1b6940f107169b4f06e4a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00950-of-01024.json.gz": { + "num_bytes": 319722042, + "checksum": "bf376260e5a838b3b901ceb22f922829619be710718446ee95c24400cbc73495" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00951-of-01024.json.gz": { + "num_bytes": 318315382, + "checksum": "987cd895f63bb74c9d4ce229ee853c7bce53c75c324366a0d06377c36030e39f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00952-of-01024.json.gz": { + "num_bytes": 319247792, + "checksum": "d218dda02748a22821c2ecccf1cbb136dc8772a25ddfacc7ab354fc089470e87" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00953-of-01024.json.gz": { + "num_bytes": 318411551, + "checksum": "698768f3d7959b33fa74a3827e995b0c184bb3b4c46eba667d7dc3365fdd07f3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00954-of-01024.json.gz": { + "num_bytes": 318809810, + "checksum": "651d9ff43d5a3f7f5945ccf26b9410018248bf64956f3485c50b0df9034fb2ee" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00955-of-01024.json.gz": { + "num_bytes": 319761211, + "checksum": "29fa5c68fb8d3719e5f5f17568ce888522de64499554b5f0f4dafafb4ee5b40b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00956-of-01024.json.gz": { + "num_bytes": 319255736, + "checksum": "333a90a9c13f71e41a7cdd4784684bc142c79ef99155b9d62d062db318798b93" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00957-of-01024.json.gz": { + "num_bytes": 319504417, + "checksum": "730c90615fca09c81d9644cfae40d325851bb9bbc1af696caaadd67d8282ab5b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00958-of-01024.json.gz": { + "num_bytes": 319066016, + "checksum": "bb565af6529720ba2a3e989769b33d978ef49cb2aae49c60f2ff98a981414280" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00959-of-01024.json.gz": { + "num_bytes": 319887940, + "checksum": "8992783693dd0ad5ce07427f6b5739c818f13952d90bb61312ec98f9c813f313" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00960-of-01024.json.gz": { + "num_bytes": 318051437, + "checksum": "4773edbc822ff8d51ec13af6c371214aea7545047d9babeeac0b29180d52fa0b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00961-of-01024.json.gz": { + "num_bytes": 318373291, + "checksum": "ff33854746566f7d3b4ba9eadd1329ece48c034345fda000d9af73cb26d197af" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00962-of-01024.json.gz": { + "num_bytes": 318572513, + "checksum": "a6d07f7caf55fda0df74a22b454d196fb2e29312d433bc5506b00448c22b579c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00963-of-01024.json.gz": { + "num_bytes": 319488084, + "checksum": "453f666c6578376508b1fe8bd3fb8ea5bf030aca5cfedf383cd23b27de15228f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00964-of-01024.json.gz": { + "num_bytes": 318905670, + "checksum": "74f64ed6583e6a4df4b3c3f8a76263a2d63905d51d5680d9683d86f5039d5b56" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00965-of-01024.json.gz": { + "num_bytes": 319452844, + "checksum": "88016c1a0663b89dc3d76689c827c82a6d128401ae05f7b70c8727d75302cd47" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00966-of-01024.json.gz": { + "num_bytes": 319334588, + "checksum": "dd9300bdc27513dd62578e1cf3c8302647b49c61185c282a684011d788c43d17" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00967-of-01024.json.gz": { + "num_bytes": 317872396, + "checksum": "90747ee63ac7d8176fde1f2afce8deb7e39bf19e682e17d0fcc1711d09d5f1d8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00968-of-01024.json.gz": { + "num_bytes": 318988069, + "checksum": "2cc785d650013d35d5d31b1e85c5530b197687c69117881362bf6b98f47c22fa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00969-of-01024.json.gz": { + "num_bytes": 318324244, + "checksum": "83750d93c788ad32a256862b8173db3549eedf52ac131f09f662f1fe0f46bd13" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00970-of-01024.json.gz": { + "num_bytes": 319494164, + "checksum": "e0e46e185851ec569dc13a18519988ad926bdcd9bf448eff00aebf6df141f5cf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00971-of-01024.json.gz": { + "num_bytes": 318714665, + "checksum": "941c9bf116353230417950d292c38b12b00935184162227eaec01870ab7f4510" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00972-of-01024.json.gz": { + "num_bytes": 319518275, + "checksum": "de30e19a155a6f4303afb0311416aa84cc3baf5a09cef55b8e2adc2a4f478f6e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00973-of-01024.json.gz": { + "num_bytes": 318092574, + "checksum": "f70bf6727f1f308d93684ca41e9c2c68dfbd737a90da6375b58f162e8470fdea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00974-of-01024.json.gz": { + "num_bytes": 318555677, + "checksum": "109fe184ac9498ac571cd9c6cb38ae5ed566b0e98e8b7718984656a70cc6b224" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00975-of-01024.json.gz": { + "num_bytes": 319045215, + "checksum": "03c4257851857450f7397ac3d627a60ffc98708ad5aac6e1f73e6ce818fe7be8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00976-of-01024.json.gz": { + "num_bytes": 319172031, + "checksum": "7d98fa662aa9d0ff7ed50cc72195bdda2147212b34a3d22f0f757a4eb158d5b7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00977-of-01024.json.gz": { + "num_bytes": 318650530, + "checksum": "bb8ccc07ecc6fd39ae97136418efc543efe5541e85910a7f333ee5cebaa3b595" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00978-of-01024.json.gz": { + "num_bytes": 318609909, + "checksum": "40b49f3fbb2fce73bb1851304b290fc7fb400d13c2448ac7e5e559dccfda7ce5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00979-of-01024.json.gz": { + "num_bytes": 318881197, + "checksum": "b29f96cfba574428cb66f54b20c4a848bc83438256167afdaed576a3931117a0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00980-of-01024.json.gz": { + "num_bytes": 318506081, + "checksum": "a15996adaaf41e5615cb5c7fa2ef1b4e3003836542d0851d1c6907522f534fee" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00981-of-01024.json.gz": { + "num_bytes": 320000305, + "checksum": "38e282b433c4e3dcc9fc2b056f6ddbe4eb857c5137f7c51301d53ca259d6bdc2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00982-of-01024.json.gz": { + "num_bytes": 319959158, + "checksum": "97d5e58088a87a15b71db975d5e09b69daf497b7dff3ef809e1b8292caa27905" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00983-of-01024.json.gz": { + "num_bytes": 318921242, + "checksum": "f062e04f89132576ac1969fdaa43db761a0ff7e4269a6f173d87fa011a4c289b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00984-of-01024.json.gz": { + "num_bytes": 319577980, + "checksum": "e52a6c08d5243717f21120b4c3ebc8fcf77168928945adf68bc665392a6e8d11" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00985-of-01024.json.gz": { + "num_bytes": 319812101, + "checksum": "8b4f5645ae0e0b190af4ca5335c57735ae919d3c6402438af506c7907f1d1494" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00986-of-01024.json.gz": { + "num_bytes": 319582409, + "checksum": "3654109968d918aa4d8db17cb7057111c42894cfc7eee093df13036cfb3ac6fa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00987-of-01024.json.gz": { + "num_bytes": 319957581, + "checksum": "4b9e6febb461940b993c50945a2ed06736c6786aa8f758565ff545814ebfddcd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00988-of-01024.json.gz": { + "num_bytes": 320346479, + "checksum": "2891565dd75fd4354777b4f4f393983180584ee9c64b5d9b4557dbf26a3c4cfd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00989-of-01024.json.gz": { + "num_bytes": 318546717, + "checksum": "929d0236c9fb77d638e0a18aa97b00004316bbb0ef3c4323e39f61aaf7c0af53" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00990-of-01024.json.gz": { + "num_bytes": 319606761, + "checksum": "6ebd2552ecdcce7b194d4f6d5b5e66ede9d65da4e4999ee8ec4705d847e473ac" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00991-of-01024.json.gz": { + "num_bytes": 319117521, + "checksum": "1b3496964d0a895b347529ddb7b712d211c9419317fb41cdd6e20bba43f39f05" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00992-of-01024.json.gz": { + "num_bytes": 317781551, + "checksum": "9f9cfb5f9152b9a60121b03c24d944129c1ee43e862112fe3896e2772fef99a2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00993-of-01024.json.gz": { + "num_bytes": 319341839, + "checksum": "fb329b7470ae127efe1be4adc960b06eec4f55bbcbe1f3f0f0b794d70a8aca14" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00994-of-01024.json.gz": { + "num_bytes": 320357337, + "checksum": "bbe9a60c3c2b3b5b11a5d531d1d85f0a90ebe3dbc79189b3825e169ae302932f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00995-of-01024.json.gz": { + "num_bytes": 317824612, + "checksum": "26643091ae3425b63036453ffca7ed82c85c24b6a24264197e6516b68a39a4c4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00996-of-01024.json.gz": { + "num_bytes": 320453890, + "checksum": "db33809437e62bf1f086f40e4d66ad0133db7c7d406b2ce52ce5d9c9b0809961" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00997-of-01024.json.gz": { + "num_bytes": 319469732, + "checksum": "3447b74f09dc4d63dd04d6bbd4382147071504338e6ea428b37c3a5174877537" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00998-of-01024.json.gz": { + "num_bytes": 319562604, + "checksum": "270a1c19e6321541398836d3d982c2e396db99abf94317912714251d1f68e8ac" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00999-of-01024.json.gz": { + "num_bytes": 318895764, + "checksum": "d68f8f4d85d91679c20e972b2b1955d41a8f6601873bb311a2621f4b3f3152a2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01000-of-01024.json.gz": { + "num_bytes": 317697031, + "checksum": "68b47464ca3e97e9d3f4075b656f804c1bab667f231701db9cce1f0b0a921088" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01001-of-01024.json.gz": { + "num_bytes": 318915840, + "checksum": "582216879b058ccd4d0ca2edccaa2db49b64459371f8798a1d9c66c06a0cf908" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01002-of-01024.json.gz": { + "num_bytes": 317811256, + "checksum": "6864299a7d0174f92abc696dc293524291623891b86cd69132348fdf78760a4e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01003-of-01024.json.gz": { + "num_bytes": 318605529, + "checksum": "4ef35b7546266f99eae5f332cbe3e284801c5d7b39f840297d67e71c036edf62" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01004-of-01024.json.gz": { + "num_bytes": 319379897, + "checksum": "040dfa80eaf8355370d8a50692bc3ad03a1d57272af340d70031a4398f37b9ee" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01005-of-01024.json.gz": { + "num_bytes": 319515177, + "checksum": "012ac70ef2715181ec1fb578a2366d68e786d3a9ea41c59c08d7c494b89b429c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01006-of-01024.json.gz": { + "num_bytes": 320078217, + "checksum": "46030d85d8333ae224320fa54e487f3770de7de280cd0001344136b0bd87c431" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01007-of-01024.json.gz": { + "num_bytes": 318526753, + "checksum": "dd432d865ef3dba4b5af30e42b11ace96900bd7b97af053ea892292e75bd142c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01008-of-01024.json.gz": { + "num_bytes": 319407137, + "checksum": "165cd3a688be6f9f5a4cedde198a9dda4f9d3dbc1d275d1e99411f3ee96a0d62" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01009-of-01024.json.gz": { + "num_bytes": 319763066, + "checksum": "e44e86d497f8471e53531374b0e6ee61aac54996b6af64a4af0f5620673f9f7d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01010-of-01024.json.gz": { + "num_bytes": 318653930, + "checksum": "61115f16e718d3a2b66574cc17841aa5d02739762138abe3c9a7f325cf9f2e31" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01011-of-01024.json.gz": { + "num_bytes": 320037079, + "checksum": "65e18df845f1e6cce1bb92a45f71274dca94d3f0ece1d556116085b5c0e6338f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01012-of-01024.json.gz": { + "num_bytes": 319753418, + "checksum": "cd5a8ee1bc7d9ad58e98aa6fe56d60501115592519a19efcf9fa370668c6327b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01013-of-01024.json.gz": { + "num_bytes": 318657671, + "checksum": "986ead2c1b37f4094aa6f7a7882824ff013e6393323d5290d7f3e9215589d07b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01014-of-01024.json.gz": { + "num_bytes": 318028602, + "checksum": "3c82c0611fb1fb0f635eaedd2bbe7cfc9d53d1ae967a9cbd0416def046e4b104" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01015-of-01024.json.gz": { + "num_bytes": 319164504, + "checksum": "5eb5cf76022b12d8751a2fce5c4d4831066785a68edd7b3cd3dfc10017f91621" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01016-of-01024.json.gz": { + "num_bytes": 318474894, + "checksum": "a99d827be814e27d948264d6ae55c6a032a664f3ff0ef6ae94bda90f7faf29bc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01017-of-01024.json.gz": { + "num_bytes": 319516762, + "checksum": "7eac25ebb9383a4592023634b852d88a128604c494972a8fd9e2b183fbb303a2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01018-of-01024.json.gz": { + "num_bytes": 319433935, + "checksum": "35adb751748043a36f22b412d3ea0e01166037cd96216f516abc547e9d2609ea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01019-of-01024.json.gz": { + "num_bytes": 320305440, + "checksum": "54c4d52564221e48dc5354cb51d447658707ab8edaa3d6d8fec5ec379a29d462" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01020-of-01024.json.gz": { + "num_bytes": 317445661, + "checksum": "edf1c6ab9900d75b91738fc7e9e3db8cdde3f9ef2234ff249833b5cdb04c65a2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01021-of-01024.json.gz": { + "num_bytes": 318134525, + "checksum": "1c5e670ec9d815637e9bdbd75289c7ef7f3ecf384e32f403ae8a9fe2595cc983" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01022-of-01024.json.gz": { + "num_bytes": 319809162, + "checksum": "9def881764ca614c88ceabb41032d3e145f06c843a7ceebd87dba6b93c974a6e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01023-of-01024.json.gz": { + "num_bytes": 318155801, + "checksum": "552a6a2be423c0ecbb767611074200c5b85c1cf76c8640c79e3be5e967b293b5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00000-of-00008.json.gz": { + "num_bytes": 40471190, + "checksum": "1f25b6af12da84115301d4ee93ea5246c8fea5bb4a2008472794d95b917cc97f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00001-of-00008.json.gz": { + "num_bytes": 40675053, + "checksum": "db4c23d7a336032de37dfe2f3ed39653c8afd94004d4e8d9c73c03222299292c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00002-of-00008.json.gz": { + "num_bytes": 41175078, + "checksum": "4bf6b248b0f910dcde2cdf2118d6369d8208c8f9515ec29ab73e531f380b18e2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00003-of-00008.json.gz": { + "num_bytes": 40728516, + "checksum": "082b72c1ec600502df2e4403df6884390c85627ffdf37a5b700397c9a1ac6b8e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00004-of-00008.json.gz": { + "num_bytes": 40920200, + "checksum": "37c2ce46864db0b6f1fe89220ebf4ef811ea10485c8336f1712227bbbdb530e1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00005-of-00008.json.gz": { + "num_bytes": 40921460, + "checksum": "00b164e59df49df5dc1df170db99bb0d9207a6329cb9272ed8b6ef7a55058359" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00006-of-00008.json.gz": { + "num_bytes": 40549809, + "checksum": "86896a9baffe0ab9df39a2901f0e515009989ca1fec9a42583d718ce16166b5a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00007-of-00008.json.gz": { + "num_bytes": 40446172, + "checksum": "0bf87534c7050091c60466df50f174c3147d052ec7dc645da9574c902445beaf" + } + }, + "download_size": 327104523018, + "post_processing_size": null, + "dataset_size": 1658004128680, + "size_in_bytes": 1985108651698 + }, + "en.noblocklist": { + "description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", + "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", + "homepage": "https://github.com/allenai/allennlp/discussions/5056", + "license": "", + "features": { + "text": { + "dtype": "string", + "id": null, + "_type": "Value" + }, + "timestamp": { + "dtype": "string", + "id": null, + "_type": "Value" + }, + "url": { + "dtype": "string", + "id": null, + "_type": "Value" + } + }, + "post_processed": null, + "supervised_keys": null, + "task_templates": null, + "builder_name": "c4", + "config_name": "en.noblocklist", + "version": { + "version_str": "0.0.0", + "description": null, + "major": 0, + "minor": 0, + "patch": 0 + }, + "splits": { + "train": { + "name": "train", + "num_bytes": 1029628201361, + "num_examples": 393391519, + "dataset_name": "c4" + }, + "validation": { + "name": "validation", + "num_bytes": 1025606012, + "num_examples": 393226, + "dataset_name": "c4" + } + }, + "download_checksums": { + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00000-of-01024.json.gz": { + "num_bytes": 396728190, + "checksum": "06fcf4d9bf6ae45fac94245952f000c924d2a0b5cc8841c916b3ee949333410d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00001-of-01024.json.gz": { + "num_bytes": 395686133, + "checksum": "8a0b64c5efb1db1ebcc0a664c801221049f5812652dc1a727a0e9f8d0df0cd0e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00002-of-01024.json.gz": { + "num_bytes": 397762165, + "checksum": "087fabf9563297a6eab8bc39b68c0c6d15169032001d3a17c9bd964080759f2c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00003-of-01024.json.gz": { + "num_bytes": 395307518, + "checksum": "1e5b89200528320e354f60be0868a3ab6dbbe667a6b16b48e4739b988a6360e8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00004-of-01024.json.gz": { + "num_bytes": 396280504, + "checksum": "8291badbe84854960c0ddac3d6c226cb519268d1b3fd267bd72cfb4f10800de1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00005-of-01024.json.gz": { + "num_bytes": 396636600, + "checksum": "c74226ceada7d78e3e7a2ad931d0a99df93f4cc4377ec69d4f1fab4164c3d845" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00006-of-01024.json.gz": { + "num_bytes": 395364336, + "checksum": "4e52e99dfc4e55c41226978b4dbf48fac2f886b9b0446bc3bd576f32bdd7cfea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00007-of-01024.json.gz": { + "num_bytes": 396428805, + "checksum": "283ae93ecc3f8daefa9c47651ded763dc5f339ddc619c8cb5e32dce9cb9cfe4c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00008-of-01024.json.gz": { + "num_bytes": 395030041, + "checksum": "d3fc7fffdf9c2172d233bea3bb7dc485d753319e6196672d0186b8ba04a1d903" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00009-of-01024.json.gz": { + "num_bytes": 398255693, + "checksum": "61e10cef5c2cab162fb1d26f97fd9d76b30c9ee989c01ef8597d2a4e35b303da" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00010-of-01024.json.gz": { + "num_bytes": 397825333, + "checksum": "f72040887c2a2c17564c2c6a9a4b5ff95fce6a0eed4f0800cdeff8277af651ff" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00011-of-01024.json.gz": { + "num_bytes": 397877458, + "checksum": "ee34ff11164e10a86f76593205cb13986c70ea3d3a8849174a6dfb5b4ec91262" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00012-of-01024.json.gz": { + "num_bytes": 398317059, + "checksum": "7a3ef558efaca3e5d19e9ad02b47dd61f9639dd806130b62d66e9c3341c0edce" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00013-of-01024.json.gz": { + "num_bytes": 398518794, + "checksum": "f5a6c18992ab2b59a9c02469d20768bf5757624e03bcaf92957ce736a3a9edb5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00014-of-01024.json.gz": { + "num_bytes": 397026214, + "checksum": "c174b625c1534c69814f8e4879169b58af96f801dbb433113740af0d78535abd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00015-of-01024.json.gz": { + "num_bytes": 395621683, + "checksum": "4e8e52a602d4eb4b27104780f4a36617505505fb66a82f36e90631a4e668f5b9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00016-of-01024.json.gz": { + "num_bytes": 398138551, + "checksum": "a3e7a95b16f09e09e45f1c3bed3524415581e21b065d8efcc66cece705dee4d2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00017-of-01024.json.gz": { + "num_bytes": 398720813, + "checksum": "79cdb89052e8dcecd1f1319e47f4c4ae1d350ab81777a9ba8077cebdb558e795" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00018-of-01024.json.gz": { + "num_bytes": 398538940, + "checksum": "8da6aac3a794ce326b5a3971fb75a2ee848f008940d4f1bedd724ce7c5874278" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00019-of-01024.json.gz": { + "num_bytes": 396834319, + "checksum": "b57c93502949dad9001e89847947f6c65943927eb519e16de4eaf5590b235faa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00020-of-01024.json.gz": { + "num_bytes": 396402861, + "checksum": "05e14c7e21df3d4af7be7a597fa22463868464d6475282376536e12e82367401" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00021-of-01024.json.gz": { + "num_bytes": 397560852, + "checksum": "756d15d8b07414dffd7cff3efde606aa62cf8f73b85d8e1cd17408d6a339414b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00022-of-01024.json.gz": { + "num_bytes": 397210987, + "checksum": "60aa08d9c5d813d5f2448d910bc23a705cdd0828a9403c18ec223e53623889cb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00023-of-01024.json.gz": { + "num_bytes": 397563062, + "checksum": "bd865213ffb2b40c2cd3eb16724b68c0f37e29f68215990dc84d91852c7c0d72" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00024-of-01024.json.gz": { + "num_bytes": 395799120, + "checksum": "08ff3615ecea3eb5b55703e123475c95afbecfe7107eedf05750147c9ffd12ef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00025-of-01024.json.gz": { + "num_bytes": 398336372, + "checksum": "e3e30b97e585fd881b3a1b006775854a11a2b967d992e7eea886338d8beefb13" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00026-of-01024.json.gz": { + "num_bytes": 396819084, + "checksum": "fddc9e1a8405c5e05e63ce98b19c7833c0fd46392b4b55532b317e7f81426590" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00027-of-01024.json.gz": { + "num_bytes": 397912380, + "checksum": "d3e597b3a96b993840e47adb761cce2f2ae1c96aefcbd6c250198dedaecde15a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00028-of-01024.json.gz": { + "num_bytes": 399078461, + "checksum": "abd6d2341b6c61cdb89b80a8b9bfd938bb6d8a423a89e6a9f997c22c6479d537" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00029-of-01024.json.gz": { + "num_bytes": 397303107, + "checksum": "ee35a3af1056cdab79b644f6352150aeb6fb19a630cd6bc893a072e35fbfbad2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00030-of-01024.json.gz": { + "num_bytes": 396602401, + "checksum": "1d04d4bc295aee2ab80b24f587f8c483599db7d5a8157acc99a1d8b001f8353e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00031-of-01024.json.gz": { + "num_bytes": 395941329, + "checksum": "cf1dd244555511245c0e6a5b1dc9c24f747b8377674aa3690677ce08ebb8c26f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00032-of-01024.json.gz": { + "num_bytes": 398049663, + "checksum": "c83e5572647eba5ab14fdc4dcba8efb6981740b99b8f634e2c6b1942a051c249" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00033-of-01024.json.gz": { + "num_bytes": 398044404, + "checksum": "b76815aadcf4ad802071428864ce0b406cabd73dfc2be5e20b44885ec6a85419" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00034-of-01024.json.gz": { + "num_bytes": 396885224, + "checksum": "da00d92418fbdb9799d8f16977b3a33f67cb98a31808544cb68cf3b42ea9adf1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00035-of-01024.json.gz": { + "num_bytes": 396185021, + "checksum": "265ad43ce00666c83fd441d35ff29ba1ebf7d62442cc3e3c176091b4c725ea9d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00036-of-01024.json.gz": { + "num_bytes": 396702503, + "checksum": "4733156df48f2dd0f2e859fef28f56d12a84e8012085ca9318073ae647b0fcdc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00037-of-01024.json.gz": { + "num_bytes": 397582277, + "checksum": "7d62d03c3496ee2e17ab6b9635710efef9e4cefb88ddccdc16ed720a414c38c2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00038-of-01024.json.gz": { + "num_bytes": 396186761, + "checksum": "670affddf8fcca6933af3f5b30efd1bf490c3e38c3e90f2e8e9a464994d613f1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00039-of-01024.json.gz": { + "num_bytes": 397056953, + "checksum": "4acbd97f9c8fd9a930a6f4284a11cfe37f6cca3b5858ae3c2cde747dae35e0d2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00040-of-01024.json.gz": { + "num_bytes": 397809786, + "checksum": "d350e48a36bb1ba3125f72a07ed8024d26eae6d89ecac686ac0bdf3d5d89e1a7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00041-of-01024.json.gz": { + "num_bytes": 396944358, + "checksum": "817a58dc40440b8b1f54d129db08ae9124e0293e5a0e45f034fbffb2140d90c0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00042-of-01024.json.gz": { + "num_bytes": 394327995, + "checksum": "6bd6bc1269c2dd81db466ae9c41f76b8b8cf71cc7bd6e131452fa1a1318ff459" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00043-of-01024.json.gz": { + "num_bytes": 396476043, + "checksum": "f3525d9c861d984ea0cdacba7fddffaef058d8f95aa99ef1f09f9f0792fde5e3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00044-of-01024.json.gz": { + "num_bytes": 396893614, + "checksum": "292ca2b6b9ba41567fe7cc60e5424aa1f3e431ac874d06ae8eb98794563a7d35" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00045-of-01024.json.gz": { + "num_bytes": 395885483, + "checksum": "ea2c8fac41ededba7da8bf2bb48463d83f148e5c0970a689876d4932ab18a3c7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00046-of-01024.json.gz": { + "num_bytes": 396963386, + "checksum": "97672d9bca357cd2721f51301aa37d37a271dd3ca7487244c057570b995da66d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00047-of-01024.json.gz": { + "num_bytes": 395856712, + "checksum": "52c517670ba4eefb262cb71373d6370f86ddeb0aea7391a47a22d52a55bff7a8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00048-of-01024.json.gz": { + "num_bytes": 396091027, + "checksum": "49f5b68e29c55eb50da941eab1cf446c7d8c9d0b30290318977edb39ef0b887f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00049-of-01024.json.gz": { + "num_bytes": 396892998, + "checksum": "82a51eb6f301c00d927ca7920338247038cf4e9e0072d74c02bac897701f5859" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00050-of-01024.json.gz": { + "num_bytes": 396308050, + "checksum": "d72f92ecd27b716cd90cc4abe562d25fe6d49740b4a3d1fb9beac2526a61988e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00051-of-01024.json.gz": { + "num_bytes": 396137777, + "checksum": "a956e4d086077f7ab309ff10b0eaf4833e4d3ed74435293e96588f4361e1536d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00052-of-01024.json.gz": { + "num_bytes": 398302544, + "checksum": "5a54f7faa07661ea6a5f0585ca49ad66c8f7025fd9627b3af832dc886d50f78e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00053-of-01024.json.gz": { + "num_bytes": 399616791, + "checksum": "7f8fa496d50a0b7c399faff4c1864e24717b3f9c86b2552536c8f91e3e0cf9d6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00054-of-01024.json.gz": { + "num_bytes": 397332881, + "checksum": "ab862f26b4fa38b6c16d8cfd0d63a9f0973827e45915e85aefb95d4e182b7b9c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00055-of-01024.json.gz": { + "num_bytes": 397075146, + "checksum": "cb67aa9229bec8b88e496829aa0a60ca1c3ff4a2293632cf7782b69aa71aebfd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00056-of-01024.json.gz": { + "num_bytes": 397827600, + "checksum": "2f63e3ec40d32237d4a50c873b966d7fc2c16ef5c04a2bcfc33328b128654e7c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00057-of-01024.json.gz": { + "num_bytes": 397533583, + "checksum": "7c90bf39bddf8ad0c6a8bb3dff02caea8bbc2abbd76047c5d523930d2a00dbc9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00058-of-01024.json.gz": { + "num_bytes": 396411363, + "checksum": "ee6059f3c8a2df34858a0110a06ec4e9673555fa56c1a2b40930337ba5b1b39c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00059-of-01024.json.gz": { + "num_bytes": 396735510, + "checksum": "d9dbe2421edba1820294e757d88aa25455db42ce8992f8933b51cd84cfc35a36" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00060-of-01024.json.gz": { + "num_bytes": 395694553, + "checksum": "b05d6502fc95587fa7047fac64978d6be13761dcc6954629332812e5937c2731" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00061-of-01024.json.gz": { + "num_bytes": 397740757, + "checksum": "39303faa5dc33995dfec683b44fc24066ecccdf6b5001b9c0644d8e9899d45f5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00062-of-01024.json.gz": { + "num_bytes": 397358263, + "checksum": "fe27dd467cc2c34abe5b0bb34473ee68859f2198eeb78304e1d2e54460a67383" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00063-of-01024.json.gz": { + "num_bytes": 396826654, + "checksum": "1da2c414bd03e5547d8c9c7447e42b8dcff5f6ca8ba35c53076f2895e8ea63f6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00064-of-01024.json.gz": { + "num_bytes": 395781869, + "checksum": "af96de4d6b5bc1ab0527efa33a73d7eb788dca15829acbb7291ce72ad05e6c66" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00065-of-01024.json.gz": { + "num_bytes": 398192274, + "checksum": "7f46ccfc1703fee106e932bc9a1bc5dedf7de944172cfa34ec9b31413bf0bbda" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00066-of-01024.json.gz": { + "num_bytes": 397133438, + "checksum": "dd3b67d8578927d7474dae76bdca35f35a2aa125fc50873e4a9f6e73d7a81831" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00067-of-01024.json.gz": { + "num_bytes": 397204214, + "checksum": "4cdc87a7c9fea33e15d638e5c921f45149212769bfba5f59f0a5943398ca0d55" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00068-of-01024.json.gz": { + "num_bytes": 396489592, + "checksum": "64d175c23574998f8c5d28ce3d3f3934144b1fd4f6527ede1aa3420c28bb90d0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00069-of-01024.json.gz": { + "num_bytes": 397697351, + "checksum": "3329857f531c9fa22d98bd567638f0564f73062da1478ca84385246f71baabff" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00070-of-01024.json.gz": { + "num_bytes": 398449973, + "checksum": "bd13494aa03a95d943a01f3436f62c46ee3390b30f6ff0fec0636f3c0b09fa1b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00071-of-01024.json.gz": { + "num_bytes": 395498960, + "checksum": "5e69529ae82c305acbf1f58a7021b4e3fc67285a871dcbcaaff0781d0e721070" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00072-of-01024.json.gz": { + "num_bytes": 396170387, + "checksum": "9b9c7e11b9bb2cf6ea0fcdfd58754f522a95070feae74c29559522e12e1b41f4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00073-of-01024.json.gz": { + "num_bytes": 395915819, + "checksum": "87a2069589fee8de23730b8b994ba59d63d5128175b5326ba0a8c8ac9e01a3dd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00074-of-01024.json.gz": { + "num_bytes": 396986018, + "checksum": "e073efb3f00db65c1ee14e8bfa6e8c807f7827d0f3dd4d4026f823bc6f61b1cc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00075-of-01024.json.gz": { + "num_bytes": 398555103, + "checksum": "a1793748c7979e241ca34291c843ca3cc90dd7643f04810b6cd324220efbd6e7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00076-of-01024.json.gz": { + "num_bytes": 396357420, + "checksum": "7b1cd69788ca9a7e614de70a8b908183f41f316eaadf3b0236a7c4e126db9844" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00077-of-01024.json.gz": { + "num_bytes": 396666167, + "checksum": "aec828d3c2a1f7fa970de328a8fd1a85a90493dbcbec4f50816ccbc2275a1fac" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00078-of-01024.json.gz": { + "num_bytes": 398167446, + "checksum": "e14bdf5af810574aca7c6f3daa67e503f24ab1705435a62129c66c248667ee97" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00079-of-01024.json.gz": { + "num_bytes": 399696096, + "checksum": "b63756f81b8b19ecdc9bf227045df10840cbf973b60bd8ffdf28f58a53cdb028" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00080-of-01024.json.gz": { + "num_bytes": 398755610, + "checksum": "dfc118f680b79260e7ece75f27c0459484eb8458f2422df9f1918f726b54ccb6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00081-of-01024.json.gz": { + "num_bytes": 396606787, + "checksum": "17d6a503947f5132728f53ea62fd093f55bf2dc6a32316a5c0413353cf13eff3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00082-of-01024.json.gz": { + "num_bytes": 395714484, + "checksum": "8ca41818ee6a0ffd5b00714779289c18cd97d620258c5d3d741c482b72344300" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00083-of-01024.json.gz": { + "num_bytes": 396807173, + "checksum": "12d87c0a948f32f788497858751c3ef22f289136e6ae58518a97a2e976f5cdc8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00084-of-01024.json.gz": { + "num_bytes": 397241529, + "checksum": "7c3da4ca4d2b2077f0ab7be511038255732fc88d954f2f17cb0f3ab144216206" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00085-of-01024.json.gz": { + "num_bytes": 398357369, + "checksum": "26df55183e78f8d69fb16e21d07edf98659b69bcb3c48f340da6a5bc44007f4d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00086-of-01024.json.gz": { + "num_bytes": 396997317, + "checksum": "09f0641e9075cb88800d0eaae3f7b99b047552edbc71d1fd2d8594f645d22c2a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00087-of-01024.json.gz": { + "num_bytes": 397978000, + "checksum": "c9437ef5f58a46b8a6d8efcae37fa658da3f2c4f1cad0f9cf47fbcd09bb82f8c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00088-of-01024.json.gz": { + "num_bytes": 398468913, + "checksum": "be187fc14017f666b84ed7049c169c1a28654441c2f523eee8b655b3b9d9ba8e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00089-of-01024.json.gz": { + "num_bytes": 397071121, + "checksum": "637c3f964ee2c750a0a175f2e5d24b786a37d37701f10616b448804d68b72f4e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00090-of-01024.json.gz": { + "num_bytes": 395753807, + "checksum": "8eef7ff1a8080aebe5226cc3539baac46ab64d93f8e3ffb6e8b7ab3346e151dc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00091-of-01024.json.gz": { + "num_bytes": 397039764, + "checksum": "a2904ae5bf69b393a697afd62ae9b8a560c1f076e8a141e6f3feef29cb5d1352" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00092-of-01024.json.gz": { + "num_bytes": 397058578, + "checksum": "eb4d7e2712a9983bc1581133fa8eaa2e1d28b314861833bd8d810d615ec1ed81" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00093-of-01024.json.gz": { + "num_bytes": 395855981, + "checksum": "5c9a7573a5644d89d46666306d333ff1e4af3213f287cb9adb48ef87a023d479" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00094-of-01024.json.gz": { + "num_bytes": 399516118, + "checksum": "de7ae1508815e48ba031762c084cf6946b084871463821407090d23c197c6474" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00095-of-01024.json.gz": { + "num_bytes": 398236235, + "checksum": "616cef1f21ef078ffb9fc2b4148735668debdd15a8bc1be281183ba3659e9fcd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00096-of-01024.json.gz": { + "num_bytes": 399526010, + "checksum": "eb754381b8a6f3c74dda5ee5852958f7b69c707a3908cbaa9410c972e002a0cb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00097-of-01024.json.gz": { + "num_bytes": 397935028, + "checksum": "6d6d2ca80708b7c6ad4240a042dddc2170060e8976c2e7b4ace446d2f2395076" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00098-of-01024.json.gz": { + "num_bytes": 398645934, + "checksum": "568db6971230fb42df8973ecb5a2a6d77204aa8cf0bdf47b386c04370da8dfd1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00099-of-01024.json.gz": { + "num_bytes": 398110916, + "checksum": "9bacb381e3b06976619e816e40ac2ccd3bcf3cb9ecd30c294b388cfb75c8bf77" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00100-of-01024.json.gz": { + "num_bytes": 397631228, + "checksum": "7d515ac0f767736600a216ebe7280b9751f16e70df969ba601d1aaae15f201e5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00101-of-01024.json.gz": { + "num_bytes": 395102356, + "checksum": "87c5c81e154e136f3e090ba91682ad54fe678653f86f6f32002ae5ec3c9aa743" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00102-of-01024.json.gz": { + "num_bytes": 398926159, + "checksum": "2df85a9ac13812c3870180901dbba99b52e53fc045da019160a3f06d0dfa5e95" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00103-of-01024.json.gz": { + "num_bytes": 398383820, + "checksum": "8134d12e84ed4a58a5f8f6eff8a4349f7d6ded6a1d7539b5c23193571569d6c7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00104-of-01024.json.gz": { + "num_bytes": 396628542, + "checksum": "208f0cb3365b0243d70e7b4e52ff977e9b11d8e451adea521a5bf6e10cd40ee0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00105-of-01024.json.gz": { + "num_bytes": 398737797, + "checksum": "855ac7b8cb621a240319ef00197d2f20338d17db71a1aec68fb66930bc17c59c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00106-of-01024.json.gz": { + "num_bytes": 397281064, + "checksum": "544d5d91d066f2450bfe622ce55bdfe16a300aee9c05aaffae8a645966bc695e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00107-of-01024.json.gz": { + "num_bytes": 397919761, + "checksum": "f4af405c0f19c9139d93b3073f3fe328be998c9dc6f74afc7e21ad068964b92c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00108-of-01024.json.gz": { + "num_bytes": 398810219, + "checksum": "bdfce29353c6caa33b178bdebbf7e48526c391bc6c71180e3fa378b723879563" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00109-of-01024.json.gz": { + "num_bytes": 396605124, + "checksum": "ed6acc172bc9af0e31170f5533001a8fcd344e6732a4b3a714b7ad43740f25f4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00110-of-01024.json.gz": { + "num_bytes": 397491755, + "checksum": "428b6c91f12c4f7032fa692bbe887f1a4c02635eb88b91d876da4c71f3da5e4e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00111-of-01024.json.gz": { + "num_bytes": 395754897, + "checksum": "a723863559edf291fd8a6c2736cc1cefed70dd3c8625b967df049ce0d373f68a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00112-of-01024.json.gz": { + "num_bytes": 398567649, + "checksum": "a90ddc9ccfbca20b9c75bd2b7d63ee6abd03236a0f0dd2827eb9f7350d9c3931" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00113-of-01024.json.gz": { + "num_bytes": 396706569, + "checksum": "479052b6b9edcc2bbda40b982976e7e28d84fad7b2dce46b017f4e3d1f61e0d2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00114-of-01024.json.gz": { + "num_bytes": 397384355, + "checksum": "a95984e4c261a3057d1bc51939aefd9413853111e19030b19c5d26f778be00ba" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00115-of-01024.json.gz": { + "num_bytes": 397702826, + "checksum": "5eaf7fc2c9d4b2ee3e216c215da7f4fc7558e89d6993033b95a940a78061ab05" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00116-of-01024.json.gz": { + "num_bytes": 397252590, + "checksum": "268033cbbdf3be9790cb6010791693f1b490af06f9fef91b0b307420a4e30a08" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00117-of-01024.json.gz": { + "num_bytes": 395506730, + "checksum": "cb80908eee1054ddaf7e2e5d66c9a41505025c2b6dc7fe6aa287db0a9f3829ff" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00118-of-01024.json.gz": { + "num_bytes": 396452136, + "checksum": "d75bf895c88ff2e9c4031c1f65b067222cfbb1a937d685ab4dd33369f5f5ff7b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00119-of-01024.json.gz": { + "num_bytes": 396777389, + "checksum": "2c00362f4d99cef2bae2f13f17b79ec56a5ef8aca18ffd56a12fea2308e5017b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00120-of-01024.json.gz": { + "num_bytes": 397730478, + "checksum": "e31296949f7ce2e2a74fd2443552cb64b9f3cddcca691097a56992f51033fd11" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00121-of-01024.json.gz": { + "num_bytes": 396593647, + "checksum": "c2f0f81e3c835848a47532d8fd1c215a624f47740196a7bb45b5099916853014" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00122-of-01024.json.gz": { + "num_bytes": 396576172, + "checksum": "72edb7581a623e20f26cae4885f3b9d7f329581921253ca4d7ceedfbca17b7b9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00123-of-01024.json.gz": { + "num_bytes": 397378329, + "checksum": "4f045ce7bd077b7f878012aead8c51073022448de66d2e35a755d4c8c4a6f59d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00124-of-01024.json.gz": { + "num_bytes": 396545003, + "checksum": "dc7949657328520d31a27d8e267c2ab07cd4e8639036d4b1bb59454c309f862d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00125-of-01024.json.gz": { + "num_bytes": 397630505, + "checksum": "530bd95e5ef9a1d5989c595e60e0ab11583e0f42d16b2bd37c49ed09a67af207" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00126-of-01024.json.gz": { + "num_bytes": 395483747, + "checksum": "d9df071edec6959ba842509f72ad43be3ea3f529b60d48f3dfbf390908887a5f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00127-of-01024.json.gz": { + "num_bytes": 397295159, + "checksum": "02b61f5bc7d1d241484c4f04fd517960ae755a69f35192bdd5bb471baeba5614" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00128-of-01024.json.gz": { + "num_bytes": 396276865, + "checksum": "0c7d618df232c36ba018269ddf3b2863cd6d63bb7fabeaae33fd508715bd8ce2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00129-of-01024.json.gz": { + "num_bytes": 395314703, + "checksum": "03443afda032187d2dc2e696ce6eaecbf2219e6dabbdd593379e97c0e00e3112" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00130-of-01024.json.gz": { + "num_bytes": 397411481, + "checksum": "8969873d5efd3df0cef1742e4bc67f2df7a5b5d9e641f7a12e77c7e8e96a1bf1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00131-of-01024.json.gz": { + "num_bytes": 396925311, + "checksum": "31adc39ea4eda8667662608bdad6bb32bbc82b1ee1ad53ceb4df50924a933bdf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00132-of-01024.json.gz": { + "num_bytes": 395826124, + "checksum": "d2f035ba2c388fec2d847bd43449c885eadd0bcab5fb8afdf031a53e72c4ec32" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00133-of-01024.json.gz": { + "num_bytes": 398892794, + "checksum": "b7ed60983058a5f9f0ef72602789f50359f415ecbe60dc967e7a869866d833b6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00134-of-01024.json.gz": { + "num_bytes": 398206890, + "checksum": "9ba78624879aabb72bae0b4119fa2625793915382031ed897a0b4c3f2863b8aa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00135-of-01024.json.gz": { + "num_bytes": 397161888, + "checksum": "9fa6fee55f5e8f887dcc64d94cc65ada6f283a580edc7926cb159b80d0084ea8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00136-of-01024.json.gz": { + "num_bytes": 396185585, + "checksum": "81a1fcafcedfdd9bcb32d2467d9c963cc7d8b2f32e13e52ee04db41b0d3f5483" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00137-of-01024.json.gz": { + "num_bytes": 396933735, + "checksum": "c7558304b614e1cff13b0f6e967fc5ef77e4953a1eea1f39ed925c33076d7723" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00138-of-01024.json.gz": { + "num_bytes": 396371698, + "checksum": "3e896da8bf296403f7b4061ba0b24d3c3978993de4854fabd688cfce9fbf7bba" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00139-of-01024.json.gz": { + "num_bytes": 397289537, + "checksum": "1a5ffa3aaf565ccf4db7444983643ad06e386938a0a2d313aecdb972c36111e4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00140-of-01024.json.gz": { + "num_bytes": 396983259, + "checksum": "4047916916fd9dd7b76a8cbc595d52803344467135f744b23bd10296004a47d7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00141-of-01024.json.gz": { + "num_bytes": 394947050, + "checksum": "7edfc9e5870d80d470e3797e8bef5183e9d170eab410ab50957e946dde2e8199" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00142-of-01024.json.gz": { + "num_bytes": 396852755, + "checksum": "4affc3a24616858fab84211e3825e90a1ea7d9c8f2cfabbe9a5c9b24c21a116b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00143-of-01024.json.gz": { + "num_bytes": 397579248, + "checksum": "d5aa9ba68e9b30576bd640f647d4069b6c56db276cc5229573440e4a38a7f1e9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00144-of-01024.json.gz": { + "num_bytes": 398800367, + "checksum": "fa104e63eb7a8a6b066a5f00bf05b3ea095bad35a902bc728251f096173f1417" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00145-of-01024.json.gz": { + "num_bytes": 396709510, + "checksum": "b615ecd58821b1697c82094cb3435375924263827c342ab1b87e53907d4aa63b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00146-of-01024.json.gz": { + "num_bytes": 396042389, + "checksum": "6004c782f3235490865b6634b2c4840a989745b70ef2da674e75c62aeedf8a6f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00147-of-01024.json.gz": { + "num_bytes": 399840661, + "checksum": "5e8b46726f7ff2c3dfd381fb252f1b4bddf9436fd9ffd10fa300cb0fbe76998c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00148-of-01024.json.gz": { + "num_bytes": 397098215, + "checksum": "0851cb274aff2ec4f781c82af11c94f8938a797aca5097fb0089299cb4c75aff" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00149-of-01024.json.gz": { + "num_bytes": 397540697, + "checksum": "7cadf4ef9b0e29d9e8f68474464dc072b78e909a0f03c74e61b67912ff9b551d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00150-of-01024.json.gz": { + "num_bytes": 396347701, + "checksum": "521e4f67d12ae47b8f2a02b6f77e0c85cdf9a0efbcb45602d09ae116110ebe66" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00151-of-01024.json.gz": { + "num_bytes": 394890490, + "checksum": "2255bf3e1940ea28da9656028dee26865a9ee682cbaab4d5aeb34c081062f8fe" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00152-of-01024.json.gz": { + "num_bytes": 399584675, + "checksum": "f8ca4aaf5706ffb0f5518c7461d9045d18c645df068aa436137299e5ca77df82" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00153-of-01024.json.gz": { + "num_bytes": 395606567, + "checksum": "24f0e81dc3140f063ac89173fc262b01f2420133025b114f29632262cdd2e7fa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00154-of-01024.json.gz": { + "num_bytes": 397925578, + "checksum": "5f40a87b15b0acebbd324e7c5cd2c0f31f911558d57f774f278634db94f2d5f7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00155-of-01024.json.gz": { + "num_bytes": 395428741, + "checksum": "36281c154f187a09a83822878da815cd9b7f659a41cd90ac64653b437e798c72" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00156-of-01024.json.gz": { + "num_bytes": 396799274, + "checksum": "0fb66965107e54c9fed0013962763e874b940b0e174d775b21fa5e688fa53b33" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00157-of-01024.json.gz": { + "num_bytes": 397321211, + "checksum": "014d1443a4940fe95089bf87e245817d3a90c50e3e371a703098f5b9c3f6c759" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00158-of-01024.json.gz": { + "num_bytes": 398736992, + "checksum": "f912d27d68318fc0089fbaf8e0481ebe8dc5d2963cb89ed315f3bec637460bfc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00159-of-01024.json.gz": { + "num_bytes": 397250687, + "checksum": "1bfd02a301b09bfd53058522d0613e1fbecb788d3173eb30b58115cd1cbdb477" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00160-of-01024.json.gz": { + "num_bytes": 397492158, + "checksum": "149a7bd76e9ea41185d99d21df870ddd4f32857fdd628cee927d6bee7d6a527d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00161-of-01024.json.gz": { + "num_bytes": 398383574, + "checksum": "0c385b4c9b33574cdc75070309a0aed46aa7b2e3b8754a7692035a3c5a04f916" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00162-of-01024.json.gz": { + "num_bytes": 397126197, + "checksum": "5c012b2a6bbc9413914ed1420b6150a5549cd74185bf2788d8809005034d433f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00163-of-01024.json.gz": { + "num_bytes": 398201223, + "checksum": "79448c338e86cea2609399705268fc6011cb21c4f0aff82e3fb7660391ce85c4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00164-of-01024.json.gz": { + "num_bytes": 397914908, + "checksum": "dfb89631dce146ab4713a03f184e864472eb133b2cd04db8b4bccab688e9e287" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00165-of-01024.json.gz": { + "num_bytes": 398142696, + "checksum": "74acc88d6612aae7bdf5187d3b9eddcdb04cf60f1cc350661ffa50219a747f9f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00166-of-01024.json.gz": { + "num_bytes": 397533050, + "checksum": "757d23402b3a155cfcb6b30bdc305c8014c9b64ba4e067753664670c2c5e9534" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00167-of-01024.json.gz": { + "num_bytes": 396241119, + "checksum": "521bd7a9dcfa0390c35e50a3d0cde3ea627ca538dfc419a97ed83b251d8a3005" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00168-of-01024.json.gz": { + "num_bytes": 396041761, + "checksum": "dc540ec27d5999f6a4c71f075ae1ec64ea84415c720cd2b6ef3fdac925e576da" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00169-of-01024.json.gz": { + "num_bytes": 396350882, + "checksum": "36d5d35075a82038dfdd5abd29a839f4e9ab79d51f0bbc635d3dcf3f5f1e2732" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00170-of-01024.json.gz": { + "num_bytes": 396885157, + "checksum": "db9a3f6a7e085007eee381357ea9e4d5d6f702580d38220860967ec441ba3525" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00171-of-01024.json.gz": { + "num_bytes": 397266368, + "checksum": "7f8098cb6532bc888d3c1f0ea5072cf8419ce1689b9ffe1c370ca20071e7e1c2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00172-of-01024.json.gz": { + "num_bytes": 397140430, + "checksum": "90ae7e2551b1f3bf2e5ccf4fb3fac8fa3512add5e299ba7c90319611baf8c840" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00173-of-01024.json.gz": { + "num_bytes": 397069631, + "checksum": "a86f5ab72e1a9b1d491988154fd6400e6ee8c74378a9e64276df438a3c4edf9f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00174-of-01024.json.gz": { + "num_bytes": 396743897, + "checksum": "451cfe8e14c17113a2f6673ece27e01f8d54bed1b57d1b20cb84f125879939ec" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00175-of-01024.json.gz": { + "num_bytes": 395780705, + "checksum": "3252e9781545bc3f9f19ac6e8fdb87d81cdc5a94838798daf6037c9f4f473db4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00176-of-01024.json.gz": { + "num_bytes": 396205053, + "checksum": "49d1648d37150b90632a6459828eedd82deb2fce7f108bf4e1b050f2f9ad1668" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00177-of-01024.json.gz": { + "num_bytes": 396248718, + "checksum": "99346ccda762ae85038a10baba937ef8ef668a0beab483c4005dce77e331768b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00178-of-01024.json.gz": { + "num_bytes": 396634813, + "checksum": "8d3bb1610ce79cf359d75f32e7624b6203140ed3eb276362b040615e9ffd4b54" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00179-of-01024.json.gz": { + "num_bytes": 396524113, + "checksum": "971e5c9499425294cf5945436b2ee419379a75bdd72d4cd6a33b1d17c17de298" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00180-of-01024.json.gz": { + "num_bytes": 397938782, + "checksum": "dd6b3e60219788b82ab3fc63a9e65f38f64aa2f7b294135ec2d16b36350f1f40" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00181-of-01024.json.gz": { + "num_bytes": 399155769, + "checksum": "c6a806d627a9d197789bfc6257a92b0223ca51e724c3c2ad10fe2397dbe30848" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00182-of-01024.json.gz": { + "num_bytes": 396136228, + "checksum": "2c48e3237253eaad9afc121e6946a9e1856bbe82c5a7cb287b05cff3e6ea8e8d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00183-of-01024.json.gz": { + "num_bytes": 397083292, + "checksum": "52645e03ab47da01bb40226eb90042be914f1170688ae940314871e16cbb1037" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00184-of-01024.json.gz": { + "num_bytes": 397402964, + "checksum": "1edbdb41edeabc108f0147e18b439a75e390e0a843ed915f1cbf73a7c7f7867d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00185-of-01024.json.gz": { + "num_bytes": 398411052, + "checksum": "ef071e52174a19597e567696262470906275c2cd1cbbb0b1e98864999ea2d463" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00186-of-01024.json.gz": { + "num_bytes": 397122443, + "checksum": "0d87080bc08f7f8a1952a7df57ce2bdbf61e40c05b61937c8c19ae0ecd952b1b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00187-of-01024.json.gz": { + "num_bytes": 397244868, + "checksum": "4aed75ea9f885fc3dab599c19c7bb98f7d57ce2b2ec11ac8ab3258fa479fc0db" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00188-of-01024.json.gz": { + "num_bytes": 395677432, + "checksum": "342882e436ea826cda9fd38c0caca68bb35444a2a07596f8de0e53a3e2169f59" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00189-of-01024.json.gz": { + "num_bytes": 393653750, + "checksum": "22ed9e389f6c8410c9bde898d97ad798c236c2da4d0b2c76b86d013f8686da03" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00190-of-01024.json.gz": { + "num_bytes": 395437920, + "checksum": "b3f9ba5834d4f0280d6defd3bd50fdf961bee6be4c71ed47046cf4e115acab01" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00191-of-01024.json.gz": { + "num_bytes": 396944861, + "checksum": "4e7ed636a60edc44b5ba709dcd83bf4263ad8d5a06a02827d3d27191bf3731a3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00192-of-01024.json.gz": { + "num_bytes": 396611165, + "checksum": "4fea34466d9b470bf0bc44455183b2c61994c4e71e4bfb684dff3b5e3870d1e4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00193-of-01024.json.gz": { + "num_bytes": 398283211, + "checksum": "4c4e6d31f455831330971ed1e0c33221203401b817adbda5b53de16f8299a9ba" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00194-of-01024.json.gz": { + "num_bytes": 398915952, + "checksum": "dfd0b1ceb2a437da8cd38c9c791af809e94f2e36ab4399b2a45a5b916f4ccaa9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00195-of-01024.json.gz": { + "num_bytes": 396352694, + "checksum": "0ccd90ced34b3ff28c21d015a87eca3f31eae2bf31f11f25ac073139f9d50c22" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00196-of-01024.json.gz": { + "num_bytes": 398582922, + "checksum": "f22e59765cec074a0c687c500f4e6348250d0e418d12dcba211e39c133aaf290" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00197-of-01024.json.gz": { + "num_bytes": 398839554, + "checksum": "95fa68cd75d77a1b5bb526dd5ef16a2f04a3520604f734baeb6e2d95608b5973" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00198-of-01024.json.gz": { + "num_bytes": 396202192, + "checksum": "f0e6343e8105178b38f75eade6774aa6e85b62a271622fcfcbe2745f1cae11ec" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00199-of-01024.json.gz": { + "num_bytes": 398029364, + "checksum": "4c58736410c8d3c7174ce011e2f281cb16e4949d756ff4ace86b4a9d4795c04e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00200-of-01024.json.gz": { + "num_bytes": 395867629, + "checksum": "1cb798ee6609e670053987d881d130d5b73db19d9f37fecff7a6da41152aba05" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00201-of-01024.json.gz": { + "num_bytes": 396858169, + "checksum": "7357eb22b2aa75c55885252c62d12e08cf8f7ef285c0052cf1d706c3f0f74fef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00202-of-01024.json.gz": { + "num_bytes": 397955766, + "checksum": "8901d0f27c4c11916cda7cf806cd00000771b6351954c8503bc312cca5ad3a10" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00203-of-01024.json.gz": { + "num_bytes": 397737882, + "checksum": "ed51917fc8936701b681cfc49ef95b2dab451ca597e76b34ba90be9405a1a0b8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00204-of-01024.json.gz": { + "num_bytes": 396094006, + "checksum": "88692bb8da78347cb97c0e0849d1a10a97b1686cde1f75626236b89bd507e2b0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00205-of-01024.json.gz": { + "num_bytes": 399027636, + "checksum": "fb17fe19d1f0fcaa43fb31a3ad9b105b3d93fa287351c7f93fb599edb7f40bc3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00206-of-01024.json.gz": { + "num_bytes": 399406254, + "checksum": "668d2a9927080b686a4d728236e4cfc780b262f9045dfe9575cfc48cb69d6adb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00207-of-01024.json.gz": { + "num_bytes": 396291803, + "checksum": "928f451dddfe42bb2ca791dbc61c36ddc618006ef709eaccbc2beb665c8427e4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00208-of-01024.json.gz": { + "num_bytes": 397807368, + "checksum": "11e8627b758588056b61d31de07c50092222013a38ba802b7a9ae34b6b8b84a6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00209-of-01024.json.gz": { + "num_bytes": 398085408, + "checksum": "d49d31d1719698ab7a2b9ee91d887f3192c8fc1b6108152a75b39de2a0ad25a6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00210-of-01024.json.gz": { + "num_bytes": 397670254, + "checksum": "049b3294c3e22e6db6c115979a4a55f0650966c600ca17250e91b241cc97bbd4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00211-of-01024.json.gz": { + "num_bytes": 399643598, + "checksum": "7772f26fd90f47033670e7f1d3f6fe092116486bb9a991577f9560b54ed3832c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00212-of-01024.json.gz": { + "num_bytes": 397390768, + "checksum": "7a24e4a70f43f6227fe6491fcc7bb6b2a19cae203521c803bedf8882c995d7e6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00213-of-01024.json.gz": { + "num_bytes": 398657925, + "checksum": "21d0ee8d1a01957b56ac503aa88c6f3269b4e4692762a3f929fe0e7069be8c0a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00214-of-01024.json.gz": { + "num_bytes": 398282324, + "checksum": "ede2d9824d8f99dd578a36ea82caae942ebcafd99f308cf5d0ff8aa4a56f0a05" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00215-of-01024.json.gz": { + "num_bytes": 399178235, + "checksum": "82516fa361dec02c7ed59ea2d0510d9ee4187609b449dca649a04141b12bc037" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00216-of-01024.json.gz": { + "num_bytes": 397630870, + "checksum": "4a6d5e60354b7b93f005010c6fc55c0a81596e98a116cdeec99e1ab4e58fd03e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00217-of-01024.json.gz": { + "num_bytes": 398628848, + "checksum": "02dffb623b628a3a3ea38084fe6bb840aafab8419feed3d1f2bd3598cfa80aab" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00218-of-01024.json.gz": { + "num_bytes": 395087998, + "checksum": "e1e9a7ac7a922d6a9bb90f82cb48dff11ab7208dac08511e9613cd2726ca67ec" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00219-of-01024.json.gz": { + "num_bytes": 397622792, + "checksum": "955afc7d45a080ae137e9dc25ba3d85629a6a14c3d9bbe4065aa37d710345b7a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00220-of-01024.json.gz": { + "num_bytes": 395112655, + "checksum": "a3560918bec20087e9908009a362957ecb06401924789e20b36c26e363db5ae7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00221-of-01024.json.gz": { + "num_bytes": 397132000, + "checksum": "d8459bb5b6fb6b341b24fe517cfc5dc099765ad70c3383bae913229e06cf99e0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00222-of-01024.json.gz": { + "num_bytes": 397138513, + "checksum": "20d3c6219921dc9c2928d637000e488635fd9a12b5636de5a6a7e52c1b67d781" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00223-of-01024.json.gz": { + "num_bytes": 397167661, + "checksum": "43a18accd194646893324537991e0162f6f98a9cec5ff59fe8fb510d81d707bc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00224-of-01024.json.gz": { + "num_bytes": 397905941, + "checksum": "a516485cbefdef2e31a493cd8827a5f936f10674ff3525b71d414e17f48241c3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00225-of-01024.json.gz": { + "num_bytes": 397218123, + "checksum": "791c85c78c5e7f3557855a1fc71acd860521710515b89f92e54e02960549f46e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00226-of-01024.json.gz": { + "num_bytes": 396619135, + "checksum": "52a36037696e6245efad80e00d1f123c36dbd79e7ff52b1fb99f579e712d2b30" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00227-of-01024.json.gz": { + "num_bytes": 396654998, + "checksum": "e31123ab579fe95bd50afa10d52a51e9c15a4af28c06583fb5aeac4e3418f129" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00228-of-01024.json.gz": { + "num_bytes": 396899165, + "checksum": "86481361fff334dee3183fac8ab3f346e44ab3e6e7b35bbd7e6e062b2d2fa0d7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00229-of-01024.json.gz": { + "num_bytes": 397489378, + "checksum": "bbb717711fb4c78ebe8a0476296a21a50285ec41d9fb9f08d5d66d899577e04a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00230-of-01024.json.gz": { + "num_bytes": 397462301, + "checksum": "054414aac29b5c8faee71a918f2586ad3fce8ee44c71e7a2e2af4b91e0169523" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00231-of-01024.json.gz": { + "num_bytes": 396097584, + "checksum": "8136e320fccba75a493954fefbb560f92532be44a6e0990404edae659d48ce1e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00232-of-01024.json.gz": { + "num_bytes": 398984795, + "checksum": "3d9362aab157beef3b5fcd4a0a0236d59de635a565b1c86423f45b26e8b437b5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00233-of-01024.json.gz": { + "num_bytes": 397258012, + "checksum": "e1a532922477d17f7cbea7db72c2391d26b4db580e526ebd5a90be23607a8d31" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00234-of-01024.json.gz": { + "num_bytes": 398350453, + "checksum": "c464829565bcaafdba165b2d886be4580f3c0a516b5417853ffc4fe30049cffe" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00235-of-01024.json.gz": { + "num_bytes": 397147353, + "checksum": "573a6a1d33ccc6c5b605d381f04d73989504bb6d24514b938e92c3d4f61501e8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00236-of-01024.json.gz": { + "num_bytes": 396963006, + "checksum": "21318462014bc185d0da7cbd342fddd07521401ca2b73e47eb5cb4bd42a82bbe" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00237-of-01024.json.gz": { + "num_bytes": 397087111, + "checksum": "49459c97b078726bf8377748d4bb2066bdfa47e2717315a9b3c8075cfc4b9b10" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00238-of-01024.json.gz": { + "num_bytes": 396984031, + "checksum": "befb46e9f928876edc580c60ea4242f63cf6df77c6c107fec6e4280d279e348d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00239-of-01024.json.gz": { + "num_bytes": 395915197, + "checksum": "dc5ab17e04e4f2678771094af67909dcaa8be36a6cb047cfa66e75f986c91312" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00240-of-01024.json.gz": { + "num_bytes": 398321096, + "checksum": "25b92f7a499e9aaf0496a57f6292a7f65941b34dd6c78f14b08358d180070029" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00241-of-01024.json.gz": { + "num_bytes": 396626980, + "checksum": "1ae21ee5585ec718763a3c7bd70d9338aaf77d0e02f92a41f6ed213d1eefa5b4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00242-of-01024.json.gz": { + "num_bytes": 398220596, + "checksum": "c29f98174a0c02a817d5cfa3ebb2a92d5f49df8a34fa40abd360f1b39b4bde05" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00243-of-01024.json.gz": { + "num_bytes": 398250083, + "checksum": "819387c95ea7183b1f9e1e78d077de65023c4809198ef3a0c946f46f8b6c19b4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00244-of-01024.json.gz": { + "num_bytes": 396943969, + "checksum": "7a0b0b984d7afc4181827705212f917cf4ac12412f640a2c8120513763cdb390" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00245-of-01024.json.gz": { + "num_bytes": 398365865, + "checksum": "a424157137a5eeca89819d600deea2a1619ea8f5ae1ed395c88ac600a85e3afa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00246-of-01024.json.gz": { + "num_bytes": 397285385, + "checksum": "73029f721bdaccd9d126e871973e70a551f48f077f5903656b305ea9885c4798" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00247-of-01024.json.gz": { + "num_bytes": 397132841, + "checksum": "b223cf1270d2c728592ec65b09599bbdef8d64f7df2eb525e114f86268500daa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00248-of-01024.json.gz": { + "num_bytes": 396316645, + "checksum": "94102d9bcc086ed5b203bc0c6b830dd245c9bf6c695b23b19922b2a98eeb6a52" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00249-of-01024.json.gz": { + "num_bytes": 396644237, + "checksum": "36be793f4d76070ba1c696b3274e6dbab43f415c8fbaf752145cc99af6558680" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00250-of-01024.json.gz": { + "num_bytes": 395860541, + "checksum": "313febcf026d2cd1495fdd3d5ba3b492ce5d5749153e189672b6d9dff3e26a61" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00251-of-01024.json.gz": { + "num_bytes": 396709140, + "checksum": "7e2480b3d5869ba35007c40e18585f3fa208cdf8e004078cc8de4fac36773507" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00252-of-01024.json.gz": { + "num_bytes": 396508847, + "checksum": "25df46ae56c0d4a6f945922e31fc697d12e0b7c525be9bc2b8eced802641488d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00253-of-01024.json.gz": { + "num_bytes": 396364816, + "checksum": "6b2125b9eab9bf893e7f8913a6beedbeeef5de53893fbd6172f706e33bab5177" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00254-of-01024.json.gz": { + "num_bytes": 396122930, + "checksum": "7947e5152c5305863e2d664622e3de49f9386b4384eb09630c5bfcad21fb458e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00255-of-01024.json.gz": { + "num_bytes": 396929803, + "checksum": "a1ec8c609ac969c24e2524f0f3dc31ef43ca0147ffe66569d3135e4f28394325" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00256-of-01024.json.gz": { + "num_bytes": 398432943, + "checksum": "3fd0373f5a8974a3499c436d96ea73be95f5619b8388dc316f51aff01e9ecad7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00257-of-01024.json.gz": { + "num_bytes": 396003748, + "checksum": "516cf3626076f083962983b2d6c596ef355609492f2e81c6c3cdec01acf8c5d7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00258-of-01024.json.gz": { + "num_bytes": 393890690, + "checksum": "700760a7764f890c8aae337e7ee458c8467eb9048347edd237e341dd2bd5d236" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00259-of-01024.json.gz": { + "num_bytes": 398130606, + "checksum": "d868f8ef5e1cc971ffd00908bdc7eace32ec151d7405d7cac5fac22df9ea10c0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00260-of-01024.json.gz": { + "num_bytes": 399765969, + "checksum": "7d5eb3b88eb8a0291ae70c1997458cf5aecac645397e50a67fab3d1193064353" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00261-of-01024.json.gz": { + "num_bytes": 397418895, + "checksum": "ca607c9e13d7cfb73a29ee3131f77e6bef3130d8627037cef9f57ed459185f0a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00262-of-01024.json.gz": { + "num_bytes": 397925991, + "checksum": "ca789394ab4398c41490ec6147a41ffc8847155ea9ff74d7ff8b3402ed0634e8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00263-of-01024.json.gz": { + "num_bytes": 397082336, + "checksum": "aac81d1bf0ade80758c14d01842b9b06c89ebf2fcdb9a06b1472bf2f70bbc348" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00264-of-01024.json.gz": { + "num_bytes": 398101079, + "checksum": "3cf56a2989b5c3f26ba94124cc534f5c9ae9770bdc6a3431dd745603b480ab19" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00265-of-01024.json.gz": { + "num_bytes": 396949669, + "checksum": "d4f252a6c2f43833d6d89bf69337449b4cae5dc88fd08fb20b35fe7194a50ddb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00266-of-01024.json.gz": { + "num_bytes": 396242007, + "checksum": "71c745968d8ee4a0d64f38930a76e65d68ea094ba3e0b963d5d6878f65f51b34" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00267-of-01024.json.gz": { + "num_bytes": 398342031, + "checksum": "706a560c862979594265925c3200d4bd0981a9eaa279841f2cba673634f7074b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00268-of-01024.json.gz": { + "num_bytes": 396399468, + "checksum": "eb3dea553c37f220b3b9b5f377d5a4ef94243b3c0b6b46981e3e5b7ba5b4a935" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00269-of-01024.json.gz": { + "num_bytes": 397181296, + "checksum": "4f0feae035dacaeb720ca3b6ea17685144895a0d78cfa358e30983f8d6c4ec76" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00270-of-01024.json.gz": { + "num_bytes": 395712883, + "checksum": "6e0f6de1e5a5c6d4bf23d0539ee72ecc2b4285da2b0f1ec2cdcc443d2e22aa88" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00271-of-01024.json.gz": { + "num_bytes": 398066980, + "checksum": "4c5cd1ef1917ed762d7d8c5c54e1da05db74e45721697df8b0626e0aeac96966" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00272-of-01024.json.gz": { + "num_bytes": 396667308, + "checksum": "77a33c37a5d88e419e2b31cf560d53f129a38e5bc2306b5baccc187b7e94e589" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00273-of-01024.json.gz": { + "num_bytes": 396020214, + "checksum": "b18e40c00b8e0e02dfac40ea0519964e231c8a2f28bc1294b044fb090f41a9fb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00274-of-01024.json.gz": { + "num_bytes": 396300833, + "checksum": "34c8945a6ebac564fe87881d6968d05363a89985f297692a3df7104128b9c26c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00275-of-01024.json.gz": { + "num_bytes": 395206463, + "checksum": "1e41d7e2a6117224dc23fbaae8e9d20df9d7744adb4687d2b0e570bf8d9e47f2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00276-of-01024.json.gz": { + "num_bytes": 396667995, + "checksum": "45973b91c2f1140f79265a24f484fc6d6653f43f83d5bd2d18954892dfa4dfae" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00277-of-01024.json.gz": { + "num_bytes": 398134029, + "checksum": "b7da91889b6695cf01bceddfc139b23f9465bda5cad54088b84a1f5a4d7a4f9a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00278-of-01024.json.gz": { + "num_bytes": 397422615, + "checksum": "e794a2903bda1f3c082e8f590383c714a518c202ecb99eda5513d6b320f70e86" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00279-of-01024.json.gz": { + "num_bytes": 398776175, + "checksum": "a5528d3e33151138ef9bdc2433744f1797de2b20673a570de5bd4d81b306354a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00280-of-01024.json.gz": { + "num_bytes": 396208086, + "checksum": "1be2d8c3d0eca510fac7b06a5401b2b8873bc6dfbf85a3c736301756f9681309" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00281-of-01024.json.gz": { + "num_bytes": 396893734, + "checksum": "1db3e9017561d38a91c417ffef875b7a948c4f64c51b90b0983c71bc9d950903" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00282-of-01024.json.gz": { + "num_bytes": 397411883, + "checksum": "4e23d39fcec2c310cbde3fdc5d9c185046086877ac03bbf9d772b092614f93da" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00283-of-01024.json.gz": { + "num_bytes": 397906911, + "checksum": "850eb5e60b84bca4d2f10b2e511fdb2661e3d08444a07db1782ad85c754fe808" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00284-of-01024.json.gz": { + "num_bytes": 396043261, + "checksum": "fea24050c6aec13eb706a6f3854b4debde62b1b842f2992fc027820c66218b0f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00285-of-01024.json.gz": { + "num_bytes": 396961329, + "checksum": "6052f82887cd2362320f72f6545d2e5b5a775e9bef95783c9b9995ecb7a5ecc4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00286-of-01024.json.gz": { + "num_bytes": 395697481, + "checksum": "f4361838b5b679c8306447364166c1c3083af392b4c8793399c122af09c7312a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00287-of-01024.json.gz": { + "num_bytes": 398773520, + "checksum": "9add91f23f31ff8c5d8d84e6a0af75fc6fa08ceef8ccd9b633d8c49aa1d0104d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00288-of-01024.json.gz": { + "num_bytes": 397684645, + "checksum": "64dc94555a122353c3a3c9999e67d17b0e4b682096ba80be2258c791ce1c2b9d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00289-of-01024.json.gz": { + "num_bytes": 396655864, + "checksum": "2472c76b1cbcfc3cb82126795673126e8f532119a03722a304396ceee9b7db3a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00290-of-01024.json.gz": { + "num_bytes": 397415313, + "checksum": "960b71edbdc6a6a62a0d3cc1069bbbfb11893cc017aba543e10c9a23cb759d1b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00291-of-01024.json.gz": { + "num_bytes": 395617977, + "checksum": "96e582d7a750bee597331f373ec2e16d3a9686f48a49d39765d39550c8cbbad8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00292-of-01024.json.gz": { + "num_bytes": 399332500, + "checksum": "cd6ec4941aa5babbe274684945bf899447ec2459b8f7076ec8c74d2b3fe794c5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00293-of-01024.json.gz": { + "num_bytes": 397021546, + "checksum": "d0d0c4d80e75c5d02103b49027d9e2e6f7db74c12f8b53f600d7fe420b2d0a7a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00294-of-01024.json.gz": { + "num_bytes": 396272726, + "checksum": "caf5708a6989f867ec6c4c56f338aca9f3a43a1806a27ef473d9b0f219001cb4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00295-of-01024.json.gz": { + "num_bytes": 395233811, + "checksum": "a7b5f904e34c0b370238e6beb19149d4bb96d0cce43a1eca3bfaf181952ede53" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00296-of-01024.json.gz": { + "num_bytes": 396480926, + "checksum": "4fcf284d98c2f7b63e47573e9d084eeec2516fbfa62be42c3ff94e1cf518e313" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00297-of-01024.json.gz": { + "num_bytes": 398883718, + "checksum": "c1cb458076497e7dee645f50281d1af2fe5dad556d28a2cbbd73abe6537c8a9d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00298-of-01024.json.gz": { + "num_bytes": 398733629, + "checksum": "4a612c715025292e62860fb0018e9fa2d3fade692342746d044be6297e25a034" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00299-of-01024.json.gz": { + "num_bytes": 398155026, + "checksum": "d33f4043fad9551f92084a45b7f54d920ded9d6fec271cbbf85f71b021f9ee4f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00300-of-01024.json.gz": { + "num_bytes": 398612975, + "checksum": "61b1181b796a2f40db3cb6954f2890397c3722c486dccd4075d74679cf61a70c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00301-of-01024.json.gz": { + "num_bytes": 395385748, + "checksum": "95a78e9d3cece0620430c85822fedf4021ebd88ece57d6714933c268d3b6af6c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00302-of-01024.json.gz": { + "num_bytes": 397620059, + "checksum": "321aed402a5e779febe9766294ad040a3f8dcf57bae68648c03d3c59023aafa3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00303-of-01024.json.gz": { + "num_bytes": 396549027, + "checksum": "4198f6a2b5bdaf90ac4251f013908123a5964429870ccd6b245a9069278c4e17" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00304-of-01024.json.gz": { + "num_bytes": 396596460, + "checksum": "74a6440e93d18d0d6d0622ab7d8832d7ccc91c03297faf20c8090d16f7c042d6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00305-of-01024.json.gz": { + "num_bytes": 394881271, + "checksum": "654deec494bba4eece19c27140426049574cf529c93ccb422fcc09fe4496af15" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00306-of-01024.json.gz": { + "num_bytes": 397760377, + "checksum": "e0840cbc94db6cfc35df66d413a11261756392dd59b0fdf89d9ff166ec76f3e5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00307-of-01024.json.gz": { + "num_bytes": 396671816, + "checksum": "31ceb8cfcd09fda621a9a483b09dfb43f5436e867363f6736ea3f710a6af10fa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00308-of-01024.json.gz": { + "num_bytes": 395961013, + "checksum": "8c1e5acc3f964eaa5aff300731a74dde84ed0671cd764b121ea638fb08c3dd0b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00309-of-01024.json.gz": { + "num_bytes": 396035179, + "checksum": "7d555942b1bcb2518aa5ff9c0549d98fabe7bb563cdc6c73d3f11e6a0bc502b4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00310-of-01024.json.gz": { + "num_bytes": 397140669, + "checksum": "859eeb7a9d2ed03d5299bbf7f1c3e719236477950d7601112a458ea5a2adf7c9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00311-of-01024.json.gz": { + "num_bytes": 398170419, + "checksum": "1e7661637b0a4445119ba403e4f8ede129c829fb7d1907ca7660870b536b8b29" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00312-of-01024.json.gz": { + "num_bytes": 395605627, + "checksum": "87a3ccd2ac9deff1ac4a5dd02bba269a48692d4598c5899630e8d2e4136dbb99" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00313-of-01024.json.gz": { + "num_bytes": 397081206, + "checksum": "c6952116cf573a6e20c849cf1b7d8d0edf3b9d00fc7e717e7bacde915c4c52a8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00314-of-01024.json.gz": { + "num_bytes": 395555727, + "checksum": "762066fd85c596ee01b3b8070708517cc5759bb1e3c4bb65f4645fd62b550d13" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00315-of-01024.json.gz": { + "num_bytes": 397871218, + "checksum": "814f19cc5e81144f5bfd7037f5f522dd5c44faf150c10337c675174a5965a5b9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00316-of-01024.json.gz": { + "num_bytes": 398577523, + "checksum": "27643c7c3c0a1a78c9003b936ea27785709a2df80d09817278a179eecaedc352" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00317-of-01024.json.gz": { + "num_bytes": 396388623, + "checksum": "5f840180e2017c41c6b1c865784788dc3b002478a9ecb43c3859174af788ba5b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00318-of-01024.json.gz": { + "num_bytes": 396173471, + "checksum": "2aeab99fbc84a2640a05081e2c7438451e75f76cbece3cbe5d82e85463a61966" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00319-of-01024.json.gz": { + "num_bytes": 397912127, + "checksum": "fda805ed19f4b996b048386f4bd73924dc965a069e85b8b4452a54a1372375fb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00320-of-01024.json.gz": { + "num_bytes": 398765416, + "checksum": "bce244d024c076911c1c6dbd35609be5442c8b0440690e2cbb342ac64bdc494b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00321-of-01024.json.gz": { + "num_bytes": 396005962, + "checksum": "763584ee096223b8aeffb1576ec6e4f3bea674ec4de40fa163c2f2221b3701d9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00322-of-01024.json.gz": { + "num_bytes": 398615672, + "checksum": "5c12ec1d0c450fb7515c586f24311bad145050dfc64180d65bacbd346c2ce9c4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00323-of-01024.json.gz": { + "num_bytes": 397861187, + "checksum": "93326f43273fb963593e0b1caab1e9588387291c23d5c14b5ae40b46b199998c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00324-of-01024.json.gz": { + "num_bytes": 396679008, + "checksum": "6ebfe6e28851e6d79cfdbf370602373fc2136e88936eece302ecaa8ef8251827" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00325-of-01024.json.gz": { + "num_bytes": 396358086, + "checksum": "51190fbfd48479842ec3c7d910b5519e01ff797ca0143c39be142c1650c5e893" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00326-of-01024.json.gz": { + "num_bytes": 396490692, + "checksum": "f4d9bbfd1bbc6e939fce9a2df26e45c79be73dbe2650fe79af395bdaa39cd121" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00327-of-01024.json.gz": { + "num_bytes": 398354656, + "checksum": "c70c824b6c16e5fad922ec9b8d363d97bed90501522b641b0eb0f66b8c086325" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00328-of-01024.json.gz": { + "num_bytes": 397326336, + "checksum": "7e6008433a0e5bc6eed28a13b9dba17246e7d65ca96c31092086c3546a3a397b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00329-of-01024.json.gz": { + "num_bytes": 396390524, + "checksum": "f379d844a35172424554bb82a65c790c354b76c0e7abfd868225d1968017d1a5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00330-of-01024.json.gz": { + "num_bytes": 398259199, + "checksum": "ea15be4a83c3de66c42410e13e5ef9c93baf86099a8eded1c1d10b0cd5ad0f29" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00331-of-01024.json.gz": { + "num_bytes": 397618860, + "checksum": "7b6aad6224ead9ee3a0c860cfd991301ef5e97093b23c76d713e73f4911d0e44" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00332-of-01024.json.gz": { + "num_bytes": 396743573, + "checksum": "bc5333d383020d2296aa0f6ec940ab586a367efe50d1c597f9db55ca72fa66e0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00333-of-01024.json.gz": { + "num_bytes": 397460128, + "checksum": "095b3a85a9598009638622ca21cb00142efa0d68196c8c3a8bb922cccb465e8c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00334-of-01024.json.gz": { + "num_bytes": 396900262, + "checksum": "6f005575f4843b84f4512e1b7c1b748edf497e4e9f55eaae47f9b4637161ccab" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00335-of-01024.json.gz": { + "num_bytes": 396106895, + "checksum": "66bfe399d0859f71c20db01de53ca7bf997b33afcd3d181f181d9f265a2c2fa2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00336-of-01024.json.gz": { + "num_bytes": 397732616, + "checksum": "1f1e0435de870b98b119e91edd4a0d32d078dbb810f919a70b85360cd860f0cc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00337-of-01024.json.gz": { + "num_bytes": 397834763, + "checksum": "1db4bcdaa6fca612c3f1b38dad6d5402679ca21aa6a545850d61bcda10103697" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00338-of-01024.json.gz": { + "num_bytes": 396712179, + "checksum": "810c104a8862699c490fc8625a7be4115872fe2de4d8c061e095dc5a81eb4d19" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00339-of-01024.json.gz": { + "num_bytes": 396838831, + "checksum": "9bbc616d5c4aba46475957a22544dbdb0557f8de31cdf919718fbfe55bc70ac8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00340-of-01024.json.gz": { + "num_bytes": 395587861, + "checksum": "48c8411ee2b5fc8cffe1589ed204d0ac8a12b5b3bb1857373f84bae984d49e8b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00341-of-01024.json.gz": { + "num_bytes": 398093153, + "checksum": "4ff8ba83e489580da2401aaa23ca3329befe8fc08b6f299b612950c358688604" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00342-of-01024.json.gz": { + "num_bytes": 397248009, + "checksum": "c72e063f95d10ce661b4bc97538eccf6da6ad493b7e54da555a46e4a47aabbed" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00343-of-01024.json.gz": { + "num_bytes": 395939409, + "checksum": "249eb2080c55402aab34a31a442b06bcaa25d2df3f4319ea1a5f50dc6bb709b0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00344-of-01024.json.gz": { + "num_bytes": 397608807, + "checksum": "8cc57604fcc5fa920b0d16df6e8d8b7f4ca88c0c76c86f9ac81f42a615b330e7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00345-of-01024.json.gz": { + "num_bytes": 395751274, + "checksum": "13fbc76e49a8b856f7563b945bef10d786a86caff63b4cebea50416ca34932ad" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00346-of-01024.json.gz": { + "num_bytes": 395516794, + "checksum": "61d43da2e3e7770016ba7235eaa74a1e6a180e64cd2cfacefed5c34e8b72eca7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00347-of-01024.json.gz": { + "num_bytes": 396180000, + "checksum": "4a0ca2103de168d05d0090c8800d47f216cc167a9cfe9e736403aedf040c5e46" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00348-of-01024.json.gz": { + "num_bytes": 398461180, + "checksum": "a56396961496499ac289a85d126b916132e787d0dc4fbd9961aca7dbbc7cfcff" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00349-of-01024.json.gz": { + "num_bytes": 398049366, + "checksum": "ca012572c575f6a8e6ad6453296ff93f22118995c17928e76b655da44ce5810b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00350-of-01024.json.gz": { + "num_bytes": 396532962, + "checksum": "bb35d17862201063b46d8745dc182756d1bb09e809c4c355452ab1967e655491" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00351-of-01024.json.gz": { + "num_bytes": 396576223, + "checksum": "19ea45ab2fe5487d2a69cca7c9a1db7a09c8d5dfdf130412bbcd241cc60a61c5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00352-of-01024.json.gz": { + "num_bytes": 395956381, + "checksum": "bb5869b8649fffadd5f1945ca9a79588e84081a8fc45b7e4cb5507149b5be2d9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00353-of-01024.json.gz": { + "num_bytes": 398903623, + "checksum": "cb16a7ecadd28a8b5622c4e581f463f0ae2fe20a3e6582fa6885d76e7523715a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00354-of-01024.json.gz": { + "num_bytes": 397316693, + "checksum": "42aea18548695c458ddc229d8c837356845609aca3bb64ce6e07b185443b9468" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00355-of-01024.json.gz": { + "num_bytes": 396240550, + "checksum": "1577d76807548d83427293b9f534a3261fb72a345569f0491a1fd2691047bd92" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00356-of-01024.json.gz": { + "num_bytes": 396132315, + "checksum": "b6e17a39292e082e517082b23b381305ebe889c2530fb5eb74a2683d36d07a86" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00357-of-01024.json.gz": { + "num_bytes": 395948117, + "checksum": "524ebed10c881f52f155db5d6690806f5a97aa8f811deadae916323b50427ed5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00358-of-01024.json.gz": { + "num_bytes": 397397242, + "checksum": "8e23d852bc3a0dda4684d5fd511003ad6f18232e5f54e32638c8db62e9d18c6b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00359-of-01024.json.gz": { + "num_bytes": 396141321, + "checksum": "345c34dafbc59f5e93355c8b2e6fcde6bf59bc9e1ebbf5cb962d54228e6d3204" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00360-of-01024.json.gz": { + "num_bytes": 397258644, + "checksum": "51db06055d95e2b43fddebf8c2b7d76b7572745f129d89fe005f8e5d3f12b758" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00361-of-01024.json.gz": { + "num_bytes": 397913411, + "checksum": "2c0f6054fef084d3e7cd10e2de0b1d3a48dc716af1e9146548195df128bdaba9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00362-of-01024.json.gz": { + "num_bytes": 397722576, + "checksum": "664b390b20498eb6e78fc09604b3a947fc1847a01e3eaae4c7861d1dde3b90fb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00363-of-01024.json.gz": { + "num_bytes": 395416894, + "checksum": "c57529884c6d4977a279a097c0dfbcc31d52048cdcf64950182c743583d7989a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00364-of-01024.json.gz": { + "num_bytes": 397028679, + "checksum": "ed4f252d63c679f6e3f35847e0871c3360e072b0d6963f662d7e808b6615457f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00365-of-01024.json.gz": { + "num_bytes": 397574891, + "checksum": "68e8e44a531d98897245fee90ad349f4fdee891b2f68dfda78a1dedcc9474326" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00366-of-01024.json.gz": { + "num_bytes": 396905692, + "checksum": "9e88b888d85633671e009ed7093763b934a42054ed6a1252222dc64781a20e22" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00367-of-01024.json.gz": { + "num_bytes": 396802011, + "checksum": "2abaf3f3946788258b8543fa2ccccc0c20e6980b9d26a38decd356e67f575fa1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00368-of-01024.json.gz": { + "num_bytes": 395630737, + "checksum": "b4960e3395d8a1bf8350f57e5f6280b00443a4c6b85e6fd47478fbbfc1733caf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00369-of-01024.json.gz": { + "num_bytes": 396228047, + "checksum": "08e8210426e6c6ef9746675592a3eea4a92eff9aa4bb7ffc6bf6ba54bc411f72" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00370-of-01024.json.gz": { + "num_bytes": 396548482, + "checksum": "10e0305ac4d1e410d749637e0c03386d969563f8eb73bbbc376fc1d21025e4ee" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00371-of-01024.json.gz": { + "num_bytes": 397344482, + "checksum": "03df0f4aa5c377f6b45db3c3b863240bfb1211ddb226bc055433fbcd9ee8e873" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00372-of-01024.json.gz": { + "num_bytes": 395872223, + "checksum": "9b70549213cb01595179928cdb020daaf7bcd2085c5e947d111f3cc66e406d2c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00373-of-01024.json.gz": { + "num_bytes": 397399096, + "checksum": "945c204cdb107669a8d1252a91323eb300c902bdd6c6a8167a90805ec02cba9b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00374-of-01024.json.gz": { + "num_bytes": 397755002, + "checksum": "8353d4383f73caceb5d112f260b37d1349dc7898af2d05b98ffe17d22aea97ca" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00375-of-01024.json.gz": { + "num_bytes": 396534763, + "checksum": "a3de41388a6d8ce3b605c6586e47b74a565dd2f54175551987bda0a0ff95036f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00376-of-01024.json.gz": { + "num_bytes": 395594630, + "checksum": "7cadf813f2b31a1bfe44fdfc84aef4eb65e889c2616c56b189890734c22b731f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00377-of-01024.json.gz": { + "num_bytes": 398241040, + "checksum": "15df154b52cb4d9314dbc4ac26ca4b4df7125b12131d538fd480f8a6b3fbdfc8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00378-of-01024.json.gz": { + "num_bytes": 397217224, + "checksum": "208ce680427f62d78dad857bee91122a79f968589b4e44f2f89919e91f4dea30" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00379-of-01024.json.gz": { + "num_bytes": 398504097, + "checksum": "0052fe7f27e720423b6143f401b8618428d913b22fc2af2950874785e2ef7528" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00380-of-01024.json.gz": { + "num_bytes": 397494149, + "checksum": "15c4f07a2629c7bd79b243c97367e3e18de02b5ab09eccc0f85b1eba0e0b071a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00381-of-01024.json.gz": { + "num_bytes": 397190859, + "checksum": "77c71b4a79ac2f462040ea0e8408fdb8f719fac0f09fadb760ed00b709e9dea5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00382-of-01024.json.gz": { + "num_bytes": 398126420, + "checksum": "aa44d029398c33f733065c489ab3ded9395f6e53263407173b6e9c27b6fb9c45" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00383-of-01024.json.gz": { + "num_bytes": 399108296, + "checksum": "f507161fbe96f8abe9dedccba2458448719e6b153bcc1256ecee6b4b9c82256e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00384-of-01024.json.gz": { + "num_bytes": 396156787, + "checksum": "83c236bbc8508fb81992c837751a4d8ad4b9bc138dd1f4bb5c1fcc68203e12da" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00385-of-01024.json.gz": { + "num_bytes": 396878483, + "checksum": "df45b4749951a46695f88789fc536617ee3470083e55562292f606e09185e4a6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00386-of-01024.json.gz": { + "num_bytes": 397495799, + "checksum": "a8240c9e7266e47bda8880e38ac8a5afa8541aed4b989d6642b31497716a51ac" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00387-of-01024.json.gz": { + "num_bytes": 397062301, + "checksum": "e6fd54ea6f17d5570fa4cc97554813a7a33bd4e44cbc456b27b0c87c1af22c60" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00388-of-01024.json.gz": { + "num_bytes": 397074091, + "checksum": "fdc2a134df4a669deb839f26947c86b7e7a4bc7596a6a1c25562cb97fbb6b089" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00389-of-01024.json.gz": { + "num_bytes": 397056868, + "checksum": "e7390f0007582a3460fa67375b2628c85a1aa85954796d8e6584fadcb35761cc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00390-of-01024.json.gz": { + "num_bytes": 396404332, + "checksum": "820a97060abd3172852f38e1636706c8389adad8495de56f4c3a2c3ba6008235" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00391-of-01024.json.gz": { + "num_bytes": 397125489, + "checksum": "68732c5ab9f4b6945e79ce2a1b45b97a97822d6a107aa79aa9135f29d91173ab" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00392-of-01024.json.gz": { + "num_bytes": 394992472, + "checksum": "c9d1e8cfd481631a76544e5880ceee9990e7553c88c5978a91b48ec8aa47717d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00393-of-01024.json.gz": { + "num_bytes": 394778146, + "checksum": "7a5ec4f0878f676a3ac2c417f512186066d793f28d611f97135c3626b3b60fdd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00394-of-01024.json.gz": { + "num_bytes": 397024190, + "checksum": "44e32db5a39684ab1789cfe97b6e9cbd3c539390e7a4c8ec9298e7177945452b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00395-of-01024.json.gz": { + "num_bytes": 396537190, + "checksum": "601ec281240753ac5793ec7cb83802a788c4d88e56dfd83e6c875cf2ef9bd8f1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00396-of-01024.json.gz": { + "num_bytes": 398049705, + "checksum": "b1024b69e191b2c7073f5f4f3ea51e8710be54db8603ce8aaabbfb919ea6694d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00397-of-01024.json.gz": { + "num_bytes": 396670567, + "checksum": "11357bc600f9b0c443f124c7fa4046d10cf03e19016e5ba8cdde884d2ff76c9b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00398-of-01024.json.gz": { + "num_bytes": 394706629, + "checksum": "778eca6d845b9a7d49e22941b959a95e5e4d2d9714720f27b810230d136acfde" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00399-of-01024.json.gz": { + "num_bytes": 398257272, + "checksum": "27c2a30af83975d32469e85fb2e27953a3aa9f97514f621063325cb9af1829fa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00400-of-01024.json.gz": { + "num_bytes": 398732278, + "checksum": "aff9a39748526a03d3476288cdbce122c3683baf113362e9085895609d03c3c8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00401-of-01024.json.gz": { + "num_bytes": 396372632, + "checksum": "a6af262bb962eb1c45d2003ee1bb2be1a3a12cb3e53d4ffe58b4b68dd852957f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00402-of-01024.json.gz": { + "num_bytes": 396783625, + "checksum": "db9aca12012da21fc5a0619a47e9c3075959786d6d6d74f6a244af1cb33c402d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00403-of-01024.json.gz": { + "num_bytes": 396950960, + "checksum": "b3566f7b9251f6aea9343d1344151f10fc104464f92e8f10a97742defffc2244" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00404-of-01024.json.gz": { + "num_bytes": 398481154, + "checksum": "897904040b5887620b9996cf89656f5bff329a430a8c3dfd6802d0c879675376" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00405-of-01024.json.gz": { + "num_bytes": 396065216, + "checksum": "45e0108549ab06d9a8ad5c45dc53250798d0e58f7e940080a754106801250009" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00406-of-01024.json.gz": { + "num_bytes": 395637879, + "checksum": "bda70f3a19b19e2ffdd1c3a26b959945b447acd450cab49e72ce727d2218af5f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00407-of-01024.json.gz": { + "num_bytes": 398356109, + "checksum": "1df9e8b4715d9a3f02a0b06aef6095f81d38acd1be0b4fa402acaac0258c3116" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00408-of-01024.json.gz": { + "num_bytes": 396041456, + "checksum": "e89ebf354280543204e78f4308a8f8751cc26094524628cd8e9cb691d9911b82" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00409-of-01024.json.gz": { + "num_bytes": 396254329, + "checksum": "15729474174d6a5adb5935f25afa6de2f03a8dd2f73b780e23795ede92f5762d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00410-of-01024.json.gz": { + "num_bytes": 397850848, + "checksum": "98f1b8fc845e0005b76d7eac70a430ce98e6989569344ea92266f8391b1396fe" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00411-of-01024.json.gz": { + "num_bytes": 395527322, + "checksum": "52b2e31f2adb61c8e703c6758016cbfc650f8104dcd5f78867c81434be155ea6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00412-of-01024.json.gz": { + "num_bytes": 396155992, + "checksum": "7b6b4192f9bec4fdeaf9d6dcabd9cbba6b4c8ebb42d26730fea21bad139823c0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00413-of-01024.json.gz": { + "num_bytes": 395766377, + "checksum": "775d1fac6b1708ba0384d922640b2f372b3ee146fc79fbe692ff69a7c6c699b1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00414-of-01024.json.gz": { + "num_bytes": 394860848, + "checksum": "0386d8a8e0cc9d5d613b1f84085791de57ad05751d94d25681d86dff5cec1afb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00415-of-01024.json.gz": { + "num_bytes": 397566065, + "checksum": "1957b0d185943b1952dc66e78f0a7d449f49f8f55fc0978bf77e8dde10f4714d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00416-of-01024.json.gz": { + "num_bytes": 396297306, + "checksum": "3f8796934edb79d172e682511a5ed7666aa09ff541ce55e2c66406bdb6eeda9d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00417-of-01024.json.gz": { + "num_bytes": 398314475, + "checksum": "8da08075b966c04aa7859275eefd34c78cd2b9edc366684733d027ad6d619ba7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00418-of-01024.json.gz": { + "num_bytes": 396296110, + "checksum": "efe43733ebfc7b65c646aee68b883cf40124c1446a28e70ff2bfa9e1bb1377cc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00419-of-01024.json.gz": { + "num_bytes": 397614415, + "checksum": "c0f02d78715de9c3ea0c684dad36a506386081fed2011ec298ca0ee623c7792e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00420-of-01024.json.gz": { + "num_bytes": 395133656, + "checksum": "6237f5797a35dcdd89a0b70cac4dedcfb3fe418560f8dbbf6cad685f11c870b2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00421-of-01024.json.gz": { + "num_bytes": 397061849, + "checksum": "ee37899a6a49269026633ec79577491ff4b11e219e0236dcba68eb168279067b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00422-of-01024.json.gz": { + "num_bytes": 396539584, + "checksum": "e5914a4b97c27da82eaee2f4f67a165de946bb38a00d6126b1527f5eb1200417" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00423-of-01024.json.gz": { + "num_bytes": 397715346, + "checksum": "b99e628f8790a7baa8ee7828e31f2ec72374f9a8390c1d64c9b8092b10d9c7fe" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00424-of-01024.json.gz": { + "num_bytes": 396335469, + "checksum": "9cb3b9eb00760bb68f3df4b66b96f1e5798c338231500472fd64c49cd87c6599" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00425-of-01024.json.gz": { + "num_bytes": 396714466, + "checksum": "f28d4901ccde8eb7afcede9732ab94fd18c49e0e3731659ef587058d6ea2ab28" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00426-of-01024.json.gz": { + "num_bytes": 395566563, + "checksum": "9ab75a89a425ce974fd36e936476a30db913c2d7c9ca6e5522b91ffbcbbe30cf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00427-of-01024.json.gz": { + "num_bytes": 395379035, + "checksum": "5e1ca658bea5ba5506afbb9ae5a5da4d35cdc3a215478c68e11652a7d5d918f5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00428-of-01024.json.gz": { + "num_bytes": 396419259, + "checksum": "d740b37b576bcde0e1c8eee27c3bfb3b58c1a0d3c5b471001804b2a37f277ac9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00429-of-01024.json.gz": { + "num_bytes": 397116774, + "checksum": "d1c10b0ba72aa2d4cb4640d1263c32868190942b1e93b4bb4e9798e25f10ba67" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00430-of-01024.json.gz": { + "num_bytes": 396634586, + "checksum": "11dec038b4c1c35d32d000915812b6ec8da9abbbec2e15f7493551198b6a1ef3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00431-of-01024.json.gz": { + "num_bytes": 396704705, + "checksum": "efdfdef444cf68fc05090107033ffe2ac906b6efe2fc138e90f47cd4bd0b6204" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00432-of-01024.json.gz": { + "num_bytes": 396264701, + "checksum": "fa649c2e2dbc992408c3a60327e5d5ace4697c84010446bb286e544eb6c604be" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00433-of-01024.json.gz": { + "num_bytes": 396887722, + "checksum": "3d5fd3fbf209dfff2057143a3dcf7eceeccb1e85967a9a85a992f465e3522335" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00434-of-01024.json.gz": { + "num_bytes": 398856291, + "checksum": "ab6dc5343b052da901f4671c1cb3173850fbc6bbfac2623ca14936b2b83d9667" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00435-of-01024.json.gz": { + "num_bytes": 395888569, + "checksum": "26abd1e2263af02f998705501bd02ead2edc3d7f68fadc7b198e7fcf4dffc454" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00436-of-01024.json.gz": { + "num_bytes": 396976077, + "checksum": "a5dadf6ec93e8dcd62b0e1de3cb03c866147bafe0da8e631341663ccc03bb801" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00437-of-01024.json.gz": { + "num_bytes": 395809168, + "checksum": "7f98e98270f9b88570b5e498511ee65d07428db604af349ef9107dbcf65ac4e5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00438-of-01024.json.gz": { + "num_bytes": 399136723, + "checksum": "0e03ec507b90b38d5b6d7dfe27d40e127efdc9a0bae349bea2e743375ea29b9d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00439-of-01024.json.gz": { + "num_bytes": 396435416, + "checksum": "5f868ba66ea32a23be4a926fda0a86d0d2ab4948326e1ebac615fa16a2a6864d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00440-of-01024.json.gz": { + "num_bytes": 397487165, + "checksum": "d30005787e7472313982cf2860e0a0764900b82a7bf616da27e6c1c3298eb215" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00441-of-01024.json.gz": { + "num_bytes": 395968030, + "checksum": "181461b447d88040130c3348ae7d22f220e0f97ace030d6f54301a9a3d483fc7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00442-of-01024.json.gz": { + "num_bytes": 396909150, + "checksum": "0854cd3454047e0c6a0746ef21e0cbbb22fbdf4349c2e668f4fa1e49add183c1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00443-of-01024.json.gz": { + "num_bytes": 396271897, + "checksum": "2493db29dd3cadef3719576c34213496eff807df5ae8cf538f13e84d403fec77" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00444-of-01024.json.gz": { + "num_bytes": 395540084, + "checksum": "5e717d9e0c1b6f728df0f206e422a0958a537dddf31fffa4d699e5bf4b3c2b16" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00445-of-01024.json.gz": { + "num_bytes": 398750991, + "checksum": "b8af9d413da48fb5f9a9174b12ad253b2eb2c1ed7709cab710d66710841568e3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00446-of-01024.json.gz": { + "num_bytes": 397575547, + "checksum": "2bad5a914cb9f2e5e99d76afbf85eef66c18e7c1cf2e11c5d455792ae86ab441" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00447-of-01024.json.gz": { + "num_bytes": 398035036, + "checksum": "d834925674a33ed5eb8fcb335fd81b95e4ab882010e434e3fb9323e0f23be2bc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00448-of-01024.json.gz": { + "num_bytes": 398658613, + "checksum": "16f3ac40180e47b9b97998f5d1d7c0e9336e2fee5612a3397fd161937f7a2b07" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00449-of-01024.json.gz": { + "num_bytes": 397934476, + "checksum": "09dd3d5a529f62b10d1ec97f37ed142315190fb437be3f50987ee955b11f7672" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00450-of-01024.json.gz": { + "num_bytes": 396444119, + "checksum": "8a25c11e0adc5fdf50944767fbfbf01a9c35b3c0e07205c7c06288d1f68b4c10" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00451-of-01024.json.gz": { + "num_bytes": 395963541, + "checksum": "f3ac2e295ca4b3ca1f55c8b500ea2588f1519163cec381297ad4bef390fbbe1c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00452-of-01024.json.gz": { + "num_bytes": 396594911, + "checksum": "25a57709e934077c2972f0f8a1a9db7afe9b7558ab023bd6ee5224b2f8cd770a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00453-of-01024.json.gz": { + "num_bytes": 396745507, + "checksum": "75c1a4803bb58efe5df885bccd13596d46dd1f3ea30899a7e83812167b990bde" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00454-of-01024.json.gz": { + "num_bytes": 396193342, + "checksum": "c151679573ea5f5b52e26e8b50da7e14760d1ec15c63a5b864b648190efd48f4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00455-of-01024.json.gz": { + "num_bytes": 398096160, + "checksum": "7f86270b13ee4133adaa06de809f26ef581229407813fca05db521d9d36880dd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00456-of-01024.json.gz": { + "num_bytes": 398965570, + "checksum": "d5b292189c5d318e0ad622eec1e764993084d0477147f51f29acd637935fec5c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00457-of-01024.json.gz": { + "num_bytes": 396672892, + "checksum": "8b490f615b3ed701390ed671d5645dec4aa3fc576a032da8f9d434087c1eb8c0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00458-of-01024.json.gz": { + "num_bytes": 396911580, + "checksum": "8bcadc16baaa4e36fe17ffc0862c264230385e18bbd861671ad5fd8cbb86404d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00459-of-01024.json.gz": { + "num_bytes": 395969213, + "checksum": "b8ff8371a01d7bd1782044058ee0f53d4d1275ebca0870ba16104c1c4b12f07c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00460-of-01024.json.gz": { + "num_bytes": 396928338, + "checksum": "23dde1fe55277467d6d2385684b71e90e9066e6a3c349a1da30a1487e87c8539" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00461-of-01024.json.gz": { + "num_bytes": 400009637, + "checksum": "34b98d46d207c5b6ea7416fab6f3cfcb1444cdc19376464ae9abb9296fd14c3b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00462-of-01024.json.gz": { + "num_bytes": 398107677, + "checksum": "2031735c0f38ce43e37a5bb1b9728fc37c758fc4af71758c3d3b9535716a3253" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00463-of-01024.json.gz": { + "num_bytes": 395503017, + "checksum": "7820184904183fad9a61b6c638df9de11d4624bb3aca08885b842255172cecee" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00464-of-01024.json.gz": { + "num_bytes": 397493281, + "checksum": "b39b1b1e6686014a3c62e74912ec3b915dfc161b62e2d1108410354e6dec760a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00465-of-01024.json.gz": { + "num_bytes": 397080149, + "checksum": "a65cc7f590cc498da334d5a8653e818421e09e5e6ce2e8bc2a29ac67a02c3d43" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00466-of-01024.json.gz": { + "num_bytes": 396633690, + "checksum": "15d891873ba02923893cbc8c42adc0468bb39161f898a810037cc2e9f82e0796" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00467-of-01024.json.gz": { + "num_bytes": 395045117, + "checksum": "711686ff5478ec35ccaaf1549b7a33b941e322585f702257dfe2d31630245ba9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00468-of-01024.json.gz": { + "num_bytes": 399486439, + "checksum": "59c4599c8610f4c54778daedbb358f5e26fa527f8f94c3364b70565ebc90571e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00469-of-01024.json.gz": { + "num_bytes": 396170105, + "checksum": "4263dbb03135c2d8b16fb323208f98fe1a1ff1223e76a7ba085f881411a0ab95" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00470-of-01024.json.gz": { + "num_bytes": 397479432, + "checksum": "2db90de8f4d2bde9af453478ed4667166f636af701bb487095311f99b28e59bd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00471-of-01024.json.gz": { + "num_bytes": 396679096, + "checksum": "caea3c4744adb89f006d9b0d9ef93241a55c1fc165cb0cd62b6d07fa3a40cdc0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00472-of-01024.json.gz": { + "num_bytes": 397080237, + "checksum": "34995676d953f4c95f8bd4f54fba8f92b86189cd73298ab77ee2702611b86e5e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00473-of-01024.json.gz": { + "num_bytes": 397881706, + "checksum": "c0fc6c68ae509d8273e7ca0efbe24f1452a57dcb000f44f550fe9600fd305e62" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00474-of-01024.json.gz": { + "num_bytes": 397705270, + "checksum": "50aeb620f8c03a2e4f2346a0c79a4509adfae084ffbeff0b86d8892b858a821d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00475-of-01024.json.gz": { + "num_bytes": 397201717, + "checksum": "4fa508d23abd417bdb0b0e7a61f9aedfb770609214cd85b10b4bde7ced7f12b4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00476-of-01024.json.gz": { + "num_bytes": 397522775, + "checksum": "27da6164865687041e4f53d9ecec2edc877b147da5b424acbac2c69480132a08" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00477-of-01024.json.gz": { + "num_bytes": 397323156, + "checksum": "e40115fc4901a3930494652ce9ee7abb0c3f41abc6d6c58c81fa75a0ee752db8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00478-of-01024.json.gz": { + "num_bytes": 397380721, + "checksum": "79a16b7016aed0eec375ca383eb316765687f12421f786b2e133faa5690ef197" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00479-of-01024.json.gz": { + "num_bytes": 396828680, + "checksum": "08185ce3c3e5b01552be7d8f08ed5b27a6b1b121bb2d7d70a78b7074fee02fa3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00480-of-01024.json.gz": { + "num_bytes": 398678311, + "checksum": "37a5804dafb2f4aff9e393af5b127c3577ab8a5dd23f1e41f2304b25a4c428a6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00481-of-01024.json.gz": { + "num_bytes": 397654112, + "checksum": "47ce12535b753d8936ce3b569675e76cb6f638bfb74a93caf201f3ffc409d71a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00482-of-01024.json.gz": { + "num_bytes": 396387301, + "checksum": "1d07828a199bb1e1c0c8342ba99e484093557188370d1ced90803c2615d24b7b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00483-of-01024.json.gz": { + "num_bytes": 397178863, + "checksum": "b6499612fac654798010e11c27ee8a25fc05d1dbed8aaf2338fd0ea377dc4732" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00484-of-01024.json.gz": { + "num_bytes": 395826769, + "checksum": "ce197ad5a226249bbba53c34b9f3c83508b542853748c3094a5b98befb537f2d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00485-of-01024.json.gz": { + "num_bytes": 397100006, + "checksum": "f483044a4a0418b695e0b989f0fd03bfa79df01b649991f2356443bcb29d0820" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00486-of-01024.json.gz": { + "num_bytes": 397658615, + "checksum": "297beef7b85dc128a6a58d834c5fd1b24bd7fe84c7a317500461720c742235f1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00487-of-01024.json.gz": { + "num_bytes": 396904673, + "checksum": "06751938694fad1645ed575208e8e2c1efebb7165b4feb2d0ea871dc348741f8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00488-of-01024.json.gz": { + "num_bytes": 398019631, + "checksum": "eb58bf8b011fedf15835841317e445e9e757c9939b4453a013233f020f98a697" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00489-of-01024.json.gz": { + "num_bytes": 395822836, + "checksum": "b339e33e7affbdaf691852d3668ff79adf8476a3c33eb86ad9f4ad4a6ebbf3dc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00490-of-01024.json.gz": { + "num_bytes": 398410737, + "checksum": "4d8356cf804474538772c5520e77e75ac750dce3e6b103c9feab49ccd46a58ff" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00491-of-01024.json.gz": { + "num_bytes": 396607853, + "checksum": "1757097fb884d03aa288a05870016b1c2b9f1700ac5913d85c9821cf2e367702" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00492-of-01024.json.gz": { + "num_bytes": 397612443, + "checksum": "92e98e431a378e0402d81299c49209c66d39b0ba7ae63711f8d6ecf542f5fdf7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00493-of-01024.json.gz": { + "num_bytes": 395595466, + "checksum": "d839e1763aa6ebc7cbcf1b870d947ba45b0b4ac95b0adbe4941a0b121690a311" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00494-of-01024.json.gz": { + "num_bytes": 400397068, + "checksum": "31caeb5f0ef694c06ce434df44c01f4a91fcd48e4acb4f1bf167eae6e59a02de" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00495-of-01024.json.gz": { + "num_bytes": 396458630, + "checksum": "26291dfcae5145cdc306317ecf95851a3f693b4a7c6e132e55384ec69d85ef3c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00496-of-01024.json.gz": { + "num_bytes": 395037560, + "checksum": "b32344b92f81006ad9e2e471f5ef8133e87924c5150145b13d51c3d7a0f68c46" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00497-of-01024.json.gz": { + "num_bytes": 396247929, + "checksum": "0396f0bb16b06ff130e955f260233ec868ada1daef6e8cbd480ce388628d49b9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00498-of-01024.json.gz": { + "num_bytes": 394798084, + "checksum": "28d43d4e7bbce4e20167741ea2bbc3f17981aa51f9c040cfc41c522e732c6d32" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00499-of-01024.json.gz": { + "num_bytes": 396699883, + "checksum": "c6f6deff919b375fb08c74e159c25aa66362e4cddb0700f9b1e0e2701293ae70" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00500-of-01024.json.gz": { + "num_bytes": 397014521, + "checksum": "7ee22957fdfad0880f132f47860612331afce7a48975b9312233ba8ddf537bed" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00501-of-01024.json.gz": { + "num_bytes": 399063718, + "checksum": "ec94186b620037002819cd40347e6aaf67cb847848483790cd687222c9addbbf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00502-of-01024.json.gz": { + "num_bytes": 396938850, + "checksum": "a218de10cee75c4bb5a7102fbe208e6e65142ba5f960ecdc2b56b6f85fa30840" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00503-of-01024.json.gz": { + "num_bytes": 394631309, + "checksum": "8189de9454986f63253fa1ad44c63d5c2f692ff4bc3a848c7c2fd02e08f4e1b9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00504-of-01024.json.gz": { + "num_bytes": 397884411, + "checksum": "b7b268545c27573840bf8a6abb7361c209f92f9b5f0f8028fffd49b0c773854b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00505-of-01024.json.gz": { + "num_bytes": 395784113, + "checksum": "b9f1610be9f045c15e43a7343bd2918743a71585a7122a4e781533dd39a73132" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00506-of-01024.json.gz": { + "num_bytes": 397939195, + "checksum": "f07b77d1be71c5922321e8683140f9a63a90903f1fbd1515d908807e12fc4597" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00507-of-01024.json.gz": { + "num_bytes": 395925741, + "checksum": "23e9927e9e83fd03e9d99c3fac05f1bf63d6c296a2b02d1aa208798d27d8dc1c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00508-of-01024.json.gz": { + "num_bytes": 397426015, + "checksum": "f4b8a74c610cea50a6b144337f65fcfed11fff21df6683503f25d4b82e29a4e4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00509-of-01024.json.gz": { + "num_bytes": 399072341, + "checksum": "c3069ae9658273cbaeaed1730f171837c8d3042e31d1093cf0f519f601309a41" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00510-of-01024.json.gz": { + "num_bytes": 395859781, + "checksum": "e5863648f64423397ca1a7838df18aeddbb3d5d3a2551321fd99a480508fa86f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00511-of-01024.json.gz": { + "num_bytes": 396948832, + "checksum": "a2209ec05a794f083cf163c102c6ddd8d5e5627674686950e17e586128a81e60" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00512-of-01024.json.gz": { + "num_bytes": 396585426, + "checksum": "1c6fdb002dab490e6ddd7fe6023b2124bb944b7ebe95ee3b7faca9a92f4b5de3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00513-of-01024.json.gz": { + "num_bytes": 396789970, + "checksum": "83b02c0cf9ffea9d021adc102269c30a33ab3a803d331ba8d39aaa9b3b7acb43" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00514-of-01024.json.gz": { + "num_bytes": 397131474, + "checksum": "783f25460641cd3532c3bb3920c7d3f0c68b5e674d44cba33b1ed755608cf8ba" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00515-of-01024.json.gz": { + "num_bytes": 396127068, + "checksum": "61e5b9947f77d929442f23fe84465d88044631aa1eb6438a0b86372cba7286fa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00516-of-01024.json.gz": { + "num_bytes": 397526020, + "checksum": "539b032f528d1ec3a8e8420514ef2118f05482297b052f6d28876a8bf776a080" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00517-of-01024.json.gz": { + "num_bytes": 397748661, + "checksum": "03b85a51aa7bcde672cc017fcbb0f11976cbd1447fc0ccb4f4bc822b2b04b27b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00518-of-01024.json.gz": { + "num_bytes": 397915751, + "checksum": "80dec6dc7d15459c113c16f23978c38cdc1157ca18468d8a00e0d2192bb2ffd9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00519-of-01024.json.gz": { + "num_bytes": 397847480, + "checksum": "7125e7915fd03c6312cfe448e4e7a8629249765c13d8558b17c240c2aef713b4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00520-of-01024.json.gz": { + "num_bytes": 396232144, + "checksum": "27974f9766c18fd0b652c94eafa3493243c8e1b25b6e850e857ab6246b193b48" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00521-of-01024.json.gz": { + "num_bytes": 395111538, + "checksum": "61406e92a8f9a6ab800b3dd25cbac842e3487a4c7db7b1bb2070a41d627367a0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00522-of-01024.json.gz": { + "num_bytes": 397690206, + "checksum": "b2e29801d120132a5fbbd3662a54290e46ff5e178b3146ebfc2169facf72e7e4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00523-of-01024.json.gz": { + "num_bytes": 398274007, + "checksum": "79905dbc45756c9f1c225120709d39cbf3caf435e322a531a4add690a1d0440c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00524-of-01024.json.gz": { + "num_bytes": 395689218, + "checksum": "1dc3086cb869abb13862970186f6a77cb29b687cd49518173f639c148d937f6b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00525-of-01024.json.gz": { + "num_bytes": 397979085, + "checksum": "6958bbc6029c00229fb0059d016a6b7a2bd21cfdc69392893423d2657c35c7c5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00526-of-01024.json.gz": { + "num_bytes": 398473877, + "checksum": "895f42c4e7569f0db3832af13e56499f65fff74e93fc0cdf60c1c4b4b08881c9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00527-of-01024.json.gz": { + "num_bytes": 395879939, + "checksum": "e84e72048b56878b1ff904ee83d92c208e15b16663b99a9d763edc23c2e0e55f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00528-of-01024.json.gz": { + "num_bytes": 396472889, + "checksum": "badcc3cda339c61936591e9333787ea032c42d7ff2288fdaff791bdc8504ce96" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00529-of-01024.json.gz": { + "num_bytes": 396983038, + "checksum": "ad20643f9d50c7c508fa136ceed0039ce39708e0e7a5e743c1981f1000bc3c4e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00530-of-01024.json.gz": { + "num_bytes": 395774249, + "checksum": "9453fa3fd296150b436f0146171ea8317512c6735ee9434622a83765a5d9e310" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00531-of-01024.json.gz": { + "num_bytes": 396171120, + "checksum": "3e3c230ab6beda13e4dd4747c7c6291e57b1ccb4a96ac2edb46ffdb4c3cb05b5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00532-of-01024.json.gz": { + "num_bytes": 396200411, + "checksum": "e9b52c3dad233fd1c4310cf5f76c2e6d0788ed084abcf931f99ab7002976d75b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00533-of-01024.json.gz": { + "num_bytes": 395580851, + "checksum": "e135cc4420d9f4d17ab523f7db8c559021a46a9a6bcdd21a6c4075047465906e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00534-of-01024.json.gz": { + "num_bytes": 397459281, + "checksum": "bb4f32ee1c1bedf4582b0f4f9ec7644be73fa25bf18cca7506e3c26e98818bad" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00535-of-01024.json.gz": { + "num_bytes": 397344480, + "checksum": "3766ddf8313c5cee08a575fa96bdde06a5b293f1964e58293ea583d72bd18e20" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00536-of-01024.json.gz": { + "num_bytes": 396588089, + "checksum": "56d236a4250f9488d80b93c0c005962d018da256ea5632c7e16ae26c54188749" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00537-of-01024.json.gz": { + "num_bytes": 397606873, + "checksum": "d7ec24ef99de2769937b89e0ca7e291eca2bd0438d501d9228d5ab035f49d83e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00538-of-01024.json.gz": { + "num_bytes": 397608864, + "checksum": "1a60378a0f1a200b11f85577bbd0f373ae47022eab16fad53da492ca1ed35bfd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00539-of-01024.json.gz": { + "num_bytes": 398377669, + "checksum": "787d263107eb09e852b015c17d1d0f54d8b93e78292c0c1e60cf99f27535c608" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00540-of-01024.json.gz": { + "num_bytes": 398516980, + "checksum": "dce03ef0813ef66e27df8730da7e341b49bf7e684bffd3a9cf700905501d1d72" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00541-of-01024.json.gz": { + "num_bytes": 395557685, + "checksum": "e4035222d65124bd3e33372b76b65c2dad9e696701607ceeb5968d483595645c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00542-of-01024.json.gz": { + "num_bytes": 395725875, + "checksum": "4e7ae0b1c0c4d514e0208e21336d095fea5970475077d6690a917faadb2b72b4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00543-of-01024.json.gz": { + "num_bytes": 397625187, + "checksum": "a96ac467b6ace74a08f7dbc4bb8e3fc57fae36abc8975d6b60a7b7353ca9ca88" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00544-of-01024.json.gz": { + "num_bytes": 397078230, + "checksum": "337470c84cde5d02bc6a89003a6796de9e63db269e7800637ef2d220d75bd3ae" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00545-of-01024.json.gz": { + "num_bytes": 396145060, + "checksum": "da65d66aa4cfff77c754f8017eedd92cb82494b9425c2d5c5491d64603b2231e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00546-of-01024.json.gz": { + "num_bytes": 396093007, + "checksum": "399f7b70d1c1b45ce315f396d5fa0db2c69e41c522b0514e19bcc6802b953b1f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00547-of-01024.json.gz": { + "num_bytes": 397457696, + "checksum": "47fc8fd82271e6b1fb074512da45dc005e22cb7f0aca3b7b621ea87613aeff9b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00548-of-01024.json.gz": { + "num_bytes": 396246097, + "checksum": "3108770b39746852d7c048d9a8777722480505bbf4592732c7d1f231e2505c55" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00549-of-01024.json.gz": { + "num_bytes": 393096516, + "checksum": "9bb2b88775593afe4060349985ff4417a37f1ba9b4ef33399c58644c01a92b89" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00550-of-01024.json.gz": { + "num_bytes": 396631619, + "checksum": "cbb55d645d145ecc2ff9b96524463f82d5548c0bdf42381fc6faaad256e7ead7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00551-of-01024.json.gz": { + "num_bytes": 396806780, + "checksum": "ece03d7f12daa39473b6b8d5faed08a3f751efb9b1ee99f69c5188633d4a0f43" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00552-of-01024.json.gz": { + "num_bytes": 398608968, + "checksum": "7fbbde9c39d67d8d7f9f16c0848188b743c6ff5bc44e6339d5fd88c32e1aafef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00553-of-01024.json.gz": { + "num_bytes": 397696672, + "checksum": "85f9c5c5fbcfd06f715b520a1a3a63a014b1831d2f65de5f02cfea49a18ddf63" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00554-of-01024.json.gz": { + "num_bytes": 397122204, + "checksum": "78e3d43c3d2b71d8483788a085cd5706648767de7a2fc4aab707d6a05257ff00" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00555-of-01024.json.gz": { + "num_bytes": 398704893, + "checksum": "113e5fd99ada6ca96c086487b6e4012bad711d1d482d580e22d3af5b9d118572" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00556-of-01024.json.gz": { + "num_bytes": 398099675, + "checksum": "c7a816f8f2f74b4554ac17ffc41e67ebbcabb7c8b0c94292b4569bea372bea3d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00557-of-01024.json.gz": { + "num_bytes": 396538561, + "checksum": "7af6d2c9886481a0d393e026739b5ad7d0fc358ecc216d2fc124160402d4b50a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00558-of-01024.json.gz": { + "num_bytes": 397660839, + "checksum": "c1033428189671d4e1ba55c822040f307748c6ec31b80be3e4ed8e7a4325066b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00559-of-01024.json.gz": { + "num_bytes": 398754128, + "checksum": "69c9f88840166363f2b7ddaef05ac9d10441fd184d8451abfde76eb105572342" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00560-of-01024.json.gz": { + "num_bytes": 394988981, + "checksum": "a2dc4fc315a0db8f1a868d631d2941ab2806f44c2ae698e94bb7e8308bd67c70" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00561-of-01024.json.gz": { + "num_bytes": 395801300, + "checksum": "dc1b2b4594e3fc7f8795f7649d1c524405edce56d617f1e214692565de8c8937" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00562-of-01024.json.gz": { + "num_bytes": 398322250, + "checksum": "c23404fef6a6b5b887cc2dddfe341e983939ae36078d62842919a3739c96b43a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00563-of-01024.json.gz": { + "num_bytes": 397584845, + "checksum": "c909fe429772c8198f904496ea6cf239d669c6c787889cefcb7623e08a988db0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00564-of-01024.json.gz": { + "num_bytes": 396436964, + "checksum": "8e7cb1863057a3b9929af4da29b4e1cca1f71c254f5eba91a657d9e8c1fd6dea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00565-of-01024.json.gz": { + "num_bytes": 396486039, + "checksum": "23ba56e78c4edc4d58fd7fbfcf784b29037204a641e43a9894c95c68bdb982fc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00566-of-01024.json.gz": { + "num_bytes": 395358745, + "checksum": "71259a300ff096b49e3461c91824a8185037ca85ef2018dff2617f335ab304b6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00567-of-01024.json.gz": { + "num_bytes": 396405726, + "checksum": "d9b56ed523376681dd81cb9831727467461bdfb87c80d3932937338370093033" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00568-of-01024.json.gz": { + "num_bytes": 397509797, + "checksum": "c650aad13a48d5b0c51162ad19c9eb3135559d0a3318dba701a90e8138a8cd24" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00569-of-01024.json.gz": { + "num_bytes": 396514261, + "checksum": "d71e4126c2deffae8ee55077cee9dd2b70ce27adec767bce06e02afb23b42416" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00570-of-01024.json.gz": { + "num_bytes": 397072833, + "checksum": "519a32e1bdf7f5b97e1a438242a79218317e04e44021dc61aa65c526d35ce8ed" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00571-of-01024.json.gz": { + "num_bytes": 397170114, + "checksum": "919a9659156cafb26b87190fc00b9d33c4fd536dd35544cbef8e5ddc018ae365" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00572-of-01024.json.gz": { + "num_bytes": 396475017, + "checksum": "3d7e4e548f01c9ad5fc99b4342cbf9a9004737058dd93aae8b7d95b2c00856bf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00573-of-01024.json.gz": { + "num_bytes": 396749955, + "checksum": "032f8e37328c9f0fc046e5a6ff5a79cbb744f3100c4cbea78e397c449471bb10" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00574-of-01024.json.gz": { + "num_bytes": 396036505, + "checksum": "8e795341527712be32a69307ce8cbd2d6195c6b2fea596d326a279734505198e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00575-of-01024.json.gz": { + "num_bytes": 396722381, + "checksum": "45a43576cfc61842bde146eaa566b4f22a128c3c2eb8f30c59a6b6cae4bcd4e7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00576-of-01024.json.gz": { + "num_bytes": 396163377, + "checksum": "38429d2d6176ee42ddd495e052c01735a9a7f0076cde107d24a0a9c7a26bf2a1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00577-of-01024.json.gz": { + "num_bytes": 396813305, + "checksum": "eae77c319bba236feaffc9f74eaa38e911fa48eb06f4794c9b1a6d17edab91a7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00578-of-01024.json.gz": { + "num_bytes": 397797226, + "checksum": "1dd2b3d7e99fde8903bc12625568ec4fc6fe653737b3af5e9c71432e311cf5f0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00579-of-01024.json.gz": { + "num_bytes": 396012631, + "checksum": "d9322e66701b4ada3788b91a07e87b03af6c91eb4cfaaefee23c0330987a1840" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00580-of-01024.json.gz": { + "num_bytes": 397943129, + "checksum": "23deb32e1b0f07a55a5cf1572cb8e313ce716c748a07f58bd90cbae97290d0a0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00581-of-01024.json.gz": { + "num_bytes": 397614648, + "checksum": "6193f8b848c7930fc04b9f2429dbccf36f1b291271b3eaf646c655433bf3ff9f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00582-of-01024.json.gz": { + "num_bytes": 396659280, + "checksum": "40997ef02c7040356cd1c5acd8e6a5121e00b31253713cad4f529ab2922affc9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00583-of-01024.json.gz": { + "num_bytes": 397686445, + "checksum": "5cd21271e4ae036f8d1e0c320330a6c93a8b1ffbb9293a80c56c2d7f123f9ee7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00584-of-01024.json.gz": { + "num_bytes": 395500815, + "checksum": "c25befb7c735b2340b092a04375d2109c1b876d2b0057dd8d4ed4beac87118ad" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00585-of-01024.json.gz": { + "num_bytes": 398413461, + "checksum": "073f632e95c218fdf17274fc21915c94f56bdfbb58a6b1a0550de249ce4d2129" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00586-of-01024.json.gz": { + "num_bytes": 396849745, + "checksum": "647cbe9bd7709c0d8a01485096fd88ad0fc09b27de324eae141a8d841536b71b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00587-of-01024.json.gz": { + "num_bytes": 398567154, + "checksum": "557af97a8d2b2656149bc25ee5b362116d173e6a48911b860ec10d512b4b763d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00588-of-01024.json.gz": { + "num_bytes": 398086388, + "checksum": "9e9afa15ee3534e497c9fc7c8cd967388183193dade3d1ec82a8e2b0e82c5118" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00589-of-01024.json.gz": { + "num_bytes": 397335823, + "checksum": "ed8a1d0b9c55f465b5d4a4e5ea022f6d17aaa8b82569be7cfec55629c1bf26c6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00590-of-01024.json.gz": { + "num_bytes": 394931693, + "checksum": "3fbe539fcf64f0d914c19b383de9953b0605d4a69f48801145f0db1972f9c6b6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00591-of-01024.json.gz": { + "num_bytes": 397828770, + "checksum": "9165de8866384d3d03c3876c39c96706e33a24b9f95acc09999c2dbfb85cd9cf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00592-of-01024.json.gz": { + "num_bytes": 398782493, + "checksum": "433a9cb730d7ab024b56ad662a3ea53633f7ff26c625051c4c02f252beeb87a6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00593-of-01024.json.gz": { + "num_bytes": 399264489, + "checksum": "4a7e5f40aa8b692cfa0519d33a868e9a05e579ad430204bc13c48b533eadc5ce" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00594-of-01024.json.gz": { + "num_bytes": 396629833, + "checksum": "521d5e90550dbc97ab26a18a0b75da81e38ce2083ff5fd93340fded2e54e1ca1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00595-of-01024.json.gz": { + "num_bytes": 396916313, + "checksum": "30c9be1d99ce0a41b214fdbd5115988c82ca317d4aceb30c19fbca05e0a409e0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00596-of-01024.json.gz": { + "num_bytes": 397013253, + "checksum": "b16bd9d7d893b4a71056575fa0799bef96120c03cfc6e2a88c292469a67f2614" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00597-of-01024.json.gz": { + "num_bytes": 395980036, + "checksum": "3bd15089b6fff342df2b3109d7ebadca35cead4f44ca5b1b55e55d8892aab82f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00598-of-01024.json.gz": { + "num_bytes": 396295935, + "checksum": "6252d951a9570baea9767cf3350a6d09ac5a5fc34ba80eae3b5c40adb8361ab9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00599-of-01024.json.gz": { + "num_bytes": 398608239, + "checksum": "b265a385cdd5e64d1fb2ffce739e72f2fe2cc8944621f20e2084dc52b91cdd9d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00600-of-01024.json.gz": { + "num_bytes": 396563743, + "checksum": "43d12028cbe738e8f450911f6a55dcb00f8742cefc2a2c4da5f9e9220b0572c1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00601-of-01024.json.gz": { + "num_bytes": 398256993, + "checksum": "9368dcfc581e6d572d899ef25b129bc0268901a2fa009500174a0985bcf330df" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00602-of-01024.json.gz": { + "num_bytes": 396202546, + "checksum": "3cc57d7afd161fcd411f73da8369d98db4c6d8e30643ee01450adef21e8ea3ea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00603-of-01024.json.gz": { + "num_bytes": 396338425, + "checksum": "cc21fc5b8ed6e5115bd8924954d685ed52cd5b773ab63d37188343443c95851a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00604-of-01024.json.gz": { + "num_bytes": 397597307, + "checksum": "d24f6d807ae35037e695e19917ed446f74448166fa464c862e31fe7ba2bea196" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00605-of-01024.json.gz": { + "num_bytes": 398278313, + "checksum": "99166183c752aed8d0f2cc9c010f1ebdd4fb93d40e936fd6c082eb3542baa956" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00606-of-01024.json.gz": { + "num_bytes": 396590468, + "checksum": "657ce79340c15524a5897459a6cf712fa4127def2445f7eb3de21c9b46db3794" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00607-of-01024.json.gz": { + "num_bytes": 396603228, + "checksum": "3705441435f18d1e4aeea9e794e1216fcd29b48213763a554808e3d3697951a6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00608-of-01024.json.gz": { + "num_bytes": 397280580, + "checksum": "be0bef2c16e9bdd0387276402dc99fe5a9a0a7a105a44e88bdb783139f2de474" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00609-of-01024.json.gz": { + "num_bytes": 398284528, + "checksum": "3a7c7a8cb01f6d7589152a1483682a5fa99e119490f3e70d8a02f582f2e2b19c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00610-of-01024.json.gz": { + "num_bytes": 398872039, + "checksum": "c349aac5b64227397ec2870992ac9e4fac9fe39f1fd4e0a7b8c727e171655e14" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00611-of-01024.json.gz": { + "num_bytes": 398736440, + "checksum": "63ca5eb2d27632b3b4dde8e40f9925e71e21ef737262bcda7a99324a67e0fab5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00612-of-01024.json.gz": { + "num_bytes": 395170895, + "checksum": "3b4bb3e14ee981a9edb9828ce40b86b5d83dfafcc1a5e0e02642cb40924bd6ed" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00613-of-01024.json.gz": { + "num_bytes": 398443337, + "checksum": "e95adbd7d55024b7e62145860f217a6f04f5fcef79ac23e92dd9e14f9a0b2a30" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00614-of-01024.json.gz": { + "num_bytes": 398854661, + "checksum": "def8cb789f8f79fa169e855816c5e4bc7d5c253e565502691a9abb826d7436d4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00615-of-01024.json.gz": { + "num_bytes": 395505189, + "checksum": "6775ca6aa4f834289396a438906b90936ed0ff6390213dac2b0861f40d7761e7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00616-of-01024.json.gz": { + "num_bytes": 398999454, + "checksum": "6cd5efddacb09cc80ec1eb79f93b562044787903b3cb1c879be2acec64a9dbdb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00617-of-01024.json.gz": { + "num_bytes": 398570431, + "checksum": "26d1f587377446e8b1499be7a3b6776d437baa40353fb04c591203a420eb0cc2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00618-of-01024.json.gz": { + "num_bytes": 397064982, + "checksum": "e59a87fd1cd3d87fff4b15c3a9331521d7587ac7f4a7fd51ec3906b484ef9ad0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00619-of-01024.json.gz": { + "num_bytes": 396676338, + "checksum": "8077c3a15d93579d0fbf00bd9d117bf4f50092c5be3acf46c7d4433ef7be9dfc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00620-of-01024.json.gz": { + "num_bytes": 398186471, + "checksum": "ee3fb91d7797ebf1daf8dcb81563b7dae7b161d97732efd35e3eb6ebea732ee2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00621-of-01024.json.gz": { + "num_bytes": 396467968, + "checksum": "386adb83129a7306ef4da37c1cbedc39b3971e7633d516d406a982f307577e67" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00622-of-01024.json.gz": { + "num_bytes": 398293882, + "checksum": "b708cad0e04c56174d0feec84d7224a4490cb8db023d38e57398cad89b78568f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00623-of-01024.json.gz": { + "num_bytes": 397396780, + "checksum": "c50c4568c6f103b3e6a3702cbd915ecb530df954df808156bc38a98f36a0b944" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00624-of-01024.json.gz": { + "num_bytes": 396971282, + "checksum": "11351ef83c9fb883d6c0f484af5c10f0d686b7ac4a2f08fae9ac3d9837df0a0b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00625-of-01024.json.gz": { + "num_bytes": 395882440, + "checksum": "dfa97ea7949c9bbf7af43d43ac5c8d0034bdbd1ad572895159b7c7846ab89676" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00626-of-01024.json.gz": { + "num_bytes": 398292846, + "checksum": "fbc9c23dc286ad6fd7f01f344de97ef5789733af581de278488869bd36f3b246" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00627-of-01024.json.gz": { + "num_bytes": 399890427, + "checksum": "f43bbde36b8bd34ed9998b99b42c85434b8bbc8bbaa1cf5b38cec6393099c23f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00628-of-01024.json.gz": { + "num_bytes": 399589466, + "checksum": "c50058a4937912b678d33d34ff91e2287e8701365f4f71fce61f9002652556cf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00629-of-01024.json.gz": { + "num_bytes": 397355095, + "checksum": "051c4631d0587b6f65827410ad2f2121c05c849a009274415bc5e7f72db42d44" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00630-of-01024.json.gz": { + "num_bytes": 397860559, + "checksum": "07b48a86a8a3245fe5b78f6943c8970c839942b8d86abf173507225b0d1520d0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00631-of-01024.json.gz": { + "num_bytes": 396161304, + "checksum": "70a03f0308105de5266c4a40803b51f99888b362b71409719b7f71f73761b590" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00632-of-01024.json.gz": { + "num_bytes": 395620184, + "checksum": "c6923984c419f08bb4e6effc27dd25dd986513034338debc9b238592dad9f607" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00633-of-01024.json.gz": { + "num_bytes": 397572527, + "checksum": "900fc701703234031e825a1eb2d11b364f1dda97eb0c7943e17ef278695f7bea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00634-of-01024.json.gz": { + "num_bytes": 396215174, + "checksum": "0cc838e395581933123fc57c6690afbdd2be1b67d213336d9b8c08b3876f8458" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00635-of-01024.json.gz": { + "num_bytes": 399176005, + "checksum": "5a3daa1bd0be8c997da56257f063a7d1c7b2b271648a46615b26ca4beeb42863" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00636-of-01024.json.gz": { + "num_bytes": 396035356, + "checksum": "9d21ce1c8b5a7c1330cc95b1f45286fb8578d5dcec0686724ff6e25a97f38a7e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00637-of-01024.json.gz": { + "num_bytes": 397214839, + "checksum": "83cd34e1ba09c268b515fda7699e12bfa2531fb7e60e2f861946ffdc01e54a04" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00638-of-01024.json.gz": { + "num_bytes": 396292535, + "checksum": "82a7bae9a7d35fa707bcb6d90f7b244f1509e112dfdbd604c9be1f8b8ce7150b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00639-of-01024.json.gz": { + "num_bytes": 398009954, + "checksum": "b6d7ebd102c67960413caf5fcdc5b4aea728b6d3d6369ab8dd3cd6bee6c769de" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00640-of-01024.json.gz": { + "num_bytes": 397558496, + "checksum": "151c55d019fd84fdc0eab73d24984e5d88ac964c86f89a361a03dc776a22b5b4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00641-of-01024.json.gz": { + "num_bytes": 398031508, + "checksum": "e0e87304a8ac408adca2badf2564ec52caf155295ea303a121c30f3b1ce797b7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00642-of-01024.json.gz": { + "num_bytes": 396594124, + "checksum": "73d08c99b6b96d96b82d88267b2a392a7dda2084ba5142b8eefd0d23212702d5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00643-of-01024.json.gz": { + "num_bytes": 394552252, + "checksum": "ebccf3b935d63c30f626d317af250b6bd0f04ef5e1cced829287ba64fbb0d25f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00644-of-01024.json.gz": { + "num_bytes": 397586341, + "checksum": "674c0965a9a880c057b6f2dbb785a4a6ae048954d44ba4f5266dd5e65095d06e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00645-of-01024.json.gz": { + "num_bytes": 397950976, + "checksum": "7ac8d4dacd682a2977818f01d860c3dfa5a5e5a78f7d2d95be0353a675452e93" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00646-of-01024.json.gz": { + "num_bytes": 397511840, + "checksum": "452a9cc03facf9151552f914f9a8a3507a96fd8ea40f7d04951a29ecbf6aa1e5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00647-of-01024.json.gz": { + "num_bytes": 396692070, + "checksum": "5a795a238203444596c711bcedc634e653e5240c9a800a9884c51f878340b494" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00648-of-01024.json.gz": { + "num_bytes": 392707626, + "checksum": "9cc366c37950624df6af318ee52a97d32a40e278fcb519cbe8545b04bee3204e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00649-of-01024.json.gz": { + "num_bytes": 396283284, + "checksum": "4ddeec31a30b5c563838b17e1115ad30041e08c70a94f299ea324ee4b71fd82b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00650-of-01024.json.gz": { + "num_bytes": 396349662, + "checksum": "f5bc63114ec9d73d6cea7f8e38a95031ae2bcde849b27440afd840a3e72aac13" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00651-of-01024.json.gz": { + "num_bytes": 397187042, + "checksum": "7199c0242b2654509af187c9c8bbfc22cc5067aafa1ff69949b1f0e5b718425b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00652-of-01024.json.gz": { + "num_bytes": 396263026, + "checksum": "c9e62b6df7213ea5b71913fbf736403f33c51e5a868bf1035cebcc39d80635bb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00653-of-01024.json.gz": { + "num_bytes": 398689010, + "checksum": "f3bcc9eca4d71043e920db6399a032f916c23b1da329d2ef86434a74f8e7b318" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00654-of-01024.json.gz": { + "num_bytes": 396938678, + "checksum": "fb41df26e1f68e1e9d12ae8740535ca66e80910320be2270d680fec40d6fe9a7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00655-of-01024.json.gz": { + "num_bytes": 395995226, + "checksum": "018b40ddf6d88c4c346c8018439d16f6ca66ee0720970e84ddc34b1010ae35d7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00656-of-01024.json.gz": { + "num_bytes": 397860049, + "checksum": "8f3847e9bb5a8145e2959b340f86cc06f85e6646f32d5d785c5c90ec11a9f404" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00657-of-01024.json.gz": { + "num_bytes": 397142407, + "checksum": "a1ae8735a39bd099dac2e50c22e312f1a010f2644774ef53c995f3437c0a5524" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00658-of-01024.json.gz": { + "num_bytes": 397827609, + "checksum": "f6154377cfff2453392fb899f81514a7c0ffd40dbc35d8842d61a115d0aeef35" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00659-of-01024.json.gz": { + "num_bytes": 396861858, + "checksum": "4299633524667921549573c469a73e33abae89d107375d5ccc6a6d987c2a2a26" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00660-of-01024.json.gz": { + "num_bytes": 397773823, + "checksum": "44eaf6c1739d8a9c13c54750c473ac04aaf9d2223d8893cd8094f1769b1f6f8c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00661-of-01024.json.gz": { + "num_bytes": 396311257, + "checksum": "18edb60444b660c7cc68dbe59ac71989be0e20ff13639725a5f05e4d4d512514" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00662-of-01024.json.gz": { + "num_bytes": 396176936, + "checksum": "7b60541181fbb92f361fbdf0bee80d086c75279610aab792a7b3877d49a3e1bb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00663-of-01024.json.gz": { + "num_bytes": 396274985, + "checksum": "59e057ee5f5e8c7267138c18c5c88f3ca24d30f86c484e4bb0c0a4eb5169c4a4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00664-of-01024.json.gz": { + "num_bytes": 397483935, + "checksum": "585f45d3ac3f88c3bf1c86e01daa46537f8f5c5165521412de0e67393cb6da33" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00665-of-01024.json.gz": { + "num_bytes": 398831104, + "checksum": "e403d2f4ff6e74abc9639749f93f77cc868453908c10821fea7fafdbcc981a06" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00666-of-01024.json.gz": { + "num_bytes": 397668116, + "checksum": "f9bbafa396a466b24630a259a01804b2857c1dde2fa3cec60b2967a88ad9f528" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00667-of-01024.json.gz": { + "num_bytes": 398123165, + "checksum": "ed693d5ecb9dfcaf545e831b5769b877e927125794cae61a0ec7821c3c85dfe6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00668-of-01024.json.gz": { + "num_bytes": 398152096, + "checksum": "51c33c07d503743704f564bc6a372c2f6f8f13a1ddd00b0b9a2c44c94cc57444" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00669-of-01024.json.gz": { + "num_bytes": 397927981, + "checksum": "d356b5268ba39e38ffccd20e95803f3218407e0a1ca3b4d1165ff82796ec1bae" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00670-of-01024.json.gz": { + "num_bytes": 399074605, + "checksum": "bb96ea8154ae01275a9197709820e670c4e6212c740e92a7f1cfb7c618a49bea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00671-of-01024.json.gz": { + "num_bytes": 397864381, + "checksum": "afca3dbcaefdc368e996259fd595b77fd98a885ec005a93069a01b83227c827b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00672-of-01024.json.gz": { + "num_bytes": 396077133, + "checksum": "3da96ebd1b28b55b03bbab8e85f78295cffdad9020f869cb456da27058ffa090" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00673-of-01024.json.gz": { + "num_bytes": 396943842, + "checksum": "6a4c344a8af68a95e20d58b64fff8fe616c2a406cf26f642cdfea65fce5883d1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00674-of-01024.json.gz": { + "num_bytes": 396975969, + "checksum": "e6b0f7727d78143fa180abb76e617b37660b35f6323f19bf1dcbc78fb9374508" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00675-of-01024.json.gz": { + "num_bytes": 396692800, + "checksum": "e4ed97b19c6d83e618a3fcaff75460d828ca419b1e62842a1493b0ec4c9703e5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00676-of-01024.json.gz": { + "num_bytes": 396514400, + "checksum": "a5672f1561ab85f071395de43e702791aaacff77a9f67f6ec9e14b12aba675b2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00677-of-01024.json.gz": { + "num_bytes": 395939125, + "checksum": "3dacd3bb90b5e645d1b9a962d8df87f571b0fcf227996068535bb98a68f9191d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00678-of-01024.json.gz": { + "num_bytes": 397022852, + "checksum": "c1a0ef31342161369b7fb709be17e3c86191c1a52cb04b704fc58190818302c3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00679-of-01024.json.gz": { + "num_bytes": 398325372, + "checksum": "47ddd1056ad977407f61b2eac3ff803d17b1aa8fa0719279bf911caf49bbb7c8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00680-of-01024.json.gz": { + "num_bytes": 395502228, + "checksum": "cbb93f322d684ed558cbf8d92b9f83958ba772fe4177093a334b4596343f3cd4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00681-of-01024.json.gz": { + "num_bytes": 397981781, + "checksum": "9ec2dec493733846a1ec9f68ff5130cd461d7ab9c07b22d4aae94463bcf03146" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00682-of-01024.json.gz": { + "num_bytes": 395265758, + "checksum": "7731cb9a2898c730a650e5d1b358886ed562228928aefe55d991cfaaa61a9a99" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00683-of-01024.json.gz": { + "num_bytes": 398783283, + "checksum": "6f2bb48070e809ac17fc90e1117d63bd8c7cd0079d9e44c9f262c4ce60f5d373" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00684-of-01024.json.gz": { + "num_bytes": 396160769, + "checksum": "fd07413637b97b68cb3a7a6cb86c4656017b7841728e806485ae196294e79f8c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00685-of-01024.json.gz": { + "num_bytes": 395594461, + "checksum": "939925a9169da729891fbeef926f420b80bcc60e0f170bcf9a2095449a22d424" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00686-of-01024.json.gz": { + "num_bytes": 398275260, + "checksum": "13836c45719ba10f2d581cf17cdab1daa4cc207a49db2b4786b451605842ac4b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00687-of-01024.json.gz": { + "num_bytes": 395256765, + "checksum": "0c0d0e6c1e3cb9a024c184a8510066a005c031a15af74d117d0e736a358a91d0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00688-of-01024.json.gz": { + "num_bytes": 396635904, + "checksum": "2462e084563f8b8de68c6e826289949ff8ebf8cfaf323344c07ab93e56373539" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00689-of-01024.json.gz": { + "num_bytes": 397749444, + "checksum": "d03746220f3374c80102ed39d8f6ae0daec40fc1b23312c08ecdee82a65ac6df" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00690-of-01024.json.gz": { + "num_bytes": 399380060, + "checksum": "217d032ecce8d0b7e448befe83aa051a3bfab8cb0e167d043b6abc833f5e9b4a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00691-of-01024.json.gz": { + "num_bytes": 396975651, + "checksum": "354fe9bc07aefc55cbbf8752f53ad69d45761da928bc8deb6fee1de9e244e93e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00692-of-01024.json.gz": { + "num_bytes": 399720848, + "checksum": "21f88940b6cbceefd66ea5e8d466467806370ae24a5833ca308cd840daf5ff8d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00693-of-01024.json.gz": { + "num_bytes": 396787846, + "checksum": "c8d28980ffa1eff4459d2fbf0043a1f8eeaf840a3b1d1ea4989b2192c7a82041" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00694-of-01024.json.gz": { + "num_bytes": 397945967, + "checksum": "1936570da24c4bab9fe0559826f1cc509c4ab6eb3679e26d697efa6e7e5c8a81" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00695-of-01024.json.gz": { + "num_bytes": 396349049, + "checksum": "8e497506f84513272a8a0694e7d4efb004b1e3b515887e3b5762f59b6c659dc3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00696-of-01024.json.gz": { + "num_bytes": 394901418, + "checksum": "9e1d6cc187ff67ee734bbadc6cbd57eae05634a448edfde184fa8d6fc3259836" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00697-of-01024.json.gz": { + "num_bytes": 399142528, + "checksum": "9584496113a8612620748aaba35e185b8f47b7c96b4ff0dc7bfdd6024a3faa14" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00698-of-01024.json.gz": { + "num_bytes": 395923784, + "checksum": "83a3c57b3870ed9beeaf3ec8ab694e0be458106f3128b14b2a44a036e89d32b1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00699-of-01024.json.gz": { + "num_bytes": 397137494, + "checksum": "0befea64fe749d79592e337bc359bcef70ca8816d0126ebf89d4b8fbfbdcbec6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00700-of-01024.json.gz": { + "num_bytes": 396554785, + "checksum": "34739b543636aeadb6dcce3e7c97ca49026cc9897c13add6b592fe60e5c40338" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00701-of-01024.json.gz": { + "num_bytes": 398091188, + "checksum": "c9bcc7c9e91de707ee548e67452d6970af2e19bef91f966b19fa71504e5305fc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00702-of-01024.json.gz": { + "num_bytes": 396039798, + "checksum": "fcda5f8ddc5ed163db84aa70c565f8181731af9a29918a2ece0436d3146d7125" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00703-of-01024.json.gz": { + "num_bytes": 396889704, + "checksum": "c80445d442a766d2e87ecf5804e87bf7f8b23c2238476fc2b51f657400739306" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00704-of-01024.json.gz": { + "num_bytes": 399465260, + "checksum": "0bb73674d579523fcbe079fbea7190138911711f023404ae46ea7b685fc09c73" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00705-of-01024.json.gz": { + "num_bytes": 398579507, + "checksum": "97d6fd9cea2a47913c6ee9d1e34c3440858f25f3d670cc81c8f83f2346fce6e2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00706-of-01024.json.gz": { + "num_bytes": 398761590, + "checksum": "2f4836001b8b80066ae09b6e385ed0048770c13ba2410e0f0309ab4b9200e37d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00707-of-01024.json.gz": { + "num_bytes": 395576626, + "checksum": "8e0c0c635a7a7c32d4fdb1a7906ee95a9f334a55b2ff3881cdc7d5e816a9c817" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00708-of-01024.json.gz": { + "num_bytes": 395930921, + "checksum": "e6978b92f333230972e2b4c31cb86b5286fb899948c7680c7a9cbe75a9d60296" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00709-of-01024.json.gz": { + "num_bytes": 395734676, + "checksum": "13071a3527071f06570c6cfa485073f2f3980c83cac782db6bf66a75dd865df3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00710-of-01024.json.gz": { + "num_bytes": 396501107, + "checksum": "6562cb3675a42a58b8c8b2a232043adf532fe49420e30c3c237a6d8889a8de30" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00711-of-01024.json.gz": { + "num_bytes": 398422179, + "checksum": "f38b59c4739d3c15e5bf5dbc0965d1a5dcc0f49a3c89eb7a6822003aaa1ae7c3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00712-of-01024.json.gz": { + "num_bytes": 395905103, + "checksum": "500b4914f3c42d5e24ced7d36dbd3143c49e4fd5dfc3d53a172d1a55ae738889" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00713-of-01024.json.gz": { + "num_bytes": 396009909, + "checksum": "4f50bfa762db1435a89195fd180615e9f569c1668e128d343c87c40ac5cf60ef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00714-of-01024.json.gz": { + "num_bytes": 396963447, + "checksum": "fd9eea7dfb93916a3798a8b69d29fb5d4bf0fec448b8a24427f729e7a41205e8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00715-of-01024.json.gz": { + "num_bytes": 397474378, + "checksum": "3c61bcf6f24e21d2584bb4ae008230540d9a375e35f3c4ba1668621b80d85c5d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00716-of-01024.json.gz": { + "num_bytes": 396285471, + "checksum": "c554e562a369d9696219ea8b0e363907c50f626d7c410a26515e07de801da74a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00717-of-01024.json.gz": { + "num_bytes": 394827995, + "checksum": "f8b4678c21d93c19d50cb576f0910050d24dfd606238bbf8013c45f98defda12" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00718-of-01024.json.gz": { + "num_bytes": 395517823, + "checksum": "1bf63affd6914d98e197b6e1ce526cae7754ecdc750184154d3cb8e3bdd21a9d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00719-of-01024.json.gz": { + "num_bytes": 395561934, + "checksum": "c04b162d984ff2ada9f39aa6c0fac04a1531fbde05175f856d2e3ca2797a448a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00720-of-01024.json.gz": { + "num_bytes": 396227762, + "checksum": "25da2ac7c1f3cbc361807f67e8826ffa95f4caa25f81f66832cbd0a08f1a51f5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00721-of-01024.json.gz": { + "num_bytes": 397716450, + "checksum": "28180c6396deaf34e2a197f5cad1b53ba1c9532db8b5c21dd7d81332b2793181" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00722-of-01024.json.gz": { + "num_bytes": 398022279, + "checksum": "9c3a8038a7f9431b90f67ea0d3b77353d0508b09865f49af575b6aaf5e32d6b7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00723-of-01024.json.gz": { + "num_bytes": 398064523, + "checksum": "4b18959f604bd5f379a73b52947261cb8d63f2243f5afeb5807a13669ef4a800" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00724-of-01024.json.gz": { + "num_bytes": 394747045, + "checksum": "615f13a1b2a6942931519b7a7f6aba286f6045aad65b041c2c6643ce906de1a6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00725-of-01024.json.gz": { + "num_bytes": 396726374, + "checksum": "4099a416eccbb56818efda68bd027c993c1a5fa1a8e722bc268041fd3f804cfb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00726-of-01024.json.gz": { + "num_bytes": 397361407, + "checksum": "152d5e2bad0de3b6b48fb26066891b160ea79c4c382ce6aec6047196e3b08ef6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00727-of-01024.json.gz": { + "num_bytes": 395542925, + "checksum": "ce1d46b0cd7d9e4075db3feab71d2f72939817ebf45819e73ec277c9cc07307b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00728-of-01024.json.gz": { + "num_bytes": 396647931, + "checksum": "c859626b14584c1bab396c867ad5eb11ff3af39628206b03612ee2d2b3058497" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00729-of-01024.json.gz": { + "num_bytes": 398272080, + "checksum": "758fbdc5bf6d66a36d69d31141742b2a917bf0341494b844f22ab82cd54e7ead" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00730-of-01024.json.gz": { + "num_bytes": 395977662, + "checksum": "56a7fcb59ece26d4b19be0bd5e6c2d0f05e4b1b23e8ce7b4fab064a29b229c02" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00731-of-01024.json.gz": { + "num_bytes": 397530948, + "checksum": "bf0f4dc8796a737daf80b977a6e3656cb1e244fc40d6df92852da45e53e6cfdd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00732-of-01024.json.gz": { + "num_bytes": 398314575, + "checksum": "1862bcc85d48f59283eae56836e5598f20287ce36a185252abb24bcfbd1377cc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00733-of-01024.json.gz": { + "num_bytes": 398547748, + "checksum": "476389cb582df3c214f3f5a45268bdb47b581a432c08723bd811daa5f5990083" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00734-of-01024.json.gz": { + "num_bytes": 397380175, + "checksum": "2b6fd36a8f8bc3edfcd8a486de44d2f3132f7b8f4bb2d4c93453dbf1a1b6667a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00735-of-01024.json.gz": { + "num_bytes": 399584382, + "checksum": "3e0a067fef0b40edcd23ce6680efc07253660b8c00699630bb7629b9d803a198" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00736-of-01024.json.gz": { + "num_bytes": 395312038, + "checksum": "e4f92413c837d269481ecc0b5d0fc87548bd2ae718ef7f9bff18674ece289bc7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00737-of-01024.json.gz": { + "num_bytes": 396820243, + "checksum": "e61680c57505f027ef8cbd28a45e706936befa2ab40a24a63e638019a1717b63" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00738-of-01024.json.gz": { + "num_bytes": 397691872, + "checksum": "d3acc0c9c76ef2df89f49896744dac53f488f830d3d42f0c481f2321ed60fa67" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00739-of-01024.json.gz": { + "num_bytes": 397912166, + "checksum": "18d281ed9831f28c4c54256a844ab2cff7a5b681da1b7c8eab2565b106381aa9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00740-of-01024.json.gz": { + "num_bytes": 397093867, + "checksum": "6a65230910384587f5e7f34b52c2a6d9a86a8b1f7a23d26f890b6e810c051815" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00741-of-01024.json.gz": { + "num_bytes": 396371058, + "checksum": "26eb40e98075ab716b4edec76d1723a679e648258d6812119b46f7522dfa9b07" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00742-of-01024.json.gz": { + "num_bytes": 398346941, + "checksum": "466043ec98eb806916806cff7495f0bae89cfeb2835204ea34328030b92a27f2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00743-of-01024.json.gz": { + "num_bytes": 397366055, + "checksum": "d98d31aaadf95dd0d1cf0548db515c8e77c95bbc4b611ae9ab5650429c171889" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00744-of-01024.json.gz": { + "num_bytes": 398722902, + "checksum": "a43c80ab3bd8d12d12b4ea41d9054b90214fd3ea2ef957f317d6ed6fa7b60e34" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00745-of-01024.json.gz": { + "num_bytes": 397562514, + "checksum": "1e6dad94e0f90bfa0fdc5557c58873aaa95fa9ce1c7b70a1fe76817289cff78b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00746-of-01024.json.gz": { + "num_bytes": 397731351, + "checksum": "21fefd6cffa9032c9ca7cec91cd775c83bbd37419ae236eeec9589f8bc4be0dc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00747-of-01024.json.gz": { + "num_bytes": 397781450, + "checksum": "b84c74bf1caecf92777fb85129bb009eb3a27fbab1b97af567f36a8bf100e704" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00748-of-01024.json.gz": { + "num_bytes": 397425031, + "checksum": "fe9bb225f6d03b44e552ec985c844e5012e90c4ad99f699ec4ed4297db91349d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00749-of-01024.json.gz": { + "num_bytes": 397925850, + "checksum": "3913b2955fee02e2ba716d843559bc4bf4e85a2884ae4495446a379f857a30e1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00750-of-01024.json.gz": { + "num_bytes": 397089489, + "checksum": "773486144d3008cb3207c3c8b65fe6081c9e64dda09728d3586bc82e6bb73fca" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00751-of-01024.json.gz": { + "num_bytes": 394819424, + "checksum": "d728b117a7b74150b03ed7d562514c2e45ccc03b0bceb120eddfa8333166a923" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00752-of-01024.json.gz": { + "num_bytes": 397199683, + "checksum": "6c10c3f4e3737db6a70375bd605139de61ae8b09a1aa91dd1cfdb82c183f0cb3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00753-of-01024.json.gz": { + "num_bytes": 399197199, + "checksum": "101c4ed5426b586a4aeeb7dbd377306eae9eec2eaf934e79d25583abff70b15b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00754-of-01024.json.gz": { + "num_bytes": 396415619, + "checksum": "732f4dedcf1266bcabf15a6a1cdead617ea37d428d8cfbccb5a9dd7521133075" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00755-of-01024.json.gz": { + "num_bytes": 394564662, + "checksum": "a23f1bb1de23554efff68e730d85802a6491936fb54e256744af641f97ec155b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00756-of-01024.json.gz": { + "num_bytes": 395577258, + "checksum": "2f4275994a103dca517d4eb3656009c8138930079e00303c7b8746ab6094fd19" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00757-of-01024.json.gz": { + "num_bytes": 397161772, + "checksum": "ab16360173283b22a7e19d181fbf55a6a8d07f0d9007b51aa159c1e81661f5e1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00758-of-01024.json.gz": { + "num_bytes": 397545456, + "checksum": "ff5a6292bc557aa9895de39697e8aea5843fa5a00c83c7983eaa36640d446ecf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00759-of-01024.json.gz": { + "num_bytes": 395470957, + "checksum": "66a64accfa6c281d2bdfa7b6846397f56c2d4f8a22ae8925a07af853e42f5521" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00760-of-01024.json.gz": { + "num_bytes": 397328304, + "checksum": "46778c90bcc6da96cf02e66956a1bcabcb9a95bad538cfc0d5190db473a278a9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00761-of-01024.json.gz": { + "num_bytes": 397706141, + "checksum": "4825f25d6e1d13c70e6e65ce13ccd7b1922344c48ee2806952f3ba1b6e26d3ae" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00762-of-01024.json.gz": { + "num_bytes": 396983663, + "checksum": "25e1645f05d342b5f872ca809b36d516c7336c22035bfa86cf295d0865e08789" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00763-of-01024.json.gz": { + "num_bytes": 396355038, + "checksum": "d4c3a92808f0bfb042423cd4166abc57d20603ef07a0f0912058a718a38f26d0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00764-of-01024.json.gz": { + "num_bytes": 395434042, + "checksum": "aa4384f587fd64c24fad9a27defb0345eb44cc536b3d45c710017d225c191ded" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00765-of-01024.json.gz": { + "num_bytes": 397204482, + "checksum": "cf419554f6c4f6201ebe92e7a232013e5949910f3d54f5cf3d1d65845685c7ca" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00766-of-01024.json.gz": { + "num_bytes": 396420917, + "checksum": "32076dd8004ebe35f46d6e790fd6330ad1d7df2b7ae3c4ede325b0da73a673ad" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00767-of-01024.json.gz": { + "num_bytes": 396840905, + "checksum": "08e5fd0fc1578a337f3dafdb3c718ade437256119e1968e9f958a8ea9d052c81" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00768-of-01024.json.gz": { + "num_bytes": 398085225, + "checksum": "3579e0756bb6cbf1eddfca27de5cf067a212d683134bc6f8c26a79b7d802bfce" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00769-of-01024.json.gz": { + "num_bytes": 396879117, + "checksum": "0913c93203a084521212e473d08c1d11e8136a8e37f1891330fbce0397bd431b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00770-of-01024.json.gz": { + "num_bytes": 396386647, + "checksum": "6c12ab51c92b9c92336a6142a1a4e2f7c3725beb7e61dcb004551d13e8d5488e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00771-of-01024.json.gz": { + "num_bytes": 396279989, + "checksum": "752deaefbf22dd1b1adb36561e8524c1dc555fd105bf3acb78611be9bce72318" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00772-of-01024.json.gz": { + "num_bytes": 397850815, + "checksum": "4f1969284d1f448caf0bff5d05eeb995cf2339801f6a71e01286f4f7f387c564" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00773-of-01024.json.gz": { + "num_bytes": 399466666, + "checksum": "20ba552cd30349bc8a2c0b6a8701d4587a005e7ebdf6e3f2a3bf95462c304447" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00774-of-01024.json.gz": { + "num_bytes": 398051538, + "checksum": "1f66196e8fbf0ebef977f235d2aacb7245f4033b53ecf75ada2f8007465a629d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00775-of-01024.json.gz": { + "num_bytes": 399284061, + "checksum": "97df92baa605c34ce857d380f1ca42f9e2a0de499ccaa9bab26a5c449451d1ef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00776-of-01024.json.gz": { + "num_bytes": 396710162, + "checksum": "4b1ec54b82c8e5d969d3000ce547f4c20df16d9cc0b889b2b58c8839e9d8e27f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00777-of-01024.json.gz": { + "num_bytes": 397265441, + "checksum": "03827ccc3c5bebbd12a04019e9797945c55becabf7f9c1f3fe5353513f5c5a38" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00778-of-01024.json.gz": { + "num_bytes": 396050013, + "checksum": "54aeadf4fe16949b2ee9438feabe979570e7587bb07b3c57e47422f662191936" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00779-of-01024.json.gz": { + "num_bytes": 397124991, + "checksum": "913e268b5474a8b4cf1426f5a0a06c7f437eeabbc35f0126481328b419f85bf6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00780-of-01024.json.gz": { + "num_bytes": 395196367, + "checksum": "4c1a4f296916c30103a5dacacf8a167e43bb424d085ed3491b19f0ec1985d9f9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00781-of-01024.json.gz": { + "num_bytes": 396578403, + "checksum": "a54f26c233662299ec8f0ae1bd266879e93cf4676707b0955114a1a80e2fcf61" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00782-of-01024.json.gz": { + "num_bytes": 396142106, + "checksum": "3713c6b725afd833063402e6577bc0ed003a87720f700f9272864c2360bfd260" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00783-of-01024.json.gz": { + "num_bytes": 396470511, + "checksum": "fe9d904a07ffb2581b6734c8dd847435b867d3043ce4b4840b1c54374919d757" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00784-of-01024.json.gz": { + "num_bytes": 398156228, + "checksum": "af762a9ff3eeb7ed4a56f54702911f0c190b97f8efaa02cb89b1626a1c44c9f4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00785-of-01024.json.gz": { + "num_bytes": 397185035, + "checksum": "6629e1827aab88f55d53de24625f8362daccf910663db8584d959aa44f8043a8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00786-of-01024.json.gz": { + "num_bytes": 396556703, + "checksum": "ce51603900ea0aad8981fbfa8d05d684bfef5360413dadc6933246c2dc81c413" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00787-of-01024.json.gz": { + "num_bytes": 396214799, + "checksum": "6eed5802b89d63eea115cbfd9e00f6d1b4970bb3600a887b904b548181a4acef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00788-of-01024.json.gz": { + "num_bytes": 397965162, + "checksum": "eaa948fdaa744576f006bd70d54f129968772a479fb0bd8e946d7605857545d2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00789-of-01024.json.gz": { + "num_bytes": 396280999, + "checksum": "e0b80ec73507f96310abf070e5cd17d5a67ffb4a337820a8b79a02afe81a0b99" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00790-of-01024.json.gz": { + "num_bytes": 396224660, + "checksum": "2b4a06fb6f68c773da34f8d4c33d7746b6a3206bb242042841e5e007fe3cb6ea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00791-of-01024.json.gz": { + "num_bytes": 397681975, + "checksum": "1b167c20d0414d970cda74cd357cf07d69abd1d3fb0f57222028b369551d513b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00792-of-01024.json.gz": { + "num_bytes": 396210611, + "checksum": "ab55128753a1e58d1032b8fd747c48158a721b12e85990627478f22b78e156ff" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00793-of-01024.json.gz": { + "num_bytes": 397534599, + "checksum": "e7476bde08e0065c523d09932cf2cf6ffe8ba023ae0ee435238efb5dd6f93d7c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00794-of-01024.json.gz": { + "num_bytes": 396536137, + "checksum": "6228922504b2d3ebeef4735abdff06cc786d6533a6c150d50f34042aeeae1544" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00795-of-01024.json.gz": { + "num_bytes": 395235406, + "checksum": "9dae151c15898d7991417596a364e30f00e0ff6280f1505953e6de40c2e228e2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00796-of-01024.json.gz": { + "num_bytes": 396226178, + "checksum": "1dc8decde490324087fcd06e4b1e17117606f2d61a80d506d89a12cce11ba291" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00797-of-01024.json.gz": { + "num_bytes": 398556774, + "checksum": "a454758e8cffccc88f83517a241f2457e683647949cde6aaf1e217de42f6a52b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00798-of-01024.json.gz": { + "num_bytes": 396109677, + "checksum": "3daa6b8602517b9873db96522a2852d940d52cdf0fa86f259ac41a9cd688751f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00799-of-01024.json.gz": { + "num_bytes": 397930210, + "checksum": "09dec669699a437d6fb78b3f2705028fb380b2eaa20ee73b77270216a48b8a95" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00800-of-01024.json.gz": { + "num_bytes": 394545441, + "checksum": "726f99301047519de253e3edbaef5f4a4f95e3850b1b98e01c7864499dad7833" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00801-of-01024.json.gz": { + "num_bytes": 395867151, + "checksum": "a97ef657bd8ea718427ffc686f55fc1786f0834755fce3ea3ae8402d9f75c11b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00802-of-01024.json.gz": { + "num_bytes": 398573429, + "checksum": "20ee1f30272a0d5db74e8589be12c17173580cc9f14b039b3d33f3197816ef95" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00803-of-01024.json.gz": { + "num_bytes": 398084513, + "checksum": "31d1a8f6965d3a8cb7e28fa8bf2cb9a5609d4a129dbc630a8e2a939f475b2003" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00804-of-01024.json.gz": { + "num_bytes": 397815811, + "checksum": "edb758146d462848bdb113df90fa4b9f451eca6658cbd2cab147c8b0eaf88a70" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00805-of-01024.json.gz": { + "num_bytes": 398641802, + "checksum": "b916bafa7269ad4ed09c58c74dc3f098b529444609dafc57e6e4056aa6496ee9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00806-of-01024.json.gz": { + "num_bytes": 397993720, + "checksum": "92fcc5881ca81b808c14f8c9960d873be70f857f95fd1e777b1ae1d4c62bbbaa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00807-of-01024.json.gz": { + "num_bytes": 397743279, + "checksum": "79aca62194176964b66a90dda7631d01acc2a6abea1ba19a90076139e390170a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00808-of-01024.json.gz": { + "num_bytes": 397076817, + "checksum": "a469391e432dac6967e841d46eaeabe9429849492a3df5e91431777fe9b9f164" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00809-of-01024.json.gz": { + "num_bytes": 395533122, + "checksum": "1278d928e105ea7d9c397ef1da79dcc8791dfad9177727aba098bd451734ce45" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00810-of-01024.json.gz": { + "num_bytes": 397468683, + "checksum": "5c6f3e7550827de9d7028decd82320a55722785394ea4951ee78f3ffadb2d4e0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00811-of-01024.json.gz": { + "num_bytes": 397348260, + "checksum": "8c1ece72814dd82bf1bb663b76a40c58129c08540195f9b2134eff5837faa366" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00812-of-01024.json.gz": { + "num_bytes": 396753479, + "checksum": "b3770924d0576f7cd1706771c411f0f288277c6c6c922dc7af4017b665109a88" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00813-of-01024.json.gz": { + "num_bytes": 397977743, + "checksum": "864040da6f03f4d2ed2a9eae4daedf304e0d27196f0b522cee4e8fee55f9ea71" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00814-of-01024.json.gz": { + "num_bytes": 396168620, + "checksum": "542986bb3b75ffcfc853af11a80edb6a31e12527d2588f1c5b2119fe35d3f150" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00815-of-01024.json.gz": { + "num_bytes": 397639162, + "checksum": "a617c2f27306ce5de74ab756cbf74707fddeb0aa92277b66d0cd65be230f386a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00816-of-01024.json.gz": { + "num_bytes": 398296204, + "checksum": "174a2e77e6562384cc4e7459ebf536db5cf4b530e4f1d7714e60d082ac7a19c6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00817-of-01024.json.gz": { + "num_bytes": 396112543, + "checksum": "95af2c4f32efb4ed2a41cfa38dd2be09d51d4b0dc53ca8763309503f0276d56b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00818-of-01024.json.gz": { + "num_bytes": 398371592, + "checksum": "67789e3525f2daf6af2551df12a50341c3ef51c89a9c714a8def76209b5b7460" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00819-of-01024.json.gz": { + "num_bytes": 396751420, + "checksum": "07431a263e2bb92c048fadbab74ce1399f76fc57a04d7f9e90cb33aa60a4c5e9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00820-of-01024.json.gz": { + "num_bytes": 399213859, + "checksum": "83c03df95869973c2ed46c909c0e92e7ecd75317c06b09e447a62b592421d1c7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00821-of-01024.json.gz": { + "num_bytes": 398408628, + "checksum": "b5cb8c52a8713c5291ccf29c171e9bd9b57a54211392a19e8f31182d1053a032" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00822-of-01024.json.gz": { + "num_bytes": 395429180, + "checksum": "8c47bf7a0d2b9c84d255df0e7da058fba2b4ca6da3c20cbdfe5a686e01cf5c45" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00823-of-01024.json.gz": { + "num_bytes": 395437149, + "checksum": "62818e45f34e70728494c74daa583e30c70aebf91c2f057470039f6d35059691" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00824-of-01024.json.gz": { + "num_bytes": 394503147, + "checksum": "e9fd88994b23531ba26e6859ec1985798a2ab9b300c2fdb1e202ac553ab305b0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00825-of-01024.json.gz": { + "num_bytes": 398841091, + "checksum": "77ad5a9ac5e3c1d1180981bffbbdbf8a429854001d990258c615e0e16c8a9f6a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00826-of-01024.json.gz": { + "num_bytes": 397404278, + "checksum": "06a39374c1cda19cc4b034c4877e1fd3bdc84290fdb621fdcdc77f3c5eea9a47" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00827-of-01024.json.gz": { + "num_bytes": 399316947, + "checksum": "fd27a73b130c1cf8256f22212e23799d0dd31281cd29bcf9bb658bcda457b66e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00828-of-01024.json.gz": { + "num_bytes": 397514415, + "checksum": "3e7d199d05f885e8bba769d21a55a3f2ef2114b66ed738428ceb506fdf272ff2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00829-of-01024.json.gz": { + "num_bytes": 397251538, + "checksum": "91650563e9520b2d1ec2cd726304b781b4156ffb68bc172635a53f425fa6bb0a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00830-of-01024.json.gz": { + "num_bytes": 397653118, + "checksum": "893ef017cbf7d46c99d9c69ba74344cfc2800bb23faf93e7400c0c282422945f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00831-of-01024.json.gz": { + "num_bytes": 397299276, + "checksum": "4eb3c91e52547f3b4af586f5bbdb0cdaf6a345b202a09c6aabff5c5f628b2948" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00832-of-01024.json.gz": { + "num_bytes": 396915924, + "checksum": "9fffd46fc1f1bce010484f2850102e2e153c5695c277efb67f65811630c2493d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00833-of-01024.json.gz": { + "num_bytes": 397652261, + "checksum": "3b89df9375a906c96eb1e21a6572a07de2f5d875996c01c744933984edb1af1a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00834-of-01024.json.gz": { + "num_bytes": 396070735, + "checksum": "b758b4cbfdfb799a8615ec9c3678b27dcd9b1d63af4f272879e0dae84cac9d63" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00835-of-01024.json.gz": { + "num_bytes": 398028152, + "checksum": "6e07f1e6a099aa496fef3015514fe5f3cc665c742f8a783389c7da4ce0e0e72d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00836-of-01024.json.gz": { + "num_bytes": 395941604, + "checksum": "6bef1291a741ea5976749456185a3e3a03c3fcc9ac00370f28672ab39c552db8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00837-of-01024.json.gz": { + "num_bytes": 398655070, + "checksum": "b0b7e1c826302417630c3e1b1877bf106beefb5a7a11feb9bbf1ac3712714fed" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00838-of-01024.json.gz": { + "num_bytes": 396374435, + "checksum": "3e9bdde8b73397a5fce143e91c92f9e66f46b45edfb30da1cac400b9aa7b2ecc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00839-of-01024.json.gz": { + "num_bytes": 396388725, + "checksum": "4154322b97c600742660125e6458787e603cf1a44b49267f4d1c569387fd132e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00840-of-01024.json.gz": { + "num_bytes": 397564603, + "checksum": "f9560028196fc934378389e355101e5e7f8fde9e5c921722704a18b24ebc5804" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00841-of-01024.json.gz": { + "num_bytes": 397001678, + "checksum": "0dad99ac959765280e6bf6d9d1a1468ef9dc9cc781e8f5bb832f7295e4e79f69" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00842-of-01024.json.gz": { + "num_bytes": 397139167, + "checksum": "e81fd683da081349629a0a7ae8ff7813351ed23caf4ef87041b64524034abc83" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00843-of-01024.json.gz": { + "num_bytes": 396044889, + "checksum": "d8e3a5b4148c7e86dea50ee5ba89ef55629d3550fd926c41754e5a26e7e52c36" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00844-of-01024.json.gz": { + "num_bytes": 397365441, + "checksum": "c4d2ffe853b55464961b707b6d0264d6852817077204a0380c906184c077012c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00845-of-01024.json.gz": { + "num_bytes": 396477802, + "checksum": "7b3c4d435eca57a0fad05c106ec5928750aa01d95047618a3bc84e5342e912c4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00846-of-01024.json.gz": { + "num_bytes": 395983616, + "checksum": "bdad2ba411291435ac0cdd083e46aa8369499f014a788fa85ed8c419fe9cb2de" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00847-of-01024.json.gz": { + "num_bytes": 397646062, + "checksum": "3f6bddcefcceaa4184161432e4f0b9292ae4fe7dac3079d4191a31a38f48c7bf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00848-of-01024.json.gz": { + "num_bytes": 395958111, + "checksum": "5ed10d926e5fd1dcbc777df82391eb3ba57276c7303d488d6f3591022d20cc4a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00849-of-01024.json.gz": { + "num_bytes": 396960036, + "checksum": "ab82adc6f66ab0403cbbb38859009a460e6c8c38c789bc2b2420da8b87096a9d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00850-of-01024.json.gz": { + "num_bytes": 396603592, + "checksum": "5a6aa59a01504f5655d429dd5cb3ebc39e3994b22cbaeb5b09ceb29a26b94031" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00851-of-01024.json.gz": { + "num_bytes": 396511886, + "checksum": "f1954da7e217d893a0237a0f431dd2a9071723e543bf0f4943ce38fab048a44e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00852-of-01024.json.gz": { + "num_bytes": 397626831, + "checksum": "f5cdcd7ec4f3c855a1006f9278ed4df50574a3fa7aa1c5a2e255ea5fa1a770cd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00853-of-01024.json.gz": { + "num_bytes": 395811873, + "checksum": "24b1033da877ebddc09cfe2d3325868448dab9083b5147d6cfc4fa63ab402a94" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00854-of-01024.json.gz": { + "num_bytes": 396513614, + "checksum": "419952e0bc38cce474190c0b9ea581ccbce77da5e045dd60f5ff1fa1d2833d19" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00855-of-01024.json.gz": { + "num_bytes": 396493352, + "checksum": "3d2b529871c625fc9c1c59b9d5cede2a77e609041f1ea044d68ac16e9fa6a30c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00856-of-01024.json.gz": { + "num_bytes": 396852729, + "checksum": "a3b56e6171fc2b14ebe67f6a71af688ea6135597bb8f8cf83e2fb460727aa5eb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00857-of-01024.json.gz": { + "num_bytes": 396428653, + "checksum": "de550a5d608bffde45c149bc0d4c1165cbd3b5baab3d3529f006a02aba6d53e7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00858-of-01024.json.gz": { + "num_bytes": 397039613, + "checksum": "11374c2685676ac2eb3dd0d281b44b512ff1d2968ab320d9c857b44304eb8ab8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00859-of-01024.json.gz": { + "num_bytes": 396515194, + "checksum": "64879e565e5c467e630566ab75524bb300d58798c814637ffebd15646544cd5e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00860-of-01024.json.gz": { + "num_bytes": 397764125, + "checksum": "7e22be61b3413c8fca2414087655b7ef7bef2ab5ee373fee74d13c8fb991675b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00861-of-01024.json.gz": { + "num_bytes": 395314420, + "checksum": "29c451c69c8c05f6eee2741b9ef6c241f551257a45da8342a1d6bb341f80314a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00862-of-01024.json.gz": { + "num_bytes": 397763845, + "checksum": "679668616899f548fb35da32c3e5f121002670cc3296c0c90f5bf45eb3ea1d79" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00863-of-01024.json.gz": { + "num_bytes": 397356206, + "checksum": "43c5b3af2173d4293396f336ec363aa2f31580b65128f44ca8bb891f2022859c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00864-of-01024.json.gz": { + "num_bytes": 395463092, + "checksum": "77b7b6299955f4869e5db994fa6b20fe3007cf8cf2b6609442fb1ed49284cee6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00865-of-01024.json.gz": { + "num_bytes": 396909291, + "checksum": "7eca0e82842b52f99640ab574e4b2446309aba6ac262f980fc6d249a337d06a4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00866-of-01024.json.gz": { + "num_bytes": 397587651, + "checksum": "931014d99ab2a765ebf90e876694647c265ca5e6bf2b459eb027d6b06643a8ac" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00867-of-01024.json.gz": { + "num_bytes": 395992645, + "checksum": "0976a5389aed40e4bca89cf22382cf121390c75bd755437be474c097c8fee0ed" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00868-of-01024.json.gz": { + "num_bytes": 397789857, + "checksum": "6ffd848d165290a746a21767e79a9f046b70534aaf7b14fc01f9365e4e3f7d93" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00869-of-01024.json.gz": { + "num_bytes": 398124116, + "checksum": "5fb85058bdf40c0ee6cf748cda7483b1b3cfad18c26a90c2150c2a3f30ceeeca" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00870-of-01024.json.gz": { + "num_bytes": 396432487, + "checksum": "89d50aaa3620eac4ad593a403ea637b2ff090361ead05c3aa8c7a3351c66ad65" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00871-of-01024.json.gz": { + "num_bytes": 397484772, + "checksum": "490f4104981a9ab3ef04600a4865b9a2a18239e335d7fb7fff79ec1b7a225318" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00872-of-01024.json.gz": { + "num_bytes": 397240896, + "checksum": "d344994866bc49475f66e9937636afa787e1ff560e3f62dc1a0e4d0220d6ed39" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00873-of-01024.json.gz": { + "num_bytes": 395450398, + "checksum": "5d3b320aab1f7f09450531649666ded1aba8a9bbcf0f47992c43cb40a6d7a929" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00874-of-01024.json.gz": { + "num_bytes": 396365056, + "checksum": "346aae20204537ba2f4a865ca80b5d1c6da1e3a3b78d306d7570a69f185cc4fb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00875-of-01024.json.gz": { + "num_bytes": 396679348, + "checksum": "ba81f9c1650d30853edbb9886dde84658c254dee5a3ac1062484f7194cd413f6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00876-of-01024.json.gz": { + "num_bytes": 398278881, + "checksum": "88fb38aad7cadd76c818dbe7a372144dfe17d110f7d2123a80d14686fb43a6dd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00877-of-01024.json.gz": { + "num_bytes": 397051868, + "checksum": "049e4a62056c98284b35d10a74ad5ef7014265a6dccb99a71f93a409933a685f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00878-of-01024.json.gz": { + "num_bytes": 396132123, + "checksum": "bb7b97a82bd6d31612de66a03af35d404b15808b925e7fd94bd0a8e9e928b927" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00879-of-01024.json.gz": { + "num_bytes": 396520374, + "checksum": "2a56fed53aa022e6a7956f604d54d99af89a15b6c7fc6b037f94d347f1d15f51" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00880-of-01024.json.gz": { + "num_bytes": 397004524, + "checksum": "1cadef434909d4508a9a6bf40d6a9323256f3089615a5d2963c83040d5f549f8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00881-of-01024.json.gz": { + "num_bytes": 397336334, + "checksum": "0e36dcd0eb1773eec15ffd0fbbe8951343bb6961dd1838b51e74da2e055db176" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00882-of-01024.json.gz": { + "num_bytes": 394949798, + "checksum": "78c99406cb921c2b8f5b86e4e7eeed24c799678732e5a5450db6b12b7ceeef61" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00883-of-01024.json.gz": { + "num_bytes": 398647721, + "checksum": "f0e7a0a9970c7fdb5f629771e76bb06bf62b79e9cbf5008e866f954dd436401b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00884-of-01024.json.gz": { + "num_bytes": 396040500, + "checksum": "05272a55eb2840f94a7dcc30a8d09b957511b983b0fc3fa618a8995bc594d055" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00885-of-01024.json.gz": { + "num_bytes": 396460591, + "checksum": "27511aa50410260d261866dc970b897b10a95dd4dfd92b0bc3a5fc41e6c75335" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00886-of-01024.json.gz": { + "num_bytes": 396149133, + "checksum": "e66ba9c7ceca631a4b43ecff1e151524a209368f298ca83624476ee9144cc3cd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00887-of-01024.json.gz": { + "num_bytes": 397164216, + "checksum": "95e341054bd8a21e7f49e4a5aaa5fbe51517ff631e66e67ff1cdaea6e3178002" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00888-of-01024.json.gz": { + "num_bytes": 398216402, + "checksum": "6fef57de31fa1692d8a4021b317554688657fad3f55dc144e2971d63083e7879" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00889-of-01024.json.gz": { + "num_bytes": 396976936, + "checksum": "36da1bd0eaa27ca6e8510a3c005695fbbd7b0fedf63f077e3787590d4b1af625" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00890-of-01024.json.gz": { + "num_bytes": 396903125, + "checksum": "6bbbe5db2c0938efe5f8afe7b30765f45cedc9fd4209bb7826c489381175bc5e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00891-of-01024.json.gz": { + "num_bytes": 396404354, + "checksum": "47601b1b1a0a725c32ae0c32364f7ac188b7e8c68d29a2dffbe1a4dbe39393f4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00892-of-01024.json.gz": { + "num_bytes": 398144052, + "checksum": "a7b6bdafa5a226c22ccdf97c873e4915ed8dd8b59e2820a4dc62f600b4710175" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00893-of-01024.json.gz": { + "num_bytes": 397990484, + "checksum": "12f08cfa1fb4f94a3d7d9584cc3f5ae9fa518cc095e4cb07939d02ecfb7ffd9b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00894-of-01024.json.gz": { + "num_bytes": 398271782, + "checksum": "004bf46ac7c8d7770b458ec341322f5cef643926aff9255954f08faa1dd43d53" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00895-of-01024.json.gz": { + "num_bytes": 395489909, + "checksum": "3ea14b3dbd7a4c9cb7aad83d1311d335714aaea5b2dd0374debd63c56d02dcbb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00896-of-01024.json.gz": { + "num_bytes": 397589097, + "checksum": "c0f1c7e54bf7a808f66d2acc9aec79f1ce936ba480f5d1e379c6853714413175" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00897-of-01024.json.gz": { + "num_bytes": 399215096, + "checksum": "20958123acf2d578448a5166f1209b0452db33ed395cfe512015106bf99ad31d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00898-of-01024.json.gz": { + "num_bytes": 397044516, + "checksum": "46c5145069d861c04b2ac1afe80c4c4453f91869f6cb6a1d9f7b648f1b08942e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00899-of-01024.json.gz": { + "num_bytes": 397687759, + "checksum": "2a3923d8ff2ce0eab5978a8e0198bc2d1512cfa19c69e673e048b8eaa72f82b6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00900-of-01024.json.gz": { + "num_bytes": 395192267, + "checksum": "9cc72deeea7fbc0fa3782c41938d66315923dd9f53d89f47c00f85f93e454ce5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00901-of-01024.json.gz": { + "num_bytes": 397806320, + "checksum": "8cfff74f280636416f523c271f75e5704a570db4cddb8a70d033158868c21347" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00902-of-01024.json.gz": { + "num_bytes": 398450537, + "checksum": "7df8804eb5ecb79177001f9ce3c66f0ad20cccd8151e817816e9342d07c392be" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00903-of-01024.json.gz": { + "num_bytes": 396733151, + "checksum": "89551a52d1e97b4ec3007f8c43191c1ae1475d0ba5b48d20818a12c85b0add74" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00904-of-01024.json.gz": { + "num_bytes": 397497719, + "checksum": "2bcde59dfaa642722969d1401a4ce43a35c57930bb1d664371efece1e2e91c32" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00905-of-01024.json.gz": { + "num_bytes": 395760696, + "checksum": "ec844272b0666a455dfe0cab065e00df44e8da2156a03797100418307c96830c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00906-of-01024.json.gz": { + "num_bytes": 398496346, + "checksum": "ff68909d470edef08929a91068e1de02841c16a000fbbd17ef042cb76f1fff37" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00907-of-01024.json.gz": { + "num_bytes": 397085405, + "checksum": "a9b26676af61a6a1355225bce5bbcd67aeaf0fb7dc2209f30235b275536baa85" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00908-of-01024.json.gz": { + "num_bytes": 397037103, + "checksum": "e86688677a46103b0b224333faf1b4f89da062e4ec0ee35752c91ff9772697c7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00909-of-01024.json.gz": { + "num_bytes": 397394775, + "checksum": "93082177607900bfce7fc53f1665a831093bb50caea33e014f327181579c0012" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00910-of-01024.json.gz": { + "num_bytes": 396668466, + "checksum": "dcfe639607c18a309e2c91864a6912dce3851abd62bbed3ba16390899e637327" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00911-of-01024.json.gz": { + "num_bytes": 397926997, + "checksum": "aa995c38d953237b1d6d53be7237958a00ca2dbab4a753c7c4404849fb416d5d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00912-of-01024.json.gz": { + "num_bytes": 397810240, + "checksum": "e3f17ac285e8c9b04713713a957602a63e176f476d4a67018012e9cf2a3e5a84" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00913-of-01024.json.gz": { + "num_bytes": 397143597, + "checksum": "4082ab833be47cf881693ea4442e3940625e0d2c1117e15234886fdfa779bce3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00914-of-01024.json.gz": { + "num_bytes": 396398347, + "checksum": "7c62dfd17b21ff64af640e4aca8fea0240998596d11ca551a3ab045d5041fcac" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00915-of-01024.json.gz": { + "num_bytes": 398622100, + "checksum": "69abe67cda4b1613d5f741804ccdb294cd5f457027818d9366db8cf2f5f40871" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00916-of-01024.json.gz": { + "num_bytes": 397387266, + "checksum": "6effa83cbf3345fd7e41e432ef82156bb1334f2cf17589bce313aebee9727131" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00917-of-01024.json.gz": { + "num_bytes": 399730979, + "checksum": "f0d0ff1ae76a84c07647fa1517410533862f1927fa85dbf38017dabf4607bc1f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00918-of-01024.json.gz": { + "num_bytes": 396895902, + "checksum": "84cc56e725be31047d0b6a025cfacefc462f4a1a546feaa34af95a6f25a4e1a7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00919-of-01024.json.gz": { + "num_bytes": 395247578, + "checksum": "daa3156989ddaa9a7eba228848697ccf6a385679359ab765881d2293bef107aa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00920-of-01024.json.gz": { + "num_bytes": 398305242, + "checksum": "2a9e02ef643962f6009e42304b983c87bae7b74c1edcbf8e6808b320ea7ea776" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00921-of-01024.json.gz": { + "num_bytes": 396446011, + "checksum": "f83526ad11d81820fce4231e3303d613dbbe56a8fae878d9442c8d7e98023437" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00922-of-01024.json.gz": { + "num_bytes": 398010331, + "checksum": "e47cb9d7550644ef807c3ea9e19ca4aa1df54eb908b54651bf0e17f0ded9157d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00923-of-01024.json.gz": { + "num_bytes": 399160018, + "checksum": "470401e5b0777096806113a36dcb92b8d453d6e8f5f4f0b15df2788e382ca03f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00924-of-01024.json.gz": { + "num_bytes": 396880756, + "checksum": "c86e546c68bf8458951fa723c086d6efa5b210f53cd4fcb2de4b9efc7a71a275" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00925-of-01024.json.gz": { + "num_bytes": 396806561, + "checksum": "5d9b1105c0053dc9530c911046f4da458f41d92c771282d0df8a3a22838feaec" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00926-of-01024.json.gz": { + "num_bytes": 397479994, + "checksum": "c3253305ac4ef226501e4fd4a6acfc6067a76c084ad852eb2a9f5916aa3d51a2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00927-of-01024.json.gz": { + "num_bytes": 397083225, + "checksum": "8931df0ee597f72ea3592d0a4d236ce655a92cf4e7eb9298145f496246c18c21" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00928-of-01024.json.gz": { + "num_bytes": 398000839, + "checksum": "5e29e75231bdb413dedd1211bd87e9fc3f4ab8bba41999afc1ddcddc16f4599a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00929-of-01024.json.gz": { + "num_bytes": 397731309, + "checksum": "03f7a9199b7927a6d78a8aa4eed32c250d32dc409e3bb2847d7db948ee63d46c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00930-of-01024.json.gz": { + "num_bytes": 398133003, + "checksum": "b22a79dc228697394d0ce25b7d31112f9e1a6508cdc4b57af35e84e65167bfeb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00931-of-01024.json.gz": { + "num_bytes": 396694508, + "checksum": "dbbc65db3d442f9ace85498a3b27bb598c20cea171b3de17d409f9b989c262d5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00932-of-01024.json.gz": { + "num_bytes": 396255463, + "checksum": "02af4162b084004e99dc6862c88749545593e342a83523597cada140e57a0ab7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00933-of-01024.json.gz": { + "num_bytes": 399013035, + "checksum": "dc4d3b4f03c36a8f1393ba15195c3f64b128862b812839689fa387e708ffabaa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00934-of-01024.json.gz": { + "num_bytes": 396593138, + "checksum": "02a5a8e02b2636c9e912a9ef8a79ececde4f4fc92bea74e59791d181bec104cd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00935-of-01024.json.gz": { + "num_bytes": 396748502, + "checksum": "05d1d6290580d5c74b906ab03fe6773ecaaa1ff3be84dfdef48d1a2e7f5e1120" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00936-of-01024.json.gz": { + "num_bytes": 397737673, + "checksum": "351d3543b1457da9719061948a1b4bdd79be8a0b786ecd6a9a8cc0db49cd2181" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00937-of-01024.json.gz": { + "num_bytes": 395377872, + "checksum": "d431b01bddcf911d7da5bad74a78d0d1527d60d9720f77868ef08e1a65850986" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00938-of-01024.json.gz": { + "num_bytes": 397193715, + "checksum": "bff5e755b174e3608ba72b39898a2bb5e9ca6d3362b70bd66143566aeff52690" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00939-of-01024.json.gz": { + "num_bytes": 398044482, + "checksum": "03facf22c376f03a8078e99d1dcc1c22ed5d7e179de472019cae894f40c7a4ad" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00940-of-01024.json.gz": { + "num_bytes": 398894204, + "checksum": "3d3a2125262ee8ca498cd54db52fe626d010a2a93c000ea2b45f931e491ea9e5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00941-of-01024.json.gz": { + "num_bytes": 396758197, + "checksum": "b3957de08e7779d8ec23af02a6d709189796314c70a99f46c90d0bfbd14ad561" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00942-of-01024.json.gz": { + "num_bytes": 398181993, + "checksum": "74aec8dec794c79683dfe43d8aece4c1c47c5389aa6d4bea847ac461cb5ba21f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00943-of-01024.json.gz": { + "num_bytes": 396271547, + "checksum": "231f63d05f81d249f618768c9f712cc31314dacf55a6004902a0e7d0bfb13724" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00944-of-01024.json.gz": { + "num_bytes": 396603419, + "checksum": "d5661730f3ed6cc5bbc5d935a6f1ac7d241b40c52dc83775a421e7a1a672f518" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00945-of-01024.json.gz": { + "num_bytes": 396596660, + "checksum": "3b5aeb0786dddf0b9cabe2ca071283b276822e2861d8688e38f927595c159b02" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00946-of-01024.json.gz": { + "num_bytes": 399900563, + "checksum": "6d5549970af2c6987583477991552e1944b411642782c07d17eb52f91e714a1b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00947-of-01024.json.gz": { + "num_bytes": 395391489, + "checksum": "f5544ecb42c385cd5d5120c82140e4a36051f6a401d89ce30c8f2fc08cd69804" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00948-of-01024.json.gz": { + "num_bytes": 399257562, + "checksum": "1448cca7f1b9824adcf8437a33d14a7e95b705396611f82e7aba9a69e0a25118" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00949-of-01024.json.gz": { + "num_bytes": 396371965, + "checksum": "a7eb228f1d1ff2744af3d1a1358a94611cd92c25d81edac0e209b9f81c8a0a60" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00950-of-01024.json.gz": { + "num_bytes": 398022110, + "checksum": "8651693d2180e518039da487f638c532c53f6d79a33356922b2d8706aa6a83cc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00951-of-01024.json.gz": { + "num_bytes": 396224338, + "checksum": "c46bc8aa1621153fbd913b5d0b23a82352a28b36ec997c4df4b92dcc6ef26895" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00952-of-01024.json.gz": { + "num_bytes": 397581207, + "checksum": "02775930e3c420978a9d2785ee0137c3963dba7bc34538b2155eb38dd6ee89a0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00953-of-01024.json.gz": { + "num_bytes": 397045599, + "checksum": "9d54940cb594de6e0f8593f64293e96375f0a5c56f3569c72720476bcef1f1a5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00954-of-01024.json.gz": { + "num_bytes": 395457873, + "checksum": "3c12a1c3061164f345d9e402bed28be9af84ef56d5df1b22a3cf9f818ed47ae8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00955-of-01024.json.gz": { + "num_bytes": 396450938, + "checksum": "45db78bea4fae6cd69d900c581fccda873d2aa9f24ac5e9dfc18b486c15c3788" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00956-of-01024.json.gz": { + "num_bytes": 397120474, + "checksum": "7db7ea23446bd8a66737546c5daa0c2dec7bd5c4743f52eb53685ccbf54d9b17" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00957-of-01024.json.gz": { + "num_bytes": 397403279, + "checksum": "89de2950bc3f7dd4f95d8a0b7cba19e9678bfbc23175bc22d9f9599ec1ad9cd0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00958-of-01024.json.gz": { + "num_bytes": 396861933, + "checksum": "f325478647cbec9d79bff2266672144147276a82f665d3014c5d2fa9c112c387" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00959-of-01024.json.gz": { + "num_bytes": 398439950, + "checksum": "70d786bb337c012269caf6aeea3bf9604d279d3e4335294c72ca6cb5a9fbd951" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00960-of-01024.json.gz": { + "num_bytes": 395684257, + "checksum": "e1d170b0a4d6954a920ef3923688a7dbf40398609ed2ae04b2635df9ceb07821" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00961-of-01024.json.gz": { + "num_bytes": 397526287, + "checksum": "47b90e3747f35bf67c872d65d843f6dd9bfca15dcb769b31bf3586c6645858bd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00962-of-01024.json.gz": { + "num_bytes": 397473683, + "checksum": "d0ddb2c104f515144265bd3eed526a65ada46f848183688b420694751b113272" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00963-of-01024.json.gz": { + "num_bytes": 397964876, + "checksum": "74725b631c1699b1166589eaebb66374c031b170eab3ab359230cd4a23a8ae79" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00964-of-01024.json.gz": { + "num_bytes": 396523661, + "checksum": "fa0d49a2cc726628d9a1b5ae2ace52ee90401af8ae15add27c3f4566dd99a79b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00965-of-01024.json.gz": { + "num_bytes": 399289514, + "checksum": "11fb1878a8b204181f7f776a764f5e9e577d0fe62d4b2e4ce2164ce9fcc30b8f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00966-of-01024.json.gz": { + "num_bytes": 397411408, + "checksum": "5646014ca3c99f53bd13183187b1e6e8f84cb6c846d6f1f3a3c82edb4accc47e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00967-of-01024.json.gz": { + "num_bytes": 395095282, + "checksum": "b799b17f36d85235eaf1bed9f4f760a22b75fca736744218e44fae5917a2286c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00968-of-01024.json.gz": { + "num_bytes": 397189410, + "checksum": "8d9748f5a92a9e0b836fe74b962bd2da04b62a0a2943ea5e440cef19166a5479" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00969-of-01024.json.gz": { + "num_bytes": 395651742, + "checksum": "f42c71219641fa302692698b4944864f27b7f87d4477a86babe23745dad72715" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00970-of-01024.json.gz": { + "num_bytes": 396180197, + "checksum": "383d9586f27579b4a97c5901013b3e025f10dc813047d65158d6621430803aec" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00971-of-01024.json.gz": { + "num_bytes": 396574555, + "checksum": "d2c9700fbac454d3b3a42b2a3c4eb0111eb7cca7cab3d545b0912aba60415c91" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00972-of-01024.json.gz": { + "num_bytes": 399639122, + "checksum": "5d59e643bf20156a28e5e9dfcd811c5a6c3779e1875f375db09a0fa1871dcc90" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00973-of-01024.json.gz": { + "num_bytes": 395456709, + "checksum": "8b22e82588e30f30f664895b9716cbb0cf38d5ff4331d3be31ab25663c634a00" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00974-of-01024.json.gz": { + "num_bytes": 396693438, + "checksum": "5fba4f9d634d968f15d5d4fb29d253646494e3e125aaf1c2f8fab38a7e60180b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00975-of-01024.json.gz": { + "num_bytes": 395697641, + "checksum": "b4c5fceb9fa2397a9b7c75249bd3386b8dbf999d5b52521051a86e067d698448" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00976-of-01024.json.gz": { + "num_bytes": 397172005, + "checksum": "093aa01a944a222828656d31dacd8ecd57a24a51d361a8742514bb6af009dce9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00977-of-01024.json.gz": { + "num_bytes": 396182407, + "checksum": "1beef6e248c00abee5f8952641b12d3f5b12d58adc05c8d461c0a073a6ca9b39" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00978-of-01024.json.gz": { + "num_bytes": 396180428, + "checksum": "0f2bb125af300de2c9fe347899673a4bd2842ba8298146bfe94c9eddc41893cf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00979-of-01024.json.gz": { + "num_bytes": 396479117, + "checksum": "1fe9d0e54b9be79722e6483e386801263ca51d6e9ad925dabbb58a38c4df877e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00980-of-01024.json.gz": { + "num_bytes": 395119279, + "checksum": "0f262ff2d4701497f6fd6d4f9d3cb1aa3a730ad6bef1961d890a3b0cb4747ee8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00981-of-01024.json.gz": { + "num_bytes": 398285798, + "checksum": "a295b85e63c176cecd9f5222ba417eeda307e41847eb38c61dec9b83101a8256" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00982-of-01024.json.gz": { + "num_bytes": 397811687, + "checksum": "2a3a0e0f454dd72a68ed1dd71c508a9b24fb2349ffdfc588cbfcef728cbaff05" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00983-of-01024.json.gz": { + "num_bytes": 397069906, + "checksum": "5b4256392755c4dd79cd37cd6ede645a9a549c4436acd27495e974ebe1d80bc7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00984-of-01024.json.gz": { + "num_bytes": 397670152, + "checksum": "68d4f5dbb3fa349a6811edce8056eb297e771cb9c9939c3a84d30c6ba3ad9dc2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00985-of-01024.json.gz": { + "num_bytes": 397949975, + "checksum": "6ba478b8a1ebf3b1dd67ed7b4a055cc9cc3c01bc90c1852aea8f5a99f6c07e69" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00986-of-01024.json.gz": { + "num_bytes": 397730984, + "checksum": "a39a23589cc434e573613e3ead44f33adb005c2c13cea8b33601647c97300fce" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00987-of-01024.json.gz": { + "num_bytes": 399173506, + "checksum": "eab46d9d0a0cf05dc5ba475017d98f02f1cfd756c8e707d9823a0463713ebf23" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00988-of-01024.json.gz": { + "num_bytes": 398674037, + "checksum": "88749d380aac85314df66448542b696e9ae6f61f1b27dc395556737f59ad9024" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00989-of-01024.json.gz": { + "num_bytes": 395313344, + "checksum": "bc565b662396e3ab4e108635e01873014515663bd5216926a59ae80f6cd4273b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00990-of-01024.json.gz": { + "num_bytes": 398567254, + "checksum": "e9b9bd97a30ccac353a2386babbd01c3a3bbede8c07bc28d17aecc7ef5af6330" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00991-of-01024.json.gz": { + "num_bytes": 396958611, + "checksum": "505ab5458d5e52d656048284fd22cc0fcd16e49ba19331669239be37645cb04e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00992-of-01024.json.gz": { + "num_bytes": 396102263, + "checksum": "59ac5b2b04f224be04a4ceac6a16e29a33681f19cd40cbce3d3e8eb961b9f33f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00993-of-01024.json.gz": { + "num_bytes": 396935362, + "checksum": "c804f2311de9f7ae5691280e16261b9f8385ef9a71929b2111dfade532b6bdd7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00994-of-01024.json.gz": { + "num_bytes": 398832432, + "checksum": "594727bdc3756e678bd4d156216712ed6c8fc98d3f8e9594cfbed10b2e414554" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00995-of-01024.json.gz": { + "num_bytes": 396699737, + "checksum": "bb3c73c6d48aebf9c60cde56944faa5bb6727db4cc48ae23d67650742462c42d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00996-of-01024.json.gz": { + "num_bytes": 398059244, + "checksum": "ac1a7e6e2c2a5468c704f5a2318b5617dd4ce140b98271e2034e00015db6cd76" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00997-of-01024.json.gz": { + "num_bytes": 397439167, + "checksum": "ce9664b29c86c05d3541aee377acdca7a32ef8f0220e0b4b6bf18276b692529f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00998-of-01024.json.gz": { + "num_bytes": 397383159, + "checksum": "1b4db1b59255f106dd2af7510112eef6d6b611d9f9e000a0e585b623fdb8ae98" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00999-of-01024.json.gz": { + "num_bytes": 396339114, + "checksum": "ee5e1508704b03f0a9cb3c4bfb578c08fb83a4d20760e3b40f101c58cbbb3ec7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01000-of-01024.json.gz": { + "num_bytes": 395172166, + "checksum": "f8cbf0bd9c2b90e588942048848fbfa1a20cf775364cb9c84b4d5dd7cf19e603" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01001-of-01024.json.gz": { + "num_bytes": 396629363, + "checksum": "7cad3f9a28e5988ef91073c48e9d85ea7030289690f817545cfa9f1165dd33d9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01002-of-01024.json.gz": { + "num_bytes": 396507390, + "checksum": "b4ae1017913509855d6d8d4413ff3de4a8d519d91f354b6e5b5267219d20658b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01003-of-01024.json.gz": { + "num_bytes": 397652598, + "checksum": "0c115446c159d27e6e1354173ebec29e6dff5f38c4d2ddb46c07c450523309c9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01004-of-01024.json.gz": { + "num_bytes": 397408971, + "checksum": "f0b559a832a9ee50225fe1417d936d6b898026d80a105b976deaeae75f9e30a0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01005-of-01024.json.gz": { + "num_bytes": 397753911, + "checksum": "e001c9285ade7de6ac23716b596ddcc733f05bd6abd7e1a67874894c93fbd43a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01006-of-01024.json.gz": { + "num_bytes": 397962701, + "checksum": "acf13433824104e4bfc3a8aaf8805eb16712cd97b2dc1d48e7d771bee4bd41c0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01007-of-01024.json.gz": { + "num_bytes": 395966285, + "checksum": "4c6069f6a95d036fd3e05a4246db932ad5ab89b9470274f23a17df0b77b9b717" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01008-of-01024.json.gz": { + "num_bytes": 397075505, + "checksum": "9b3b9c0cd4ee02e18a5d22142183874586da8fd23b4f97033e354f9681d150a2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01009-of-01024.json.gz": { + "num_bytes": 396881470, + "checksum": "14d2d7cf2ebf3b2c73bad4a6099fa1d2b1cb341b100976b03232fb664a7d020e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01010-of-01024.json.gz": { + "num_bytes": 397471393, + "checksum": "01e6f56bebe0c874d82135f551a6b917759c41af48d127df181267dc9b8f6486" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01011-of-01024.json.gz": { + "num_bytes": 398092801, + "checksum": "ead5b6b13bd09136fccd9548c224398401bda0ca7ff62ca4db852760760f13d3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01012-of-01024.json.gz": { + "num_bytes": 397831436, + "checksum": "daa2d1507f9b56de0c4aa9d86d93259c1e6f73f0cdfd553ce075a16807dbcb56" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01013-of-01024.json.gz": { + "num_bytes": 395098326, + "checksum": "c2b21a1a56e9879335c72008919e8f7998dcc1e8df2258fdf2196ea86194e3cc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01014-of-01024.json.gz": { + "num_bytes": 396164077, + "checksum": "0df125946c83c66c6961eae2aa45ad7eea7038d808281d633ce30686a8245e01" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01015-of-01024.json.gz": { + "num_bytes": 397895284, + "checksum": "f6f6eee8fc113b7e717654b9305cc5129c3ee1ce9f263b91f0202762f078a526" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01016-of-01024.json.gz": { + "num_bytes": 397723033, + "checksum": "48426df1f4665d3179251904c96a0e73c041ed5b57885b4dd852809e632685b6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01017-of-01024.json.gz": { + "num_bytes": 396761053, + "checksum": "f33cf2d744585e0338b29a5a5638752123b7b59f9ae3b723cf7e7b536f9f80ed" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01018-of-01024.json.gz": { + "num_bytes": 396562520, + "checksum": "72adb0869cac573282c4bd938cdff556f659540dd4a0a6663711974cb2dc147a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01019-of-01024.json.gz": { + "num_bytes": 397564701, + "checksum": "3b64235effaf41ad61698b2c28f4d73ced1b6ec6b6d79e0f52314176fa0feb12" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01020-of-01024.json.gz": { + "num_bytes": 396053080, + "checksum": "b16b9f815823d176f94388d4c482652ac656aa763ec738ccd8c8a2a3bdefc1e9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01021-of-01024.json.gz": { + "num_bytes": 394731398, + "checksum": "f4c0044abadd339055bf13843938eef4c066856757250fc15f77060fc0881ba6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01022-of-01024.json.gz": { + "num_bytes": 396548645, + "checksum": "5ecd8432526eda57065e6161f0618a19cd5993c7dfe86575775f1bf01836f750" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01023-of-01024.json.gz": { + "num_bytes": 396863581, + "checksum": "c6cd29b8f6067152ccd584ded81df1f9cb905515d48815b8a546d104ec7a3565" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00000-of-00008.json.gz": { + "num_bytes": 50774357, + "checksum": "7cd6c8b1072af3f3ca3fa160d9411960908142743b101f7229223e6658acb42c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00001-of-00008.json.gz": { + "num_bytes": 51252663, + "checksum": "d36ef5fc04b24117a19d992de06400e5f290f11786be99be9de68818f7495694" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00002-of-00008.json.gz": { + "num_bytes": 50860289, + "checksum": "ab8b3dee7c0698c3cc3a74f159d85495b6bb9529600ef9246bec218ae6775e28" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00003-of-00008.json.gz": { + "num_bytes": 50141661, + "checksum": "54d62c9359000b99713a8a0a0fdfa415f1c09824555526f01dc7217b068542ad" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00004-of-00008.json.gz": { + "num_bytes": 51141505, + "checksum": "c11e31de558613237533b41354ca29f0635b599a1c9232517dbf4c2cb1197319" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00005-of-00008.json.gz": { + "num_bytes": 50797157, + "checksum": "20d39c0f52c34a3148c0a235238ed3849576ed895c3a43cb47b0159bf233c7d5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00006-of-00008.json.gz": { + "num_bytes": 50158887, + "checksum": "754a2b7f134bf45f17db7450d5c0eaf2b8824e4a6072be7b20db434f9cb7968f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00007-of-00008.json.gz": { + "num_bytes": 50232244, + "checksum": "f90c1d79c51ee1a009dc05930fc40e9ee4c3840ca2412cc129855156aaddc279" + } + }, + "download_size": 407016751197, + "post_processing_size": null, + "dataset_size": 2060282008734, + "size_in_bytes": 2467298759931 + }, + "realnewslike": { + "description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", + "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", + "homepage": "https://github.com/allenai/allennlp/discussions/5056", + "license": "", + "features": { + "text": { + "dtype": "string", + "id": null, + "_type": "Value" + }, + "timestamp": { + "dtype": "string", + "id": null, + "_type": "Value" + }, + "url": { + "dtype": "string", + "id": null, + "_type": "Value" + } + }, + "post_processed": null, + "supervised_keys": null, + "task_templates": null, + "builder_name": "c4", + "config_name": "realnewslike", + "version": "0.0.0", + "splits": { + "train": { + "name": "train", + "num_bytes": 38165657946, + "num_examples": 13799838, + "dataset_name": "c4" + }, + "validation": { + "name": "validation", + "num_bytes": 37875873, + "num_examples": 13863, + "dataset_name": "c4" + } + }, + "download_checksums": { + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00000-of-00512.json.gz": { + "num_bytes": 30085821, + "checksum": "6666a680b0a34eb8756dcb5fd2b12f0078237f3502e8a513bd3e5b71bb92be00" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00001-of-00512.json.gz": { + "num_bytes": 30065900, + "checksum": "61c3f9ab763067f76d9bea349d86efb97af7539d481b5d2807f362204971c327" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00002-of-00512.json.gz": { + "num_bytes": 30028880, + "checksum": "3aa4405d957ed42d10d643efe7c0f51b05e8f29cf4ad8783448083c1cd3f2a24" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00003-of-00512.json.gz": { + "num_bytes": 30136880, + "checksum": "f6eb49e4c0d691e67fe96ddeb3f8370c5e63a7297a31a8da0c58f5cb3a9f6061" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00004-of-00512.json.gz": { + "num_bytes": 30110499, + "checksum": "6e0908780f555f4b74c6a5055e2c9708333a8466f0b8723a8ea38cc04828ce44" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00005-of-00512.json.gz": { + "num_bytes": 30097927, + "checksum": "a333562df3fcd4c5ccf51b4c00e11f6619ac4a28a878383aefad277bd30131a6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00006-of-00512.json.gz": { + "num_bytes": 30013820, + "checksum": "7c436cd0993077187988239cf74c3e64de440dacad62ba4b02bd4ac0a8d219b6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00007-of-00512.json.gz": { + "num_bytes": 30557005, + "checksum": "dc9e43681c404fef1741e9608295b8dfae0953473993f3fc44fb83af07a6b82b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00008-of-00512.json.gz": { + "num_bytes": 30369535, + "checksum": "8de7a4005acdb60436b4e5d7274084e28df3aee31a5457c6837452094544c541" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00009-of-00512.json.gz": { + "num_bytes": 30033048, + "checksum": "32310a6c74cbee1dbb8b196e0cfad41f79e88e48d8f04c88692d42506113b903" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00010-of-00512.json.gz": { + "num_bytes": 29948345, + "checksum": "b7df217de849e26ecce5ed7a35b6e6238fcc1c08e969023f209307842dd496c0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00011-of-00512.json.gz": { + "num_bytes": 30558885, + "checksum": "82e5428aaeecf27141a7105e48b78dc02516ae6ebc3d6cd4ef13963316279e1f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00012-of-00512.json.gz": { + "num_bytes": 29888513, + "checksum": "f3d7e496b7c85ed7d020c8f8a24a0b27f9b2535abdb22b45c08441a29398c44c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00013-of-00512.json.gz": { + "num_bytes": 29936292, + "checksum": "bf04d82f0cdddc09ce4aecd9f71910b9858badaf6456253d43d89e6a8c56cba7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00014-of-00512.json.gz": { + "num_bytes": 30169338, + "checksum": "15b4611513154de0dfc1c9d470326fd053adf70de814ecfe8ba7ccee66de947e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00015-of-00512.json.gz": { + "num_bytes": 30071363, + "checksum": "887bdea83bdefc50786c93e8014d1d49999f8090ff15168598c884cd0724fec2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00016-of-00512.json.gz": { + "num_bytes": 30451660, + "checksum": "288ad0d553d54052354be506f87878fa7c54b0fa65811c6e456b3262e1d117e1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00017-of-00512.json.gz": { + "num_bytes": 29940254, + "checksum": "b13ad58ae9f38598cb9d560e3ab34c1d0200db73fe86da12230e50086b532463" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00018-of-00512.json.gz": { + "num_bytes": 30282186, + "checksum": "5a67e71955ab2d8f6531bd3949cd8ab71f4ff91863ea5a6ec3e7b33c31a05dd6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00019-of-00512.json.gz": { + "num_bytes": 30373907, + "checksum": "a70682315a0cfe0af815c7b2abbcd63310fabbc33ad6e19daad19f1f51506955" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00020-of-00512.json.gz": { + "num_bytes": 30104199, + "checksum": "980e544ce130a06e9e99ec906342eb0ab8aeaa96ac26eca01c56ebb463f5d688" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00021-of-00512.json.gz": { + "num_bytes": 29733696, + "checksum": "a69729b8f3ccb9db12476a31917783c1c6e036e7bbbb4089f430362aef71f467" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00022-of-00512.json.gz": { + "num_bytes": 30012894, + "checksum": "589e698fe450e22cba47813a5a28da5393e79702a528f6a8469f72f6d630caad" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00023-of-00512.json.gz": { + "num_bytes": 30024851, + "checksum": "2a7b036c38fb4d2df6535631018c23d001931e5bf8d8a815fd5b2f9343ec4529" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00024-of-00512.json.gz": { + "num_bytes": 29906809, + "checksum": "7e512306cb6ebb0b0c3e96ceb16dade9e1e1f484e754bebd0078e7f545fc5b6a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00025-of-00512.json.gz": { + "num_bytes": 30332268, + "checksum": "b636b91fcd9a91ce05b8cbeea6f591a0e916175ab23b0cfaf688171c8a98ae8c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00026-of-00512.json.gz": { + "num_bytes": 30288490, + "checksum": "9e2f8e2a37dcfe66873cc5355740448ef75a1de2deeb2d8c047c3c3a7ee485c0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00027-of-00512.json.gz": { + "num_bytes": 29897688, + "checksum": "882616d1e8ca66c0b6e7aa2ccb18d9239021603ab1b9486638a9a3447ddebe0b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00028-of-00512.json.gz": { + "num_bytes": 30201690, + "checksum": "0312b12f50c64fbe7b894a28e0940089ad57af95df8116cd7d43c0435ec2e79b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00029-of-00512.json.gz": { + "num_bytes": 30237920, + "checksum": "1e8677140186b219d32e764889dcc344ccac9db51685363324d1bc13ddef2bb7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00030-of-00512.json.gz": { + "num_bytes": 30048903, + "checksum": "43558e81c291cbf53a5b6a016aecb0e07e26a98b8fb32f4a000037b281afa363" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00031-of-00512.json.gz": { + "num_bytes": 30294528, + "checksum": "c33ae8a2fad7e5264d093fbe89ed1611357110a4f0f26dd5a93a4dc15560f205" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00032-of-00512.json.gz": { + "num_bytes": 29868168, + "checksum": "5dc2a8f96db8da87607efc0b708e6a2172530f0c9b43665dc01286109b5c55bc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00033-of-00512.json.gz": { + "num_bytes": 30105916, + "checksum": "c4cdc2b39a86eff251f903d7f3d39605b721615aeffa6a2753f3588b7dbef6c4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00034-of-00512.json.gz": { + "num_bytes": 30126174, + "checksum": "6d874182112b0881dc929c0182a30ec4f9f1633372a2b822200a7b1faaf4f1bf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00035-of-00512.json.gz": { + "num_bytes": 30084101, + "checksum": "5bea17f0cd4dd888f5d8a2d4092138e4777d80493a1f410d618d4cedf353b914" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00036-of-00512.json.gz": { + "num_bytes": 30095974, + "checksum": "6e7f42f3012d8ca7500c7e2ec82d27c26b3cd8bb5b8b66a7fc8355d77284f433" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00037-of-00512.json.gz": { + "num_bytes": 30239345, + "checksum": "54ee45bf25152060679bab3e5fc6f5cb5a3add6acd2664cb152f88c223f83239" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00038-of-00512.json.gz": { + "num_bytes": 30247683, + "checksum": "f738a2f0f156f7bd897d9d822748d4192a5fe46b566c7288ed5b840c4ffeda64" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00039-of-00512.json.gz": { + "num_bytes": 30057005, + "checksum": "60235900d69579334660c153c4fe384c08f14f4e729a06a1e8247e8b4ab8a213" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00040-of-00512.json.gz": { + "num_bytes": 30185136, + "checksum": "5a059d64fd6a1b42a2faeb4088db327c47f9e8328737ab74a0e0457f84433374" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00041-of-00512.json.gz": { + "num_bytes": 30314653, + "checksum": "2cfdc460c8dd0fb4766191ef2aec0af856af7c95d11eb3f1d731f63b71db4daa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00042-of-00512.json.gz": { + "num_bytes": 30123256, + "checksum": "64e59b8ebde3c12b0a1d218a302252b96aeb5bb4976927463101a9509579ec22" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00043-of-00512.json.gz": { + "num_bytes": 30057043, + "checksum": "edd200b97394f15f9cf0a6289406a83b42c3d6f961456f031f5814db4f6d482a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00044-of-00512.json.gz": { + "num_bytes": 30029900, + "checksum": "1b2980f21ee5cffb271591adc8eaa414438841426442f194b5f4b703356f4e5e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00045-of-00512.json.gz": { + "num_bytes": 30367170, + "checksum": "83967210891345b831956722e8dcd29cf55fb17b786c85c2dd2778528ab4d1c2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00046-of-00512.json.gz": { + "num_bytes": 30105866, + "checksum": "6921ac4854e2eacaeb4be07669faab85f2bab33f744c7efae1ce17be25176bb5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00047-of-00512.json.gz": { + "num_bytes": 29957618, + "checksum": "e8eba2ba9f51e76a06a2df43b6b120c47b6e41f61e46a2e3331518ebb2d0c84b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00048-of-00512.json.gz": { + "num_bytes": 30329887, + "checksum": "6af9c44a53d7eb9df9d86ee4d895fb9f7f2b9b3863fd30aae325e79fb792a10c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00049-of-00512.json.gz": { + "num_bytes": 30116207, + "checksum": "57dc1e94f73b55e0be5690b01d61188a62186ea9f5f85b556ecef3bcaa36fb92" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00050-of-00512.json.gz": { + "num_bytes": 30236341, + "checksum": "eb75bdf0e63e798838b3d7abfc6a3bfab5de2ba39af833c38048dfe39c1175b1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00051-of-00512.json.gz": { + "num_bytes": 30357091, + "checksum": "f48b1f5e07311ca9d69787019a56ad849932e6868d1f7778681cf7e4cc9fc562" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00052-of-00512.json.gz": { + "num_bytes": 29944959, + "checksum": "debf9490c057f11e404898b4a57cb424c1eb523fa90bb7899b1317f970481638" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00053-of-00512.json.gz": { + "num_bytes": 30240416, + "checksum": "9e847a5c6eb80e5c045fbb405729c695911674bd8d29b1d0be0791303d02f41d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00054-of-00512.json.gz": { + "num_bytes": 30174556, + "checksum": "65a80db1cdde9153e08277ad2d9074dfba1682c0f771fbb9f4aa8f88ca557f43" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00055-of-00512.json.gz": { + "num_bytes": 30134394, + "checksum": "beb8d280d322520ded21aec92ae087867d0bce64aac4e243a127a88f143ff578" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00056-of-00512.json.gz": { + "num_bytes": 29891026, + "checksum": "82fceaec35a2456487a59ae652d72f41a940d2d6bafdc4f05a6e02bcd7ed4dc9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00057-of-00512.json.gz": { + "num_bytes": 29920525, + "checksum": "e4fd55ba5fb2825ef4209aec87706ecdd3db040242c6aacfc82f350765fbeff8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00058-of-00512.json.gz": { + "num_bytes": 30060421, + "checksum": "3cfc894a1853e3d1f2daa314873b7919fa52b7208b590637f8face6536305770" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00059-of-00512.json.gz": { + "num_bytes": 30038488, + "checksum": "4f06ab7b5ce8e8c696445db4a3e32896b6396e3f67d7414a593e7398d752e564" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00060-of-00512.json.gz": { + "num_bytes": 30129718, + "checksum": "7923385ee0c6801073feb10437ee3c59e5f5dfe82c2311ad8c4ec670dcc0ec87" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00061-of-00512.json.gz": { + "num_bytes": 30130505, + "checksum": "5cd682e148b8488775622098214fc2009ef9c95355f46341bd78434f1b560fa2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00062-of-00512.json.gz": { + "num_bytes": 29968130, + "checksum": "53562fc23501f3a1d11c8ae6a59e719d6f4e67db8b8ea1d55e2b1b80849afd08" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00063-of-00512.json.gz": { + "num_bytes": 30116532, + "checksum": "008cc5c0cb7d60e84ffdfe2132f6bb49aafbb31083fd026067b3859326ca64fb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00064-of-00512.json.gz": { + "num_bytes": 30236194, + "checksum": "8f9eee169071e80c94c248f1c37b7fa631bd75a7f6e401f6a963aecd8815910b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00065-of-00512.json.gz": { + "num_bytes": 30077312, + "checksum": "8c5e18ea3575cd350e98d062ef88d3fd1df068e4bd410be8732723bda03656c0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00066-of-00512.json.gz": { + "num_bytes": 29920862, + "checksum": "e377b8112dc6ff6834607c27b927636429e887f4ab8edc0824363941b7bb311d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00067-of-00512.json.gz": { + "num_bytes": 30278223, + "checksum": "ec2c2ac74cc3f4f814d645410cccda266151949dd36aae518b8082b948b47edb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00068-of-00512.json.gz": { + "num_bytes": 29940464, + "checksum": "ddfc16a17cabf48a2c59fa8ef25ccd12d899d3462d08b45f2a301567ccc105c4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00069-of-00512.json.gz": { + "num_bytes": 29903118, + "checksum": "66d9d1791cda56607b2561199503cef216df86b28d4519d5862905671a4ec4c5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00070-of-00512.json.gz": { + "num_bytes": 30082323, + "checksum": "8072d3bd5e19c005493c0332b73ca5be253397f54be90be1bb7b2ef8df7ad117" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00071-of-00512.json.gz": { + "num_bytes": 30128276, + "checksum": "b7c68af5a6dcac3fbb3dcbe12123d1045a79baf657a8b3bdada60c1a97404c48" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00072-of-00512.json.gz": { + "num_bytes": 30458419, + "checksum": "cfe5c6ae2ad1531271b0039042e033bdd7caf9604bfa219980ca27513cea755f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00073-of-00512.json.gz": { + "num_bytes": 30366974, + "checksum": "a132f5e85376b0d0a06c6ae6af9c226dcbc98394461578c4fbc6cd439ba6e721" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00074-of-00512.json.gz": { + "num_bytes": 29987779, + "checksum": "f905e808b50908a7d2a7f0944e7e6c01ffd97ec16e5f0b6ed7169a60d66b0100" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00075-of-00512.json.gz": { + "num_bytes": 30070204, + "checksum": "b57458683803936f6bc03b06fc26be9d1a09ba09517b5c1518676f468e404595" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00076-of-00512.json.gz": { + "num_bytes": 30129238, + "checksum": "81e88ec53e39d6191e40e5852564f592b745abf99c71ff78302292632f636792" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00077-of-00512.json.gz": { + "num_bytes": 30051399, + "checksum": "218b0f6e219e42113e35d99458861f8511266dee6c17d9e2780a17af8877f822" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00078-of-00512.json.gz": { + "num_bytes": 30144230, + "checksum": "c0a337619559362e0e1cd0fe87c9ced5c987313a7f3cb65eb44f8b861c41c616" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00079-of-00512.json.gz": { + "num_bytes": 30544297, + "checksum": "27e257efda6adbce01585b3b6cdeefa95d31f607012fed5dd4310bfb5a790ba7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00080-of-00512.json.gz": { + "num_bytes": 30188866, + "checksum": "26411f1a0a7b299d0bf6cf78db04b0bcc617894cd87d59e54614f3258dd393ee" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00081-of-00512.json.gz": { + "num_bytes": 30418881, + "checksum": "87a659f6b24560a754ccbfb6aee019484e48e3ddc7955a6c7a18aa9098952cfe" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00082-of-00512.json.gz": { + "num_bytes": 30086460, + "checksum": "708fe5108042b957688817625c84059c11700b18ddcea3814b86b6c8c66af8a5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00083-of-00512.json.gz": { + "num_bytes": 30138639, + "checksum": "8d8681519538afdb7622b677ca5d3ae2a643382bae9639e3ad90c82d36477653" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00084-of-00512.json.gz": { + "num_bytes": 30228150, + "checksum": "db708760b9d45e0b20c8dde9b0008f01761d9bb0f37a194845b4d097a60e477c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00085-of-00512.json.gz": { + "num_bytes": 30004564, + "checksum": "19ba55c7cbc44ae30a6497373fc15b548e5c45667f790c392857f6fdaa7e2bf6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00086-of-00512.json.gz": { + "num_bytes": 29696360, + "checksum": "4cb07dd259a084818f9a79a4fe4fb7b24ea1adda0cd4fd405ba003e7bd481f12" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00087-of-00512.json.gz": { + "num_bytes": 29927300, + "checksum": "7c3c07dbc9c57881a3c1abab85a927f1ba609c58da9dcec22d7415079cd336b6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00088-of-00512.json.gz": { + "num_bytes": 30038333, + "checksum": "59158c87d7e9e5011516f98dec1313758072ca6685c7ad9df5ee4a075d9ff8a2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00089-of-00512.json.gz": { + "num_bytes": 30223506, + "checksum": "d3f39f7e90b4a82257779290a3f2de5619049d69b2169577f1e3c81791d85419" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00090-of-00512.json.gz": { + "num_bytes": 30266969, + "checksum": "88ed3237aadff809cec186fa378e176774d3f32aef1a6d8bfdbc530f64e8aed4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00091-of-00512.json.gz": { + "num_bytes": 29885840, + "checksum": "b9a247993a8eec31b3f853d1329ae79da29397dd27eb4acdc196b71c091335e3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00092-of-00512.json.gz": { + "num_bytes": 29942337, + "checksum": "3d83cc54c06cad8effdb7a38ed6666b5d912e6fffcf4c82471af064b0aabe05e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00093-of-00512.json.gz": { + "num_bytes": 30129376, + "checksum": "d72ed9855fa86ceb4089435da3d78e8d4151b92185f828329b534d1adf3821db" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00094-of-00512.json.gz": { + "num_bytes": 29613450, + "checksum": "f61f74aa65a81616b97cbc34a8be1b563f83f69709642b8156eb76cdda02103f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00095-of-00512.json.gz": { + "num_bytes": 30469526, + "checksum": "926d1ba2e4b191e75b0bce0cbe4c15f95f244445ec03a6095c009c34e36f897e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00096-of-00512.json.gz": { + "num_bytes": 30126036, + "checksum": "e74818ad94e408498644dc71f1ed967f356f539418222f1dfea467a21c99badc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00097-of-00512.json.gz": { + "num_bytes": 30374980, + "checksum": "d9cc8827ee38bddd1a31e48b2b0064a567520e3c0f2e1be745acef57d267e4d5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00098-of-00512.json.gz": { + "num_bytes": 29928579, + "checksum": "090ad37fd9eaeb53308599f2da1053b19b1c6478adaea5a8a1c35d6c35340111" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00099-of-00512.json.gz": { + "num_bytes": 29901456, + "checksum": "c0e7d9a7cbc3b9b940077508441e471a1eb70e822479fcad726b900e6c196382" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00100-of-00512.json.gz": { + "num_bytes": 30033459, + "checksum": "b62033de618191de3200205e6e40725baf045e403060d10417211d47854d6bb0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00101-of-00512.json.gz": { + "num_bytes": 30280468, + "checksum": "8726d092785856ec690dcd8a9edcd968cd04af1cfafe8a83192e3c0782f02b4a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00102-of-00512.json.gz": { + "num_bytes": 29805195, + "checksum": "248edf4dd6c9a1137c7b45ab0b5a05a5fc93fd14cec17a5da4d758b9f7b359df" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00103-of-00512.json.gz": { + "num_bytes": 29995494, + "checksum": "d66b75c3f08a0db141d2c0162eb3dbc351e656ba1ba480e77eda051435d1390f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00104-of-00512.json.gz": { + "num_bytes": 30318447, + "checksum": "09bd2068c20d33783f39322c95756fd3dbd0da91f4380fae3822cb33b7d06779" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00105-of-00512.json.gz": { + "num_bytes": 30209523, + "checksum": "0a399ecb1116890e1a0189cd2842d64d8ed53213b1623ae38229a6ac4f5c1c76" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00106-of-00512.json.gz": { + "num_bytes": 30476739, + "checksum": "540f682a7c977d20f920b5af1ec7e40c14a0d54f1718b43271e22dece9cdce16" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00107-of-00512.json.gz": { + "num_bytes": 30203291, + "checksum": "0dd51deb74ab391c54b20862f7df561f74d00be2ee4fc13987f91771870c099b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00108-of-00512.json.gz": { + "num_bytes": 30265100, + "checksum": "172b09a108b154014077a415f644cd16db6a66f178bf780c120a6c4fecc3c0a8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00109-of-00512.json.gz": { + "num_bytes": 30342649, + "checksum": "214a8f147f2d77ec0f3889b0a2d782e5d44230878359e695e9523561e6723a1d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00110-of-00512.json.gz": { + "num_bytes": 30152418, + "checksum": "dc0d34ce7918b80ecef3528ec2b063edf7b12223c453ac7fb9d39232fecd81d7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00111-of-00512.json.gz": { + "num_bytes": 30160329, + "checksum": "d0594cb69d26f0e853575d86f92b1aa233b5bb236804a2f496a792fa031014ee" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00112-of-00512.json.gz": { + "num_bytes": 30428351, + "checksum": "2b0542d973bab88e696fb9efbe042167600da397d776ef65344dce868bbcb0b9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00113-of-00512.json.gz": { + "num_bytes": 30200133, + "checksum": "10dcb929692795fefcf4623040191d9cb6199fbb3b164648b62b9867e8392379" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00114-of-00512.json.gz": { + "num_bytes": 30205273, + "checksum": "f16631d5bcbbe133a01675286ca7667400ecc7e6df13d728015381d21ec71cfc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00115-of-00512.json.gz": { + "num_bytes": 30164849, + "checksum": "bed27819db4bb7e02cb42cdda18acd232659a2eaa43eed910ba26d686cb3f837" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00116-of-00512.json.gz": { + "num_bytes": 30117752, + "checksum": "4eb4bec7adac3c2f431d356212f8a9d47136f0011f5f9e71dd29d82b1b823e2a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00117-of-00512.json.gz": { + "num_bytes": 30062588, + "checksum": "79639624734885b3051b10f052f5486d7124bbc4bcd18d99348f3683ee2fc54f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00118-of-00512.json.gz": { + "num_bytes": 30125828, + "checksum": "e922a4a5332a4182ddcf6ac8ba910024fe4fa878b524f7368b27373f75bbfe44" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00119-of-00512.json.gz": { + "num_bytes": 30156741, + "checksum": "a44aba8779b99ace2f212789389af058d12dfb0706221b296676d5e10528dd78" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00120-of-00512.json.gz": { + "num_bytes": 30489925, + "checksum": "82bec41bbea7bc5ddb67b3bccea51122da7d0922768f8bda7a0c9d489bd20cdb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00121-of-00512.json.gz": { + "num_bytes": 29606989, + "checksum": "b49238f5b75aaf876657826cfbd4346d250f564a86bdb010aa1e85b44a969229" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00122-of-00512.json.gz": { + "num_bytes": 29770557, + "checksum": "0803ccbd505db47cd09b20d86cc6ad459c7a8d1c583a5ee756b0397369d8b6fc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00123-of-00512.json.gz": { + "num_bytes": 30248121, + "checksum": "d73a1bf285a0355bd61a25891cd8c5fd9da66535ec515dc7e1602a769b994727" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00124-of-00512.json.gz": { + "num_bytes": 30131013, + "checksum": "65d2dcc7e63a28e1911717d149b907d0c74fda6e36db2840353a0290f7880324" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00125-of-00512.json.gz": { + "num_bytes": 30348971, + "checksum": "5dee3c7afe0364ccb8e36647d01e78ffe61690f29f29aa033efac9a0413c2a47" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00126-of-00512.json.gz": { + "num_bytes": 30370074, + "checksum": "1dc04b3755291842711623d1d6cf042e2d66987103a0c708f01c9136a8c42db6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00127-of-00512.json.gz": { + "num_bytes": 30320846, + "checksum": "e31a27ba25bdf13e6f929fd38d53409dd3f50be78ad955b69b1956709de5aedb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00128-of-00512.json.gz": { + "num_bytes": 30076235, + "checksum": "122ee9d293428a7a823c17b3a432b5b2198fa2a68bbb246b97e981bd09f78f0c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00129-of-00512.json.gz": { + "num_bytes": 30569486, + "checksum": "918bf43ce3ab54d535dd02cbcd09f1081890be3287e23fd81bfa032beec61ebc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00130-of-00512.json.gz": { + "num_bytes": 30280169, + "checksum": "ab0a53e8c10dfdd139281175b5fcfe3090fa238fcb383e27b1dcdfdbbe8a879c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00131-of-00512.json.gz": { + "num_bytes": 30338899, + "checksum": "e54771e12a6f3583c3accf9bcc01b598819231f367e7f80cbd44cf6683c5c852" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00132-of-00512.json.gz": { + "num_bytes": 29969011, + "checksum": "f69d7052ca7657fdebe547a6e196b109285d5d4e4f1a68f3900a37ba6fecc22f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00133-of-00512.json.gz": { + "num_bytes": 30179558, + "checksum": "cf2130dedafd8f47e97661a5b1555813433e3f7293b5c5cb222cf551d90a0604" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00134-of-00512.json.gz": { + "num_bytes": 30080257, + "checksum": "1a32902fc21633ae8d41e4e5518804f4c719dc8729b866ebc32d3c36fdadbc10" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00135-of-00512.json.gz": { + "num_bytes": 30284972, + "checksum": "6e3a78e7a530d91ee4578caf462a4c685a5f221f0cd8eb9639c9067e2b655a7f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00136-of-00512.json.gz": { + "num_bytes": 30130265, + "checksum": "defc57340cbaa5f325994a91b5134789c84a76a4ca7b9fdbf993b0e634735f05" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00137-of-00512.json.gz": { + "num_bytes": 30146793, + "checksum": "7ce5035f452eb2e1adeff36d0c6d6d65c245d139a86ef48bbe10c5275975183b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00138-of-00512.json.gz": { + "num_bytes": 30180265, + "checksum": "298849a53a8ea0e68d01cc137195bc36d686077bed722e1198337a1dee3c51cf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00139-of-00512.json.gz": { + "num_bytes": 30398387, + "checksum": "ef2ac4b8f195141a79a357d934d5d97bd4d2c64027ec7509b5873a4ae32fcb9d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00140-of-00512.json.gz": { + "num_bytes": 29652990, + "checksum": "290f1c99b696e345aaa6ac6d5a882a87dcf5d3939b08ba859a359d2459498785" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00141-of-00512.json.gz": { + "num_bytes": 30083642, + "checksum": "fb6a38388a25261d86fbd8ffea63e06bcbcbd6846a4eb6f13fd09d7fe5a1fbc3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00142-of-00512.json.gz": { + "num_bytes": 30131064, + "checksum": "b61ccf6166ea4b777629bdc07d543f299bf7569deab18228ec5bb9edc8cd3eb5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00143-of-00512.json.gz": { + "num_bytes": 30244435, + "checksum": "22812c50efdfcf2c0fdcf593639dfea09ffee8068321c30effc669c8234d4f3b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00144-of-00512.json.gz": { + "num_bytes": 29725094, + "checksum": "79cfa65a3115193629d16606643d90dcf27d3108c320cc9e364ba19fdb9fb1d6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00145-of-00512.json.gz": { + "num_bytes": 30335033, + "checksum": "e836f0bc9acba85fd1721d19cc24054e97defb0d12678bdc0d086f40deb9b1a6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00146-of-00512.json.gz": { + "num_bytes": 29905680, + "checksum": "bf684871a235078390d6c6bb03fc2d5bbffec2b095806df652a19baf5e67135d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00147-of-00512.json.gz": { + "num_bytes": 29852459, + "checksum": "0e716de5b3b09ec287b039be0f0dd6edd7d541aa6d3f9d2be18768e1cd5f4cd8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00148-of-00512.json.gz": { + "num_bytes": 30364788, + "checksum": "4cef624e6b7c2b73dbfb47227e31681223a5a9369c4b7daef8606b796f010dd1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00149-of-00512.json.gz": { + "num_bytes": 30096278, + "checksum": "fb448ccc7412f5ca8667004a70f3dd6e1b5e6cb7f6facc06564bd22b1d815593" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00150-of-00512.json.gz": { + "num_bytes": 29776995, + "checksum": "1e14268cf723bc7336b33896537643d21dbefc1f05ffd5201feb5fb1130f9683" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00151-of-00512.json.gz": { + "num_bytes": 30205172, + "checksum": "797224cf74063fbcaec741535278ccce141e6dbbdd69a2191d07f89816ab14fa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00152-of-00512.json.gz": { + "num_bytes": 29845034, + "checksum": "77eeb2353f544c714deea68d4a781b498c40d7c1e27db3aade4987b381ca29c0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00153-of-00512.json.gz": { + "num_bytes": 30258796, + "checksum": "0fc581e92e70dda031d72a4aa0bbd65b1e9b28884f0ef5dd5e895cbecb270609" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00154-of-00512.json.gz": { + "num_bytes": 30249734, + "checksum": "ba10dd0a24bded170541e23078264b82b35bc99e402db594e2335e31905ededf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00155-of-00512.json.gz": { + "num_bytes": 30198742, + "checksum": "fe285ac893126062bcbc20df75a9f65c57d3a7391354fa7e62b7f6a7122d6e77" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00156-of-00512.json.gz": { + "num_bytes": 30168323, + "checksum": "d21826b71bc85dbc496dd947ae9ee79d62885cffb3fa7c47409feee6ab247f17" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00157-of-00512.json.gz": { + "num_bytes": 30241978, + "checksum": "fc41765301b62849eda0b7b08f792e45f03db458fb92063af70c43d7cd0d0bb6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00158-of-00512.json.gz": { + "num_bytes": 29959715, + "checksum": "1eded3ce0bc099c7e198e9277719d578c3fb6c425bb2110cb0ca6ce469d1d19f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00159-of-00512.json.gz": { + "num_bytes": 30109595, + "checksum": "eccaab5b694c2f0017fe1d423637872d5587f6deb316796f7c0ff5517fa28178" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00160-of-00512.json.gz": { + "num_bytes": 30201741, + "checksum": "4ceee71372da6112101665f5bbf942a85f065feaab924c6e3f83498169bbe255" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00161-of-00512.json.gz": { + "num_bytes": 30176266, + "checksum": "6ed829daaad190b2d50b626d840edb750a063afad95315ffe7604a193183a489" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00162-of-00512.json.gz": { + "num_bytes": 30018118, + "checksum": "dcf8509a55213425a41706e5209ad411afb715fb9cd8c1a8b8edca23fab7d6cd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00163-of-00512.json.gz": { + "num_bytes": 30236016, + "checksum": "d93cfaabcc7197637f233896b5799527f27d5b2dc60f0f0411ee51f05f09c500" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00164-of-00512.json.gz": { + "num_bytes": 30150055, + "checksum": "cc7de5ed3c774ff1dc350fbb5167dc1610c4f9a0dbc7c5d60ed4cf08aaf23ce3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00165-of-00512.json.gz": { + "num_bytes": 30348056, + "checksum": "b41c4a3b7b4e96262fe5c87d06fbeb000dc48cc1d304a475bb4f4e1af84a9afb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00166-of-00512.json.gz": { + "num_bytes": 30015834, + "checksum": "0a0821b7628b9b019995a9f34223e2960ded84331ce1bb55089838becb8a170a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00167-of-00512.json.gz": { + "num_bytes": 30282254, + "checksum": "1285af56d024efe2166fa892878d471948e1d4c996922c7673e3c0f7f0f76bef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00168-of-00512.json.gz": { + "num_bytes": 29815124, + "checksum": "29ec54ed647725ca3b9aec3bae341151a8e2b708cf21cd87b4389329298442b8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00169-of-00512.json.gz": { + "num_bytes": 30346843, + "checksum": "1791e3f8371a63f9f849b7bf430e70d3f4011dbdef572c166cc5d49d06162fd7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00170-of-00512.json.gz": { + "num_bytes": 30175685, + "checksum": "de8f82986addfc64b88fd3041d7ee6fdb64e6f770758146dc4c9309df348e965" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00171-of-00512.json.gz": { + "num_bytes": 30145505, + "checksum": "0dda47f679666862de6343e1109ed92866a42e8fa129ee69e9f0b73f18b6aecb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00172-of-00512.json.gz": { + "num_bytes": 30009998, + "checksum": "2990dae6c16b7d60652439bed8b80ee4cf93972f33d8511d3d6aabaddfeca5cd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00173-of-00512.json.gz": { + "num_bytes": 30062185, + "checksum": "e154a969bba2bf9430e0c8307561de78599fd2bd527cb1f15bbaf8f8e88cdf23" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00174-of-00512.json.gz": { + "num_bytes": 30055129, + "checksum": "e714ae153e8a927c88fe577d4c27017985d3ed7f3d0f5470f9a5f25c2e901a9c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00175-of-00512.json.gz": { + "num_bytes": 30091082, + "checksum": "5f47c663d1e15d94fb0057d303048be990c713f3285ada2c6233137b1d84d60f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00176-of-00512.json.gz": { + "num_bytes": 30235767, + "checksum": "20b05e4e99e5a05f6a4c29b304803b895bb8816caea6203643723ca587d66128" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00177-of-00512.json.gz": { + "num_bytes": 30071950, + "checksum": "29294e4b224df4695c9342c6f23d5495de9a0ca6a1be7217aa2211506e8ac7bc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00178-of-00512.json.gz": { + "num_bytes": 29932121, + "checksum": "6022ed3b2ceef02324e40d3c7407622c95ead2cd3d3c41ab15ff9dd218265673" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00179-of-00512.json.gz": { + "num_bytes": 30119251, + "checksum": "42fa0aa883d9db4303a4981e4e308b2432b031fbccc98c3e1994ec775ba8023e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00180-of-00512.json.gz": { + "num_bytes": 30175456, + "checksum": "6fb2ebd61524846f6b1f746f9c6356045623beb4b685fe265a23446037c9cd9f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00181-of-00512.json.gz": { + "num_bytes": 30029564, + "checksum": "b779d721bb135fceaeddebb0dad1bdb43c9067a5e8595b3d544dfa7a084eb9f4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00182-of-00512.json.gz": { + "num_bytes": 30437016, + "checksum": "b388fc0e862d7f6bb5b879ff7c69c301038faf5b542f6b40cbea4e2096a41e6a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00183-of-00512.json.gz": { + "num_bytes": 29994048, + "checksum": "8208eeca7bc76f8b1786c95939d321ca0c7ae190b1f12dae86738810e412aa8b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00184-of-00512.json.gz": { + "num_bytes": 30338616, + "checksum": "49859e75d999f65de99f9236e649a81989360f0328ba684671057b0dd7cf5e79" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00185-of-00512.json.gz": { + "num_bytes": 30088874, + "checksum": "ff6d32fdd471d3076a9367c175baab84a5d699ccd6dcfe00c755f0b714ca6074" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00186-of-00512.json.gz": { + "num_bytes": 30193681, + "checksum": "82508ed104fc57de3062258eaea57854ab9e1934437a88dc0d8a9921f3641bbc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00187-of-00512.json.gz": { + "num_bytes": 30171163, + "checksum": "409d6576b25ad27455c755e5484e3f51d5d9788962efabe1c32e06bb3febacab" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00188-of-00512.json.gz": { + "num_bytes": 30060432, + "checksum": "fae94de96fa2962ef51e2ea90a5f760a5cee5de249bfd9f56d7c7b4e5c20f6de" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00189-of-00512.json.gz": { + "num_bytes": 30180741, + "checksum": "25293d5cba09980086f380d9e9ab44543adbbdcd05ed08601248b3a2b16d118c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00190-of-00512.json.gz": { + "num_bytes": 30207152, + "checksum": "ccfee160de15df5d88f0ff5a898a0c5b2d0ef4ebd6e6832715a9ef8a9904f88f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00191-of-00512.json.gz": { + "num_bytes": 30143987, + "checksum": "4c579619e465d9d97451801147202826a3855e772ea6dc4e9968e43ce2b8c05d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00192-of-00512.json.gz": { + "num_bytes": 30072097, + "checksum": "9c32ecb6d4ec9feb27c5b642879b464e68ca8804db161219503f624e7ca1166f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00193-of-00512.json.gz": { + "num_bytes": 30172886, + "checksum": "8442ddc3843c72aa169ca67801ff865ff85e4183beb38faa664f4f1d1c22a5d8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00194-of-00512.json.gz": { + "num_bytes": 30037105, + "checksum": "2942ecacb22cb9a2953c68f21ddf3368cd47ab1f2b2d8e1f5c76b1c849b28d91" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00195-of-00512.json.gz": { + "num_bytes": 30014854, + "checksum": "9e5c6815a5734403a7062bb27b2565d433a3520a401c836ac3f16e743a1dd949" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00196-of-00512.json.gz": { + "num_bytes": 30020510, + "checksum": "792712f0073c158b5f96f7a99d97970fca3819b69739d34d7d2b7f4b8b407b7f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00197-of-00512.json.gz": { + "num_bytes": 30072566, + "checksum": "3ece37e2d0d0b26fbd839b5d3facdfd70844945a06867fb68b141f6b1378462b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00198-of-00512.json.gz": { + "num_bytes": 30036679, + "checksum": "c3f37a9b89987dde4578b394b5c3916c2d4fd87e0902309b4c81af19b1d2d5ea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00199-of-00512.json.gz": { + "num_bytes": 30195178, + "checksum": "ae01bb5515097a083afd498d8530e788d99671e7cf802c4402957d6252b2ec77" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00200-of-00512.json.gz": { + "num_bytes": 30064374, + "checksum": "2399d4869f3a8bb4a9adced5ec548a9a3fde1d4fbc4e3abd9a0a3b495fb9a8ef" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00201-of-00512.json.gz": { + "num_bytes": 30136711, + "checksum": "5c922040697bad8d7807d79f34f2b667eea63ceefba89b2d413fcd4d66497607" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00202-of-00512.json.gz": { + "num_bytes": 29962983, + "checksum": "e4df518d612a8614de73d5944a31d22ad06ec9ecd26fb52e500df71fe363c1be" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00203-of-00512.json.gz": { + "num_bytes": 30178998, + "checksum": "e84a98a176451fc82d940a64cdec821e320a648780edba6466b74a1966eca47e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00204-of-00512.json.gz": { + "num_bytes": 29988832, + "checksum": "c6dc56388bc7c57cbdee8280895ab80da7b4d49c9a0101a685229c50cad2e2e1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00205-of-00512.json.gz": { + "num_bytes": 30229414, + "checksum": "e7e5175b6a7372377ba3a0db439911e189db459787d48588183ac1a0198c5fa7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00206-of-00512.json.gz": { + "num_bytes": 29914929, + "checksum": "eb263433133660ebe219cd5817dea3b546ef2fba0e15396b2768d7091117cdea" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00207-of-00512.json.gz": { + "num_bytes": 29912800, + "checksum": "7f8a5f62ba5912b64af5b02bd987b4d81727223ef8eff110022e89d01961366f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00208-of-00512.json.gz": { + "num_bytes": 29900590, + "checksum": "bc2af142244601bb7a96859dfd9885196940e675ca217cfc7c73ac9c614ea938" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00209-of-00512.json.gz": { + "num_bytes": 30242768, + "checksum": "fa51a4337faecfc790ca925802f87f10761552e16578b880ced80497f62bba60" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00210-of-00512.json.gz": { + "num_bytes": 30039857, + "checksum": "3adf7482ec6a3ad106c8edca3645a94032c33f84fcd26bd9876f2b8a1f6b5722" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00211-of-00512.json.gz": { + "num_bytes": 29846856, + "checksum": "8e931aaa9c1f069c0eca0b4605277610df9d2d0c07a0dbe6191fb7081b0e642a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00212-of-00512.json.gz": { + "num_bytes": 30022172, + "checksum": "21c8bba1c83544c27977b22b077fd77f8df9cd06bc4eb5e9e9a532c511498d36" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00213-of-00512.json.gz": { + "num_bytes": 29877918, + "checksum": "b64ebaa088df5c6230e69f207267a038705c38f4d327970e9117979e1c13d1ed" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00214-of-00512.json.gz": { + "num_bytes": 29906552, + "checksum": "55d833a2b78ad564e6532d1acd14511e8b48d703030e3bbc92d7c835c1ed38c7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00215-of-00512.json.gz": { + "num_bytes": 30075441, + "checksum": "999c77c136d3df83601e33c823f389b133f33c4c0b03736ceace617b526cb293" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00216-of-00512.json.gz": { + "num_bytes": 30507152, + "checksum": "0b23d4e57eaa101c78bab46151add537668d2722bf0c50470c1b434ec3389ae1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00217-of-00512.json.gz": { + "num_bytes": 30044236, + "checksum": "6abacfd53e231a38c714d436018cef9a58f53320026c2ebb27d6caf08f02d7ac" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00218-of-00512.json.gz": { + "num_bytes": 30047926, + "checksum": "01120ef69493d84c44d112a41c69a851edaf89232679366e812f240fd26a0e47" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00219-of-00512.json.gz": { + "num_bytes": 30349211, + "checksum": "c4fc219559f0f076f634fc6812d4b13c229908c1ae45c3b74c059fb3b8124f63" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00220-of-00512.json.gz": { + "num_bytes": 30063445, + "checksum": "11f712439d54ef062cfa1225328fc4faaef5f6c9c0b0d87a0a81d25a71350e28" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00221-of-00512.json.gz": { + "num_bytes": 30115660, + "checksum": "9a344857ef4f9d141b57df38e25f717153b773436d72c23e10289ffe67c315eb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00222-of-00512.json.gz": { + "num_bytes": 30134562, + "checksum": "227cd1847a948e388b404b5cda9289f05510d4e22f0ae5ec4d5a87a8f7f98a45" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00223-of-00512.json.gz": { + "num_bytes": 30120819, + "checksum": "e0029aa6b612a98f76e37d82107fcb90f2b57ae8d52beea172b5153b76334f20" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00224-of-00512.json.gz": { + "num_bytes": 30371365, + "checksum": "1ce5242d163ca12dbb22655eb841bf80750b552353af4f84973285d823d0add5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00225-of-00512.json.gz": { + "num_bytes": 30319212, + "checksum": "71cb82bb95107a7e0b7777a5fcaa0f76b465ba828ac47401babcf7289eeb2335" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00226-of-00512.json.gz": { + "num_bytes": 30020940, + "checksum": "b7b8d98ade41f52ece23e896bdc4c19ad034a92ba18adb5fac85c7271afbfa65" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00227-of-00512.json.gz": { + "num_bytes": 30109958, + "checksum": "b2ec382f44caf4e8e46fef2faf6bd2e4000420e6da2eb12a5d9f6e7efb4e1564" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00228-of-00512.json.gz": { + "num_bytes": 29940895, + "checksum": "ff86264683d0fdf9d689aa30e7889c4ceed21098b7c60a220db92d396614cb1d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00229-of-00512.json.gz": { + "num_bytes": 30080588, + "checksum": "3a5502cedd61501055eb16adb6ef861c75880524c5468a69cd346bc03e98e219" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00230-of-00512.json.gz": { + "num_bytes": 30376399, + "checksum": "6d3a4171a1febe9149f6900e3cca5a38046ca9d59214b548a4ef9de7de754bbd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00231-of-00512.json.gz": { + "num_bytes": 30031670, + "checksum": "a2c8d9bb3eb260d5d8a7dcafc4703540332e2896e5127372d380d7efbd567a3a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00232-of-00512.json.gz": { + "num_bytes": 30132612, + "checksum": "c9dec917eff4d72c684d6f8373ca66839061e29d25f0aa5fd6fb7de5c30df469" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00233-of-00512.json.gz": { + "num_bytes": 30178285, + "checksum": "1eb83b8eb7e72b2b3e55420436bb17521b989d0627da46f8cc61fe9f420fd464" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00234-of-00512.json.gz": { + "num_bytes": 29991258, + "checksum": "5e14e2a9e8c0aba73feb9134c694e99baf57357bb524877322ff5181eedef1f2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00235-of-00512.json.gz": { + "num_bytes": 30045172, + "checksum": "50a118a072498b5338802cceacb97a9aa9242252e8d76d305cf5f0d928fd4af6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00236-of-00512.json.gz": { + "num_bytes": 30403542, + "checksum": "7d7605576975232579e422a1b72625ad6f9d714d27770725dc7b99ba258e1985" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00237-of-00512.json.gz": { + "num_bytes": 30242989, + "checksum": "22d152fa02c5a959e978ea4887dd873dfef7267af0a577b4d796ff0cb52d5c56" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00238-of-00512.json.gz": { + "num_bytes": 30214634, + "checksum": "6d0af6f396fa21867e899a7678c633e47bfe79bcbda29b8072c5d32ab20a9aa3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00239-of-00512.json.gz": { + "num_bytes": 30255546, + "checksum": "d35a93632638b6283053b121f0f30d47ea20b2747d871c3dd0beb13f4ffbcad9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00240-of-00512.json.gz": { + "num_bytes": 30347604, + "checksum": "fd052d532fcfe811d96f8433f79a684f68f76ec42bd959c76ae3b63aec0b2c3e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00241-of-00512.json.gz": { + "num_bytes": 30135691, + "checksum": "12c80c41dc4d6313bce4a171999ecda93ffc59f2c70cca363bce214cd12dc9f7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00242-of-00512.json.gz": { + "num_bytes": 30229834, + "checksum": "fca5b81914ac0c5fe0b0c1a554a1e62c64af5c98740df1f8ce8f48f2a62b6a48" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00243-of-00512.json.gz": { + "num_bytes": 30053753, + "checksum": "ba41c505579524e9d244354a70060c9a0131007e0b129f03e628bb7b7b512ca9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00244-of-00512.json.gz": { + "num_bytes": 30216889, + "checksum": "54a391c1d2de7627e739f3cd94eeccd50a80d56a40606f7c5392f6098df456cf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00245-of-00512.json.gz": { + "num_bytes": 29887569, + "checksum": "c3263ea7e16e0036961dad28fef57ce4f0495219e59b4e800af82b67b3c6c506" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00246-of-00512.json.gz": { + "num_bytes": 29906815, + "checksum": "a3dcc92aed81708434edee84397010eae4ffeaa38b39aaf3919256f72deee625" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00247-of-00512.json.gz": { + "num_bytes": 30074896, + "checksum": "019e983a95908651bfae83e37bda5200b3888b03ab235fc8db2d5b16742f028f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00248-of-00512.json.gz": { + "num_bytes": 30108081, + "checksum": "6f68835ec02cf899f8f44a795b1e3117956ff5bb6c8946435d9861ae7a112df3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00249-of-00512.json.gz": { + "num_bytes": 29957882, + "checksum": "9bed6b7f56d93fa3973d4f177dde0973fa0eb6fe17d8d85279d865531613f963" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00250-of-00512.json.gz": { + "num_bytes": 29822284, + "checksum": "1848bef8d11360df55a576c64147e519327b1178f77d3ec14ab9522b33b1c423" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00251-of-00512.json.gz": { + "num_bytes": 29956462, + "checksum": "425f69c361a8671cf571df577ac0cfafb4894de494360084b7cbe9cb8869bc3f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00252-of-00512.json.gz": { + "num_bytes": 29733712, + "checksum": "7198e831e75eff1e116513f9cbe098c071f051c545b41d1943211a1d996a3c67" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00253-of-00512.json.gz": { + "num_bytes": 30450662, + "checksum": "0452804e723c919bd3c84217bb1dfc8764112fd70c5581f84520df7592f28ae9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00254-of-00512.json.gz": { + "num_bytes": 29944765, + "checksum": "dbbff2253d70094537de481344e5706315271fdfce7ebaddc8d277ed05ddfe24" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00255-of-00512.json.gz": { + "num_bytes": 30321363, + "checksum": "79173dd85d535cee71afb52f7775bbf7289509bc555efe21a8700d36f7e5da25" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00256-of-00512.json.gz": { + "num_bytes": 29982818, + "checksum": "bacd191568e72da06c564fc7476225ce83440de6aea6c85ebe7f5279f1c15846" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00257-of-00512.json.gz": { + "num_bytes": 30338592, + "checksum": "998287203665559c27a66e889611ed716b7a389e403b2e857086f548b2c47b39" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00258-of-00512.json.gz": { + "num_bytes": 29911193, + "checksum": "ed9829f41a71cc187d0ddfeafc9cbde8e362b52914c988708a1a5ffbd3c152af" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00259-of-00512.json.gz": { + "num_bytes": 30227794, + "checksum": "2fe86814499a3379601a179acca1d440b3c79467827ce9ef9787e1ab311904e0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00260-of-00512.json.gz": { + "num_bytes": 30206902, + "checksum": "c4efdad05d3f5e9f27884399ab0ec82081c26486e87f0ed5408a9eb80b223daf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00261-of-00512.json.gz": { + "num_bytes": 30035514, + "checksum": "e47675a956a626a32b1870c61e6f98c3cfe9cc571901cf477abae982b4e63c96" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00262-of-00512.json.gz": { + "num_bytes": 30406718, + "checksum": "ae19c1389e26562322f745bafbd7839e7a95b3169743d48baa7ae7f2db2a0b5e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00263-of-00512.json.gz": { + "num_bytes": 30266531, + "checksum": "289c9fee87f12ea22ad5329f80cb379e5e9c22c5cb6639077748958228c62bf7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00264-of-00512.json.gz": { + "num_bytes": 30100823, + "checksum": "7c65dd5d90c6df49ca2dcbfdbf1b9fbb0789cb32043795942d88c5f2d7a99869" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00265-of-00512.json.gz": { + "num_bytes": 29957109, + "checksum": "e3a1b501b2cc3f5f2667ef179d7876db602daedefd0cd741c0898679b24984e6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00266-of-00512.json.gz": { + "num_bytes": 30196603, + "checksum": "9337dd8240f168da5f6a8b57c5c169a2a400a9a160eccc8a6e44e7b32004ff19" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00267-of-00512.json.gz": { + "num_bytes": 30304605, + "checksum": "513eea4e78c399cc045e25f13bb5f77ddb6c9b606522bed8216945c529894e8a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00268-of-00512.json.gz": { + "num_bytes": 30312562, + "checksum": "0503c5bf6848213c5fcb81a5c94307fc010d910a8989e104ad5fedca58c76f7e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00269-of-00512.json.gz": { + "num_bytes": 30045257, + "checksum": "59bd3011d12d7d70b5fd64bc2dd2016b1a9ca6f0d210dbb3e6c202bbbf74ced5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00270-of-00512.json.gz": { + "num_bytes": 30027628, + "checksum": "8d3ecf4c61acafc49b624d08b6aa31340643e030f6c2248f689e8a17d355359e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00271-of-00512.json.gz": { + "num_bytes": 30014730, + "checksum": "b2e4820a0a7287786f802b3b40602c8ca77c7813b5f50db8a336b89b89bbdf37" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00272-of-00512.json.gz": { + "num_bytes": 30145705, + "checksum": "20c73e4a9056a5201621a4799b86c323c5136af43caa63a74298a5c3bee890a6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00273-of-00512.json.gz": { + "num_bytes": 30165945, + "checksum": "8f07a91b6b40444635d869b94558fa68e3593626808bc6122d4e17403cf76101" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00274-of-00512.json.gz": { + "num_bytes": 30097947, + "checksum": "9530522c841d8f09ccb89f4f0238f7b9048c211e85b27449fb3c09d3bd2bab7b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00275-of-00512.json.gz": { + "num_bytes": 30296359, + "checksum": "51a358db81805a20df4f920baacf3adea05209282f800fbedfc7fa49638a072e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00276-of-00512.json.gz": { + "num_bytes": 30311407, + "checksum": "a51253cf73fb200053eb5fd5eca398a7a070fcaa27fc99b23389d09eef7fe5ba" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00277-of-00512.json.gz": { + "num_bytes": 30372345, + "checksum": "cc4f6d9040d8c4909d4ea5b661a7e54ba4775ff1c7c55db1ff686a56d428e2a5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00278-of-00512.json.gz": { + "num_bytes": 30379507, + "checksum": "1052defa657524e1211e67d775a32243b164eda431c4c6ed351f0c6727f21b16" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00279-of-00512.json.gz": { + "num_bytes": 30195406, + "checksum": "6f4fdc92c516ad779fd521afba7d8d5bcd40672e63028f43f70fff4d7605f5ba" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00280-of-00512.json.gz": { + "num_bytes": 29902057, + "checksum": "c26f89efd0977465f45fe321036d88e2d6ca3ee1edc4bafe4b40ad1895cfc0e3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00281-of-00512.json.gz": { + "num_bytes": 29779702, + "checksum": "094139d741b7a47faaaaf50093ab4edbef6ad1943985c6f453ce45a67a95b190" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00282-of-00512.json.gz": { + "num_bytes": 30063500, + "checksum": "280d69bfc795f1502a9e744d53d1a189051a1e771042721f8e6f74f6559e25a7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00283-of-00512.json.gz": { + "num_bytes": 29956350, + "checksum": "505e49b7eeab46c77a324959eeff103f8899da1efc4d0fef5c0e6c6f8879a721" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00284-of-00512.json.gz": { + "num_bytes": 30146285, + "checksum": "9b075f2cfdb9a90fcdc7f779a52b0c5dad36385214844d4fd9df1e528ae78b6a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00285-of-00512.json.gz": { + "num_bytes": 30160056, + "checksum": "d9b9f3cbb9ce2a0a0a1a2f7ce91e98621d48a7a900c278aeef437dc6c0a7cdf0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00286-of-00512.json.gz": { + "num_bytes": 29844025, + "checksum": "6de9ff1013484662305e414725be2d0a4a1873a941250b95b80b5dea8919cf95" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00287-of-00512.json.gz": { + "num_bytes": 30089218, + "checksum": "444ff132c4a5330653b7319d34b2c7f4ae3b960d8b510cbd7389e3881f65ac5d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00288-of-00512.json.gz": { + "num_bytes": 30092170, + "checksum": "46dc5b3b84e4387ad718fdf96b751354d7048e898ec664e0d3bdfc21ee841ec2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00289-of-00512.json.gz": { + "num_bytes": 30365397, + "checksum": "b42e35746112198143ac18509e4f0148772db75e19f5eea9ed0d7e2849dbba48" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00290-of-00512.json.gz": { + "num_bytes": 30275920, + "checksum": "25d99877235c4b9dacd5d1dd7e9d16bba76cdf6cb1725fa617209142873dca0f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00291-of-00512.json.gz": { + "num_bytes": 30125784, + "checksum": "51da68b6f2751a83e2534c342b6e9d69c419fb606b44c42b872d69f5f726df3c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00292-of-00512.json.gz": { + "num_bytes": 30201021, + "checksum": "1e0a42b5e7ea7049c3c86b96d37c5d1c36f3ba2e2dab02145a897ef056fa6a87" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00293-of-00512.json.gz": { + "num_bytes": 30124224, + "checksum": "8c744f5c6eb92c0de70649cd773c0ad147bc7a1487b2ae7f1107bce9d19da601" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00294-of-00512.json.gz": { + "num_bytes": 30074708, + "checksum": "b3cfa4c4408c1a9f39b48e18a62e112ec3c132b226efe0850f9e58e2a517aa97" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00295-of-00512.json.gz": { + "num_bytes": 29990007, + "checksum": "012f63e147d22e34249e930975a2d8958a8d0b17350a9f6e368d702189b40d5b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00296-of-00512.json.gz": { + "num_bytes": 30093755, + "checksum": "5573859cc485ae4535b83fd408dcc6a82f644832c93e6125db9a16dd6ded338f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00297-of-00512.json.gz": { + "num_bytes": 30078472, + "checksum": "25e694485171ba1347ccbd7916c1b87a0d46acfd13795a8aabb1cb57b5eb1221" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00298-of-00512.json.gz": { + "num_bytes": 30327122, + "checksum": "6d6832cb3b1c86b6392bc9ca52f69a0bb16bf71c3c7664d9fe668ee259a40a30" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00299-of-00512.json.gz": { + "num_bytes": 30214180, + "checksum": "9f3c3d87a525874ea117e36e0b30d7f5cc6c64564506808058a0788d74943634" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00300-of-00512.json.gz": { + "num_bytes": 29895171, + "checksum": "e99d296965da2f731ea660889ce834cd1d21edf427298bab3a059ff3ebc64a2d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00301-of-00512.json.gz": { + "num_bytes": 30131063, + "checksum": "e5eeb0f237cf986134c946bb3c2a4b5483fb9c88b3c2b16b9db26135043036d6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00302-of-00512.json.gz": { + "num_bytes": 30184609, + "checksum": "4ac9bf5ca6fac7f7293238852424340326347ceaa6f5dfa6fddef8003421bebd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00303-of-00512.json.gz": { + "num_bytes": 29956412, + "checksum": "559019fe1ef1f7e77ac53ad98b3556965ebc524ecb80bbc3f26255d5ae6e3609" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00304-of-00512.json.gz": { + "num_bytes": 29974071, + "checksum": "3c54edc4b6a7e34048cbbadb55cb3b16496a4e6e7334b4ede4e1368daf4c5301" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00305-of-00512.json.gz": { + "num_bytes": 30338106, + "checksum": "1c91c0c5bcc2bec0a698318ad6f576a06db7885c20ed7f36782427b80580a75a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00306-of-00512.json.gz": { + "num_bytes": 30178986, + "checksum": "fff99f2758c2de57ccbfbfc6388f67e624d00d4a6cccb5820a7a8f5fcf02d386" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00307-of-00512.json.gz": { + "num_bytes": 29493455, + "checksum": "5d08c6e3909e21bed456ff9d06c983f14d3a277cb399a91047a692184f87c4c3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00308-of-00512.json.gz": { + "num_bytes": 30228844, + "checksum": "04bffac195e24383d06b0ab9ebf019959a4e7abe8e8e6a0cdfbf0a8e7c23c899" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00309-of-00512.json.gz": { + "num_bytes": 30351688, + "checksum": "3ce14d5104d1318c6a16d042735f0a71f4452897de60d17408181ec5b135bbb2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00310-of-00512.json.gz": { + "num_bytes": 29993012, + "checksum": "afad2f39bf4cb932e50d9a0be93940b423e7abcc3d67dac15b1939e4e40f4ce4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00311-of-00512.json.gz": { + "num_bytes": 30448951, + "checksum": "a049c31ef6304084d33cb7bdd2e21ada0c60b40b1002b2369e60d36a5098c4b0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00312-of-00512.json.gz": { + "num_bytes": 30034189, + "checksum": "557d1e88400a6d1d8ee4d717a959239edacbdd3e18d8cd20c5c85b77174dc302" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00313-of-00512.json.gz": { + "num_bytes": 30066486, + "checksum": "e4823ea1e9a59d5db84564a5b90c28fd8058450f238c60ad689ffd6b673d65f8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00314-of-00512.json.gz": { + "num_bytes": 30397706, + "checksum": "1b4c0653e7ccf7fda0a53d8cbd5ddd57322ac83822e9d05bbdb9eb8ac979cf50" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00315-of-00512.json.gz": { + "num_bytes": 30219107, + "checksum": "9c364c9cab4ff7acdd1818b13de2f36713df8fa6c504ba15cdf47fe8e3c30206" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00316-of-00512.json.gz": { + "num_bytes": 30098661, + "checksum": "84dd8a8739b5abc39d8180f0894b1fbf2930d6d333d7c86b646f40763327397c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00317-of-00512.json.gz": { + "num_bytes": 30178992, + "checksum": "16e4791b4e5ab3719dacf79fedb0b88ed54346372874c37ccb71d86bc419edc3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00318-of-00512.json.gz": { + "num_bytes": 30022982, + "checksum": "98345a826aab12bdaf5e639205d5dcdc1da8fecd7cafc1982df89ac8d4df7ebf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00319-of-00512.json.gz": { + "num_bytes": 30360409, + "checksum": "d53a39019a1627b42ae6bff68e283d37d0bb5f48b328c2c5cdcc1a3897f4e992" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00320-of-00512.json.gz": { + "num_bytes": 30347267, + "checksum": "c343a0eedf58484055e58762802ae8cc05f2cdb0b923785c493d056a2cbdb015" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00321-of-00512.json.gz": { + "num_bytes": 29967877, + "checksum": "cc5795d254ad749ccfe613034927bdf95529545ae1f277b694dd24a5996aca83" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00322-of-00512.json.gz": { + "num_bytes": 29885538, + "checksum": "d5eaaa1eea983bd37ed34651e6c16b746ff7c92e48038b234149fa6d04d3d866" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00323-of-00512.json.gz": { + "num_bytes": 30308848, + "checksum": "a42cfaef5e088fd6b24dfc121084a6cd038f5b0bfaecb9f33997ab22a97fb155" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00324-of-00512.json.gz": { + "num_bytes": 30351634, + "checksum": "0e2e6933f93466e9c8fe966f7770fe4c34caf182c713dad3206f4132eed1d41d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00325-of-00512.json.gz": { + "num_bytes": 30077168, + "checksum": "77cdbf7040ce7f38d735fef41813ce63aaa16fcd87fce80e6ca6bd56d350c369" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00326-of-00512.json.gz": { + "num_bytes": 30031750, + "checksum": "8d994c2dc1b766e3270dce3f0b8f6f8fe22d5c1e0e9780e1bfed52c1292b8641" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00327-of-00512.json.gz": { + "num_bytes": 29845765, + "checksum": "f6279e351d016769d6fb5482d01a15ba054d5fe6f9f1c4e92c0663cef0083002" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00328-of-00512.json.gz": { + "num_bytes": 30253188, + "checksum": "2ea84aafd94d1843a2cc4428279dbb079c6ae0aae6c00f90ee4b5ace3c827afd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00329-of-00512.json.gz": { + "num_bytes": 30124922, + "checksum": "49e3d91126d53eada7bbd87bfe9eaae74f059c69cd70a3a3b8101f49c1aca154" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00330-of-00512.json.gz": { + "num_bytes": 30026414, + "checksum": "07442fc4f7fb1732362293bc15a6754d70ecf4743392cf89c4497b3cd96269fd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00331-of-00512.json.gz": { + "num_bytes": 29961847, + "checksum": "f437c6f5f758a5d32c8fc949037060259162864c29aeaabf37032e79f5a1cf0b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00332-of-00512.json.gz": { + "num_bytes": 30167166, + "checksum": "96018497eb6dec020436c1333ff81980a64fb615997855fdd8cf35fe3f658db6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00333-of-00512.json.gz": { + "num_bytes": 30192963, + "checksum": "1c12ea6b9031049dbc84e4da6b5fdedf480e989385d758c88322c415a1cabbb0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00334-of-00512.json.gz": { + "num_bytes": 29847008, + "checksum": "c269285f15f626b4b15a7d1705ffa08e3f4d49ce13de8174b72f9f6276a1c6af" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00335-of-00512.json.gz": { + "num_bytes": 30262244, + "checksum": "179ee564e6fc644d9ee139bdb02d470a1172221b0f6e510ee5935683500f8257" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00336-of-00512.json.gz": { + "num_bytes": 30262910, + "checksum": "317933afdd8dc8a3a355e44ee3d84bbab12a2f30c98ea1172dde7074ed4c0557" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00337-of-00512.json.gz": { + "num_bytes": 30155329, + "checksum": "c5b850399252ec41b0fd9cb2da87ce25e5a44df9f44c6ed9d8c559a5729e5a0f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00338-of-00512.json.gz": { + "num_bytes": 29952961, + "checksum": "48083123ba97a6212e0501799bd01936f0795bdd4d9c2710b9aa67d54b29037e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00339-of-00512.json.gz": { + "num_bytes": 30403399, + "checksum": "313b60f985dcf591f34d351b758eedace655b6c6d3946dd2ddc55f34a9a97ae9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00340-of-00512.json.gz": { + "num_bytes": 29917484, + "checksum": "2c72290f3bd51dea2a2877d68a968dc2b75dadf99ab3cc2230e41be45f3515d3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00341-of-00512.json.gz": { + "num_bytes": 29905522, + "checksum": "1acd83a0da4a7a4912b589dbeb68b37396d0454371b2b71af4ae18b854d482ce" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00342-of-00512.json.gz": { + "num_bytes": 30022369, + "checksum": "8756be42335bba12d06de63e247659f8d603a092ff342360dfed645aec135c47" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00343-of-00512.json.gz": { + "num_bytes": 30229313, + "checksum": "863e29987a3ccfa08e14ae987c81367a53b9fe08795184db086117a9555e058b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00344-of-00512.json.gz": { + "num_bytes": 29924335, + "checksum": "aa9003a7cc3527fb658fd807c78890587a8b35634a1f0838bc221a6374205d20" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00345-of-00512.json.gz": { + "num_bytes": 30229482, + "checksum": "a7e88b015bcf7761217e9b3ffd413f13cac48f6afe083353436de6cbd0d0018d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00346-of-00512.json.gz": { + "num_bytes": 30029147, + "checksum": "b862ea62ac032c203c0038c061a44edabe4644be03b876ec7322e96762374940" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00347-of-00512.json.gz": { + "num_bytes": 29808182, + "checksum": "62915b86cbbf61a76f73d05509a8e839aae0b965134ef79022377625df7ef741" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00348-of-00512.json.gz": { + "num_bytes": 30091116, + "checksum": "6c384c2c6bc8340b88e085f8bbc2616be68c96fa7b8b88306b4500367d053a49" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00349-of-00512.json.gz": { + "num_bytes": 29867618, + "checksum": "bfb19508ecf8bd4d9a8847f0edab5acde6896182c27da706a6f2863bec43c152" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00350-of-00512.json.gz": { + "num_bytes": 29723106, + "checksum": "a645c62c94de9018175f15a0b38aa8bd2484601ee189b7c27d589288eb5af97e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00351-of-00512.json.gz": { + "num_bytes": 30047620, + "checksum": "991061a23834e6bb3dc0595cf0e8328e07746d10fbf7a7ba397c1410cb66175a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00352-of-00512.json.gz": { + "num_bytes": 29808328, + "checksum": "6c8e377a6cc82e81d66e2be3d23c1cdd42480015a68a1db458d542b7ff64ab7d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00353-of-00512.json.gz": { + "num_bytes": 30040117, + "checksum": "ead6f32d98a91c47fb9c21334143f02181efb0b831705baeebb9820d069598fe" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00354-of-00512.json.gz": { + "num_bytes": 29953984, + "checksum": "ba349e503d017abbc1c83da2314c0a4892a9f3e5e480173812578f44d9b5904c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00355-of-00512.json.gz": { + "num_bytes": 30179912, + "checksum": "2bfeab794bbe0432db52cc595d25864b17fdb0744a80d6d907f6f2ffc5c56b81" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00356-of-00512.json.gz": { + "num_bytes": 30312163, + "checksum": "d0dec696d28c601d3a1f75b0b6e6e711e00809f0d5ea915f63cb6d9b7adcc597" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00357-of-00512.json.gz": { + "num_bytes": 29931515, + "checksum": "d43c75371e32d0c1e65f43acc00aac3ca43762d4c6eb6bb61759ac5fca593a99" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00358-of-00512.json.gz": { + "num_bytes": 29739788, + "checksum": "96fef1b4a5d6a080ff5d4a10bc90911dcb2ddecb4be91d0c9620e6d2484e3ee3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00359-of-00512.json.gz": { + "num_bytes": 29913841, + "checksum": "05b065d2d13b787ddee4707be7e2be46173c23794b9e8c773d0da743f435db17" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00360-of-00512.json.gz": { + "num_bytes": 29805295, + "checksum": "826104b9f4c2634d128f15564bd4990057dfbbb4066f2a082039d243bab56935" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00361-of-00512.json.gz": { + "num_bytes": 29839676, + "checksum": "ee5ba4cb14ecee0c857828a866615c6bfe45f67b158173dcac44146a02d97738" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00362-of-00512.json.gz": { + "num_bytes": 30154783, + "checksum": "d67b49e6fa5dc293fbd3057b7ca0beb7e0bd1ff692cdad7f2dfb7abadc1f4599" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00363-of-00512.json.gz": { + "num_bytes": 30126118, + "checksum": "6940704da6cde5822d48dc806280b8d57e0593ba299731e68ca9c2a4f7cf65bd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00364-of-00512.json.gz": { + "num_bytes": 30184894, + "checksum": "e740b4a0240e691f16a423fd658aa3c7539986695418af3b5a171a48524db74f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00365-of-00512.json.gz": { + "num_bytes": 30386766, + "checksum": "5a6a9461ef9ca579a849f6bef4d6225504a885aa797d3b2236ed8df6f5ea72ee" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00366-of-00512.json.gz": { + "num_bytes": 30208411, + "checksum": "8e0ce2447dfadaa4d41b991a2ce1be63b409e58e88944594dc8591bf9ab41403" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00367-of-00512.json.gz": { + "num_bytes": 30266003, + "checksum": "04ea00b46a583edea7740d74d719ef7f303b7f3873365b9ff4e94f08ef80832a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00368-of-00512.json.gz": { + "num_bytes": 29993752, + "checksum": "38b1a55dd4ff1b504d2dbc0b2ad54fe43ab16c8bdba55bd97f4a55dafa8c83dd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00369-of-00512.json.gz": { + "num_bytes": 29833222, + "checksum": "a25c405918920ed00edf5f3007cb8895b59fb67618dfea266b048273303b9592" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00370-of-00512.json.gz": { + "num_bytes": 29988999, + "checksum": "2812e6d9865d77ca8ac2d1499ba86be1ceed868a1da2bd13fbd0967058a3516c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00371-of-00512.json.gz": { + "num_bytes": 29866636, + "checksum": "ecd1d3bdc41c3f41f8c9d3a63c75766c173f70ff117af748a08c221ca4273b18" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00372-of-00512.json.gz": { + "num_bytes": 30296883, + "checksum": "723d2c5ebbdd95ab84c53e458d81944b6907d08c7aec67300f012880624d0010" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00373-of-00512.json.gz": { + "num_bytes": 30310322, + "checksum": "ae45d088521f2faf9852cb169962176e84bbb81d5ba157d4228d348f7fcf60f4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00374-of-00512.json.gz": { + "num_bytes": 30340527, + "checksum": "9b09c9e1b424fd05540b720c5a85f71eea43d743dc4ebb318e839125ccac9383" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00375-of-00512.json.gz": { + "num_bytes": 30193692, + "checksum": "c3ca4bb179cadf872f25f1cdb5c3667933bb8dfb7af21068a24b1b09c961dfa8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00376-of-00512.json.gz": { + "num_bytes": 30184130, + "checksum": "5d801f4bc20c4c6d8821ccfff06cb5dfe4214e571734feacbea3325462afa280" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00377-of-00512.json.gz": { + "num_bytes": 30259301, + "checksum": "ebf08508c24e29a8a14b72248f090d765b02ee7a31296811d0391f2a2e73c046" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00378-of-00512.json.gz": { + "num_bytes": 29650049, + "checksum": "c13e994e68b938ca069d2d412e7891cbaf2ee205d65b1c17c6acfea01adce157" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00379-of-00512.json.gz": { + "num_bytes": 30265211, + "checksum": "667da6f0650dd684aa50bc691b5783968ae8cab847dea14fc8d8bfe203e351f4" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00380-of-00512.json.gz": { + "num_bytes": 30429631, + "checksum": "7cf0e9ae00bec72f571d152730107efdd944176818600517fb2d0412a859d366" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00381-of-00512.json.gz": { + "num_bytes": 29889471, + "checksum": "f781b3128e92c54365be7771695555378067a65fb922e04062ab6f3f092ec827" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00382-of-00512.json.gz": { + "num_bytes": 30029894, + "checksum": "2d133def2bc4b840312ebe5c466c9f22729b67aa4c2a41dda2e6a9a55ddcddbb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00383-of-00512.json.gz": { + "num_bytes": 30249255, + "checksum": "e8610abf7e2bd70b1067a1b2dbf392ac32be156945502629228969974d3899b2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00384-of-00512.json.gz": { + "num_bytes": 30362665, + "checksum": "f217071bd0c1b1bddb3342c85064d7ebb54bcde2512997636f0638a0b3641588" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00385-of-00512.json.gz": { + "num_bytes": 30080234, + "checksum": "2db4b15c7391b6e6d3791721ee574d09101df597110feebc59e4f0aff4df6c26" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00386-of-00512.json.gz": { + "num_bytes": 29897704, + "checksum": "035daed74487c5262b8cfbefdfaefd17f2834c7b4a1d293934d755e059b58f5b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00387-of-00512.json.gz": { + "num_bytes": 30072139, + "checksum": "73013fbd06eaf94a7c8a0f0de420f83bed56655fb2d4e5d93972e8ca1847d130" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00388-of-00512.json.gz": { + "num_bytes": 30123843, + "checksum": "5db846c3d0b36774ce771ddfa8c53a915767926a2ad48222256d839326336f19" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00389-of-00512.json.gz": { + "num_bytes": 30278955, + "checksum": "9e4c590e67b2fbd357af955e39864ffe73dda201d76759935fda80b10b463500" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00390-of-00512.json.gz": { + "num_bytes": 30013591, + "checksum": "90974ba6eff489e0f4f52187b6241120740c782945e86525cb5d1e551a54e322" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00391-of-00512.json.gz": { + "num_bytes": 29925212, + "checksum": "10fcd62813434e2557b5861fd8604f534952561065bee9dc525b1cd3f5b2730f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00392-of-00512.json.gz": { + "num_bytes": 30016498, + "checksum": "da88b36bd3f15551d8fad115a86f111cc5c3d9a3c6fa9497214aabec7bcd6aad" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00393-of-00512.json.gz": { + "num_bytes": 30061083, + "checksum": "1ed9881020f240e1277e6513bc2abf24ea48e9cb0046d7e87a6d3669c8b42a0f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00394-of-00512.json.gz": { + "num_bytes": 30043459, + "checksum": "a35c3de1b0c982df8471705574e6eb7cc730fff122ff17d1381f2c7b9f20d6bd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00395-of-00512.json.gz": { + "num_bytes": 29921106, + "checksum": "f4cf52f8d6a1288773cc366469df140f885b233fb6aa1cb75387a450d88ec94f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00396-of-00512.json.gz": { + "num_bytes": 30024980, + "checksum": "5ebe04e54e4242d52aacb4c2e107dd10e609d5a7a6ff0425d9952bed98ef4921" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00397-of-00512.json.gz": { + "num_bytes": 30096825, + "checksum": "3ac381004d8257aa50fb28f0fd2171abbb93ad825c3f43422b9dbec6e1c6f31b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00398-of-00512.json.gz": { + "num_bytes": 30059739, + "checksum": "40c38af325f4d01ae7c74aa9cd8f8d1c96c6af851175f80d3c50d85c5f5d3585" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00399-of-00512.json.gz": { + "num_bytes": 30049826, + "checksum": "2ba0109b2d5b88422250bcbd2494cc6e11528710f38fa6e83a1f699b840b68a7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00400-of-00512.json.gz": { + "num_bytes": 29953506, + "checksum": "010610ba3af3dbfbcf2fac93136b7066fc58eb914dce9ae999722d0cfec4d331" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00401-of-00512.json.gz": { + "num_bytes": 30271141, + "checksum": "29587bb4be2c367f6479705b5c3c28716affeefc857ac1f77e4c33e55264def0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00402-of-00512.json.gz": { + "num_bytes": 29861236, + "checksum": "8e399149c335ec599f881fada448c9b4be22326357153c74b0de627078f1d43c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00403-of-00512.json.gz": { + "num_bytes": 30175831, + "checksum": "0d2800836914a1e2ef4a1aaea6e70d19699fc2555582ec670223177cac05a4fa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00404-of-00512.json.gz": { + "num_bytes": 30097682, + "checksum": "f9665e9199978b123feb962ce347b30cc1520626c32dfef0ca3cd8895a45e445" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00405-of-00512.json.gz": { + "num_bytes": 29810961, + "checksum": "8ea29cf9f7774a16a4c2aaeff1b6353de2951073676a9c411f19b0a5fb755b07" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00406-of-00512.json.gz": { + "num_bytes": 29963498, + "checksum": "90b10c91f6e0006576ec9b426c424e50fc1726c25ae8eb91bf91bb9001ade2e8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00407-of-00512.json.gz": { + "num_bytes": 30089554, + "checksum": "cfa905514e4f19c4eb82e438f5eb987731004476f026f4bebbeeafbe519ec85f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00408-of-00512.json.gz": { + "num_bytes": 30148002, + "checksum": "dddada59e2ef306cdf83b7c9ce3c912792237852053a4ea683224438a242c5ff" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00409-of-00512.json.gz": { + "num_bytes": 29989174, + "checksum": "907667ac304b6cca7100a9606e915c003fee43f1640d5b01405beb16eac4c379" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00410-of-00512.json.gz": { + "num_bytes": 30519580, + "checksum": "acd5cd2ecc46927046c81c9bb3459dd72a98e346ebb59c13c0db08fbb60961a0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00411-of-00512.json.gz": { + "num_bytes": 30408107, + "checksum": "6a9c2d42717f853cd4a76fc5275e95e2a584b7465c6059f586f6a06417048a42" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00412-of-00512.json.gz": { + "num_bytes": 29699198, + "checksum": "29e76bdab47496ed61a102edd3c61c20e60ab52abeb8e6068f7aa4ad1868f4fc" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00413-of-00512.json.gz": { + "num_bytes": 30065457, + "checksum": "b4a33941d0b994b82e3be351542cb4a832742e050ebbd71481e7ba34c8dcbc3b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00414-of-00512.json.gz": { + "num_bytes": 30342960, + "checksum": "4ba7edb3c77a45f0e4cb7e969053db6f44ce8c0a8ef262582512814b1161d9ad" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00415-of-00512.json.gz": { + "num_bytes": 30201576, + "checksum": "25cb4eb4bdf3cd1b29289a23696be8bd41c5f577294e94607bea7b91252a04fd" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00416-of-00512.json.gz": { + "num_bytes": 30021170, + "checksum": "60472bd2a2896bfb57baabb583fc6cdd402a1d776f6a4c9bb58ed556e67cd76f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00417-of-00512.json.gz": { + "num_bytes": 30237505, + "checksum": "aea8fd33c2acf1cef890549b1f88b18a2eeb37f6d4dd22b552f735811ad0b8a1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00418-of-00512.json.gz": { + "num_bytes": 29999334, + "checksum": "93583d771ce7f0e1d044de2919a3ffdd48b7b7dab0cd3b6dc459200dd53d8762" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00419-of-00512.json.gz": { + "num_bytes": 30194801, + "checksum": "cd36e129487272742f3e60ab6512dd79b3d1ce3c22490d2e47c00c2ae595cfc6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00420-of-00512.json.gz": { + "num_bytes": 29903898, + "checksum": "6f18a5ffc7efe5f555b02d3a31ed43714e09e73f7462206220d70450f47cd6f6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00421-of-00512.json.gz": { + "num_bytes": 30015573, + "checksum": "cfacef2cffd953425eaf4d7b2b6cf5d2637bf5d58c6ed2bd0002442795c7d36c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00422-of-00512.json.gz": { + "num_bytes": 29966521, + "checksum": "14f646b15948cf586ec1abd4bf4bf45bf180913e4d09049fa779bc7a196e455e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00423-of-00512.json.gz": { + "num_bytes": 29972805, + "checksum": "ad7d4ab443c7a8122976570891a225a44ff86d2299d70706066633a6204eb0de" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00424-of-00512.json.gz": { + "num_bytes": 30317886, + "checksum": "37c8bf3b535ea4053aa2424c846e3449f9eb27d5ff999e1e93b6cee0aa975333" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00425-of-00512.json.gz": { + "num_bytes": 30059310, + "checksum": "674ca5eaf6a88f76881c8a1c48e1e0f93794785ee5ea17fb70f49228d7f39614" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00426-of-00512.json.gz": { + "num_bytes": 30182498, + "checksum": "988d08cd18162d9a309155d2e75cd4980f76ab4c73ef8286edae94ca4628ebcf" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00427-of-00512.json.gz": { + "num_bytes": 30253874, + "checksum": "aa8c08a684ea0bbfda9297aea07429172a2fa4a161268b964421796173275b35" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00428-of-00512.json.gz": { + "num_bytes": 30055421, + "checksum": "b1ed26e826bee7fcbc31cf1c368c9a63eeedbea1c2fd0fb07370b461a03d1a7f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00429-of-00512.json.gz": { + "num_bytes": 29830674, + "checksum": "3efdc67ad7a108416dae47886e542da5c2ab1cd7e1aedd25c1c5d4e0607572f6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00430-of-00512.json.gz": { + "num_bytes": 29938000, + "checksum": "3221ef5e4c28d44c1da4fa04689f318217991c07aff4fdee5e1091fe8e1162ac" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00431-of-00512.json.gz": { + "num_bytes": 29829687, + "checksum": "225f4e22df1b45a7dc9fef2f5a44da8f8ee25608cbe34195e21b49c8cd10f3ed" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00432-of-00512.json.gz": { + "num_bytes": 30006209, + "checksum": "9fc53637db7b16c8cf6f824adf21d4602efab715ad78eab62c4be7981a8bbc1d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00433-of-00512.json.gz": { + "num_bytes": 30656456, + "checksum": "6bf7b701dc18f68d0facd7cdea49a26cdcfdd7829d5346eefe555485cfa7f336" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00434-of-00512.json.gz": { + "num_bytes": 30138891, + "checksum": "793532f72aa41c1dd7c549e9597fe8e73796c53eb5fe410a73de418ec446d686" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00435-of-00512.json.gz": { + "num_bytes": 30430276, + "checksum": "0d13d345ad12999fb4e7a9675e08bb1c90980fd193ed8530e4258e07bd6ea754" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00436-of-00512.json.gz": { + "num_bytes": 30173309, + "checksum": "fbce5fadb4b49bf833f77337929d873b2b25c3b564f7622f3672dde7a044e5d0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00437-of-00512.json.gz": { + "num_bytes": 30142240, + "checksum": "76c34800a3223f5fe0f1960f3d3c9dd9ecdc2e652493d71ef245415b5027c902" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00438-of-00512.json.gz": { + "num_bytes": 29979673, + "checksum": "4784c3787d24b9d46ad7c835683c6506c2e55c84835391e2aca0355f032a1888" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00439-of-00512.json.gz": { + "num_bytes": 30169105, + "checksum": "5012d03e637769d7494bd3cef0a8dfc8b38c995e0d5780089c15d6b1495b3a8e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00440-of-00512.json.gz": { + "num_bytes": 30107004, + "checksum": "529beaf4ad0251e35be574b1f623571526ec91a588ebd7df43e9d1cb99445f53" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00441-of-00512.json.gz": { + "num_bytes": 30324563, + "checksum": "f5e5fbf5e329f5bb0e83f758b8fc76516d65c3f91ad97e328187eaea83e4b667" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00442-of-00512.json.gz": { + "num_bytes": 30335681, + "checksum": "b8a26ed60f87a87347886b4467aa576ec5e8c106931589a1aa821b99fdabdb54" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00443-of-00512.json.gz": { + "num_bytes": 30155655, + "checksum": "e27bfb813fd6aba96ada81b095a559f0b7847cd25f7f8973663b19cdc5b8985a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00444-of-00512.json.gz": { + "num_bytes": 30340540, + "checksum": "705dec13ba2824d45e801bc2cf3e709d6492b1ff6de2f9ddefb5a57dbdada4ca" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00445-of-00512.json.gz": { + "num_bytes": 30248960, + "checksum": "09a6b83910369cf269c4f095607fb2f0ac0ec7e25b501f577fe13920a8573ee0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00446-of-00512.json.gz": { + "num_bytes": 30316703, + "checksum": "8f88b794c08bb492f50073337a30aafac0d05819505b507ab283dba0cf17d125" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00447-of-00512.json.gz": { + "num_bytes": 30184407, + "checksum": "38c819df823197bea6d647c3f78bcc15024aabba814cae322c1663c45fa8382e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00448-of-00512.json.gz": { + "num_bytes": 30238484, + "checksum": "8c0abfb8dca37a179b01dadd2227206cbe6e5b916d0111c0b00d2edc3951c7f6" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00449-of-00512.json.gz": { + "num_bytes": 30143151, + "checksum": "9731e9644e5615d5d5ebdbacc6efa6382df856c8763b7485c9a5838864c1332f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00450-of-00512.json.gz": { + "num_bytes": 30122606, + "checksum": "3b746f616f21c91277cde8e6d0d7f792ead7874de7ecdf11830a4a56db3dc799" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00451-of-00512.json.gz": { + "num_bytes": 30128179, + "checksum": "d6cadfc64ee39c9beb93f0bf8c169ca9d9053e0f76e1c9697841438e20dddef3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00452-of-00512.json.gz": { + "num_bytes": 29979326, + "checksum": "42de19ffc3ec821fbf5ff686d1b36d189ad9ee5c4553a2ff0d003ee1a754c9c8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00453-of-00512.json.gz": { + "num_bytes": 30118272, + "checksum": "22f9b2d3a9f089f1015f74d1ca0aca8f2a4970595326d964817177cbe6859271" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00454-of-00512.json.gz": { + "num_bytes": 30018294, + "checksum": "17c16895edccbb8b40fcc52cbafc0c15957020eb530e071dcce34544d5958bd1" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00455-of-00512.json.gz": { + "num_bytes": 30155903, + "checksum": "8b9d49837b309c3389d03dd3bbae92395bf7086134fbc69d28d9fff60a90d4a3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00456-of-00512.json.gz": { + "num_bytes": 30282104, + "checksum": "ab63fd2efb0cc883d303241b3488a8135a196db7edc844458cfc1483898ceb3b" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00457-of-00512.json.gz": { + "num_bytes": 29920723, + "checksum": "dbde2eeef90144b209ef5afa6d5165ad638ae57d919926a379a10fccf6850a61" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00458-of-00512.json.gz": { + "num_bytes": 30163167, + "checksum": "800307106f5861e0bc246bcaae214e6dadeee849905cac184ecfe6d0b560fa68" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00459-of-00512.json.gz": { + "num_bytes": 30248893, + "checksum": "3e78d327a9463929f33311e18116f5d1d2ae4926f7a600378875ba854cf5ee47" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00460-of-00512.json.gz": { + "num_bytes": 29840067, + "checksum": "047568a5dad00b04ca1ea4aa262c7a4af9b61e87bc4ea02ffd5c6c8c049bf8a5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00461-of-00512.json.gz": { + "num_bytes": 30179062, + "checksum": "ed8abe7b465bc19150b831632cb7afa298d6cb4beb9b6043a35a0f8afb5f730d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00462-of-00512.json.gz": { + "num_bytes": 30266398, + "checksum": "d7b74f5c1c1f7bb489700adcfb7e48400c4fcca7669e2d56396d9fabb5a63b91" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00463-of-00512.json.gz": { + "num_bytes": 30158800, + "checksum": "224815aee29f6d04ddbc7457c84338eef9b127a767e7b50ed77283ff166d4f93" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00464-of-00512.json.gz": { + "num_bytes": 30393915, + "checksum": "0dd019fd2c19936ce2e6410b65872f630131c5da7543c8e66fa87547fd1a2209" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00465-of-00512.json.gz": { + "num_bytes": 30148939, + "checksum": "6d74dc9d74d28c2b8ba8d43ba3d594af0cb176cfa7bf738f3933be2a9c37bb85" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00466-of-00512.json.gz": { + "num_bytes": 30268228, + "checksum": "0e201327066f28c19b082fe35e4fb3bd76c8fd2d32236d1d6e2309489152aa66" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00467-of-00512.json.gz": { + "num_bytes": 30121937, + "checksum": "7352e5a9ee66dcbeed2c9e1fbe6c9355f0e5dd1b30b592a9fd5690958945e5a9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00468-of-00512.json.gz": { + "num_bytes": 30004669, + "checksum": "53876848336ac57c082c9d5735bc1717f69ef38688b221d5e5ab9cd9cb4ec620" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00469-of-00512.json.gz": { + "num_bytes": 30049860, + "checksum": "a5a720b38f106dd5d2a2b7647748b52b4531ac12294e3b0d8dbc92062639c0c3" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00470-of-00512.json.gz": { + "num_bytes": 29961380, + "checksum": "9611764fc4f84b92e86fa6f9ea41464f6c26b07d1c51241b627a3d155e99d163" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00471-of-00512.json.gz": { + "num_bytes": 30449164, + "checksum": "db508df549d518c3e8b99b2f0098ea93fead1e632f53d8ae2cebff1d3476577c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00472-of-00512.json.gz": { + "num_bytes": 30312620, + "checksum": "1993b5e292c6c60a3373aabe896f1a57afaad73fdce0ec60e30696368f7c0afa" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00473-of-00512.json.gz": { + "num_bytes": 30406764, + "checksum": "913045c61fb5a145379d9fe08c91ea63092b197400c0c87bfa65af91720b563c" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00474-of-00512.json.gz": { + "num_bytes": 30078563, + "checksum": "c495119e150b083d709ca915abd760683793361ebf3e079b04efc9b7e1900379" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00475-of-00512.json.gz": { + "num_bytes": 29860761, + "checksum": "50bb5f40d2e91ab136aa63063fff860529c8961f2a38500a645b10339751589e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00476-of-00512.json.gz": { + "num_bytes": 30199778, + "checksum": "c969cfbb7ed7716f665b336b2ed9f7b10b532c7adc6d8a347964831a39cfef0e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00477-of-00512.json.gz": { + "num_bytes": 30130742, + "checksum": "54c8b89102cf882eda5208544a6c5d317c1defa8d997f9450ebd576e58f91830" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00478-of-00512.json.gz": { + "num_bytes": 29901444, + "checksum": "f669299d794ecc0523c64ad31af8fcce5cf3f880e87fd73f4c3f434425e9b238" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00479-of-00512.json.gz": { + "num_bytes": 30587214, + "checksum": "25d0fbd9027deaf140650f0b82a2316c37939f199fe7633b9f643684404f2029" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00480-of-00512.json.gz": { + "num_bytes": 30145237, + "checksum": "68a29728290e1199ce8d1ac060365bc443ea67c24292b2b04f1b4ca44ca7238d" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00481-of-00512.json.gz": { + "num_bytes": 30204159, + "checksum": "1605034b89e33f6794c901adac1eb200bb489f76b9bae6bc56b01e9f6ab4c254" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00482-of-00512.json.gz": { + "num_bytes": 30430794, + "checksum": "2dce9df095e89ea6645fb599f518612511a62b6c475808ad004c32968b19bae8" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00483-of-00512.json.gz": { + "num_bytes": 30102412, + "checksum": "c7c626977521b0d1f5bcc02c484b3eb4f517ba71006a4802df08a0f4cfb8ea9e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00484-of-00512.json.gz": { + "num_bytes": 30171871, + "checksum": "519ed997f1f1f1de7864b0bddf202b25e25bed349f63593a88337262d7705968" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00485-of-00512.json.gz": { + "num_bytes": 30049539, + "checksum": "8d2314fd3239ba3dfa99962c1d0a38e05edf9194e1faebae88f6b19ecab8fbf7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00486-of-00512.json.gz": { + "num_bytes": 29949995, + "checksum": "a7521e09cbe77098c23172427bfb931dd50f0c9d58b034fd1621687849a8d379" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00487-of-00512.json.gz": { + "num_bytes": 30345072, + "checksum": "ebc6254a4d241afb886b8df20819301121fcb234a32a1dd4ee8ae49571081f92" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00488-of-00512.json.gz": { + "num_bytes": 30300622, + "checksum": "509bba28ddf770d38554a2e846f2ce0d2af59e3662a6d6ec4dddb75fb509f8d5" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00489-of-00512.json.gz": { + "num_bytes": 29949909, + "checksum": "996e61f8e674b0a016a568630ee13a7473f99a919437c225a4198d232861e628" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00490-of-00512.json.gz": { + "num_bytes": 29995429, + "checksum": "9730024ad352eb12f74ac446ed32b9c57898658954be5dd639184fc5264527cb" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00491-of-00512.json.gz": { + "num_bytes": 30293919, + "checksum": "65b2a7de3284e892441b0fe8e850d89de842355d78fa9944358b1ee5912a948f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00492-of-00512.json.gz": { + "num_bytes": 30115831, + "checksum": "26b535c3175bb86ef721593f81d9cf006d4c3749f156c63ccd2a2c04e1201236" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00493-of-00512.json.gz": { + "num_bytes": 30187809, + "checksum": "a0918223c5523da20bd8230de1985b0a3cbb1e239af3d62a83d720a3a528c567" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00494-of-00512.json.gz": { + "num_bytes": 30149878, + "checksum": "6e9a5e329f834e41b4a8a9a6809df3243e5bffc580327912288ad7f790b43ab7" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00495-of-00512.json.gz": { + "num_bytes": 29711944, + "checksum": "3b9ba9d667e1241692ff9a654a68e98e8e94e32244a9419b2542137b63fb4705" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00496-of-00512.json.gz": { + "num_bytes": 30114815, + "checksum": "24b78cc36bb0abc67c998320e7029b6e7bbbee267a367eb538f23956c13f27a9" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00497-of-00512.json.gz": { + "num_bytes": 30048480, + "checksum": "29c3606acf298498fc3498bd769544e2879afbd0d5c46cee298cb25058694aac" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00498-of-00512.json.gz": { + "num_bytes": 29934973, + "checksum": "8afaffea92dfad745be8aa8cd3de0ee97cbcc26fbad6c71d56683aef6a27055f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00499-of-00512.json.gz": { + "num_bytes": 29796509, + "checksum": "9cbbd8f6d8fe92207c4cb2f0422284726deca1bde7f30cb01cce7fcd4665b380" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00500-of-00512.json.gz": { + "num_bytes": 30221736, + "checksum": "902904aa9fadaecbe698402a27b4e68b00813e67b79f84d4c696cd9c72f08f55" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00501-of-00512.json.gz": { + "num_bytes": 30108320, + "checksum": "76e848f8dbc082158fc5d3a2f7c10cd6e03585667c00efc639f2c6f47d44aeb2" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00502-of-00512.json.gz": { + "num_bytes": 30381907, + "checksum": "885bbc9788235abf33728737f72f267e60d1f5d4a77493cae76f161651d89579" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00503-of-00512.json.gz": { + "num_bytes": 29983805, + "checksum": "5134934392b13e3f84dd32dcb1c59f4d5416d6dfd925bf896f3eb61881d82136" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00504-of-00512.json.gz": { + "num_bytes": 30041413, + "checksum": "4978245a7f545d676bad6edfdfe60ffdad94de47af0fb10649fa39e9b068939e" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00505-of-00512.json.gz": { + "num_bytes": 30021620, + "checksum": "64933c28ea3f608326f1c6ef56170886767f1ab4f9ecbc4bf3263c7043901fce" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00506-of-00512.json.gz": { + "num_bytes": 30260343, + "checksum": "84667dbe68ecf1f9bbdaba0e73eca6fe0444f6594a1e9a4b46e9812ae7bce7d0" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00507-of-00512.json.gz": { + "num_bytes": 30173739, + "checksum": "dd6d44e4f344f3ab1cd61bacced7b5f1429cf6823fc9282452a539012bda028a" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00508-of-00512.json.gz": { + "num_bytes": 29903443, + "checksum": "4afc46096ac2697867c3a75896c5ceb36617c4c21a749dded58a1ea4565e41df" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00509-of-00512.json.gz": { + "num_bytes": 29862664, + "checksum": "74a720dc16b389e8122d61aa94bc12a5bc4253ca6f39679781c938e2eb556878" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00510-of-00512.json.gz": { + "num_bytes": 29744368, + "checksum": "6a302049e7a1668c5fb2e4b5afca518fa53ba1a9dc717015ecb5768e85ec4139" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00511-of-00512.json.gz": { + "num_bytes": 29896714, + "checksum": "48b89e909c0e33fd59c9623f8517cdfa90fa35a4641f999c6f68e1cc9f2a309f" + }, + "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-validation.00000-of-00001.json.gz": { + "num_bytes": 15284943, + "checksum": "42ac859dc1c4d48d165ec602909403e2066ce1d4854149ed70b9ec9cc96dc65f" + } + }, + "download_size": 15435025687, + "post_processing_size": null, + "dataset_size": 76369191765, + "size_in_bytes": 91804217452 + } +} \ No newline at end of file From 7923d9f6eb8b8df7208a330195218b8fd3d28295 Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 1 Jul 2021 15:01:35 +0200 Subject: [PATCH 09/19] infos --- datasets/c4/dataset_infos.json | 10470 +------------------------------ 1 file changed, 1 insertion(+), 10469 deletions(-) diff --git a/datasets/c4/dataset_infos.json b/datasets/c4/dataset_infos.json index 86514075daa..60e8bdac218 100644 --- a/datasets/c4/dataset_infos.json +++ b/datasets/c4/dataset_infos.json @@ -1,10469 +1 @@ -{ - "en": { - "description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", - "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", - "homepage": "https://github.com/allenai/allennlp/discussions/5056", - "license": "", - "features": { - "text": { - "dtype": "string", - "id": null, - "_type": "Value" - }, - "timestamp": { - "dtype": "string", - "id": null, - "_type": "Value" - }, - "url": { - "dtype": "string", - "id": null, - "_type": "Value" - } - }, - "post_processed": null, - "supervised_keys": null, - "task_templates": null, - "builder_name": "c4", - "config_name": "en", - "version": { - "version_str": "0.0.0", - "description": null, - "major": 0, - "minor": 0, - "patch": 0 - }, - "splits": { - "train": { - "name": "train", - "num_bytes": 828589180707, - "num_examples": 364868892, - "dataset_name": "c4" - }, - "validation": { - "name": "validation", - "num_bytes": 825767266, - "num_examples": 364608, - "dataset_name": "c4" - } - }, - "download_checksums": { - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00000-of-01024.json.gz": { - "num_bytes": 319308785, - "checksum": "8ef8d75b0e045dec4aa5123a671b4564466b0707086a7ed1ba8721626dfffbc9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00001-of-01024.json.gz": { - "num_bytes": 318039285, - "checksum": "b945059cd1a343cabe311881b7840a6f0363f570e745a0eff0e687e266f6b55d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00002-of-01024.json.gz": { - "num_bytes": 319748667, - "checksum": "2967dc7e587ced6ecb9ba617ad2d4c44901467969de5bf5b0f5a9e5b70555d75" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00003-of-01024.json.gz": { - "num_bytes": 318564193, - "checksum": "b79d9abef5741578929be0d59db9ca652a8276207ef18a944b7a5f11fef5beb6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00004-of-01024.json.gz": { - "num_bytes": 318579884, - "checksum": "cd9f98eac2bc6062f55d9a36bd744cc924a78ea2fd998830e0034e4456f5d014" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00005-of-01024.json.gz": { - "num_bytes": 318003681, - "checksum": "8ac5907a54dbc7ab9c14624448c7c3f6afed33af9d0a855f1eae955e62e255b9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00006-of-01024.json.gz": { - "num_bytes": 318495137, - "checksum": "8fd9b9a4b74c9414466b245ebda7db041e7bd8603971de51b5db782bd758aac7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00007-of-01024.json.gz": { - "num_bytes": 318417273, - "checksum": "41dd377a1ba6b72eab0260c39c626fe45ab6b649d42d57b311d3ba21a0337cd0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00008-of-01024.json.gz": { - "num_bytes": 318131845, - "checksum": "64da652c235f089a0b52f6db5883ef5f1e9c31edc4c950332b34dd12439c99a5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00009-of-01024.json.gz": { - "num_bytes": 318185592, - "checksum": "807a548efbb10153c9eff0df5733a97a1b51ab1743242530de1b02a8ea17ace7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00010-of-01024.json.gz": { - "num_bytes": 319045292, - "checksum": "3bd0f6f664069c3bd964ce48ceae60ba47b55b54745a4b00c207bdb3a1926b17" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00011-of-01024.json.gz": { - "num_bytes": 319686980, - "checksum": "5baa0c010083459ba58e34b4e93bb758caa878f7db6fba0528921329fa1a6cc5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00012-of-01024.json.gz": { - "num_bytes": 320119088, - "checksum": "fdee7442c06856e2c4b7665cc51978e9011b5e0a2112c30dd15bc9e53818842d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00013-of-01024.json.gz": { - "num_bytes": 319474856, - "checksum": "a4ab3b24087781c3577945492525696e182ffd7ca5265b958f49803a02867ecf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00014-of-01024.json.gz": { - "num_bytes": 319693210, - "checksum": "62215b2451e71b117018ef73570c944aff890624b384c538950b64c37f184c49" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00015-of-01024.json.gz": { - "num_bytes": 318427305, - "checksum": "9893c9f413a1223e7b535527829bcd6df3219929fb1abf8f2a114dd8f6ea0919" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00016-of-01024.json.gz": { - "num_bytes": 318785714, - "checksum": "bd0ade8b8a57348952ca31c39efdab538f54c852941a225ccd13d0a7170724e3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00017-of-01024.json.gz": { - "num_bytes": 320134331, - "checksum": "4132cfff3f5126d9e783191a5ccc34e5d85938bebf0b8489657805277a227202" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00018-of-01024.json.gz": { - "num_bytes": 318653930, - "checksum": "4675ab1d77da3d676d9743dca15bfce8478498f7738f79816a25ed790d28fa46" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00019-of-01024.json.gz": { - "num_bytes": 319468974, - "checksum": "1d2f3a6aeb0f6c159295f283d302794cd3eb944cff3fe68691997bb2dc4c7780" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00020-of-01024.json.gz": { - "num_bytes": 319109754, - "checksum": "b5f26d832a0ec9b0489a27169d94496f5ea33c7fb046868c565c7b5a2407221b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00021-of-01024.json.gz": { - "num_bytes": 318514423, - "checksum": "428da5a8d4585de16f6b3f30865a5ca7a8d1ddcd3b6002dcc1283368b0c3d60a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00022-of-01024.json.gz": { - "num_bytes": 318715623, - "checksum": "9bc4812ba5e08c0b2d83cd3804129ba3d77cf84ba3d8828159788ee02e155a51" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00023-of-01024.json.gz": { - "num_bytes": 319874293, - "checksum": "38843ab4f5c60ed2b9ec0cdc65074eaca454014d5702edd809a266190689d2c3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00024-of-01024.json.gz": { - "num_bytes": 318105764, - "checksum": "4fa0c7ec94445ea57dcecda7864b1346275e711c9820c2c39dbb9fdb95c97674" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00025-of-01024.json.gz": { - "num_bytes": 319122521, - "checksum": "0758514fa2e2c133c995c00d5f4abfc14b66582a4eedd0e721bdd95c4632a755" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00026-of-01024.json.gz": { - "num_bytes": 318116783, - "checksum": "56a73b9a556d6794d9c706e1b1c7e729fa13b711ddc25dd403b110eb5ed857f1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00027-of-01024.json.gz": { - "num_bytes": 320171191, - "checksum": "fea1eabb734cda33d72f3d959234a240080b4fd42cc70494814a8429b087f9e1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00028-of-01024.json.gz": { - "num_bytes": 319047090, - "checksum": "47d1c385952d6c18c431a7294339a030c213b8832f970ac987965b621c8181a1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00029-of-01024.json.gz": { - "num_bytes": 318705639, - "checksum": "3c744d3dd915ceef3a93fd18c3ff5b117fb5118d1ced2089979b6cafc81c4525" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00030-of-01024.json.gz": { - "num_bytes": 318327902, - "checksum": "7f6959020242fdc841adfc10c102bbe79e2ef8502a09dac8451e0cec6f2add16" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00031-of-01024.json.gz": { - "num_bytes": 318990600, - "checksum": "e56f29011594c765192c34298558e7227a829313196748f9a16ec34ecdb76d23" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00032-of-01024.json.gz": { - "num_bytes": 320451482, - "checksum": "9ea843dfd85e449439f3106d657762daff8f326730fefb342455c43cb48144e3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00033-of-01024.json.gz": { - "num_bytes": 319878207, - "checksum": "2633cdb7b058f126173608897f69add614659b0b21cf54ecc8a2f4a79bc16073" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00034-of-01024.json.gz": { - "num_bytes": 318701510, - "checksum": "853c4b9ff2d79621ed27a6be826dae198af609d9f9dbd1c2773b778241cf6137" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00035-of-01024.json.gz": { - "num_bytes": 318529104, - "checksum": "fb50dac3f35cb71472464f511e6b8aee72ded10b3b6896d0d1f74a18ded2b8d3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00036-of-01024.json.gz": { - "num_bytes": 318849657, - "checksum": "5cef5cfd50cfafd58feb452b85324a3d8198fca48789f0ce69227755e72d8e53" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00037-of-01024.json.gz": { - "num_bytes": 319621215, - "checksum": "f0b67abf30e2d58d291aa9bcc9c8a03668afe819549802e4e591a261c171d970" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00038-of-01024.json.gz": { - "num_bytes": 318135467, - "checksum": "991bad578a83294d34a1b11649af07339aa8cb26d49330afa9fcbca0b87942c6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00039-of-01024.json.gz": { - "num_bytes": 320131759, - "checksum": "abbbc21f81555e94484e6afe1975e13f67af19a820cd6f8d090c987a250bd4fd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00040-of-01024.json.gz": { - "num_bytes": 320214476, - "checksum": "48020d2656709899abd2572b3424c0455df3c1089a69fe26b776aeb24f0da0ec" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00041-of-01024.json.gz": { - "num_bytes": 319581259, - "checksum": "db6fb8db7162ac87ea002c153ef0c54322f24c8f7ec263cfa290ac8c3683b194" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00042-of-01024.json.gz": { - "num_bytes": 318100985, - "checksum": "d499cba2383b16bb0f26b98416211eabf2599641ecd6708a5ef487692ca9e791" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00043-of-01024.json.gz": { - "num_bytes": 317803029, - "checksum": "dc6f1ccc3fcce79b16c5157f7125942e351d74744efc593f8372f8a408720340" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00044-of-01024.json.gz": { - "num_bytes": 318837063, - "checksum": "6170fced793461bd687640a658a085d02f971c2e609f6ff33b90df944fb56409" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00045-of-01024.json.gz": { - "num_bytes": 319659188, - "checksum": "b2f79e8600815578ec326cfc6c5242c2827cedbfac51772fdcf15ef5d027aa38" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00046-of-01024.json.gz": { - "num_bytes": 318771753, - "checksum": "e4b4a3e53ee66c280a5e7ee33602ea0e910903748db8c2adbbec4b48bab1580e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00047-of-01024.json.gz": { - "num_bytes": 318088661, - "checksum": "bf8597fc359d8e9c721fd1d98b8ff3db5c011afd0fec9640670f31c7a7dddb79" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00048-of-01024.json.gz": { - "num_bytes": 317777133, - "checksum": "369db8e9646b8229a23044a7257c2face97b8e05738f0413b581892876f268e1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00049-of-01024.json.gz": { - "num_bytes": 319329891, - "checksum": "5cb2aa0432984b355b0ec6aad92f926b2fb75aea2a0e08b97f4c6a62838e6cc8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00050-of-01024.json.gz": { - "num_bytes": 318172322, - "checksum": "11a7cc48539ac97eaec87beacef9d9bbb71fc875a0bff0c9ff096044bff46a44" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00051-of-01024.json.gz": { - "num_bytes": 318704544, - "checksum": "ac2beee992c2b1ae8b1f162054e843e2b971bbd7cec45a0a7a7b7795fcdc7c26" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00052-of-01024.json.gz": { - "num_bytes": 320806303, - "checksum": "3a591fe9993c3d98a9e7949e98ca215ce164cd313fe53f3ce762c91b5fec7c53" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00053-of-01024.json.gz": { - "num_bytes": 320565764, - "checksum": "60e67c8e6f3bfdf8b490ecfe62c79a13c5d04d393fbac712a6cda49fd78e883b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00054-of-01024.json.gz": { - "num_bytes": 320425170, - "checksum": "d69305c853e9e516f5fd4e2a9afb1939d829925f71102d8aa09387ded5d000df" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00055-of-01024.json.gz": { - "num_bytes": 318713224, - "checksum": "e01737df8097a1526d6c31d37d7aeb1b92c0a7253b39f6964fcc897bf0eba9fd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00056-of-01024.json.gz": { - "num_bytes": 319441227, - "checksum": "fe516c8c0a9e59f9f035ac5fdd13e973d25dd6635eee05d648740d3e8c1fc742" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00057-of-01024.json.gz": { - "num_bytes": 319821142, - "checksum": "7e058ed9072e968e9c8b92f9b50dab318515873cca6c617b544dacab5a2f018e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00058-of-01024.json.gz": { - "num_bytes": 318643105, - "checksum": "3479dc5a5b111b7f45f87e5a91c433907af97dbe15b9db1637bad666dcbdec40" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00059-of-01024.json.gz": { - "num_bytes": 318053548, - "checksum": "8208b0943f59b5914fa13d29108ede31a8d8d34bc6d603a2278ab8b80d28b1d0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00060-of-01024.json.gz": { - "num_bytes": 317935826, - "checksum": "71324b62706aabd6faee682205cdedcd10dad289579b534d0e53f8d9b92bf2c0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00061-of-01024.json.gz": { - "num_bytes": 318870698, - "checksum": "cdf0abc5804f0991871de48b249e30b666cb96f2254762a570c39904c5780f8e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00062-of-01024.json.gz": { - "num_bytes": 318945246, - "checksum": "5ac676e16108446bd2980f9601c787eb754811a68e92ab6403c333820a6b9622" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00063-of-01024.json.gz": { - "num_bytes": 318827790, - "checksum": "a26f7cfe123cfdf3db7687996d0163212e70ff7635872b0754c03cbd5c31213a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00064-of-01024.json.gz": { - "num_bytes": 318914155, - "checksum": "858a145617a5902ab02bc77e47ee2f036a6211384c4f2285767c7558eb93e245" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00065-of-01024.json.gz": { - "num_bytes": 319794084, - "checksum": "52742215df5aaca43bed5405a397571efe7c22107ee2caa8c05e3ed229796efa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00066-of-01024.json.gz": { - "num_bytes": 320294453, - "checksum": "5b11cd54de0e95a75e53e4e32f72912cb01053d3fb609de6b7a45afafab414d0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00067-of-01024.json.gz": { - "num_bytes": 319468309, - "checksum": "4c6c69b3eba9bcd6786d7dce893340f2d7093012ead04f3539352beccd2794ef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00068-of-01024.json.gz": { - "num_bytes": 318800742, - "checksum": "ce94afc3c612e9de423a412147505ad7757216100becba2677bf5eaf443c4b6f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00069-of-01024.json.gz": { - "num_bytes": 319416585, - "checksum": "ff3084a3e5a3960425a5c605274684c42fa638f99045527f77e74d165e52b6ea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00070-of-01024.json.gz": { - "num_bytes": 319165846, - "checksum": "04c368b05f0ea42b3a51ed9bc0e817894f205c0ecd74084da015158d509ff2a3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00071-of-01024.json.gz": { - "num_bytes": 318017381, - "checksum": "e8320e9982fa377b07c5b3e8a4451ac143b05ab7a4a03f748034b37fb998bfb0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00072-of-01024.json.gz": { - "num_bytes": 318874499, - "checksum": "920f8d5ef2cae6bdbd52f724d0952e04146ff29f4aaec4dbf10bef7b66a98f40" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00073-of-01024.json.gz": { - "num_bytes": 317890112, - "checksum": "06a41bdb7bf0d52e2fe8e71f594de8d36d77880639ffdfb41e883237f76e8a0f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00074-of-01024.json.gz": { - "num_bytes": 319201956, - "checksum": "e0267d6782d30f1619a82c49c20be1c8b5424e653c093e4652a5c8ed117c6533" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00075-of-01024.json.gz": { - "num_bytes": 320575937, - "checksum": "42108758abc3c3197e7dca8293eed3800f3e79ceae80d3208d90c7a9fd205594" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00076-of-01024.json.gz": { - "num_bytes": 320070510, - "checksum": "c904b6e6041e23edeb1d88b7b69f07a339b7ff9835d0c22e0b6c354519369842" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00077-of-01024.json.gz": { - "num_bytes": 319042024, - "checksum": "1eb2b70ad4d12b7587eeb1ce86477817ad992c08fecafe5ccafc26af6b5657f7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00078-of-01024.json.gz": { - "num_bytes": 319997520, - "checksum": "070370654960e02f766c10321546b280e9933531b796c252a94999d645f360b2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00079-of-01024.json.gz": { - "num_bytes": 320736487, - "checksum": "3aa4f007660706563030b590cef9be992c18ba7ec1876210bc92665ec42c4be2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00080-of-01024.json.gz": { - "num_bytes": 320082337, - "checksum": "3b54eaf407bb593c2b16df99690446f26497530d21cf433a7d525e0eaebe9c3f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00081-of-01024.json.gz": { - "num_bytes": 318008114, - "checksum": "d01975cdbd4360331b1a0f55e9b7e731d7d9fc70c7cdd0f33f1c772eff7aa03b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00082-of-01024.json.gz": { - "num_bytes": 317829809, - "checksum": "2a65dd37027fae03819ea5a5f6c3b16d921706ad758442881dc1d15b08bc5048" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00083-of-01024.json.gz": { - "num_bytes": 319265318, - "checksum": "e14cf18c687f7eb304df6abef7235e263a5736c799d742524205dead2abfb043" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00084-of-01024.json.gz": { - "num_bytes": 319166958, - "checksum": "1dc3fa8702a4477e3a3128440b68d4cc17e6d2ce7f3c53da28d50a57b8332020" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00085-of-01024.json.gz": { - "num_bytes": 320338078, - "checksum": "0222db7b1ae14c9b10aacdb05d055d1432b6d035e3937df5640facd242c52aea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00086-of-01024.json.gz": { - "num_bytes": 318941314, - "checksum": "55ddf7a27dc91bf8d932a5efec4aa458122ee337f2cb050e2c4b0ae8e770f3a9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00087-of-01024.json.gz": { - "num_bytes": 319218368, - "checksum": "c61552d76bedbfa750c599a674d6732fb224c8a1e6c6583fca7ccabb20532920" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00088-of-01024.json.gz": { - "num_bytes": 318974308, - "checksum": "693fae3d50068ec39ad27a14335372c3e1530138cc65931edac5268dd62b7e96" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00089-of-01024.json.gz": { - "num_bytes": 318781044, - "checksum": "2d90b9318432a2313dfaec542c8b91431505035cca7416a63e3197ab26ad6e75" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00090-of-01024.json.gz": { - "num_bytes": 318569651, - "checksum": "ee674beda8ed39395e69c899f666990c5190dfad5494867e51fa727e4d38d86a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00091-of-01024.json.gz": { - "num_bytes": 319683433, - "checksum": "add2489350310ce500dde6637518c747c156f95f079a34367842bf875a8fdf5b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00092-of-01024.json.gz": { - "num_bytes": 318734793, - "checksum": "5cfd4f25e9effaa2f7381bfcf49f9263e10619811aeaa32a77d3fdfc13517006" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00093-of-01024.json.gz": { - "num_bytes": 319161014, - "checksum": "bed8774909bba5ac656ebaad6e5cacca9e5ea12c80a41fd5689e6798c74f3c89" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00094-of-01024.json.gz": { - "num_bytes": 320143246, - "checksum": "96abe370925f6962b4e75da530b5234eec21fab820d6cb02ae59b6070ab63859" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00095-of-01024.json.gz": { - "num_bytes": 319707377, - "checksum": "37b68cd632e8f86f364fd61c9581f48ad7602122b7f33c55103ac5bd727f015d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00096-of-01024.json.gz": { - "num_bytes": 320159279, - "checksum": "fb93c7467f0361c1d4b186d5e25f4bce4f237adb33b4e0ef56f57831b4f97f81" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00097-of-01024.json.gz": { - "num_bytes": 319841818, - "checksum": "7f4d4a9536e37a0c2b9a1806fcb472784ff4d3840aa57e9603e74233b877fbac" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00098-of-01024.json.gz": { - "num_bytes": 321001731, - "checksum": "239b9fefebe3815c8d785bd48086013d1a6dcd76c142786502c674d2d874fb11" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00099-of-01024.json.gz": { - "num_bytes": 319475885, - "checksum": "0a610d25a547839b8b6dfc2fd964e3ca64b23f0edc52d311c89dcb5e8a44a2c5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00100-of-01024.json.gz": { - "num_bytes": 319515329, - "checksum": "f24d17cbd27296a15f51b9edc713c74a6997bbe82267403fdb6282404c2f4e6d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00101-of-01024.json.gz": { - "num_bytes": 318803422, - "checksum": "54b8b0c72ffa325abce3dd15bdcd0856b5594500c37f4bc6a6327721ba91e4bc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00102-of-01024.json.gz": { - "num_bytes": 320934688, - "checksum": "24b99b4afa3b631a718a487d679026c91e2c936132df01df969e3173b49e091f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00103-of-01024.json.gz": { - "num_bytes": 319835920, - "checksum": "a2c68654ba81fa55bc24beb4319c8905f7b532fcb6793a6a311344d4f98a82b9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00104-of-01024.json.gz": { - "num_bytes": 319402378, - "checksum": "27764d82793e35b8a7be3a3fb0470d018243a89283b5501c0b76056de1879389" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00105-of-01024.json.gz": { - "num_bytes": 320100928, - "checksum": "3bb2499337ebe52b63a5f20ec6ca6283971937962439699bd5e483cf80fed02a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00106-of-01024.json.gz": { - "num_bytes": 318707110, - "checksum": "83510312aa188431a8dda8746903d70cfc7ffdf5437e44c1f74b7670b78bd52b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00107-of-01024.json.gz": { - "num_bytes": 319904239, - "checksum": "40d42c39dea8e4898efba1886aa3be67742501f7a51d5bc635b03a2c6c2bd63e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00108-of-01024.json.gz": { - "num_bytes": 320050265, - "checksum": "88ce3ddae88e8024e76614a1b701c157f66fe39c6f0852a4869c5063876f6e87" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00109-of-01024.json.gz": { - "num_bytes": 318053254, - "checksum": "865a124b663037f36a5738f25c82f8bea2ab54d4bbf8255ca0d1d00d76f8b250" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00110-of-01024.json.gz": { - "num_bytes": 319794699, - "checksum": "b17e210c8ceef98219ee12eba5dddd2001ded0d417c93955743c238360d96e76" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00111-of-01024.json.gz": { - "num_bytes": 318761540, - "checksum": "05be318a057bb33bf9d7faca58569cdb0880fe8eeb0fc3f57f5999d5f2af55fd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00112-of-01024.json.gz": { - "num_bytes": 319121509, - "checksum": "858dce8e43b06a0c1e26ab3e4f109814b6cc50c6b0e4d146ec79fda001ad471d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00113-of-01024.json.gz": { - "num_bytes": 317916736, - "checksum": "2e3968e48cb15a3326457d5a6ad49838d20d38c8138c529eee51f94e6bf269e4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00114-of-01024.json.gz": { - "num_bytes": 319319540, - "checksum": "b72dc8207d93848f4fcb265b3e618d0eb8649445f7b9187c5165f4adec3e0708" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00115-of-01024.json.gz": { - "num_bytes": 318863372, - "checksum": "85ef0bf3cb12bc2fede4158853ed2259dff5d25adf99b43e8c35d7e0b9d4fdd3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00116-of-01024.json.gz": { - "num_bytes": 318898370, - "checksum": "a0c82c8b48e086be7396338cdda0fed52e8c4753f04fd086b9472c1bedfb150c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00117-of-01024.json.gz": { - "num_bytes": 318153138, - "checksum": "531d5d03fd8099806d92fbff2a48a0d68dcf46325e732e698e9c142902d152f5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00118-of-01024.json.gz": { - "num_bytes": 318966511, - "checksum": "24b1c5ebbd07d50043be0d5d5c5427e042bdc53280825260226a2823e9b7546b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00119-of-01024.json.gz": { - "num_bytes": 318733748, - "checksum": "ce1fb1192b770e625430798aee94c93bd748ed474ff815a7f95cadebb826161a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00120-of-01024.json.gz": { - "num_bytes": 319672996, - "checksum": "4c2a6874921ac4a626a9c8ac4c6e91dae58f1f5b52e79124b3abf254b7433119" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00121-of-01024.json.gz": { - "num_bytes": 318779046, - "checksum": "029d3ab92f3e1724e3708790148e63b4c211d2ddfd04e3d194b24145e97c922a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00122-of-01024.json.gz": { - "num_bytes": 320861175, - "checksum": "4bb595140e5cf92147f99b58d236634ddfafbc0b160b4c88b337255482611ced" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00123-of-01024.json.gz": { - "num_bytes": 318338141, - "checksum": "d508261be287fa3d27e5f44524e22870269054213b61011ee8a6728a77910cc0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00124-of-01024.json.gz": { - "num_bytes": 317655056, - "checksum": "7612cb9fdd9f4b3a4f8958087ace120d4a73cf26bd16289bb20fc871f5744f2c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00125-of-01024.json.gz": { - "num_bytes": 317524610, - "checksum": "049ebe4971811bb1fdcfd10cc264b2074b3ace18536340644e718dcc3cf3affb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00126-of-01024.json.gz": { - "num_bytes": 317902192, - "checksum": "d97bddf003b8f647c587fe9a9a9aed75ea604478e0b550d501ad7f07b6061b86" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00127-of-01024.json.gz": { - "num_bytes": 319243191, - "checksum": "6da4c882f88816a452af54ed217f84d6e4601c11a8e33bd47c49c0a1ea04f49a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00128-of-01024.json.gz": { - "num_bytes": 318045852, - "checksum": "ea43f63e6ef3bb5723ce75bb51f7183a525d8ccb00c93f49aaf2d9b560f7bdbb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00129-of-01024.json.gz": { - "num_bytes": 318436174, - "checksum": "72ceb525367d6e8d1c0fca94d99d4fe5353ead08a5d52bf00e30e3b596fa90a2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00130-of-01024.json.gz": { - "num_bytes": 319017217, - "checksum": "92f1b2687bee78441eeb4e05bbec2a491469b23c3aad0d951fbbe35a3c27998a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00131-of-01024.json.gz": { - "num_bytes": 319237739, - "checksum": "0fd07585a82b7d71ddabbc315195c84e2fa78a8319de7dea971cfcc9b38707b7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00132-of-01024.json.gz": { - "num_bytes": 318123742, - "checksum": "c9f5604ca28ea2a9ae5267db50f6e3d1e576841abe840134b3817f370c057073" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00133-of-01024.json.gz": { - "num_bytes": 319009751, - "checksum": "7ec982de577e0eeff57dc60346ce35a7b35b3c4f037987316cfc071b0ed58a87" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00134-of-01024.json.gz": { - "num_bytes": 319750057, - "checksum": "2619d265d76d82f6b84e2686371e5b6d6c08058cbd5765dd2906af9f549af092" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00135-of-01024.json.gz": { - "num_bytes": 319068231, - "checksum": "5e1bf5b09f2cd132a7747116442d6f26ce0002eaeb9f56fb02bc00e3abee8716" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00136-of-01024.json.gz": { - "num_bytes": 317800994, - "checksum": "80ebbf64fbd91215da553e3a8d9442380cee6c3b09fbbf8353a0817993d15862" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00137-of-01024.json.gz": { - "num_bytes": 318954070, - "checksum": "3b5d2ccafe526a19c52ac0fee50109b6a95ac3c8f7f2272a9a0302c4219e82f7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00138-of-01024.json.gz": { - "num_bytes": 318452853, - "checksum": "2dd88569a62003383a3bf70d68143f16f234535469bdc8ab01a8764f6babb5fb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00139-of-01024.json.gz": { - "num_bytes": 320013821, - "checksum": "f32ca62f6a9d2c8a72901e6f2c08880c2d1907f52beb4e8fdc30f4c02c7ad10b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00140-of-01024.json.gz": { - "num_bytes": 319510423, - "checksum": "7799838d8019d7cd71a505951f155bdfb862b4a3b3b77e182c706a624617169d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00141-of-01024.json.gz": { - "num_bytes": 318339814, - "checksum": "1601f6dbcbf4e7f1db119b232e862f3c9fe29e9abe5827177458079299ed511e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00142-of-01024.json.gz": { - "num_bytes": 318438444, - "checksum": "71d891be156e1b608733a3abe8f8dab7a6213c02931117b99889bc3fe8329d38" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00143-of-01024.json.gz": { - "num_bytes": 319413540, - "checksum": "88fb2e7c3d426a6bb5775041658c07005a469306af0d97df7d68f148b64cbfe8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00144-of-01024.json.gz": { - "num_bytes": 319901095, - "checksum": "2734ff57f4265653b0b1f292f513017ba791c3091cf8ac0bbf6d75d0074e3386" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00145-of-01024.json.gz": { - "num_bytes": 318500183, - "checksum": "da2e6747f7230af5941c6bee262a606b4f7792da359dbf7516d82d8301cdf90f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00146-of-01024.json.gz": { - "num_bytes": 319315120, - "checksum": "6daac97153d51addc8b1e43b686e3d641666df3a106270a141d734079db2ad35" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00147-of-01024.json.gz": { - "num_bytes": 320621434, - "checksum": "fb2584e0ce366ad30c8110591484b84798e9f06e8a27cd864e7800b8d5e2d225" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00148-of-01024.json.gz": { - "num_bytes": 318269045, - "checksum": "1c963c0ceb6cd776822352b186ae7e3d829ef334efcba0fbdd9182dde4deed05" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00149-of-01024.json.gz": { - "num_bytes": 318576426, - "checksum": "6a21397e0104c7fe0fcd9f1d43a8e546000596d896a95eb9b6c4ab92235e6a49" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00150-of-01024.json.gz": { - "num_bytes": 318447048, - "checksum": "075b113a73e6e21d7cac49391ee559ee8aaa2bb3338f709017077a4007a7bbb5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00151-of-01024.json.gz": { - "num_bytes": 315388730, - "checksum": "bd47e3ac0209676d8a32490eb20ca8c07ca3c45c2beb88dae18b5c8d925f349a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00152-of-01024.json.gz": { - "num_bytes": 319701880, - "checksum": "241d9cf003f49d95168ebdeccd8209230507d4dfd0d170fa1b57d2355240a95d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00153-of-01024.json.gz": { - "num_bytes": 318370254, - "checksum": "3aa86900a749224dfed8a67960c166e43c3b9ef3ac7b49d28129b496c7193e30" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00154-of-01024.json.gz": { - "num_bytes": 320064875, - "checksum": "3160c723cea6717fa9f5a9eb627d76107040d084a64106973099fa0e8de48758" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00155-of-01024.json.gz": { - "num_bytes": 318089754, - "checksum": "5b6e76a85bb1093eaba698864a54a938329b04494f9f72c3c3bbb155174da5e4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00156-of-01024.json.gz": { - "num_bytes": 320049467, - "checksum": "cc013e8aa7c1cf7fc28ebecc64d893d03b092a09d725b5e626851de0b311c814" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00157-of-01024.json.gz": { - "num_bytes": 319931950, - "checksum": "2a27b4c29455bcd813a84aa3a54100d16cb6bfed25171aa3c552ea452ae569e2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00158-of-01024.json.gz": { - "num_bytes": 319963615, - "checksum": "e477f769ea1513cf607932a29d793fdf1722cdea757e00c814dad594329cfac7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00159-of-01024.json.gz": { - "num_bytes": 319000491, - "checksum": "ff5d09415753c2aa4b51196e8f4bd6c77ba100ab281314aede118f501565cea2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00160-of-01024.json.gz": { - "num_bytes": 319069618, - "checksum": "e08c35aef8a20dccad80f6bb1579d6d2ce80113c8bf8459730c69fb7048c3cc9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00161-of-01024.json.gz": { - "num_bytes": 318750642, - "checksum": "13eef84873b58e29894f9bf68a4de72a530c1bfc80a5654262fe71420292b8ad" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00162-of-01024.json.gz": { - "num_bytes": 319847814, - "checksum": "a8579c6bcc906fe018881a8474724576c3d0f7f1787f1568b79e5accbd9f962c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00163-of-01024.json.gz": { - "num_bytes": 320370365, - "checksum": "b97a74837ab9f659c13dcb4deb53c600584beb9e5ceed29e99974c4953f644c9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00164-of-01024.json.gz": { - "num_bytes": 319894618, - "checksum": "9b63afffa2b84c91b749991ddb384399f1d408bd7b6b643e7329e49531ce9a53" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00165-of-01024.json.gz": { - "num_bytes": 320166197, - "checksum": "5b2414477dc4e2b080b34f3b98672bfe3de6028e7ad83c323a7dd1ee08c05a0b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00166-of-01024.json.gz": { - "num_bytes": 319612575, - "checksum": "2cda682db53000c14fcb5d251bae4f50c8c4159348f8594c3ef020260f277a99" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00167-of-01024.json.gz": { - "num_bytes": 319183884, - "checksum": "5c406d7a8a404436039fde7c2019f0174ff8855caff319fa62bb7960d341b41a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00168-of-01024.json.gz": { - "num_bytes": 319396348, - "checksum": "df6a422d57a2e1443d10d61b13ab2c5227734195c82b43e1ead2db723cdea293" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00169-of-01024.json.gz": { - "num_bytes": 319452933, - "checksum": "81c81138e7163072e3779dd10ea8af7dff12b705fa008665298e08cfc2699f03" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00170-of-01024.json.gz": { - "num_bytes": 317748609, - "checksum": "6586ae8862b8ac925f424afb6ba779e95a147323fb83fc8c4bb0813877b17718" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00171-of-01024.json.gz": { - "num_bytes": 319052376, - "checksum": "8b3cd21d8ffbe963ce935ef9e0b6efc45f4d5abab703fdfed19a1309b700dca8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00172-of-01024.json.gz": { - "num_bytes": 319068859, - "checksum": "a42f5f5a10bfc84d51dd0855166959462faccd6a182af4c5d2115ff9995f5324" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00173-of-01024.json.gz": { - "num_bytes": 319142377, - "checksum": "e26514c5d6cea27c0cf7fcc1daadfa6f218ef9e62039c6d6fccfc31660c0c96f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00174-of-01024.json.gz": { - "num_bytes": 319134484, - "checksum": "75349aa8c734ed894965500eab2fdf59657a63e40e5a53e822ef1e5a12838a02" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00175-of-01024.json.gz": { - "num_bytes": 318330467, - "checksum": "a3d0d14b28a5a3cc559d6d89e2ec09e49e92aa189e44e68dbb4ea47978e1eca1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00176-of-01024.json.gz": { - "num_bytes": 318584643, - "checksum": "dd68b42e5bfc656b71fe5701bacb929edae84055131f1dd65bbf3f3ad734e57d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00177-of-01024.json.gz": { - "num_bytes": 319275087, - "checksum": "05a8ff159006241cf938ef27b292f65906158ac25ac28919aa6761eaa634052f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00178-of-01024.json.gz": { - "num_bytes": 318490550, - "checksum": "a3aa38083c85baada29b207240bcca1a0d562a93971b420428d039092e58bd31" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00179-of-01024.json.gz": { - "num_bytes": 319083249, - "checksum": "12858fecd1dec728eba2c8c4311b17e4f2ac1fdb27c23e9adcd9258c5c4fc777" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00180-of-01024.json.gz": { - "num_bytes": 319752094, - "checksum": "67e968cb8d3ebec2f68eddfc539ea7402aa72c9274034494a43ea7d207b69a88" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00181-of-01024.json.gz": { - "num_bytes": 320476195, - "checksum": "c1bd59eb7ca799e31bf037dc7c087c1ad94e4f88a4f12427c454510d97e1c803" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00182-of-01024.json.gz": { - "num_bytes": 318538551, - "checksum": "dbe7205a1919dca9d6936158d5653a20d239f2e547ec73280956da4f8c609220" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00183-of-01024.json.gz": { - "num_bytes": 319620265, - "checksum": "46f9e603e04040b59df8da6ee01d1c30588aa7233a00526d6f0fd84c4172ba93" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00184-of-01024.json.gz": { - "num_bytes": 318301621, - "checksum": "880a02eabae231da388a5782a7194eef0d0211c2d1314db0c56d740647a114c9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00185-of-01024.json.gz": { - "num_bytes": 320515340, - "checksum": "f522147aed30ebb3ab352c92a9dd24cd2e8b93df1d4c4a6284d89ceaa2858509" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00186-of-01024.json.gz": { - "num_bytes": 318374733, - "checksum": "5005f1c42038769e225a626a88c10bd4f6af98dcc14deed475954b00c088bc53" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00187-of-01024.json.gz": { - "num_bytes": 319116182, - "checksum": "cbd7e0f486c6dac13090cd344337da1c336973e7ec75e32b0bd5b18b98f24bf8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00188-of-01024.json.gz": { - "num_bytes": 318981305, - "checksum": "064ce8c30b7a960b20720c133c3dd3281d27752a66def44d5133ff8f1b8279e9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00189-of-01024.json.gz": { - "num_bytes": 317036462, - "checksum": "acc052da4501691fdd28f269c633ed826840f2634be49b5e2c5e1273de0cb4a8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00190-of-01024.json.gz": { - "num_bytes": 318061662, - "checksum": "5a436e97c59b8636ca5081b71ca6fe8f8a3a99dd3f426c79edb2bf53345ee810" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00191-of-01024.json.gz": { - "num_bytes": 318556228, - "checksum": "2eebc89381ff78ae63f311c98b07853cefcc42fbcc210995095d568a6ff70ead" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00192-of-01024.json.gz": { - "num_bytes": 317987733, - "checksum": "99de46c4702c06a2303262b185b92fad82e12e189c923d5b76d9d8f96faabfa5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00193-of-01024.json.gz": { - "num_bytes": 320294532, - "checksum": "bccb7d8fc34d6cd6eb41e2a1c6234596b00a5517fdca7c47562fdee0e675377c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00194-of-01024.json.gz": { - "num_bytes": 320852679, - "checksum": "bb1e7768a57145fdbca7957ed964648d1deab5edc5dfad4722a81ad411c5e0f9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00195-of-01024.json.gz": { - "num_bytes": 319016077, - "checksum": "ac520468a5bd933dbac1aa5f7f21ba276bdce15abf99963ef9d73af294e81e70" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00196-of-01024.json.gz": { - "num_bytes": 319289881, - "checksum": "9eec5740115ab52ce98ac9efbed4fa1c5c06787fe93b4b28f6a1e4df06272870" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00197-of-01024.json.gz": { - "num_bytes": 320180232, - "checksum": "07a03763b84b4a86b4f71d725927d62c40925823ee454122a00fdb625ddb3a22" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00198-of-01024.json.gz": { - "num_bytes": 320004709, - "checksum": "a1b250b01289fdaf6dcd997ef31c59c580f81f961aa0fd88ae0d175bd07c02ab" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00199-of-01024.json.gz": { - "num_bytes": 321006991, - "checksum": "650e57c3dbbf4ed929da8c6c5d78f35fbac4644722a84d98f93342a8d33b2140" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00200-of-01024.json.gz": { - "num_bytes": 317913111, - "checksum": "42caf6dee42bd73d9e4bf0c7bb16383caa936b2e0a913489b9f0aef57b6004cb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00201-of-01024.json.gz": { - "num_bytes": 317897148, - "checksum": "990974a82de2b1c27465f6d097d7a5718c5ff334271e722ab3736e7aa5b89d4b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00202-of-01024.json.gz": { - "num_bytes": 319510250, - "checksum": "8467066f2417af774363d4984a37968a0189adfe3a581723eab15004930e621a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00203-of-01024.json.gz": { - "num_bytes": 319762388, - "checksum": "4e7e20980dea2d5e77f380b24580f0df9319a0d1d73ec319e17d8cbe044e53de" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00204-of-01024.json.gz": { - "num_bytes": 317418128, - "checksum": "2c027c5225ea7ce3c31f5f32dda12b7c892c6fdc9c52da6d0af749171cdce738" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00205-of-01024.json.gz": { - "num_bytes": 320157174, - "checksum": "d953e79c60be0e2c3b072c2186a845a351392ef395fa95135f47e6b8491c6f88" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00206-of-01024.json.gz": { - "num_bytes": 320459080, - "checksum": "bc70c34931942ca143f7eb555e86458afcc36110aa9559151f31d781969d4458" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00207-of-01024.json.gz": { - "num_bytes": 317361718, - "checksum": "fad5ebd7a81bb737e12e9d4c803aea1a9e905d43a3fa87cace32a64eef01e8e3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00208-of-01024.json.gz": { - "num_bytes": 319976693, - "checksum": "21381c727d945d8d3b4a275e3622bce64b07ed87d7f2371ac28b5d2023359cae" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00209-of-01024.json.gz": { - "num_bytes": 319550585, - "checksum": "8b74e5f1780c4bf12936ac3a86be7a3d11287866522da8275aa4232c1e3d8898" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00210-of-01024.json.gz": { - "num_bytes": 319574289, - "checksum": "1594bd49cde9641b49a1ad9373a53e10d65440000363f7532a7d326d17c44236" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00211-of-01024.json.gz": { - "num_bytes": 320615302, - "checksum": "5b6f7eddfa3a9ffb0d6668d10f398b1d86482b64daa9817ca0af549433071244" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00212-of-01024.json.gz": { - "num_bytes": 319395225, - "checksum": "db58fa453269c794fedb595c6193dea5a85c72ff8b2d43e77c9bb371b8c86b78" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00213-of-01024.json.gz": { - "num_bytes": 320131797, - "checksum": "1d21d19b5e36820559590b339c049be29f27505ab4e88572edbdb84b649e0b66" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00214-of-01024.json.gz": { - "num_bytes": 320153141, - "checksum": "55c9b4ff1cd8cc88738196f867aba620dec3c8b27b9a485c7e75d3129d76e9c7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00215-of-01024.json.gz": { - "num_bytes": 320525443, - "checksum": "dfe9f44676c1abf0e2875924c094c0d788f8a0172d641d5f810258e948e37feb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00216-of-01024.json.gz": { - "num_bytes": 320100146, - "checksum": "57f19f5437b0428d9f40799af14f8bfba8f6c82ebacaea8f6fc7531524a6d4af" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00217-of-01024.json.gz": { - "num_bytes": 320688377, - "checksum": "fad4f3143aa303c9c35165a15c6d90087c204c586fe20b0c0f45cf4238311b70" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00218-of-01024.json.gz": { - "num_bytes": 318896471, - "checksum": "aabd471960d6db1e93e1129410d9138d9d9efa3292af7491b3b6844c2bd3f543" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00219-of-01024.json.gz": { - "num_bytes": 319298204, - "checksum": "f676701589e39802779a0947585638347bb4fe55376a33c6d0afcdc40c5f8938" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00220-of-01024.json.gz": { - "num_bytes": 317757045, - "checksum": "f3d0994379d244054c5e2db366a081caee28d301aa6b0d9431e7d9eb1cb38c30" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00221-of-01024.json.gz": { - "num_bytes": 318568870, - "checksum": "8026854c8a8cc1d16b52a898b9dd8a8df7901dd8cdf285f5d937c4d5d45919f3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00222-of-01024.json.gz": { - "num_bytes": 319096912, - "checksum": "71f76f898864de3ae60f7c0cdbc68d53cbfa04b2f8493c40d55e1cb56727b275" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00223-of-01024.json.gz": { - "num_bytes": 319350414, - "checksum": "ba01faf3fe41a738c255b5da83daf53a5858144557af6c6f8d6208a049e4245f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00224-of-01024.json.gz": { - "num_bytes": 319007151, - "checksum": "94200d12c61f7c73a9e3a2bb089a05b017a215348d52018a34e3224578c0da06" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00225-of-01024.json.gz": { - "num_bytes": 319502985, - "checksum": "0b7ce650e555baa546bb329d7f0567a3dc0a7ec9d49149792032a86321a73d6e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00226-of-01024.json.gz": { - "num_bytes": 317983607, - "checksum": "40cf6d4b3deb05cd97ebed01405d08ae67be6e896736e4f371d15e5404567599" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00227-of-01024.json.gz": { - "num_bytes": 320199564, - "checksum": "e65ee475e3b6682b57bfa3f7b9c1cdabf36a7282fc793865df63dbe6a6a3d1fe" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00228-of-01024.json.gz": { - "num_bytes": 318852183, - "checksum": "8b27f2fbb0233802229fc776cfcb0b6b43af3149d217d0ab00cca0f1286482e4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00229-of-01024.json.gz": { - "num_bytes": 319407418, - "checksum": "f2d5199a0022134ae127c88f0ac20d1b2b8a88014a774b5432b41085c83ecb5b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00230-of-01024.json.gz": { - "num_bytes": 320787790, - "checksum": "e1b040895ac6068dd1aa892ec93d733096afc4adda698379006ef89926491255" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00231-of-01024.json.gz": { - "num_bytes": 318220053, - "checksum": "648a6349206c50c17d4e3562fd6fcb0a723b4cb40005890173d5de0c7ecc2ade" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00232-of-01024.json.gz": { - "num_bytes": 319702777, - "checksum": "0a44b7cb4f354e1eede683a697aba4051c1542fd030dd59767065f5f0204554e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00233-of-01024.json.gz": { - "num_bytes": 319154465, - "checksum": "4070448b7844776db6754bd33791900bf9ac8dbd81e4cd774a3055ada67f6fac" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00234-of-01024.json.gz": { - "num_bytes": 319846160, - "checksum": "b1e8c73078c347fa062ed408e81bbdcb2f714675bab2c082016e822e91ef63a9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00235-of-01024.json.gz": { - "num_bytes": 317722912, - "checksum": "d8aa694e870157b2b5411f496db46dc71dfeed01a42973a65499596921198abf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00236-of-01024.json.gz": { - "num_bytes": 318593592, - "checksum": "e0c4ff6c8a12128da88777074d0b097664cf2f2395913c4d82b0eecd501946f1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00237-of-01024.json.gz": { - "num_bytes": 318902831, - "checksum": "adce772ed699d7e908ae1fe1ddf1d9875305c7875c93cedf1b3ea0bbc21ff922" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00238-of-01024.json.gz": { - "num_bytes": 318696723, - "checksum": "926f9fc42cd248077afec1f4b88603c646fc5ae47c4ee3e9b8a5f6b8b6ff7f46" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00239-of-01024.json.gz": { - "num_bytes": 318321822, - "checksum": "439d756b0ffc97ebecc6c48a7dc90da77de7ada05a6eae929db98057ea15bef1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00240-of-01024.json.gz": { - "num_bytes": 318992553, - "checksum": "1f57af6ff9477263806c0827c0dd8e494e103b6f54eec2cd5f8f8327b01ee39b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00241-of-01024.json.gz": { - "num_bytes": 319345185, - "checksum": "493932a44e09f4b311ac5bdb519111fad0982708d4b467688f2b1105316544eb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00242-of-01024.json.gz": { - "num_bytes": 320108156, - "checksum": "de5603f1b276f1373011c8884f06af017c71b03c5de3b3bb89cd6d550a0d5902" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00243-of-01024.json.gz": { - "num_bytes": 319855563, - "checksum": "7c1b74de8ae3699c567edaa6e2d1a1f1ae82f4810e769c710a23cd2dfc536c60" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00244-of-01024.json.gz": { - "num_bytes": 318966332, - "checksum": "d3ada80bad9fa776374878bc7504138e14c161bc9798ea8114b0d187d4c815f9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00245-of-01024.json.gz": { - "num_bytes": 319541864, - "checksum": "3fe5f26e32795c49743d1b2497c333be57248c9db2ce12fb93e103d1a9595347" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00246-of-01024.json.gz": { - "num_bytes": 318530369, - "checksum": "a0bdeb2dcb5dfb46f843c4086230ba918f2d3ec125654cb924ea11e7c75cafbd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00247-of-01024.json.gz": { - "num_bytes": 319496627, - "checksum": "0c4099f832ada6b24ef6c1d15267cd3c179f5b3d79e3d813d944e3ebea908c99" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00248-of-01024.json.gz": { - "num_bytes": 319132981, - "checksum": "608b1cd27ad345f6511fb677c00d56b6e827f288877d68aea1bcad3b02dd040e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00249-of-01024.json.gz": { - "num_bytes": 318529093, - "checksum": "8fd580be09f913cc3809e3b0e467e2faf657a5db6f71b75aa931043267b9b0f3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00250-of-01024.json.gz": { - "num_bytes": 318248903, - "checksum": "faeac675c3634b0834939046e60cdfad6a13558d7a6799c5bde25567898d86a0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00251-of-01024.json.gz": { - "num_bytes": 319184870, - "checksum": "038972e03db75417fc4cb25e54c3aee01e4f022eb0fab202142f539e4d866e28" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00252-of-01024.json.gz": { - "num_bytes": 319631399, - "checksum": "2fda0c2cec4624c6068556e16630c3551ef3110759bed59628913a9debd547a3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00253-of-01024.json.gz": { - "num_bytes": 318275716, - "checksum": "b5da4bfa564fcc6c49a573b90e679d60c4e222249858f4e58fdb3727a5f279ec" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00254-of-01024.json.gz": { - "num_bytes": 318638865, - "checksum": "279eb2978fe94e1570318a247b82487c04d7494ceed74dccb1d7a5734ea84e5c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00255-of-01024.json.gz": { - "num_bytes": 319640339, - "checksum": "aa0a1ef845d0df7d81d2588d53f29205a4e3858a0888c1b7d9c83eb2fe1d32a7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00256-of-01024.json.gz": { - "num_bytes": 320353593, - "checksum": "407133ea3b32a9e004b992a1bccade0440a39d0bfbd12993ea78c6526c0864a8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00257-of-01024.json.gz": { - "num_bytes": 318165587, - "checksum": "72b7a72b8402b22cb51db44c9e7859460366c7c9d33e16a4c038ad07f7ad8f3f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00258-of-01024.json.gz": { - "num_bytes": 318003534, - "checksum": "e5f9f2f74b7f9958dc9535f04a8965749ca4bd68005a6efa36f480fb487ca930" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00259-of-01024.json.gz": { - "num_bytes": 318990454, - "checksum": "7cb3c284613537fc6b1a85d7187dfca30b37a7a1a5708094f17486e3184e2d62" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00260-of-01024.json.gz": { - "num_bytes": 319514850, - "checksum": "0067e36b7156196e2451cdf78dc8832352f2481a4740afbef9046104b6810bdc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00261-of-01024.json.gz": { - "num_bytes": 318747661, - "checksum": "b1e4597420035c355abe15efc576751169e2b5e4c38e073c178346a7202d5ab2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00262-of-01024.json.gz": { - "num_bytes": 319868329, - "checksum": "374f4b951e545968da45b5055af2aa0b128c1d65d6c854f5b8f7e02d22c352e2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00263-of-01024.json.gz": { - "num_bytes": 319268788, - "checksum": "7168e635a32859a85a152b29bcd1f699257ee4e340517e218ea9b8dac3922210" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00264-of-01024.json.gz": { - "num_bytes": 319270640, - "checksum": "1da08b65c83e79a0f5b7215e5a4ee58f21383b69f09dd9a3ba95381ba3d56d25" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00265-of-01024.json.gz": { - "num_bytes": 318744354, - "checksum": "0c908e81d59b2099eda038731b387a0ad86fa3d168eb2955413dde9cf29d947b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00266-of-01024.json.gz": { - "num_bytes": 318518406, - "checksum": "115e375464931638de4af669b7301b6112d18b23835f2db2b092f47545b1a855" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00267-of-01024.json.gz": { - "num_bytes": 318921711, - "checksum": "6d66c715137885a46f2472489b21751284ec8ecfde6dca6be3ec1ee75f6cd5af" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00268-of-01024.json.gz": { - "num_bytes": 317786222, - "checksum": "588865d8f9d3da5a70c958997060ce4792e175c8fc5323f1887787070c8c160f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00269-of-01024.json.gz": { - "num_bytes": 319004956, - "checksum": "163ec7497602931de2eaffad320704e508e491937a2965e39907a086f640d975" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00270-of-01024.json.gz": { - "num_bytes": 319175186, - "checksum": "794e0e7ceccf28457a8ed5b0724337545661da16feafd0a53e4823b2cb1c92ae" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00271-of-01024.json.gz": { - "num_bytes": 319785821, - "checksum": "9c9ec0348f7d4ffc61e5f19f1f60c8382b33ca2fe4b852567cbc3c16024a4627" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00272-of-01024.json.gz": { - "num_bytes": 318933435, - "checksum": "883d85985237948018b13c20f4d4ee567c6ee36a135b326e8117d73dad4fe37a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00273-of-01024.json.gz": { - "num_bytes": 318456664, - "checksum": "fdca13067e8e118e538b8de538e164fb5397724045a5b1b02764510c8de90969" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00274-of-01024.json.gz": { - "num_bytes": 318418161, - "checksum": "27556558fe8a91a4aea4800ba9b7e844336a7638c5b96e652fcdb359f631b04f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00275-of-01024.json.gz": { - "num_bytes": 318437784, - "checksum": "6ad4e6a3e1cee04aee3051a66531e3f4aa97f7bbb7602c6aa5f46a727b319f2b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00276-of-01024.json.gz": { - "num_bytes": 318470946, - "checksum": "145a4d85ddf1e72fcdb8477dcd2f70a5554d9cd9349e02e058d3e7837204b6ff" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00277-of-01024.json.gz": { - "num_bytes": 319580624, - "checksum": "7116de0dbc5c7f6621f7c107dded9d85788937a87f2d56efca32ae9f25fc6865" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00278-of-01024.json.gz": { - "num_bytes": 319619699, - "checksum": "8dabdf2d26035d30c22204e6f46f292c58f4a4c3b0b77a1826a43341d4282df9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00279-of-01024.json.gz": { - "num_bytes": 319344020, - "checksum": "c2b7d5bf62be1772c6bb80f597b28d948cf3cdefb10b6df6f777f0ab7d8fb015" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00280-of-01024.json.gz": { - "num_bytes": 318997864, - "checksum": "025457720b0045e7bf01f9b4b847f28ef94af9ca250675efeee73eeb340a3f36" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00281-of-01024.json.gz": { - "num_bytes": 318718146, - "checksum": "2979c0ac06570a9ee437521778c514bd8755193b9f1ae6a5a671ef885243f019" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00282-of-01024.json.gz": { - "num_bytes": 318434530, - "checksum": "a17bca50ec20c364adb899a9073bbe3a1505f81803a58190efc5d4f3f78b58be" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00283-of-01024.json.gz": { - "num_bytes": 319317663, - "checksum": "9034f524fc5c2e246b22e2dee00b47e0c4da0316bc60d0a11d966c28db917f9b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00284-of-01024.json.gz": { - "num_bytes": 318957832, - "checksum": "f08b96047e711831dfb8a44d90cb712d3e78c98dd28ec6b937ee83949bbef5b0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00285-of-01024.json.gz": { - "num_bytes": 318643283, - "checksum": "c5df1f2e2dad46d71f8aadf856a5139020da8afc2ee010d53c0372ea09b2362d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00286-of-01024.json.gz": { - "num_bytes": 318064839, - "checksum": "16f7fd6abcbc69750b8131bca3e38ddc40bd7c86c48122ad2a9a77cb9cfd552e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00287-of-01024.json.gz": { - "num_bytes": 320328448, - "checksum": "41e82bd357b47a28f28a4a203d5b54263aadb3c9a08899f78302c727c56d8b38" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00288-of-01024.json.gz": { - "num_bytes": 319559271, - "checksum": "970b9df224b58ca50b3023d92f6be0c37dbda479155c29c535e457ef6f2bca0e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00289-of-01024.json.gz": { - "num_bytes": 318786822, - "checksum": "36a6515e7f516335d3fe057bb6ed9890a2aea033e08edd8588b3168b3445b2f1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00290-of-01024.json.gz": { - "num_bytes": 320634782, - "checksum": "7d19fc82b9a5aa0e0046cd17cd2c46f356f8a4a7d203d5e03e1f319156f05cb8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00291-of-01024.json.gz": { - "num_bytes": 318746713, - "checksum": "86d610d4590bca69281348dbfaaec9e704fd6194141c50c71e84aad51ce26b91" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00292-of-01024.json.gz": { - "num_bytes": 320049630, - "checksum": "d045df646213e29d4e7de4ec8915eb3b65bb962f35b0d74abf00889bd5aae8ab" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00293-of-01024.json.gz": { - "num_bytes": 319966146, - "checksum": "c66fff1a64b495211bfdcea650ff76115f8c857b9154c1b869062e702714b9ec" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00294-of-01024.json.gz": { - "num_bytes": 318805332, - "checksum": "ef3d9204ec85a1e65ae48af7924f614403d297a15f232ba41eb0e4fe223e507f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00295-of-01024.json.gz": { - "num_bytes": 318898465, - "checksum": "2a071fc28b1216f2dc0579528d9b04e597b5cdac9fd14719e312092242da190a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00296-of-01024.json.gz": { - "num_bytes": 319406630, - "checksum": "ea71e9fd444860d70d3728f7e2213a4bccf3aa31a164c9acfa8df7a0b6619786" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00297-of-01024.json.gz": { - "num_bytes": 320312971, - "checksum": "ddaeba8aad38b7e9727c579cc44f15b3c82d292e2901b47b785e9c8d3d5cdb9d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00298-of-01024.json.gz": { - "num_bytes": 320660744, - "checksum": "814460ccfda29b45edaee5f44e3c980889aee2ee52e4e5323931ea489fbe938e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00299-of-01024.json.gz": { - "num_bytes": 319848186, - "checksum": "3b91fe32d3a731a5be3bf778eedfe13e8a7e26ba9eda51c278c5212aa7925681" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00300-of-01024.json.gz": { - "num_bytes": 319647278, - "checksum": "1e0424631f7f354bc63b3e71c5c6516c85343dafd3896acb9560eaf93b672799" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00301-of-01024.json.gz": { - "num_bytes": 319080252, - "checksum": "46c21af013f611729cc06ec033dbae80151987f9098e57fb98e2631f6fe76c8f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00302-of-01024.json.gz": { - "num_bytes": 320028246, - "checksum": "d1ca8ad6e5bd6cb18db1f1be9154dbc8ba9df7ca02db4c1f8a7df9d40820d8ff" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00303-of-01024.json.gz": { - "num_bytes": 319388787, - "checksum": "bce87161f77464adfb1fc04fc2993211bcec502d7172b86f726daf7096b04f82" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00304-of-01024.json.gz": { - "num_bytes": 318627831, - "checksum": "235b8085cbeb7b13f8e1a5f6d2225a9461b7bcd76e21466a189c2411ff4c4107" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00305-of-01024.json.gz": { - "num_bytes": 318148428, - "checksum": "f13f124e0ea150da13ebeb3390c311b3db54018de0d640579307bbcf2c46068d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00306-of-01024.json.gz": { - "num_bytes": 319451712, - "checksum": "de5c3fa2cd6a47551ab43268484d017602e2c3e1f66f43f1a1d8f95bac52cad5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00307-of-01024.json.gz": { - "num_bytes": 319026244, - "checksum": "88769fbf393671db352227a64cb8ba6b4ba60c5bddb4a14294b1ad9a65a750cd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00308-of-01024.json.gz": { - "num_bytes": 318447454, - "checksum": "555bcfc0ba4db0551ce5ffb18057027ee695af166856125aeb79f7ce013851cc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00309-of-01024.json.gz": { - "num_bytes": 318147676, - "checksum": "bf28e60a7970c548190cf0f4fe56f27ea55a1ad8313fa353a8013f0a0e7919f1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00310-of-01024.json.gz": { - "num_bytes": 318930650, - "checksum": "45a68c0ef70ecd10838d604d51fecd26e5199f5372022b9c2af461a71c24c6ef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00311-of-01024.json.gz": { - "num_bytes": 319955339, - "checksum": "fb3c4e93166f1cb2ccc8a7b68da0246f0827d3a81bb5614c8c84f1c01c6d53c7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00312-of-01024.json.gz": { - "num_bytes": 318554567, - "checksum": "0dce2ac88ba7ac5340d551add9fe7b1a30772a6cc082347c536427b48daca598" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00313-of-01024.json.gz": { - "num_bytes": 318978931, - "checksum": "c5f99dab085fb705769a514626c9af8a26cf846fdaee4b403a3d6f84c892cb66" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00314-of-01024.json.gz": { - "num_bytes": 318158197, - "checksum": "79de4fa2aed5e3efa71e75d13f08d7c1869aa59f42a819f4429430b3db6c1b27" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00315-of-01024.json.gz": { - "num_bytes": 319744521, - "checksum": "5a47a89a1537662a91853bbe2a5b3e243f5de74489f820621192cacef192593f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00316-of-01024.json.gz": { - "num_bytes": 319861527, - "checksum": "1cd34f17f3ae3c8bf8e1636714a9ff600a26799d5ec02ba42abefa5db9d00e5e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00317-of-01024.json.gz": { - "num_bytes": 319286030, - "checksum": "a3e34af81264a72b523b63fdc0268f450675f7993fa0885eb2b4c747b0d6703c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00318-of-01024.json.gz": { - "num_bytes": 319054871, - "checksum": "02fa8cf278578108083bc9a3c5cf07b0a9d243f2162397091ede6c85a1df31e7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00319-of-01024.json.gz": { - "num_bytes": 319943810, - "checksum": "93ef0d7f1610043a6f7634af73e89ee9f3d7e87828ad34558a4d688e6fa6b6dc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00320-of-01024.json.gz": { - "num_bytes": 320037211, - "checksum": "06fbd99a3d64df293db2655f321117f1afcf1cda51e421edef9335a25cb1a902" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00321-of-01024.json.gz": { - "num_bytes": 318584237, - "checksum": "a224e4d902f7368f91d6a72fc9f5730996dc37de576bc2211eb632e3690f1b38" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00322-of-01024.json.gz": { - "num_bytes": 319686632, - "checksum": "57fba28c7104ff659f8a0f330ae89c68d3a392dd14a78247fa357a3bcc8b94dc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00323-of-01024.json.gz": { - "num_bytes": 319834993, - "checksum": "e61c760cd3c42f71a1a7bb6adc4e0bc970bbf864b69e2a4a5d56bf0a14d4e0be" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00324-of-01024.json.gz": { - "num_bytes": 319243057, - "checksum": "61d21ab1e7729f172ade5ab6c0dcaf07eaeaee6e047ca1c24722c06ddd919678" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00325-of-01024.json.gz": { - "num_bytes": 318569583, - "checksum": "2192a891ecc2a6aa9f6ea64f1d76ce763e0a3963ae03c95275ccd626171835ce" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00326-of-01024.json.gz": { - "num_bytes": 319175980, - "checksum": "d35e4d5f8e924ad97520db51a2c361bbc02097721195932b6768e7460df092a6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00327-of-01024.json.gz": { - "num_bytes": 319892298, - "checksum": "ce967065d3915d466982b5258e07ad2c46b02d7637057e0547586657ea0f53a4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00328-of-01024.json.gz": { - "num_bytes": 318004026, - "checksum": "0676d556f46b1f057669d3378c6fc335db6e3ac67a02e11dce3823658730f4c5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00329-of-01024.json.gz": { - "num_bytes": 319066225, - "checksum": "b00bb4bda957e1287b98c432165448b3899f9155363f7b61bfd0f0181181acfc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00330-of-01024.json.gz": { - "num_bytes": 319268288, - "checksum": "d14d1883941966ef3b35203d06e6fa1bb485dd77118bd7b6c811b0d06fa72fae" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00331-of-01024.json.gz": { - "num_bytes": 319131311, - "checksum": "4d5d41c2b2242b299fb67fa8c9327db8b4f612bdf4ee9af4d4e45aba8cd1e409" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00332-of-01024.json.gz": { - "num_bytes": 318827508, - "checksum": "68cea08d4805b392bf4c2894a4501ee3fbbe9aac4b1b6533e686ea749ced2dcd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00333-of-01024.json.gz": { - "num_bytes": 320572240, - "checksum": "06f211ae2fe1c4eef5e41caceda8ebbc289261057911fcf2583a59c730b7951a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00334-of-01024.json.gz": { - "num_bytes": 318121862, - "checksum": "46c62769e04ce8acde4562ba24d72e245babacdfb50600da4e6217948ad71d24" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00335-of-01024.json.gz": { - "num_bytes": 318692168, - "checksum": "dca69a6976e7387a12c8da16b696ed4f604254693a3280be0f90fa694700b595" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00336-of-01024.json.gz": { - "num_bytes": 319479902, - "checksum": "c52969fad97f1dc0e1e115428e7dad1ac6cb6d804db0cd34f0fc7846b1b50c7f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00337-of-01024.json.gz": { - "num_bytes": 319987407, - "checksum": "2c570f02aa6a6bac96be1e02663996c87f9a94c160f22101ce8ae1d549ae1de2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00338-of-01024.json.gz": { - "num_bytes": 319051086, - "checksum": "77132df95b147c471ead74bef16ed4fa11e15209f518dd460110132358816834" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00339-of-01024.json.gz": { - "num_bytes": 319473192, - "checksum": "7f3ac20a72d395c02ed3cb50052821521dc2d8d97303d00e0d0982e2c29e7659" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00340-of-01024.json.gz": { - "num_bytes": 318423485, - "checksum": "d1127da89e960d939cfc06cf1985df415b60d4bf02b12b7fab02b796100feaee" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00341-of-01024.json.gz": { - "num_bytes": 320087690, - "checksum": "f753423f82157e95506566d3653d32af6a181e69ea0e10b4d4eb24b626d3ca49" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00342-of-01024.json.gz": { - "num_bytes": 319767100, - "checksum": "db7410e6a6ca74163098681038f497faa373e1d81434b45c1a2f273d467c0a2d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00343-of-01024.json.gz": { - "num_bytes": 318389429, - "checksum": "7ea1e432a1ffbed8f4ad6cb985c5cf1b2584d8eb7d2fa091a2db3f104a3f7210" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00344-of-01024.json.gz": { - "num_bytes": 319117212, - "checksum": "c7317a81a6224dec9be07b41134ac7a7db4039b7c98b2061b20bb59b82ed0a1e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00345-of-01024.json.gz": { - "num_bytes": 318504232, - "checksum": "1498efe8280609d9d66c324e332c9433c6351bb7b99c5891a8f27d6841410407" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00346-of-01024.json.gz": { - "num_bytes": 316721169, - "checksum": "0cbc6b494d653878c9d52a37572064b88356058ed291aa773e5f47259fbfc722" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00347-of-01024.json.gz": { - "num_bytes": 319007736, - "checksum": "6265505e19a42a01a159297d33b1a91cd0e042a31ba6a1a867404a143ae565a4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00348-of-01024.json.gz": { - "num_bytes": 320167918, - "checksum": "cc8b29deb44c8348aa4d05836f89cbae995c946f38d9cb8e7fedbd4762168ba0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00349-of-01024.json.gz": { - "num_bytes": 319901226, - "checksum": "2a0f2188b43ffedc8b95a8276c7647147587c5e544c9e6475e790f4b5e362992" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00350-of-01024.json.gz": { - "num_bytes": 318999223, - "checksum": "1fde48c503998872aa71fc524c7408dc84cbc1faa0d885895d5c57708a15fced" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00351-of-01024.json.gz": { - "num_bytes": 318935410, - "checksum": "72d577eabcd814a7ff61b894b3fe9089f483a793e692d3ab20ce4ee59921f975" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00352-of-01024.json.gz": { - "num_bytes": 318655907, - "checksum": "8686dc0e4ff7b35cbc4fa6f3abce50c06f8b95378031c132a117e1d458cb4616" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00353-of-01024.json.gz": { - "num_bytes": 320619683, - "checksum": "cd5816469ef54bfeb0db6b55a78e0d34eb2e1f82448a41f67dfb70061c3ea91e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00354-of-01024.json.gz": { - "num_bytes": 319352400, - "checksum": "bf082c093423d562da4984b1f0428225d853a05b5f8fb3696273f36ebb5a235d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00355-of-01024.json.gz": { - "num_bytes": 318868462, - "checksum": "3b8baeca48e55a2cd268d6aef75f7eed96ef10fceca593a5179d52a2b0121f8b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00356-of-01024.json.gz": { - "num_bytes": 318903295, - "checksum": "4c9a9926a4bad6721807d99cc02a9b6bd28bb0a6254aa1c15527b745c56a06a2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00357-of-01024.json.gz": { - "num_bytes": 318881446, - "checksum": "84b4c2e05bc162fef4824e97ba7a03b1cecb41eda08a3e0aedd264b66e859a30" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00358-of-01024.json.gz": { - "num_bytes": 318521100, - "checksum": "aee99528ffd0323fe81e4ed26ed1b9295baa2a3910771dd2a42f4f378fd82569" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00359-of-01024.json.gz": { - "num_bytes": 317796778, - "checksum": "7b01f2d5ae54f60c2aeb7b96bd366d21e558e2dac48c83a78df9850f37e02f1e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00360-of-01024.json.gz": { - "num_bytes": 319502919, - "checksum": "5b54f9a050e6f9008a1806101ea553d90eead56c949a5f3f46c8ccb88812081b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00361-of-01024.json.gz": { - "num_bytes": 318595505, - "checksum": "49f4164d66187d46adff7f9bbac97b232ab7906d812e571c2e0bf028895e7f47" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00362-of-01024.json.gz": { - "num_bytes": 318851572, - "checksum": "17accad3c0706c54530f128260cacbf986cbbb20427d4ba8d3444a3702a22c55" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00363-of-01024.json.gz": { - "num_bytes": 318555337, - "checksum": "2327866e541aa6aa73f7289c3ad82a19ff154d39657d98cb78a2f481a8765920" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00364-of-01024.json.gz": { - "num_bytes": 318641145, - "checksum": "6f52354d804e8d4a1af1f6c2c6b759ae115c4f23a63f1206a73e7e25acfbdd02" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00365-of-01024.json.gz": { - "num_bytes": 319212614, - "checksum": "8f1834eeacc9bbdee95b1f0a4078eb9488bd1a7c5693489bff7943869674cad3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00366-of-01024.json.gz": { - "num_bytes": 319336585, - "checksum": "a9cf01b76104eebb4ef8462a924f61c262fa197a7c68a50e48d925cb81586e3f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00367-of-01024.json.gz": { - "num_bytes": 319161263, - "checksum": "5ac822027d50c3196026fbaffc7d968e1ca702b947688a6f4d268b942b5067b5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00368-of-01024.json.gz": { - "num_bytes": 317911640, - "checksum": "f9acffbe3c6617e85911ff9dcecec2378b3469ab4546a6973cceb460f9003cea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00369-of-01024.json.gz": { - "num_bytes": 319585031, - "checksum": "9234553649cfa5265c5a9ccc88486402f88eb81275067c51d9deef16bbe7211f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00370-of-01024.json.gz": { - "num_bytes": 318345879, - "checksum": "2fbb410346d31a33e8532602f4e3340fcc75c96be803250e9f0f1a6894ca0052" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00371-of-01024.json.gz": { - "num_bytes": 318996184, - "checksum": "b069b0c8a830ea841e82077548706f286308ef0420e163ff6d8312c8853af172" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00372-of-01024.json.gz": { - "num_bytes": 317989343, - "checksum": "bfd62e448d4d9f89353abaa384007b0b72bd860402ade3a9d938051a6446530b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00373-of-01024.json.gz": { - "num_bytes": 319770759, - "checksum": "e4e176250aceb7362ce38d496556a46409e9872e69f45166afe71aa750de8fcb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00374-of-01024.json.gz": { - "num_bytes": 319212902, - "checksum": "28aa4510c3ddb9ee0ac56aab3792bfe5e899531919ccc0214a4b68bbf2ba18a9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00375-of-01024.json.gz": { - "num_bytes": 318968029, - "checksum": "35326b1f2280e07dd754e89dfa29989d0dfa5c78995d393b36a752d8364bfcd7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00376-of-01024.json.gz": { - "num_bytes": 318685188, - "checksum": "0060dbaccf7f2f956fb8b57891cb176914ddac1bc485dd86c2fd110c46d174b9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00377-of-01024.json.gz": { - "num_bytes": 319291982, - "checksum": "99fc38654197e506868e099c15b2cb15b93238dafd33f81a7d069b3e01c3b085" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00378-of-01024.json.gz": { - "num_bytes": 319259094, - "checksum": "9b8d97f9d57dd97373c4f57eae2b9c01a58e49017ee41d3969e94fb4dbabc260" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00379-of-01024.json.gz": { - "num_bytes": 320228224, - "checksum": "82913f2d182d2a57f6c93e9b229862cb72feaa6331d04cd4419113e1eb9d52cb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00380-of-01024.json.gz": { - "num_bytes": 319738339, - "checksum": "e0de43f754ab97d103a02c708d1cd7e771ba079bd9e1f7c532a80a30bd5182ea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00381-of-01024.json.gz": { - "num_bytes": 319210620, - "checksum": "df74823f78564b544677410508e675e2811905c56afe2a60d19d3e049dd65394" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00382-of-01024.json.gz": { - "num_bytes": 319810275, - "checksum": "f5d5291a695fe2cd228213fa2bf090bf6513c49c6911826aa43ecaefec0622ad" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00383-of-01024.json.gz": { - "num_bytes": 319190426, - "checksum": "a861ae79a66b72d6cd5e0a030daae52cffb85ba1272c36ae2be04a9b7c0287c4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00384-of-01024.json.gz": { - "num_bytes": 318501845, - "checksum": "b8d0f5078ae82980f0f64120530bbeb20f627be0a8629d68885acb867091417f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00385-of-01024.json.gz": { - "num_bytes": 319530458, - "checksum": "7da119f3f63e25ff63cacd8ba0d77987b2d576be1f4b86e7e45aa3f2d194624b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00386-of-01024.json.gz": { - "num_bytes": 318938980, - "checksum": "c21f3de56fab26d7fb60bdb47c216b22793f67b8fa6d382520c79b88d1896f05" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00387-of-01024.json.gz": { - "num_bytes": 319207426, - "checksum": "e28b0884092f75836eed4d73ed24b7403d7b0530fc389386a68887420b0c2603" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00388-of-01024.json.gz": { - "num_bytes": 319835376, - "checksum": "b4f0db632cc9af66e8aea109c80d73a6281207e29ece131d5bf8b57ff8f81262" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00389-of-01024.json.gz": { - "num_bytes": 319346837, - "checksum": "413a8d8df1f6cf3094839b57231da5323f33f7115768c65d83f0af1574f71b6c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00390-of-01024.json.gz": { - "num_bytes": 318632301, - "checksum": "a3e8664fbb3ec2af5a217225dbb7fcf3e93b427e5da1a88e35c04c319d61e4c3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00391-of-01024.json.gz": { - "num_bytes": 319066082, - "checksum": "e22eed3415c90510e97768be5a685e0a8035e2635ef773c56e9ce2718c278658" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00392-of-01024.json.gz": { - "num_bytes": 318356286, - "checksum": "ddbf325390648d9d86f1e7901b75c99fe8db538d203de8dfb4c304282f82cd74" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00393-of-01024.json.gz": { - "num_bytes": 318048288, - "checksum": "974fd05f356c86be2f9109b0272eee69c5b2eaf0b16104cc573846c925d13b4b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00394-of-01024.json.gz": { - "num_bytes": 319444683, - "checksum": "0d27d6f8c3b935cef23ea60abfa82bd6a4f5e2e061080419dc9c6bc455b9f868" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00395-of-01024.json.gz": { - "num_bytes": 318353166, - "checksum": "24d9956bd857484ffbabb3ba6f6ac688f48a94b50228238c7c9153a5c6878a7c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00396-of-01024.json.gz": { - "num_bytes": 319960396, - "checksum": "9425f4f18e1690ded866c4b5313cbac8a6210092dc42f720200b7143b69eabe5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00397-of-01024.json.gz": { - "num_bytes": 319030577, - "checksum": "dee166674b835b9849d281a87238aa136e14d26edaa72d0ecb6b7e82d556a72e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00398-of-01024.json.gz": { - "num_bytes": 317664320, - "checksum": "f85e08272f73ce4aa602719d59205db54d230a6b7247830d78f91eac63d753be" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00399-of-01024.json.gz": { - "num_bytes": 319623875, - "checksum": "85dea0672a0362a08503b70623907c8c92bd105f788fbd7f3816212a9181e7c5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00400-of-01024.json.gz": { - "num_bytes": 318840274, - "checksum": "a104345698500611cd1a71a6647555300d315490918740a8c6e3b8dcff315407" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00401-of-01024.json.gz": { - "num_bytes": 318336377, - "checksum": "808327d156e183e102fd75cfbdb7b5a1fbde3740168f59b767ea380608305b67" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00402-of-01024.json.gz": { - "num_bytes": 319270185, - "checksum": "b6a5f7c1ade628091fe86744a6011147ec32795ad694ccbc82929791b93aa307" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00403-of-01024.json.gz": { - "num_bytes": 318038520, - "checksum": "108904ab05b3ad23318f8aa0f7ddd00d97aae1872fb157eea73273e011cbec04" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00404-of-01024.json.gz": { - "num_bytes": 320933185, - "checksum": "cd0c068c0831218849149eaab8f8a98748823911c745ca0ea33ae839bd625e04" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00405-of-01024.json.gz": { - "num_bytes": 317694827, - "checksum": "d99909ccd59e2ec183b41a7c6d1bd5677798bd7fd784ab681546a7bf8292f353" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00406-of-01024.json.gz": { - "num_bytes": 317937468, - "checksum": "c7f2bd7a366b8c389e41fdfad4891068c86039e1a5fc3b8a0b993253badf33d2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00407-of-01024.json.gz": { - "num_bytes": 320226074, - "checksum": "765db6f9f0c8c3d9bbb0499f0010928fe4f90d5915dfdd3b6d09d3dc78ad07a9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00408-of-01024.json.gz": { - "num_bytes": 318613788, - "checksum": "165e78c858dfaf010307392474d4917846c9d21658558912e5ffc915803bd2fb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00409-of-01024.json.gz": { - "num_bytes": 319212414, - "checksum": "5f7d5952aad1ae31413962983971b2b422d77c262ededd2ce1c1e186aeb6d87d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00410-of-01024.json.gz": { - "num_bytes": 319023647, - "checksum": "24588d41f40e3fe389575b97d41ef761be46bc9a9b3965c5e3f994760f7a4070" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00411-of-01024.json.gz": { - "num_bytes": 318408922, - "checksum": "b35d4ada5a000f51169557b00e508706d51a7becd33370014ff07c8b8dac1af5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00412-of-01024.json.gz": { - "num_bytes": 317166932, - "checksum": "d3ed1cae269ebefe4716843bd7954bf7e44ee889f72066afbdcd95f4e1f06703" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00413-of-01024.json.gz": { - "num_bytes": 318519121, - "checksum": "07fc61a7e164301113201e78c99d40289d88e0b463048e14aa5fe69c7490ccac" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00414-of-01024.json.gz": { - "num_bytes": 317417235, - "checksum": "c5a7222b2eb8e8fe690f29a0fff7e214ba94e4d9dae62f67281fe25dd385b721" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00415-of-01024.json.gz": { - "num_bytes": 319690993, - "checksum": "37052fff729bdff124577d5ba041906b2ea7420c5cb28195e6cfca0e41d560c8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00416-of-01024.json.gz": { - "num_bytes": 319466518, - "checksum": "6e8ce2b9e6e8208ad7e43ce709454cb0b96572d793e0b11c15892f5df18f6137" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00417-of-01024.json.gz": { - "num_bytes": 319694381, - "checksum": "20892d7a33c31d7967ae0cf595a2108de96a61c0bbd773aebc5d3d083f6ed93b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00418-of-01024.json.gz": { - "num_bytes": 319048918, - "checksum": "fd795ae8d53e632bb3e89a2becc5b801e10db781b14f2c0ed50b12def5376c8e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00419-of-01024.json.gz": { - "num_bytes": 319791424, - "checksum": "5a8e56faaa0892249e5694ae01e2e4dcd22d9750a9aeea5ca390117c77b8de2d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00420-of-01024.json.gz": { - "num_bytes": 318060925, - "checksum": "795ee64f4c9e2e35d9dc0c91ea593c9e41a3924162901fbf782dc7112f8094a8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00421-of-01024.json.gz": { - "num_bytes": 319328927, - "checksum": "2670b7b6b53e9082c90e4a4e915f72673831ff15e9f55918a1244e0c19c8f963" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00422-of-01024.json.gz": { - "num_bytes": 320065363, - "checksum": "34df2d1afac2ae4699524492d6b93e4a2a1e551cb4a4ae35fc19353930afab8b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00423-of-01024.json.gz": { - "num_bytes": 319349887, - "checksum": "a2b19afafb45cf30493ac2a3eb013e136e7213f63bd633374ca0d9fe2780efe9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00424-of-01024.json.gz": { - "num_bytes": 317515288, - "checksum": "ec2a84fb16dd16f9547f0c3314a91968324f2c537118ca36e982b235e23527ee" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00425-of-01024.json.gz": { - "num_bytes": 319092219, - "checksum": "1ac0b93c0faae7d446add3af3173637a4b0d638dbd5285b0f4e1bf3abd0d1542" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00426-of-01024.json.gz": { - "num_bytes": 318421245, - "checksum": "bade501dc71c0b4968a9a7c833751cee5d8f7067a45dabd53aa03534df48886e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00427-of-01024.json.gz": { - "num_bytes": 317847935, - "checksum": "7aef554aa2b120c4d787395e28aceba743e309f2540fab283e077a1429a2f7ef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00428-of-01024.json.gz": { - "num_bytes": 318822008, - "checksum": "cd94547fe1953a1cc074d97558a70d1e55834606379a8f5e6e60e1b15b56fd35" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00429-of-01024.json.gz": { - "num_bytes": 318507684, - "checksum": "4d3c9245565a808058293558603c657d6e9a0c87b6d2d4b871b856cea2eb3a19" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00430-of-01024.json.gz": { - "num_bytes": 319042136, - "checksum": "9c5a4fe50db5d0822923fe29a5aa8ca6cb09e3629472b1bf61f670388b6c2076" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00431-of-01024.json.gz": { - "num_bytes": 318925124, - "checksum": "8f18b35bb952da090ade742753e30861ba39c6c54c8ff2d76b358ca7be475ed6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00432-of-01024.json.gz": { - "num_bytes": 318680251, - "checksum": "7968c370d0efa4601ab8b5ee68e480b211fb969593608bf7e00a0153f00f99b3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00433-of-01024.json.gz": { - "num_bytes": 317822797, - "checksum": "f62d7e74434d52c36b22f6a8cd56ed3937ed6aa03f140d0fbdf5e360632d51fe" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00434-of-01024.json.gz": { - "num_bytes": 320094364, - "checksum": "55d7678c7e197e165b4e09bf3f8ac159853120acbe5801ed6ab3ab0f801c11bb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00435-of-01024.json.gz": { - "num_bytes": 319008936, - "checksum": "09b451c8ee06bc06507b3e75a60c544a6b70f27e3d07daa29c59803f785faaf5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00436-of-01024.json.gz": { - "num_bytes": 319023456, - "checksum": "6fbcb93f9dfe65e12b7efeecc8af7823471787438b1ce90e5f48b68b2dcb1d14" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00437-of-01024.json.gz": { - "num_bytes": 319484997, - "checksum": "9e70c8c1ccbfe93ec9296811ae496a518dcafbf38c81b7972f885e297da9e726" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00438-of-01024.json.gz": { - "num_bytes": 320319141, - "checksum": "eaab759d8c603e8a2ad3ebacd99e30338fb904ba307aeaba0d2e0e63679cfadc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00439-of-01024.json.gz": { - "num_bytes": 318410397, - "checksum": "7a03a92bf97b6750941c1070f933c68f1b2a3e13fb68b3a21a4726676ea75d34" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00440-of-01024.json.gz": { - "num_bytes": 319447470, - "checksum": "bc899e436da7b3bf13c1bfa2fd2bbf9d90b42a0c00f2971259a14d858ca3e5ef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00441-of-01024.json.gz": { - "num_bytes": 317582955, - "checksum": "4d777860c2750e43038ef709d77bdc403b3b3bcf0f08e3c4562952c9ac70b113" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00442-of-01024.json.gz": { - "num_bytes": 319592118, - "checksum": "d9e5dc244bb6f0b629b2a929aedf506dadaf5eacc80f0997816b95279552fe8d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00443-of-01024.json.gz": { - "num_bytes": 318104403, - "checksum": "56133bbd7cf96dbe87d48898b886a024af69ca405d7cea1799bbd30f185e9c1f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00444-of-01024.json.gz": { - "num_bytes": 318547808, - "checksum": "8be0270c3cc96dd7f7b3aad08bde81ea245feff4a09923277fb0d38a7c095604" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00445-of-01024.json.gz": { - "num_bytes": 320463920, - "checksum": "e02316fcd355914e4d08ecf37036d4727ae9ebe45bdc5c98279aa3437c2c1eb0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00446-of-01024.json.gz": { - "num_bytes": 319583221, - "checksum": "80c9b8c47665b2cef6c291b0eefdac5b14be1d7cd4a4c06c2e14cf48b42da92d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00447-of-01024.json.gz": { - "num_bytes": 319546881, - "checksum": "a18d5aaca1717ec33fb1822a633268003bf88093dd7b48db080503c3d01b6ffb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00448-of-01024.json.gz": { - "num_bytes": 320234711, - "checksum": "c41595d2b9cbf0e23fd65df1cb51499ee262d345d79d2625388cf149c3c39f8c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00449-of-01024.json.gz": { - "num_bytes": 320043698, - "checksum": "3bef99334be9d39f41296f8f134c88f04fe66502da2d2639f0d6d2485338e607" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00450-of-01024.json.gz": { - "num_bytes": 318033740, - "checksum": "9cd05b1b70ffc3c004b4b4a2f21f91abee1395f3a485efd1aafda550193df9fc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00451-of-01024.json.gz": { - "num_bytes": 318549622, - "checksum": "b2ef6cc4ac7c4c69fb1661d7ed9b2ce4da261c72f9e49dc3c934180501ef3a24" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00452-of-01024.json.gz": { - "num_bytes": 319317230, - "checksum": "89927f1fd79a5b1439988fd37e0377175176d9ed22d14611f67a81e185a336b3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00453-of-01024.json.gz": { - "num_bytes": 318952561, - "checksum": "427f55bbcfb6c1a0ef12f96cb122f362b975169770ce1d392b763c4b4408cb34" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00454-of-01024.json.gz": { - "num_bytes": 317545286, - "checksum": "2fc3b172ea721bc92b0f7614e8fea61b0781e6f4f3e6b7263cf0190beef3ec52" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00455-of-01024.json.gz": { - "num_bytes": 318975631, - "checksum": "c96f688ecb19bdb1592b0124021fb80d48965303442de76751d82fa03ab8f6d5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00456-of-01024.json.gz": { - "num_bytes": 320016575, - "checksum": "61d2be7a4b9e34cfb994ae2c120ed5a51a6669564046637445a46b9872812416" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00457-of-01024.json.gz": { - "num_bytes": 318236935, - "checksum": "a74dd51c3c490458ea0e61196d7e0085aff80d50cd149a673f54f661b364a671" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00458-of-01024.json.gz": { - "num_bytes": 318495925, - "checksum": "adf9cd717f2c79504dace22b5929d4c4064353e869457c20cc81a0b2db390c89" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00459-of-01024.json.gz": { - "num_bytes": 318956821, - "checksum": "d7be5bcb738a75586125e56a25aa234618528accda620eaac421beab6288b992" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00460-of-01024.json.gz": { - "num_bytes": 318968681, - "checksum": "6181280df5418fd9ebb52aa26a631100b6c3da0750dc5fbae152a6a44fccb942" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00461-of-01024.json.gz": { - "num_bytes": 320810761, - "checksum": "5e943c458674371dffb2466274b8f2a9df9902a370901ef97992bdf920cdae0a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00462-of-01024.json.gz": { - "num_bytes": 320154899, - "checksum": "76b3d1b120cbb7cd71d004440e0c6bd9f9c4395424c568e8362973038017a90c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00463-of-01024.json.gz": { - "num_bytes": 319247449, - "checksum": "9de2c86d85289113b24c2f7eb4771ec1391511930f5f26a12133d41faf0ce908" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00464-of-01024.json.gz": { - "num_bytes": 318150152, - "checksum": "85fce3104ef0b247798c1de8d9d616d3de754841fb6c49a01cca5b9da5efa94e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00465-of-01024.json.gz": { - "num_bytes": 320342803, - "checksum": "ddf312f0b8de8f53ed556483fd998ae308d4829d18195a48869db6bf1866c332" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00466-of-01024.json.gz": { - "num_bytes": 318619029, - "checksum": "01239a1ff6ffe9032da320c5a7d1a93125d0724851e3e10746821c9452070887" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00467-of-01024.json.gz": { - "num_bytes": 317677227, - "checksum": "41783d20189a4bcfc33f543597a5473900e692ea13fa522f2724e27e810b4e9c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00468-of-01024.json.gz": { - "num_bytes": 320038217, - "checksum": "7131b6f4dd423f2efe55c3f598893676300b31651cce7eed32ce633a015f8ca8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00469-of-01024.json.gz": { - "num_bytes": 318359701, - "checksum": "925bc76c045f25532414f29820adb0cf1a56c54b406333a6f348c29e5efda9fe" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00470-of-01024.json.gz": { - "num_bytes": 319329235, - "checksum": "9be740483aa7bbaf94dce550f2c20404c89326f6ec4ebe1b7070f85f93507038" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00471-of-01024.json.gz": { - "num_bytes": 318792779, - "checksum": "0e3d9492f15dc9867bb0dc803bdf45608fbe67255014b4488902d7bf2e2554cc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00472-of-01024.json.gz": { - "num_bytes": 319552622, - "checksum": "00484bbc10bace3dfd93b57fc53d6f5fac26b7dd54fd5b5428d75eb9e6dbb0e2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00473-of-01024.json.gz": { - "num_bytes": 319466828, - "checksum": "5db5d585798e8ed8e4a3bc540871f1185f67125f397a12942d21b24e6b374519" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00474-of-01024.json.gz": { - "num_bytes": 320014669, - "checksum": "db07fd0e972c1a474806c1b4464ad4cefdd2e8fc15806ba0d259d4f9e594c3f1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00475-of-01024.json.gz": { - "num_bytes": 320379280, - "checksum": "e6e36a9eed8be84c928980fffd8177b177182726c9e13b41a47343d431f76a7b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00476-of-01024.json.gz": { - "num_bytes": 318820301, - "checksum": "0543ed2d0b3aaba0b0fccbf0311836143bd19175c5eed9bf0f024ffb9ce3c50a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00477-of-01024.json.gz": { - "num_bytes": 320577830, - "checksum": "a62fd62ad771dbcfb7af73841e15a49e9d7239c53dbbbd84de2282131bca9c99" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00478-of-01024.json.gz": { - "num_bytes": 319593908, - "checksum": "beae9334a8e93e4b036c4a9b3c5b3a75fff17264177184d243d9e6da286dbe2b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00479-of-01024.json.gz": { - "num_bytes": 319728825, - "checksum": "ae5b475c7be35d98b77d6c4aed5d61cbd1c98544c9a6e73a53ef2911757ab7f0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00480-of-01024.json.gz": { - "num_bytes": 319903674, - "checksum": "51e0611378455d909e8b0f292eb62038848aa7afaa4f93c9c83061258b211a95" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00481-of-01024.json.gz": { - "num_bytes": 319998409, - "checksum": "68c640304ac952f544ea88c88d7c994c8d2955b95036f8352a67b57a836fa1bf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00482-of-01024.json.gz": { - "num_bytes": 319047238, - "checksum": "74cefa57158d0008a06ae85b2a7a1c04d57a79b7ae3f7b4b3426dbe9918b36ca" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00483-of-01024.json.gz": { - "num_bytes": 318775875, - "checksum": "e99faa71222017521f1fc9999bbb0832df5c91f8b9f6e2ef501d3f827d3a1e85" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00484-of-01024.json.gz": { - "num_bytes": 319190491, - "checksum": "4518faae7c9d51a51f0b02cd895cf27e7c87a623b787346c844a8d9f0b52d6ce" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00485-of-01024.json.gz": { - "num_bytes": 318974502, - "checksum": "1bc8b207583b9f36169e0e9facd258de8eb73dee8bf831051dd1ab04b7726c6f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00486-of-01024.json.gz": { - "num_bytes": 318599424, - "checksum": "0b1d9900e1921483b85305491f914b6b78fabcd0686a20695e61b89b7380a894" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00487-of-01024.json.gz": { - "num_bytes": 318958015, - "checksum": "c0c789c5f3b34d170d2aeb72642c70d2fa5eca567e7850d0c89b3d170f3bbf64" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00488-of-01024.json.gz": { - "num_bytes": 320205671, - "checksum": "6eef7a1ea80be43e84cb0c974215a477c909844899ac694afe1af2e8f4ac171c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00489-of-01024.json.gz": { - "num_bytes": 319193967, - "checksum": "eccf5d7f682a76e11332f07e7d54a080f76c0be58a98a853a9fe90c815a22087" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00490-of-01024.json.gz": { - "num_bytes": 319833603, - "checksum": "afe99e32ba36134f23b59a2ee43965bf185432de947740fc19e26eef41027aef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00491-of-01024.json.gz": { - "num_bytes": 318912982, - "checksum": "e981151b23b233bd3e5798f78658b5f52a73f69db39c30615f615069cf0c4984" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00492-of-01024.json.gz": { - "num_bytes": 320057824, - "checksum": "0cc5f7df318e0718fef93d24e7ff904b3e8e2728c4fc0b1d13893c81d8e6e2c7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00493-of-01024.json.gz": { - "num_bytes": 317967559, - "checksum": "93749543b04a5a7093177d2a03acfc0bf6f26d5b53864ae35839a9421fb48169" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00494-of-01024.json.gz": { - "num_bytes": 320426917, - "checksum": "e461f56b461a4d5ce353c60889dcb99e10818985d3788440c6119bb145876277" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00495-of-01024.json.gz": { - "num_bytes": 319528392, - "checksum": "e530f3030ddbf7191bc4082e8209f63eb48733d7085d79a8469ce3611ccb79b9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00496-of-01024.json.gz": { - "num_bytes": 317570766, - "checksum": "ddec34b528bd5314019d12089e600df27e781d78f43b6722b9c0202ccf385755" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00497-of-01024.json.gz": { - "num_bytes": 319154838, - "checksum": "e7438a08000fc7a158f887755cc496edcf51c8bdf2bc4a888ddd2c829bf8fa3b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00498-of-01024.json.gz": { - "num_bytes": 317955368, - "checksum": "ad133d808ca5b6181bae1921ab1261d79630c09bf9d6c904db036f22e6f32e6c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00499-of-01024.json.gz": { - "num_bytes": 318286671, - "checksum": "cb40879ea08db5a9eb6f2c23756574bda34deb9acf039b992f0ab90fdbb01594" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00500-of-01024.json.gz": { - "num_bytes": 318510936, - "checksum": "21e5f7468a907f38c3dc0a5c19f09921476f9186beff967e829329f191dad6b0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00501-of-01024.json.gz": { - "num_bytes": 319611074, - "checksum": "38829434c8539bb9fa9ea32bfba3c6732c5021ffb60c16fc502fe61de83906ce" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00502-of-01024.json.gz": { - "num_bytes": 318630954, - "checksum": "22d1ca1edae179d2587495fcdf1d3e515c6f547cebafc54996c93a121731fd8d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00503-of-01024.json.gz": { - "num_bytes": 318253198, - "checksum": "e95689993390086880e630ec4540e0629551076c0cad2c70f5aedd3aebfec181" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00504-of-01024.json.gz": { - "num_bytes": 319497151, - "checksum": "0cd7b986d247e010fd76fa2ab2b62d5f9eec292b28c1e7bd3e4c577042b598af" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00505-of-01024.json.gz": { - "num_bytes": 317498965, - "checksum": "f1504912fc53cc3690e26ec3babf736ddbeb8f7d9196dac83f757699310b30ad" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00506-of-01024.json.gz": { - "num_bytes": 319684193, - "checksum": "9f6defbac132e097cbf7cb7d181cb154bace6af48964fe09d111bc610fdcd2bc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00507-of-01024.json.gz": { - "num_bytes": 318394726, - "checksum": "a58f39d0bef19abefc089342d8bb6d75dbb2c663f67127673ec395404bcf15ae" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00508-of-01024.json.gz": { - "num_bytes": 319013108, - "checksum": "176443b39840826bfb1db2cef2541449a6fd0c465ff9bbf0cb2479f07fb8baa8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00509-of-01024.json.gz": { - "num_bytes": 319832758, - "checksum": "cce5a142cd7a121eba8c182d499442f4b0a397ea1484c33ccd79b1acbae832fb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00510-of-01024.json.gz": { - "num_bytes": 318762241, - "checksum": "bfc910625f0fd6074955906bb86e789b0d0adcd1f8956cb8da276933dceac256" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00511-of-01024.json.gz": { - "num_bytes": 319240643, - "checksum": "ce53021b90d1c86e2d46293e7053aa174387d7408bf0cf907898be69b1a7befc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00512-of-01024.json.gz": { - "num_bytes": 318353376, - "checksum": "e9333c6f73c30c9cb7f31794025eb9129455fac2edd64f8b3f22f879124c6a85" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00513-of-01024.json.gz": { - "num_bytes": 317653011, - "checksum": "d9450c6f541e82922b37d3b7cc25611707b44884f27825db4dbd65466b59e8b5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00514-of-01024.json.gz": { - "num_bytes": 319391160, - "checksum": "20b77f5fc2a939fc291f901e8774acfbf04ffaacb08192b724673eadc9f83c12" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00515-of-01024.json.gz": { - "num_bytes": 317994258, - "checksum": "32ca1f60d0deb395538a93ce5044a48fde05864f2c26af42dc53405b6dc05031" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00516-of-01024.json.gz": { - "num_bytes": 318786801, - "checksum": "eba4f34749eef4da2b0729abbdfa2ada77bd65383c01213d4f86625670430a65" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00517-of-01024.json.gz": { - "num_bytes": 320010732, - "checksum": "617765f971b879182db7debf879025f8dad4fd8846b11728ee1230767c031c04" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00518-of-01024.json.gz": { - "num_bytes": 318681019, - "checksum": "6987893764c56b84fca014532824a05d4187db5c313be4f7bdcb363b7e8cc8db" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00519-of-01024.json.gz": { - "num_bytes": 319951543, - "checksum": "ba151c4734db52e7c220dbefe380825ac6d66a9c6abb901b8096a87d97a2deb5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00520-of-01024.json.gz": { - "num_bytes": 317948056, - "checksum": "7e53ed26c3c068b0dedd026219b7cdab79775545ebbf31b5dadadb45364c9985" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00521-of-01024.json.gz": { - "num_bytes": 317993802, - "checksum": "4d1d4a5583430e373bd2cfd191e59cd8911953fbd73fa924e0c15be76499b54b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00522-of-01024.json.gz": { - "num_bytes": 320189449, - "checksum": "71d851498785e312acf93861a43169794d4d576f5fe8b960303419316c8c898a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00523-of-01024.json.gz": { - "num_bytes": 320443871, - "checksum": "587867d619115c2accb69322b197239b79f12de41ae80427fd369813ad8d81af" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00524-of-01024.json.gz": { - "num_bytes": 318192840, - "checksum": "7324c02db00b06d0f41d6e5ebfa4e4dd6554f5f4849d6de187ebb84162d0446d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00525-of-01024.json.gz": { - "num_bytes": 319294602, - "checksum": "24ae3495e5b59883967c62b8fb3a4fa7525d33c40957fd5fa3be413d66c24eb5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00526-of-01024.json.gz": { - "num_bytes": 319783465, - "checksum": "27cd95e7bc6a3f156f1f8f26dc5e490818fc4810562e3964a19fad401cceacd2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00527-of-01024.json.gz": { - "num_bytes": 317240081, - "checksum": "6b84920fe7e28c01a03800512915c7a9e47816267ac652f9ee0314e3428bca72" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00528-of-01024.json.gz": { - "num_bytes": 318320694, - "checksum": "fec06589f714ffe1343cb6781898e29e5d0cb789deba3aa4a4ccf86514d3f690" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00529-of-01024.json.gz": { - "num_bytes": 318391515, - "checksum": "a98c34c04c1b6f0ca3acc9e10fdf4bd0ead2ea7271832ce4972df8677590918b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00530-of-01024.json.gz": { - "num_bytes": 318473966, - "checksum": "1677d541c7bc10971c711f1eb030faa2e85e0967112ba57d7f04712908e4f040" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00531-of-01024.json.gz": { - "num_bytes": 319463272, - "checksum": "92b5d82a058554d3396a2b54504f45fa88581cb2951140c0f0bde67ed11bed0c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00532-of-01024.json.gz": { - "num_bytes": 318228175, - "checksum": "291bb3d7613f7f00b6910a0de78dbab0d87602243c9c83014de341c131200853" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00533-of-01024.json.gz": { - "num_bytes": 318966937, - "checksum": "a0ce39eac6d6ecad3478373c264e88b2ea20b77fb2049537c229ad3da2769c85" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00534-of-01024.json.gz": { - "num_bytes": 318968162, - "checksum": "387db79d4aacf8fa4c512fb78023ff94a43d5d597d5a8c2ec6198e62e4b8c98b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00535-of-01024.json.gz": { - "num_bytes": 319253588, - "checksum": "3ff8f4a926fdfb6201a94d75c17ec5afe662a339a65019eb5e1193c1238bd388" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00536-of-01024.json.gz": { - "num_bytes": 319662526, - "checksum": "0c805e83d8cfd979701df5714713d062e14853d7e2b0f77c0b414a626686cd33" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00537-of-01024.json.gz": { - "num_bytes": 319177095, - "checksum": "f9a0ac216e316075e5c2219449a954f989eb160ead2ca07ac9f3813274e18f2e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00538-of-01024.json.gz": { - "num_bytes": 320109104, - "checksum": "a425ef4dddefb40bac5a8cd3191161a41737aea5088a614410d10d83bbab5e37" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00539-of-01024.json.gz": { - "num_bytes": 320600564, - "checksum": "3580ea8da9c4aff1296e89136c5d7f1a37d021e0b10f3ebd1e05612c092faebb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00540-of-01024.json.gz": { - "num_bytes": 319993281, - "checksum": "ad8dc83bfbe7c8976f08708c5f0229cd4e1a2d80e272b225a8d208133b129dfc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00541-of-01024.json.gz": { - "num_bytes": 318256020, - "checksum": "c7452669237323fdd09ce97624791a0261f3ec07d8a5f98e71a4b1252a2805e1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00542-of-01024.json.gz": { - "num_bytes": 318843744, - "checksum": "1e5a11c25f82ce717302dbcd9acc1f8b916d83eca88d345d8434b1f88768137b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00543-of-01024.json.gz": { - "num_bytes": 320482002, - "checksum": "bbf96edf50c913d5162ee154423242e7c8faf490ba229f325bac98a5e3eb9477" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00544-of-01024.json.gz": { - "num_bytes": 319059260, - "checksum": "22c04506b5744df8c71727fc6527fa2bc495a10a237c71762c66d09625d34097" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00545-of-01024.json.gz": { - "num_bytes": 317874034, - "checksum": "84a78bb62eb6f72de7a75325870d9ecd419f77c4f6728d29609b2f7ab1b8bcf7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00546-of-01024.json.gz": { - "num_bytes": 319891407, - "checksum": "28631c527dc398c9626fc60b39ad94ed880b41c71f55b9c7c670f6a1837f98d8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00547-of-01024.json.gz": { - "num_bytes": 319361268, - "checksum": "273b8598405def0165ceaf9723d1425c9b74368fc22a414616c7ac9327930225" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00548-of-01024.json.gz": { - "num_bytes": 318360761, - "checksum": "59990568c0ea055fab27f2b9cd028e1c7177df0479712d1e2d8372e9b017ccad" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00549-of-01024.json.gz": { - "num_bytes": 317320452, - "checksum": "fd1e361f28cf099df6088e26d06d79f7f62bd8bd89b4524b9baa80ea49a1a4a6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00550-of-01024.json.gz": { - "num_bytes": 319017444, - "checksum": "4424833afcb143f6fdbfc2f5fa2508d6226a4a1df391969b2a751d2d0070158d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00551-of-01024.json.gz": { - "num_bytes": 319118159, - "checksum": "77b78f94a8bc8f905cf8b1997df1fc3b8c6d77ce65fc28bef68c6083275a832b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00552-of-01024.json.gz": { - "num_bytes": 320058125, - "checksum": "e7b71167c4ad947232b6acba26e4d3cc9214c25b50b853b5745333bba942f50f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00553-of-01024.json.gz": { - "num_bytes": 319220671, - "checksum": "ce7891f3820ce065e3bd7afa006e90889428c80bd8e771d66fbbf023bb2a9eba" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00554-of-01024.json.gz": { - "num_bytes": 318858928, - "checksum": "015a707235f46f179a08d3f6674b6d368dc9612841e2bf39f700f11fef8e64c7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00555-of-01024.json.gz": { - "num_bytes": 320490725, - "checksum": "041dd2e902ed04dfa143476da03d5fd00c30ce1259c0658150af5b77a5a092c0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00556-of-01024.json.gz": { - "num_bytes": 319863694, - "checksum": "22e3d9e4dbdf2b1b822a7bc8c889f4747aa16c71f4c91436d028a228bffe4b87" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00557-of-01024.json.gz": { - "num_bytes": 318940362, - "checksum": "4cb8b113ad9687b7dee590242c5f50fb3ea3a8775c67492a8ce0cb5c15fc26d7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00558-of-01024.json.gz": { - "num_bytes": 319797786, - "checksum": "ad157a34c6a8d496859f55b00c79fcedf7305d8502ca86a511026f39cdcaca59" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00559-of-01024.json.gz": { - "num_bytes": 320156705, - "checksum": "816d84753b71fae446428587f41de5b3490e88321f1fa0cfa2ef1fd5eef851e5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00560-of-01024.json.gz": { - "num_bytes": 318346216, - "checksum": "0b1b3d26316f2c0e973ff19820793bcfffa957c3869f74f62fb40cb6839227e4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00561-of-01024.json.gz": { - "num_bytes": 319571572, - "checksum": "4f92594382c897bf94211f1446dbb38c2cc1fff3647acba731dfe0ad89ba4061" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00562-of-01024.json.gz": { - "num_bytes": 319453711, - "checksum": "2a6ba0c64806add776081f417c8d1afdb324dd8b9aebb603372afd7fc2c4cd6e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00563-of-01024.json.gz": { - "num_bytes": 318990092, - "checksum": "e3032365b9b86883c24bfe387d810c2d9fd1d0a55ff88acd1f5b5357246b13ba" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00564-of-01024.json.gz": { - "num_bytes": 319491917, - "checksum": "da6196ab8650fc9f8fa391b821ff070070946412277bd423c40d9fa1de325f93" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00565-of-01024.json.gz": { - "num_bytes": 318756269, - "checksum": "edeb5b13aa0d65354d78a5ca5d1698732e95f1fcba249c42825a0351d4a34f79" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00566-of-01024.json.gz": { - "num_bytes": 318461036, - "checksum": "f179addbca50d8612612b0e09138d7ecc89ba7ef2d6e857d7ef0b10223dc71d4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00567-of-01024.json.gz": { - "num_bytes": 319625728, - "checksum": "eaa1d0ee28eb17c6ebe3d85c8af8b7adac28a720b2975f86ac83f3f4d2bffbcd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00568-of-01024.json.gz": { - "num_bytes": 318428567, - "checksum": "3677e88545f2d76b601995cc3e2b6b12fcf65e350ed7eb4137ab4beef3d475c4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00569-of-01024.json.gz": { - "num_bytes": 320114923, - "checksum": "2d8810d8bcfc0fc19d82313be6516b2fef4cf68f56b0448af48b512c98e1ae8c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00570-of-01024.json.gz": { - "num_bytes": 319148416, - "checksum": "8e5356dc0fa2b4e5fa16b36a1586f16920306af1227c765e5d2f0818e74d30d2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00571-of-01024.json.gz": { - "num_bytes": 318223973, - "checksum": "c87cf8b88e8e4fc0a664f4b3a381b78b317680253a83a672cb86e02adb43f2aa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00572-of-01024.json.gz": { - "num_bytes": 318322508, - "checksum": "2bdc857dfeab99c8f83f0267ed5ed7529bca8ee086fce268534bc0264ff738f6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00573-of-01024.json.gz": { - "num_bytes": 319203246, - "checksum": "564fc77dec25ce0d47f4e3d8d04bf114dc06119b28b3ab00d6092a799d496e51" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00574-of-01024.json.gz": { - "num_bytes": 318397937, - "checksum": "dc3f206e1b5da963184da72e47959844bb164335c76e3261f3a189a4b7b022cb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00575-of-01024.json.gz": { - "num_bytes": 319183651, - "checksum": "7f0c46955e37d5d52b305f71b4ce4fca5368d72e8698e8b832ac0177f868e145" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00576-of-01024.json.gz": { - "num_bytes": 318690625, - "checksum": "b37d0fbd439bdc05021a71c192ce5e61ebce27448a17819bb53156d9d5f27e17" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00577-of-01024.json.gz": { - "num_bytes": 317926085, - "checksum": "3092d1ad70fb2d262ecb33f3fb6ea554af3ddd26498ba42b644c383f6d4bd1a4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00578-of-01024.json.gz": { - "num_bytes": 319190472, - "checksum": "d9833fd591a618a167b31b7aaca420f3e719ded98987dbc0f46fd4bfd12564c5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00579-of-01024.json.gz": { - "num_bytes": 318958744, - "checksum": "a11217af10c85ad828de38847eeddcde6af6899563585d581c20adaed3c9e7dd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00580-of-01024.json.gz": { - "num_bytes": 319893900, - "checksum": "71e8be705bfa8563e33392d1c14decd84f52d6a0139b98344f1a0ed9bdc94198" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00581-of-01024.json.gz": { - "num_bytes": 320109861, - "checksum": "c5f13ba973803ef069762d22bc37ee02a4348af379c75848d93b2685fc4280cf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00582-of-01024.json.gz": { - "num_bytes": 319238177, - "checksum": "da815527ca68b5c2ed604d00ccbcc7c631c60f33e3132f79212634a82c266844" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00583-of-01024.json.gz": { - "num_bytes": 319375634, - "checksum": "a332b791df0801f0b7227117f0ea3971563e8e420ae24dd94b38d532c1ab0573" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00584-of-01024.json.gz": { - "num_bytes": 318596018, - "checksum": "e6496d31f42921eaf9f85047e7c2eeb5fef46e01e99760fa676da96481d7d5bd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00585-of-01024.json.gz": { - "num_bytes": 320156294, - "checksum": "08b978ec05d65edd22c301ddc6ab44174eeb7bef5c5997a84342b6faaa47a79b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00586-of-01024.json.gz": { - "num_bytes": 318716838, - "checksum": "567ce600ad99e543507fdf27b9009fe1782bc867f44f3dabbeb93fab1208f337" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00587-of-01024.json.gz": { - "num_bytes": 320247814, - "checksum": "8f5c82f5eaac4a315d8615c9700cd81f3b9c2e1a17376d3b2482f8694dfe2492" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00588-of-01024.json.gz": { - "num_bytes": 319546079, - "checksum": "bae91422f87091b3974ca92781a14fae8f10c5c41de9c9132f745b3dcb8bc468" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00589-of-01024.json.gz": { - "num_bytes": 319771959, - "checksum": "babb615d77f80e5ef99aeed3889a26cef5c9918a7fe68b70a503815e69b0b189" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00590-of-01024.json.gz": { - "num_bytes": 318926571, - "checksum": "61f2ed732f3b2b5e24882f47b4eb84fea28bf89d112f6f173cbb50523a43c4b8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00591-of-01024.json.gz": { - "num_bytes": 319669791, - "checksum": "3aa2e792ec775a52ee78447b81204867e58b0a46727bab4b7974977aaec2889d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00592-of-01024.json.gz": { - "num_bytes": 320393142, - "checksum": "1419c263fb74409cb0e39ebd87b1c020ee6863a3a6f2f427be27d3c76b84043a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00593-of-01024.json.gz": { - "num_bytes": 320977171, - "checksum": "4f16f33217c35a2b155d5b6fe8014c2e52014e63c419e7d3aaf71a35246c1323" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00594-of-01024.json.gz": { - "num_bytes": 318211092, - "checksum": "c9301ddcafea22d085ae48f551f486e73089a76c7990871f787064c61e4e60b4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00595-of-01024.json.gz": { - "num_bytes": 318978629, - "checksum": "349e104763320eaae96ac3bc53c5fa7a73e7dec93b8cc3afaad108a97e7c170d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00596-of-01024.json.gz": { - "num_bytes": 318573003, - "checksum": "0eb6c25cf57764ec3aa7f74d6d967c52003f872f2f3b140fe6d5ac6360241a8a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00597-of-01024.json.gz": { - "num_bytes": 318931514, - "checksum": "b42b7b984aad729185ca9b3a6ffa856b2a79165ce2feebe519b10f8ff42c4ab9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00598-of-01024.json.gz": { - "num_bytes": 319002677, - "checksum": "8306c5971408767b3735288fd0ee7ee7d01d9af4ef4cbec2e57c97b1f78e6d63" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00599-of-01024.json.gz": { - "num_bytes": 319637870, - "checksum": "844df34f2a263011f9d1d85eaad5a1d95243769e9cec5a104807dd55e1fe431c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00600-of-01024.json.gz": { - "num_bytes": 318099852, - "checksum": "b05e66568a4472feee31f20918e9813aeae2d881f47b5281ff29fbcfedf4d5b2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00601-of-01024.json.gz": { - "num_bytes": 319136069, - "checksum": "8dff2d56c9915d73e6154533e5de0ca9d867c5fdedcfeceb3e0ab22f3ba509cb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00602-of-01024.json.gz": { - "num_bytes": 319369121, - "checksum": "45b2c1757260395afeb168b545892b315fa0bf14b3d144bfcab1fdaa6d79086f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00603-of-01024.json.gz": { - "num_bytes": 319499076, - "checksum": "46edc9f556ccae692900b222b8e4843360dd5dbe0798a8ad9cb51c07a451dbb2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00604-of-01024.json.gz": { - "num_bytes": 319132921, - "checksum": "0cba8c8738ea7ff9a08bd1bab215010b03c6c83fe35206d83344d78005bdee6b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00605-of-01024.json.gz": { - "num_bytes": 319315562, - "checksum": "0dc0d37658fd672c8d72775bd8855dce9037cf9715feda35a76afb1f0e87bebb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00606-of-01024.json.gz": { - "num_bytes": 319223528, - "checksum": "f679e437a3acda1a81013dc0f3fa93fde6c3309905e8142f8699a76bc04b7114" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00607-of-01024.json.gz": { - "num_bytes": 319326218, - "checksum": "7fe91f86f751b9aa3abf1c5ed0fdab89a76c7fa4eb7ab8b809ef29b0cf4a78d9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00608-of-01024.json.gz": { - "num_bytes": 319393715, - "checksum": "a5daf706100eb797b5b0770fe0c790856637b22dc849aeda5b445ae5fa63cb3b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00609-of-01024.json.gz": { - "num_bytes": 319554192, - "checksum": "4434338fe97d398d9565ae940c62539e868fa261be361ede1b5b0feb004160f8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00610-of-01024.json.gz": { - "num_bytes": 319786301, - "checksum": "6b0d0e0457a721af6c67a31f5016432011e717302cfdc7ee39feb253fbae4754" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00611-of-01024.json.gz": { - "num_bytes": 319356910, - "checksum": "bfe201b1775270afef3a09fcfc074920cbb01093eef90d46f26b6b813d603994" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00612-of-01024.json.gz": { - "num_bytes": 318780229, - "checksum": "29248c4732fdfda2ba97ed38192ab391457e20fd70f713ef4a7cf084f9865846" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00613-of-01024.json.gz": { - "num_bytes": 320190496, - "checksum": "f5cb9be2442797d967b9041e48771196a6c0595933ef2102840b704e355f4d62" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00614-of-01024.json.gz": { - "num_bytes": 320245862, - "checksum": "89b74d0daea02fb69289ad259bbd0ddb1a64c5d6380848f7d51669be952f8a0b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00615-of-01024.json.gz": { - "num_bytes": 316874605, - "checksum": "78600c8703d5ebf80c99c089bb7a7c1cde843a66d706fd219eeac304f80e8525" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00616-of-01024.json.gz": { - "num_bytes": 320237707, - "checksum": "630ee29d4dc4cd5062eeca7877e5c1b204b36eb0b3aeacadf036cdb75c1ce840" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00617-of-01024.json.gz": { - "num_bytes": 319739365, - "checksum": "d418fd284d06b1d2d9daebea3047ed06286640ac75d23893f1effc2ee9d7aa14" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00618-of-01024.json.gz": { - "num_bytes": 318634299, - "checksum": "f5d75d129ab6c0f052028cf0139c3cf20eed3a9c5cdb151cd88ae42d5d1a32d2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00619-of-01024.json.gz": { - "num_bytes": 319086471, - "checksum": "c558908f6e08b0d02f377c9aed1655d80106f4cfe26e955774bb420d19b2f74f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00620-of-01024.json.gz": { - "num_bytes": 320665446, - "checksum": "977f959e5b5eaa24081ce025d137647fffd65f1a54d2c45db9805a232e0c0364" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00621-of-01024.json.gz": { - "num_bytes": 318576410, - "checksum": "d07f3c31d7ec1c71b5ab9539a2ed49f6d5f46b48ee2e51800b9e28cee588a163" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00622-of-01024.json.gz": { - "num_bytes": 320053075, - "checksum": "58b897603eb83f789a1cfc6bf40a091093cbd8a0c20702018c411adc7b07a437" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00623-of-01024.json.gz": { - "num_bytes": 320045187, - "checksum": "3665d7579b3c57eb21ec9e55850e39307cc6f4ef8aa8b9937076ad6f142063a3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00624-of-01024.json.gz": { - "num_bytes": 320136842, - "checksum": "35db069ae090e95c5a4d3db44eae73bcb29463c120584d7f6ccbe235983c5fef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00625-of-01024.json.gz": { - "num_bytes": 317314201, - "checksum": "7f6ddbbc8815e8bd10c99361fd8113cbbd84ebd92799eb6958cf98af825d2aa3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00626-of-01024.json.gz": { - "num_bytes": 320219970, - "checksum": "4e2c46d1e3a94957717bbbf1e1e4300bd27ac17e588d426e0ba688983e83f4e6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00627-of-01024.json.gz": { - "num_bytes": 320083102, - "checksum": "851ce6dfa6a4d1a4e3b8bf439e36db9ceb59eefc60558d429e2fec80655e1775" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00628-of-01024.json.gz": { - "num_bytes": 320386844, - "checksum": "86d8927f16d0790a07d6c68e745501188d13887df4a137e937ae00497d07c055" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00629-of-01024.json.gz": { - "num_bytes": 319476643, - "checksum": "c48cff721137b641fe9d5bcf30462c7e4e3a3ae631b7b4e39979c8c77f0890ae" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00630-of-01024.json.gz": { - "num_bytes": 317961579, - "checksum": "cde626b34c6c8455227fbb18a577877b518f529b6c8e16881cfdf334f2875cd9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00631-of-01024.json.gz": { - "num_bytes": 318952266, - "checksum": "0401582821f7b15f0b406f7ce00c56351b8e86a3c3282bdf4dd45b2f6146ea22" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00632-of-01024.json.gz": { - "num_bytes": 318261820, - "checksum": "be48396ef18ce0f3650eca86eb36039f90b51737f9848086494f34fa28d60e70" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00633-of-01024.json.gz": { - "num_bytes": 319748854, - "checksum": "9d5c342d82fcace21de2900202c3f2af47229aeae9d487a8b77b7f5b86c05f74" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00634-of-01024.json.gz": { - "num_bytes": 317806530, - "checksum": "00a70705afb91f6570d17257057c15b45386597b917061686f131bd41ddce421" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00635-of-01024.json.gz": { - "num_bytes": 320313573, - "checksum": "22a1286582d65975ed94f0ba25bf87e94d52a55214d0a51979a3e0fd9f95e3cb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00636-of-01024.json.gz": { - "num_bytes": 318151690, - "checksum": "026c699ac6fa30f9e156a957026d8fa8df72daee3407c8fdc5e0bd7d6a3b50fe" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00637-of-01024.json.gz": { - "num_bytes": 318665365, - "checksum": "9bd931dfc074bc99df31d7fd31a5ac1dc8c8bc75f8e87b763545cd824edcdcbe" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00638-of-01024.json.gz": { - "num_bytes": 318521250, - "checksum": "4b30ad531f7502ef7bc6398ab286e5c6c63d340c22792da9258ea95b496d1c0d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00639-of-01024.json.gz": { - "num_bytes": 319997068, - "checksum": "2bfdf36396e49ff625138d29925f54eb12b18d35f6d0bf5ca9e79194977cfb43" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00640-of-01024.json.gz": { - "num_bytes": 319355927, - "checksum": "d0d0ed7304b5d79318b5230a1ab48d3ed03183f1eb11d96070604a7008cd7b30" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00641-of-01024.json.gz": { - "num_bytes": 319002081, - "checksum": "1461ecb6b92819bfdc12808a5442d70f94538931f856c91dea602a23ba86ab98" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00642-of-01024.json.gz": { - "num_bytes": 317689465, - "checksum": "aa0af0169cf13db1f8133e8d76afeeae5f71d63d179794377a55b6c2eb938dc8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00643-of-01024.json.gz": { - "num_bytes": 317523344, - "checksum": "5c060166e776f8efda48882c118dc0fd5e058d9ef40be578bad31e477114a16e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00644-of-01024.json.gz": { - "num_bytes": 318876813, - "checksum": "ad98ee119742cb8a6efa1be46e9670969397c7bde10049886d7d6fceb82387ca" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00645-of-01024.json.gz": { - "num_bytes": 319981258, - "checksum": "8930ae8e14c124218793d2fd1bbfb1b624e918cb092b21c6ca74347abd9dea4c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00646-of-01024.json.gz": { - "num_bytes": 319624889, - "checksum": "a40705c4f9a4db4d2d698cf96e43b99fa0790b886506300eb4986a26de7063e2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00647-of-01024.json.gz": { - "num_bytes": 319240920, - "checksum": "7129182faeac82b47127458e92903a209acf8272166024e8313c167d6f358456" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00648-of-01024.json.gz": { - "num_bytes": 317305623, - "checksum": "3124091a6c438fecbfc948b1a35ffb1462287ae06866b02a6dbb1a6651ccf1e4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00649-of-01024.json.gz": { - "num_bytes": 318998755, - "checksum": "fdb286cfe9e9091a57b31be61a56a425fae07d6b44f0b45f8743d7aab0e980dc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00650-of-01024.json.gz": { - "num_bytes": 319612451, - "checksum": "ff88c4310f049344b8a3f701bce12d08ef5f9b037e82fef7f1f670b3d51e59c2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00651-of-01024.json.gz": { - "num_bytes": 319098081, - "checksum": "9c3b1843082aae39b057bbc7364e69cbc39bbdf91d5bff4f52b12cf1a264adf2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00652-of-01024.json.gz": { - "num_bytes": 317107981, - "checksum": "e6199d12a893ae5d05c5388ae7a679df419ef6a050c8e3ce3c15fe534943a774" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00653-of-01024.json.gz": { - "num_bytes": 319623884, - "checksum": "333ac93cf1f1f4da0f72c5e57b675052453b42dffe1e4d45ec680f4e3e075d97" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00654-of-01024.json.gz": { - "num_bytes": 319055728, - "checksum": "1efe352f2f2eba826231a5bff6c79390630b44039b226a5041a087e116b60f5e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00655-of-01024.json.gz": { - "num_bytes": 318539829, - "checksum": "613c741cfb738017b3fa233512296d9127d661738721d3fccd806aad54d19d84" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00656-of-01024.json.gz": { - "num_bytes": 319970377, - "checksum": "51fa9b217b6bcf664c472cc2b258813e1f1d7a0f501c29b822221bccafa4e201" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00657-of-01024.json.gz": { - "num_bytes": 318548629, - "checksum": "c542c6fd2f3284d64f8d53b71ab8308bbba59f7f13e9d9eb20bbbaf13ad4782b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00658-of-01024.json.gz": { - "num_bytes": 319845984, - "checksum": "b3d8fb6ed2258c463367108e2942742e88eac657c859cc8d128035110fc87e7e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00659-of-01024.json.gz": { - "num_bytes": 318887872, - "checksum": "02feb4e03020d767a4468251786d4857d5dc833969626bee616c7882bfda9ce5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00660-of-01024.json.gz": { - "num_bytes": 319854892, - "checksum": "a997d9187a185a29fb3bbeb1e696d32898efba8f5e9d6ed816493669f0c5ec02" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00661-of-01024.json.gz": { - "num_bytes": 317599289, - "checksum": "86d9189ebc534c99da5a4407624a623561b159f758fb04373a270887d0b45709" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00662-of-01024.json.gz": { - "num_bytes": 318138720, - "checksum": "9c626f7aebcc4fc9afd533b6c8a372d884d01f508ce49c01ddd830e4e9e8b2d0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00663-of-01024.json.gz": { - "num_bytes": 318110835, - "checksum": "441d4dd0d5d2ea7b6098a3fe006b9d7afd526188824a3325d44538fc5655942c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00664-of-01024.json.gz": { - "num_bytes": 318996945, - "checksum": "08ab0739c3565643b6a83d7091936f5d75a4d8418c956146114aa0315f205dd0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00665-of-01024.json.gz": { - "num_bytes": 320612903, - "checksum": "1ab7bc2d0f7c6704c97848a9325015f06228339bc52cc1fb593d9c56145e7c48" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00666-of-01024.json.gz": { - "num_bytes": 319241006, - "checksum": "8b1213325ceb2a2c89dffb891a31317e903d08fff911e4ba1ae66fc3bcce9973" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00667-of-01024.json.gz": { - "num_bytes": 319650665, - "checksum": "14676f97937eb3d0734e5f121c5f63002ba2d2c62b6c41b4b46d2fcab9ea9614" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00668-of-01024.json.gz": { - "num_bytes": 319198651, - "checksum": "a406fceed5b7d17ff6d5773679c3df50e747215e39926228ddc9a60c6bf9d152" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00669-of-01024.json.gz": { - "num_bytes": 319363200, - "checksum": "1d3267d77f43d3d720dcd79c40bc3e8c0cd777d421b1b7d0e69e140199e34552" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00670-of-01024.json.gz": { - "num_bytes": 320079826, - "checksum": "85111c229b8fcc8428b3c13676bde8268f027fe06e1f576a3adcd82bce1603bb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00671-of-01024.json.gz": { - "num_bytes": 319494773, - "checksum": "eeeed8d9f63a5c16ab9d62454fae5bef1896973cfa69cedfcfaac4565a793b27" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00672-of-01024.json.gz": { - "num_bytes": 318304853, - "checksum": "6793ec3ffbc147c36e471e1c06a664ac2143408c9ee46305694708eee0fb38cb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00673-of-01024.json.gz": { - "num_bytes": 319031236, - "checksum": "3c886ff71973805a59312d8d43ee9e616bcfafd76c03a64d53ab548036b1fa90" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00674-of-01024.json.gz": { - "num_bytes": 318647345, - "checksum": "fd7f4efc0c8af611e7e137680342843d0471ca072421ab3c172a169ba2f5d217" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00675-of-01024.json.gz": { - "num_bytes": 318313871, - "checksum": "3b797b2ad717749a24866a97acb95aace0dd4e91ee7d51dcf1fdd46a9232b794" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00676-of-01024.json.gz": { - "num_bytes": 318858652, - "checksum": "2ccdf652fd413dc624643d35a76223e8a44e6241997841ec2d13ae11b56400fe" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00677-of-01024.json.gz": { - "num_bytes": 319236091, - "checksum": "bbf069c696f09e5467b17ba98479948a85101efa776094084e37581e72c01123" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00678-of-01024.json.gz": { - "num_bytes": 318996096, - "checksum": "3e3dd21861c713bd38d1803c32da1c0bc2496899648b4cffe1fa2e61b35ca056" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00679-of-01024.json.gz": { - "num_bytes": 319915466, - "checksum": "6ed56468a31564cb25668ceb5df325ff7138dd231afa85f676ac7af5e81e0642" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00680-of-01024.json.gz": { - "num_bytes": 318537417, - "checksum": "959ce407e7a892495c477b9e0071dff496fd20db9cfb04dd035ac59dd5b2f309" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00681-of-01024.json.gz": { - "num_bytes": 320181225, - "checksum": "0aa77d778f24bfdc8566b390a7a1ef1d7880a42b98b3e82e9b37ee3ed821a8e5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00682-of-01024.json.gz": { - "num_bytes": 319087756, - "checksum": "a4da802570ee7bc27e752069612b633edf226078f48d5f55280f73a6dc934127" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00683-of-01024.json.gz": { - "num_bytes": 320019766, - "checksum": "587497efb7bcd4ca85ec0559e372ea285c1b95e3889d406f142cfe454d8e0e2f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00684-of-01024.json.gz": { - "num_bytes": 318814245, - "checksum": "6e904f73976ca18aed3375d1c1b308d749b9a4405a333dd0a2cf85360822e205" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00685-of-01024.json.gz": { - "num_bytes": 318586686, - "checksum": "c51012772c5bae73821b67f72c035f22a40725d42bcf51e439bbdfcd84393ef2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00686-of-01024.json.gz": { - "num_bytes": 319648436, - "checksum": "890b7408abd0cc04a84be3a3992d05714dbd30a9d33a8a9b05316a980fe51313" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00687-of-01024.json.gz": { - "num_bytes": 318909835, - "checksum": "b54b20c21ae9834b630a8aac057d47069cf137577d30b91fd1475f5824b61561" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00688-of-01024.json.gz": { - "num_bytes": 319381735, - "checksum": "422091d5ba0d44c64bb0c84ab4757318414bc01455a97f53190eddda89c2f3f4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00689-of-01024.json.gz": { - "num_bytes": 318995026, - "checksum": "ad5080fbddc914c649027d5e2214f1d75e0cf0617eb3ca0b1fdb8ed9129f99cb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00690-of-01024.json.gz": { - "num_bytes": 320745318, - "checksum": "d45492346bb4bf519e657356ecf1805b6b592683b98c20c93da2f07c50b06092" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00691-of-01024.json.gz": { - "num_bytes": 318575084, - "checksum": "43a07e8a98bc99f381558c938fc83acd4a37d565459c0f3f83aaadda816f66c8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00692-of-01024.json.gz": { - "num_bytes": 320651368, - "checksum": "21a790ef1dcc9c6ffa071d1a2e21e330d6afcb45368dde9cfae8933c6d029742" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00693-of-01024.json.gz": { - "num_bytes": 318429145, - "checksum": "85558018ee61e33c4f3e05acc2029e69447a5717be880e9a0aa8fa715dbd0c05" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00694-of-01024.json.gz": { - "num_bytes": 319562061, - "checksum": "894f4c906a33c644ea80c3a00155ced807a62e1bcd9f6e254cb6c88efeedd142" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00695-of-01024.json.gz": { - "num_bytes": 318298964, - "checksum": "06eb05f651f1d2fff495c48475894420334070df10c051c7253b7afb0bc38291" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00696-of-01024.json.gz": { - "num_bytes": 317473664, - "checksum": "59ea4f951335553945a644f7628403ba1a99a27e0d93fcfe5db18cbc3dd48ce9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00697-of-01024.json.gz": { - "num_bytes": 318839008, - "checksum": "f0203b0f2caa3287b8f7a64288af52bafbf033bcdf31dae54e501e4da47b9935" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00698-of-01024.json.gz": { - "num_bytes": 318288032, - "checksum": "fe2a581cd174429a81424e407aceb1d81b61d9796d74db4590327778fbd5016b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00699-of-01024.json.gz": { - "num_bytes": 318696527, - "checksum": "edf3aabcdb28fa2feb532b3bd55cd167c2200a6d8e19f05152be194e48acf87b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00700-of-01024.json.gz": { - "num_bytes": 318900366, - "checksum": "67d89417d1440afeeefd59a0993e4d12fb5731e917ec7f4e65d9319541b4b9e9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00701-of-01024.json.gz": { - "num_bytes": 318901212, - "checksum": "64d302459e6871325282fd890d2922cb1fb25b47d677ce793bc065acc8d1bd07" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00702-of-01024.json.gz": { - "num_bytes": 318913325, - "checksum": "f0bb360189166a0bd717bad85edf06943333b1854687839864aef3ee02814795" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00703-of-01024.json.gz": { - "num_bytes": 318730274, - "checksum": "c4e027079b9cf9b1adae3e285c5cc5dafeee5c74cf3621c424b6df9801d508f5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00704-of-01024.json.gz": { - "num_bytes": 320112232, - "checksum": "37540f6a00523cbf429764893aa15aae6a57e53c89cf51d82a815feef02b1210" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00705-of-01024.json.gz": { - "num_bytes": 319643559, - "checksum": "9dae018569fa4bf33674f67ba03732a2f85cfceb53ec2cbb9457eaea607b8dfa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00706-of-01024.json.gz": { - "num_bytes": 319941519, - "checksum": "03926405dc629f0664a3d27c700a4fa2f606496f0b52a9bbf2fd2d75faae2f46" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00707-of-01024.json.gz": { - "num_bytes": 317628508, - "checksum": "fac92295e4c85f087d27e0a6f231d782be7b2448e99cfc42c09c0e1e20964c3f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00708-of-01024.json.gz": { - "num_bytes": 318863059, - "checksum": "39d4880d3e47e65ab6351e94b015810d66295a86a9f08534260ccbef41fdaf04" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00709-of-01024.json.gz": { - "num_bytes": 318412651, - "checksum": "044fc99a1307737bc8d6d8a9b67997010309fc695eda6e8dd42e5b6bab2256d1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00710-of-01024.json.gz": { - "num_bytes": 318631334, - "checksum": "0b2c93cf298051864b8660e57182b38408ad738cf930afc09afdde26d952f819" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00711-of-01024.json.gz": { - "num_bytes": 320587866, - "checksum": "f1f6bb9770b76742d0131495879fa38ed8aebe8a0b38463e7834f0697f174ede" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00712-of-01024.json.gz": { - "num_bytes": 318191204, - "checksum": "b6873a7d375aa29ff39ca17c3bbc7e328292b1671b59a35e7b01c0e992da90f6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00713-of-01024.json.gz": { - "num_bytes": 319472539, - "checksum": "3bb12a0a806ecb8a5eeaa00188c655f399460609b8a19005a7141bbcb3a7a694" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00714-of-01024.json.gz": { - "num_bytes": 320196397, - "checksum": "ca6e1fa6f27c9dbadbbaa767fd21dddee7c84ca96bbb6735640ba2631668ad0e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00715-of-01024.json.gz": { - "num_bytes": 320075706, - "checksum": "1a773eec7d738c0e1e253bfd4533f0c43c0d133e564c3458159e0c47d767689c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00716-of-01024.json.gz": { - "num_bytes": 318736413, - "checksum": "c17a6b2115e56cc3d6bbbd94e8565fb14287057f80199528e6cba20adf557bf7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00717-of-01024.json.gz": { - "num_bytes": 317351537, - "checksum": "cdba391e16c3bcb5569d978a8d11518103e7687714710ef4eba4f7c0821d67d5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00718-of-01024.json.gz": { - "num_bytes": 318017965, - "checksum": "a25c494e4baead0af0afe6eabaa054bc15f80b6ca0ac8dadb1b354d72ffbe63b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00719-of-01024.json.gz": { - "num_bytes": 318124432, - "checksum": "94f5dfbec85a8c5b22ff1368a16ec2eb7fb4be25c0c8f004096156ae40bfa2bd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00720-of-01024.json.gz": { - "num_bytes": 318235852, - "checksum": "c0248326e698599dcad01eca25d747c138881c61b5636ba765b21f9cd0df996a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00721-of-01024.json.gz": { - "num_bytes": 318817834, - "checksum": "c11df487a966e748cec522fae4ed76abf3e8cc9bcd28c301117fa52ddb83dc6d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00722-of-01024.json.gz": { - "num_bytes": 318553851, - "checksum": "63d3d0c3f5dcdff29a0a6ef41e3a9df3fb505c73c8554839e3032293a78bae2e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00723-of-01024.json.gz": { - "num_bytes": 320174720, - "checksum": "29c97bb8ff301080547255af29bb5019a2c1fbc74f0a2711e626461d5a5f0b54" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00724-of-01024.json.gz": { - "num_bytes": 317805413, - "checksum": "65f8932f3c77b0fee5f2224643a71ff95246720368fe66d45c22df25ea4b9c2d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00725-of-01024.json.gz": { - "num_bytes": 319460597, - "checksum": "dc785a8aa3a1f4ed77512d51a9139dfb24b356b5499ae67dd5b860101b1e0e4b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00726-of-01024.json.gz": { - "num_bytes": 320934004, - "checksum": "45d857536d3535d08cddb6cf50d08d89cc28138a5be082465c3a8c27c02ae2bd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00727-of-01024.json.gz": { - "num_bytes": 318393879, - "checksum": "e4a02e43eeabbecb81b971f4201212104b6214078cafd9500d5b5f323595f060" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00728-of-01024.json.gz": { - "num_bytes": 318826577, - "checksum": "cfaa0d0c8dfb333899c73e0c2aa00dfdadd00e5b4a3d477e7518c4141899c8a7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00729-of-01024.json.gz": { - "num_bytes": 320390067, - "checksum": "528fe99b0c8dc917ac0f02a555603f9ae81e690b4ce1040f65ebbad3390c0426" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00730-of-01024.json.gz": { - "num_bytes": 318156386, - "checksum": "786e6913b4417a87cd4cb1882e181d8b2e1eb4b4db5b4b9ad2120b5efdf3e2ba" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00731-of-01024.json.gz": { - "num_bytes": 320013543, - "checksum": "f28fc2794c280fc1de263b9b2a81e42423f8dac3af7c4fbd3b3aff888821ca9f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00732-of-01024.json.gz": { - "num_bytes": 318753697, - "checksum": "69491eb25dbaef78235f769422e773de7a2578e678ecde29dcaa663f4ebfa78d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00733-of-01024.json.gz": { - "num_bytes": 318640706, - "checksum": "dfde8960d738b873bcb75abe1661fcaa096d70c76aef21846b173b8adf049bbc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00734-of-01024.json.gz": { - "num_bytes": 319447398, - "checksum": "145add76dcd73916b548e7e3b161757c1bdc1f22a0f127019f24827afd6f85e2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00735-of-01024.json.gz": { - "num_bytes": 319868149, - "checksum": "dcd4ba95672630f89e75b70dc08cb918bbe896f5d32ffeba7d3e4921b27c1f4d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00736-of-01024.json.gz": { - "num_bytes": 318404586, - "checksum": "4710b1569342b7aa7ca610d8b8cbb2248a1c5fcd8c6ab3b7f875657dff4779cd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00737-of-01024.json.gz": { - "num_bytes": 319915151, - "checksum": "7091dc758fd14c206514663eed0ae446178ff38e76c4cb7e711c63d419506e49" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00738-of-01024.json.gz": { - "num_bytes": 319709793, - "checksum": "afe1a96ced49662b14bc60b4ff8fc1f610bbc6f3c515bb73f2fade7a0ba67678" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00739-of-01024.json.gz": { - "num_bytes": 319789716, - "checksum": "9e2332cfc994483d4b913c6556ca9c1698b95e81033b7bbc5a4f5271e5cce708" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00740-of-01024.json.gz": { - "num_bytes": 319102226, - "checksum": "61ddcc3af919b753638dd46f18f790d7783cdc3090dfddbbeb40faa93bed340e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00741-of-01024.json.gz": { - "num_bytes": 318717589, - "checksum": "aa3038c23a37561f2ba92e95ffeaa3e3641c1a69f8688b724116edd128e9ba52" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00742-of-01024.json.gz": { - "num_bytes": 319456536, - "checksum": "ea9d23abfed6e3e8ab900291a3bc1faa27751ff94e35378f8c4eb07207036a9c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00743-of-01024.json.gz": { - "num_bytes": 318641730, - "checksum": "6efcec6cd087be4eaa98491e463d0fb9c1253aca275971de08c56a20be9aa579" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00744-of-01024.json.gz": { - "num_bytes": 320264992, - "checksum": "71653351253c8f7fa18673a3f956bddebd158978708c5a4c9e9b5318f598e1f4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00745-of-01024.json.gz": { - "num_bytes": 318665967, - "checksum": "347dfd824d6f4afe58c6f418ab5d332909038c880f4dcda7f774d3d7a588c3f3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00746-of-01024.json.gz": { - "num_bytes": 320005833, - "checksum": "812bc3c082e3a65c8c77fc7767bb435f9be9a999961d84eadc9e0c602e5ce168" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00747-of-01024.json.gz": { - "num_bytes": 318575441, - "checksum": "a4414d376c69ae8dd5e60b206315cf920d5a797c6ef7c08fe0c4b4e28b4eb4ef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00748-of-01024.json.gz": { - "num_bytes": 319266882, - "checksum": "f08aee694b85d5e7120652350bfafaa05495e609aa6d2fb0b913ed8a718d7dcf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00749-of-01024.json.gz": { - "num_bytes": 320205042, - "checksum": "b3402b16a5cc817d89a19fd3456a50b5b6d5f3f555eea725167558cc85366d12" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00750-of-01024.json.gz": { - "num_bytes": 319198252, - "checksum": "6b95232f6d53cff8045bd5ebaa87d6e6c511a74dc646d2a960eb87e801ff4f2a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00751-of-01024.json.gz": { - "num_bytes": 317855407, - "checksum": "badc9d82efdbc8db5dc328e8aa5e80155c52f00b105b136d8c5c948fe237d61d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00752-of-01024.json.gz": { - "num_bytes": 320283992, - "checksum": "67c32eb497533d6fd20b206c38483d171275029ff525bba3da13b0c62e1ef073" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00753-of-01024.json.gz": { - "num_bytes": 321030653, - "checksum": "5e95b1cb54d7d7f12bec1559ababcab0c364a0af99e10a42a08357647ef5d3cc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00754-of-01024.json.gz": { - "num_bytes": 319059779, - "checksum": "32cb59ad16dfda8a5b52615498fe2e6d85753fa44ab667af2f525a2467508da5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00755-of-01024.json.gz": { - "num_bytes": 317737268, - "checksum": "0ad2fef2fe37d59b163e29c2287938a768ee87acc34752394809295d0710c602" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00756-of-01024.json.gz": { - "num_bytes": 317293218, - "checksum": "db737ceace329fb1f8fe1aca38db048a1dedcb5226a4132485f26afecdc6c3c8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00757-of-01024.json.gz": { - "num_bytes": 319529375, - "checksum": "8b823e97964894189a13df393e1b3978342fb24bd81f07af6e54b7bfa2992796" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00758-of-01024.json.gz": { - "num_bytes": 319297548, - "checksum": "3f31d7ad99d88dde757a651b12db909a30cfcae5796fe3f85722598d92344ba5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00759-of-01024.json.gz": { - "num_bytes": 318154496, - "checksum": "a4b780127d6f22aed49d155e234e21a847a60626143a8e7dc6e31a5f204e79f8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00760-of-01024.json.gz": { - "num_bytes": 319386997, - "checksum": "020e68dc60004d0661de8a22fe2b9fa7f481fcecaef8fb06efa43093a2a9cc52" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00761-of-01024.json.gz": { - "num_bytes": 320035555, - "checksum": "8d7b5a97770a062276ca909a3bd20365cbaf3931fcbeb8b7e479f5ee03b47053" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00762-of-01024.json.gz": { - "num_bytes": 318099583, - "checksum": "b8fcbbf9b55cde2ff66ca046884870e1e5f2d2a729a8eedb253c16fe0d7658e0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00763-of-01024.json.gz": { - "num_bytes": 318354409, - "checksum": "ce2d9e44161b13f6226cfb9f93ad42fa0edd18eeaee923c8ab31c25aec1fc976" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00764-of-01024.json.gz": { - "num_bytes": 319181291, - "checksum": "53ed1ef77f24bdd7c189aae0905d63be97f48aa3233fda139e59af53baab242a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00765-of-01024.json.gz": { - "num_bytes": 318147738, - "checksum": "26b9b9ea2f94b322c03d1b83b25ab4e9a1a203fe9923728c5dd91f22d5f8fef5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00766-of-01024.json.gz": { - "num_bytes": 317964368, - "checksum": "e59fec52abde3fb4cea58a5a4e511f4cc61e21062bfdd1e3ffd60131a847e0ea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00767-of-01024.json.gz": { - "num_bytes": 318750919, - "checksum": "0e5eff983e793a3d7cdd1ec85a45d58e5e6ecf7a12cf83a01888e148ab08acf9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00768-of-01024.json.gz": { - "num_bytes": 318978892, - "checksum": "171509b0bed8854b6de92fe146993be80ab31e0aa56953c7b0a66eeb738ff70a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00769-of-01024.json.gz": { - "num_bytes": 319386097, - "checksum": "704e7daa85c0e3ac974d51a6e2cf6df2ee053613fd2b77b5fe16d10b29a50a4c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00770-of-01024.json.gz": { - "num_bytes": 319623528, - "checksum": "e787064473427fe17ba95d9326d009e9723148fb314a7a9605dcb6698854dad5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00771-of-01024.json.gz": { - "num_bytes": 318911381, - "checksum": "c54aaffd8162b30280e974e81e9d0669357b74394e0da2d1ca2ce613f5715e4a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00772-of-01024.json.gz": { - "num_bytes": 319386949, - "checksum": "2f9c83681632482df6c65e4c70718c83f500305ee1d061626cdef35bd794a412" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00773-of-01024.json.gz": { - "num_bytes": 319962599, - "checksum": "f47c487ba09051c9a4bf320d69db9546e98948e3de68050ae2ba025c71e09146" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00774-of-01024.json.gz": { - "num_bytes": 320370991, - "checksum": "69a1eacfdb6f6fd49ea2b729a7ab291b96fd5bd42f993e2306d044871b069aa7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00775-of-01024.json.gz": { - "num_bytes": 320433220, - "checksum": "d35934fb537d1283d40897d05c1486f629776fe9e4ef127694ecfd0221f860c5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00776-of-01024.json.gz": { - "num_bytes": 318809986, - "checksum": "9079970aa1618b6be51caeab7a2cab26e61c30aa53af361a6184ef6249bf65a1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00777-of-01024.json.gz": { - "num_bytes": 319617796, - "checksum": "5e200e354ece1713a32a3e1ebcea33412de814dd5843df3523afa1ec9a4d5275" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00778-of-01024.json.gz": { - "num_bytes": 318039278, - "checksum": "b79309eb335c0c860c85d2b724df52c3613f61b92ab6cd6276c2be8c25a7b01e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00779-of-01024.json.gz": { - "num_bytes": 319078058, - "checksum": "fc6053d53255e4d4a4c22c42049ce3eabc224320a51c94c1116f3201f87b377b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00780-of-01024.json.gz": { - "num_bytes": 317637428, - "checksum": "e38c933003910b02beef64af2d330f32af6e6f3b7346fa121e89045c136c13af" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00781-of-01024.json.gz": { - "num_bytes": 318792407, - "checksum": "b6795b4db199f7a7a92ef195aee3753e5e00df05fad2d8401b2b9feb56d71a76" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00782-of-01024.json.gz": { - "num_bytes": 319081289, - "checksum": "dc20640bded03596eeec689f1293be55e72d138cf0c576df9768c7631931ceb9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00783-of-01024.json.gz": { - "num_bytes": 318663257, - "checksum": "ac2b4ee9ab8f25ec010a17358d2f3f1fb9d8d50c9f4b73357429277710e6564f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00784-of-01024.json.gz": { - "num_bytes": 319687102, - "checksum": "fb93dee8a974f2ea204c240ed4c24e1b64f91ccb421070be305487e4e53ca083" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00785-of-01024.json.gz": { - "num_bytes": 318909034, - "checksum": "2f298b358cc619fa72097e3dbd9ac91e7dc3f7c5f9c4f2ff6881c988921d2a6c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00786-of-01024.json.gz": { - "num_bytes": 319213094, - "checksum": "60ebe35e0f23ccc61fc0eedc891ea9deb43001beb8205d31360a05b5d58e31f0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00787-of-01024.json.gz": { - "num_bytes": 318335621, - "checksum": "a7b0aa4dafdda2f3dc3c1832b71d4a92af08f99a70a315b4cf9f60c1768bf2c8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00788-of-01024.json.gz": { - "num_bytes": 319444037, - "checksum": "874dda510a01a2f78e51d917d309bcf1a0f21e7e1ca46661f93931a6200b3d01" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00789-of-01024.json.gz": { - "num_bytes": 317955670, - "checksum": "ec949a05ec7750dacfdf692c1ba118a33454097fdcaa56626fb042eb93933811" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00790-of-01024.json.gz": { - "num_bytes": 319033823, - "checksum": "0939164a602d7c7140c619130977b6814639122d0038aff7bb840093def5172d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00791-of-01024.json.gz": { - "num_bytes": 319366402, - "checksum": "fd6ea942b3402b5da4acb1a03bf59b17df402e90c47dbb66fb198ca2f4b5e1cc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00792-of-01024.json.gz": { - "num_bytes": 319218667, - "checksum": "9e8af5aaa6d5ed915eae334c6101948fbcc7bcf6c8c6beaf80fd1adecd67b078" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00793-of-01024.json.gz": { - "num_bytes": 318865241, - "checksum": "675330d6736a677760d854dcdd9a174eb7c1d426f94e34836a048c2139befac0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00794-of-01024.json.gz": { - "num_bytes": 319384084, - "checksum": "fd4c2623d9cbaed3fefd6bb88c2d88b58fe8f08e9e8ef0cea6bb22cac68dabd2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00795-of-01024.json.gz": { - "num_bytes": 317654308, - "checksum": "157533ddb56290662e25cb60842327daec23e377e116496338c9313cbf6991b3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00796-of-01024.json.gz": { - "num_bytes": 319298258, - "checksum": "fd90f055499095efa9cb848dee62406d25820f929554b0e07674d4c95db574b3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00797-of-01024.json.gz": { - "num_bytes": 320048871, - "checksum": "e089a95e96a081dd76e38acf9506bfc7b86c682892d3a8774e9784019db39306" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00798-of-01024.json.gz": { - "num_bytes": 319291246, - "checksum": "e29133ab6f83c84a69752a451053dfe20887ea884e09cc373afd89bba7458664" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00799-of-01024.json.gz": { - "num_bytes": 319175282, - "checksum": "8f3f3a67946615bdf499d64341d200477280947e5be8538748e28db768115947" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00800-of-01024.json.gz": { - "num_bytes": 316687275, - "checksum": "c9a17dc92658ce5d062af25e5c8610a7fbae501627cfc7324ace7ca6a8d75d8d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00801-of-01024.json.gz": { - "num_bytes": 318710698, - "checksum": "4b7d1e130fd8ba536da073069221f68d567492b2bff27d8769fb4ef124cec3a1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00802-of-01024.json.gz": { - "num_bytes": 318914381, - "checksum": "9f186b8d08f5d3090b7c9eb8a6954cf3202caec7cbf5c308221333cd115af561" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00803-of-01024.json.gz": { - "num_bytes": 319111424, - "checksum": "117b0590a976805001a879c49c42db55579e5bb9a5d4db9ce20e42746f59d574" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00804-of-01024.json.gz": { - "num_bytes": 318186018, - "checksum": "ea376d6cc1043dee9a00e1eca1c431aa59755d8966162701817f9cf274a758c2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00805-of-01024.json.gz": { - "num_bytes": 320382848, - "checksum": "1e69e7896202206f9f804b2497c4d99cca5c1d139efc782b8ede2cb88f68b48b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00806-of-01024.json.gz": { - "num_bytes": 319508172, - "checksum": "9da7e230c7abed9beaed9d6090efa8ae1029a418dbbf6d04bb4386aafde3dbce" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00807-of-01024.json.gz": { - "num_bytes": 319995091, - "checksum": "2e3ba0dbe85c004c6a23b4caf340282e0d0004ab574a14bedc9c83c67cc2c0c9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00808-of-01024.json.gz": { - "num_bytes": 319880961, - "checksum": "f53fd08fea0f874d727422357521176c6810a54abf4fcc7019357b50f1928daa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00809-of-01024.json.gz": { - "num_bytes": 317100774, - "checksum": "dbeed220f330b489cc262fbd7cbe84f04ba8a5118ebbd8f48bc7a4f5f63ae7b8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00810-of-01024.json.gz": { - "num_bytes": 319625750, - "checksum": "fe5dced88ccd54b258c6740d8988e10b128a869ecf28e7096e689c59fa147d4b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00811-of-01024.json.gz": { - "num_bytes": 318375975, - "checksum": "e4bcc5571fdc4f51b733d975e78ff02939d3463264a02d7e651271ab91c81df8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00812-of-01024.json.gz": { - "num_bytes": 319663092, - "checksum": "b1e41c198bc69d026ab997fdeaa4e687f7a8ddfca751add9bc85f00481708a63" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00813-of-01024.json.gz": { - "num_bytes": 319094357, - "checksum": "c07287aedf6854f581aaf83b75c4939aa4b10181977d4c4be97c20989ab8f992" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00814-of-01024.json.gz": { - "num_bytes": 319521327, - "checksum": "c96203ba5461ef92a7a2b0d4e598efda943b5b3adf42a7268c26f1c224410c01" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00815-of-01024.json.gz": { - "num_bytes": 319098749, - "checksum": "72f2e65c5b482be0d9e3a3d8f5cdb703cec7a515e927bc4411e2f6ff5085ed5d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00816-of-01024.json.gz": { - "num_bytes": 320377295, - "checksum": "df95ac17a25cebb854088cca345f60c2634d07f088e45e251d7f9afdb334c0c7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00817-of-01024.json.gz": { - "num_bytes": 319007451, - "checksum": "bad1cc25de4f66ff36c69284e6b615f68bdc25e45f08e04e33ee463a0c6ef0b5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00818-of-01024.json.gz": { - "num_bytes": 319609737, - "checksum": "acf1b390f1c492d97bf027f06898f1dd5cf8cc6def41f4d43b38a0c99f4a85e7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00819-of-01024.json.gz": { - "num_bytes": 319164157, - "checksum": "3d973eb401876c57e9cd1420fc938da9dd7b08f97d4596c66a8c159e2b56b1b3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00820-of-01024.json.gz": { - "num_bytes": 320181073, - "checksum": "101d5f0079caa840b934c14800ba5cbb7fca22e9e6915b98b4dc5f37c57f5b4d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00821-of-01024.json.gz": { - "num_bytes": 320949305, - "checksum": "34ba423c93c4262234e6e2005aba0436daa99b05570cff0a58e9d27b65d76896" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00822-of-01024.json.gz": { - "num_bytes": 318392521, - "checksum": "4a586e220fe34f544dd068f4e1c310459cabd5dbea9a991c21c09f70079eb4c9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00823-of-01024.json.gz": { - "num_bytes": 318526893, - "checksum": "3b10a8e32a3a8f6541400d697516fcd3fffba3554e8d8a96451f01fc6b729d8b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00824-of-01024.json.gz": { - "num_bytes": 318640792, - "checksum": "c921270db8004d309f91e3209340c476191793d47b3cfa9d19fdc602d43dfe65" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00825-of-01024.json.gz": { - "num_bytes": 319524026, - "checksum": "a6eb347db464976ba5d1aaa4fa64e103ba36520dd1e9c103644caf187be471a5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00826-of-01024.json.gz": { - "num_bytes": 318469810, - "checksum": "dc5f88e6161ac06165f3cd4cb91a00cdff75d2f900e8f53d62bacfd833e352b0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00827-of-01024.json.gz": { - "num_bytes": 319391185, - "checksum": "66a240be851d6622adf7801d9634a456e83e9edfd135601c0dc1aab48902d7cf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00828-of-01024.json.gz": { - "num_bytes": 319625277, - "checksum": "2e989beeeb2a63bfb87a5a401619a8e4155a961b44441cb5f627c29f25962dd4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00829-of-01024.json.gz": { - "num_bytes": 320001237, - "checksum": "0653e4052fb7a4ef503bdfbbee332d650492e99c130a85c04250e18d91cfd30c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00830-of-01024.json.gz": { - "num_bytes": 319240468, - "checksum": "bd56e55e75a8237b5292fa65e5ecb0dfbabef6ef0dec6695b13522803210f40c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00831-of-01024.json.gz": { - "num_bytes": 319174603, - "checksum": "ca9d6c643127a390823655256a45462ee6e75aa2485141f6530a3bdf6ce4f572" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00832-of-01024.json.gz": { - "num_bytes": 318909883, - "checksum": "e91c35d94e183515e660cd8c874c12bbf22e1fd683312446f02287b0d032fb68" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00833-of-01024.json.gz": { - "num_bytes": 319095835, - "checksum": "971d9a4f8bfce564d42dc0a80009acfa7d2f47557ac19836ab426defe1877714" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00834-of-01024.json.gz": { - "num_bytes": 318319786, - "checksum": "159412a58fb8deb59e039fa0102bdb746065cbc6b4d1d3da892930fbf8b0f178" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00835-of-01024.json.gz": { - "num_bytes": 319959334, - "checksum": "814518d53b3023e3b8ac22dad9d65dd50d455a4c7db1490022f447f793f4d24f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00836-of-01024.json.gz": { - "num_bytes": 317642779, - "checksum": "19ad4fbaa3ff5c638b77980300b8c162c21a8237b87d054a30c46aee67d0ad94" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00837-of-01024.json.gz": { - "num_bytes": 320687986, - "checksum": "190de7948a4b163047ecdfc856e5f78bbff52ca883edfad26b32fbc0b57ffe36" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00838-of-01024.json.gz": { - "num_bytes": 319802866, - "checksum": "ccb4d342791a187f3bde225e008ff8cf70465f7fd3eacaa8bbce1ec4e52c2622" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00839-of-01024.json.gz": { - "num_bytes": 318621894, - "checksum": "3ff5cf5b33996a663df5783f3f41a5b5b2f6e08a2cf91e74cad3bf82291192fa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00840-of-01024.json.gz": { - "num_bytes": 319757379, - "checksum": "8292e0854c01ca79ef03dcc1752ddc1f0df747ad67551b7c0fa5208b6aa3f822" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00841-of-01024.json.gz": { - "num_bytes": 318779722, - "checksum": "9eee9e089bd396adf5a276eddca9f6352e07f8c33877f85c1f65968aa0c06128" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00842-of-01024.json.gz": { - "num_bytes": 318692591, - "checksum": "caf3f40a144b43af08687e41a1eb7d08da1b78cd1600574566e11f29fde9cd34" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00843-of-01024.json.gz": { - "num_bytes": 318944616, - "checksum": "e74d624534091173546755ca236e5912cc8acf8cfef5f9c197b541ebe76f0818" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00844-of-01024.json.gz": { - "num_bytes": 319392887, - "checksum": "e47d3f44f996398b54f18729f4e81d88d04b19bc529847e86277a6a91ae74e6c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00845-of-01024.json.gz": { - "num_bytes": 319215311, - "checksum": "de7cffe64f422b02668137272943537946c15539954b564345d6722c4eb06345" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00846-of-01024.json.gz": { - "num_bytes": 318129297, - "checksum": "1d5ea0ab8fcb3975735aa421d646cea4544087f60a79ec209b63c93b6318523f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00847-of-01024.json.gz": { - "num_bytes": 318134095, - "checksum": "6fa4c50808df2aa8efebae3bbf832ba2b0be2f7113633fef720cffb3c50143a0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00848-of-01024.json.gz": { - "num_bytes": 318521356, - "checksum": "3aeb657aa448af82551c653802c669c985c00b7daa593de07f80733ae5dee84d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00849-of-01024.json.gz": { - "num_bytes": 319541694, - "checksum": "1cc016f58a4a2c54625214f028df05247ed319b8c1868c96c2efe8147a73d08a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00850-of-01024.json.gz": { - "num_bytes": 318861613, - "checksum": "eb5fbe6eeb4b0281604df264a5b04a3a0db96ff0d04f252375a788a0d3345c67" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00851-of-01024.json.gz": { - "num_bytes": 319356648, - "checksum": "ffe1397f1d412979cc66820555ef27345f3a2a48b8bcfe682d48301135e8c12a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00852-of-01024.json.gz": { - "num_bytes": 319662372, - "checksum": "fa78ed98d602276520e823e17adc7f796320d95e27e08d84d06e66e415b79161" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00853-of-01024.json.gz": { - "num_bytes": 317625507, - "checksum": "b10cff62fac5191b9cb5e2025227adb838088773e79bfec0937a34bb857e1b1f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00854-of-01024.json.gz": { - "num_bytes": 319665550, - "checksum": "15441b2a7c09a477389a8fbd7401c549dc8281f2bd44251b1546077301e24624" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00855-of-01024.json.gz": { - "num_bytes": 319059897, - "checksum": "f6127845b162181dd7157dd316021a4e6b5d41393c66d3e577491cdb74657f2e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00856-of-01024.json.gz": { - "num_bytes": 319243991, - "checksum": "ec9f0884c5ddf82550105f969222d3ee8b0d4907a0a2540ea6c8c67c2d2e9179" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00857-of-01024.json.gz": { - "num_bytes": 318546680, - "checksum": "840205fa73336ff51d75008ce8c530164ebcef3b50f1ad8deab879a67acf8d5e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00858-of-01024.json.gz": { - "num_bytes": 318306547, - "checksum": "e9b3819e9dc98d66a61f8f4e8f6ecb03099c79ae87a175fe1ae484174b173b44" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00859-of-01024.json.gz": { - "num_bytes": 319088302, - "checksum": "eced8de72f8755fa0dfb690c626cefcacf5fbbce97029d4589058913c31b9339" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00860-of-01024.json.gz": { - "num_bytes": 319704792, - "checksum": "90a169718609f16abe120c4b63a20adc0bbedba51de14b004d34dabe530339f0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00861-of-01024.json.gz": { - "num_bytes": 318444445, - "checksum": "d020840f09fa426ee15d19f05e5afd9cf674048e0dc4438dae0b6f02c7227d9f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00862-of-01024.json.gz": { - "num_bytes": 318606300, - "checksum": "e02bf9d3f1a398972f7d78b9b1aaff9a92146554a1358ea1b16ce7873a9f8fd8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00863-of-01024.json.gz": { - "num_bytes": 319273730, - "checksum": "c977f143cbb5e61160ce76f1cabf7bea6c158abb7e159ec3362aad1cc7af0ade" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00864-of-01024.json.gz": { - "num_bytes": 318143165, - "checksum": "bdf20dbde61f0663feb70be419c39c60acdc7ecbbe1430d47bf79ae2e114f168" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00865-of-01024.json.gz": { - "num_bytes": 319041356, - "checksum": "11c9c068ec5c1b612494c1473b7cace67a55ee66155559b19035df180ee260a1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00866-of-01024.json.gz": { - "num_bytes": 319758401, - "checksum": "ab4436f283af0ef2d33b93cf026907cf68255beee9d9dc1d6c542dee9c3f48a3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00867-of-01024.json.gz": { - "num_bytes": 318991336, - "checksum": "56beb5edbca3b66981f5f8e65f2a13a0f6e99e68ff50cc263cc529a4d8ebf371" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00868-of-01024.json.gz": { - "num_bytes": 319984390, - "checksum": "b9368d2ae0eff869c70c1a1214126c1d084f56887102d3d46e450b2c934102be" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00869-of-01024.json.gz": { - "num_bytes": 319462888, - "checksum": "68ab404e0ca2247686eb264a0d7feeb9d2460162434f5babb2b1da82d865343e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00870-of-01024.json.gz": { - "num_bytes": 318426018, - "checksum": "2d60208a558f6ba92d6c6307e1ab626acd7ff3b7bc25963b09e87e464751c42b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00871-of-01024.json.gz": { - "num_bytes": 320233396, - "checksum": "ee2517922079c713605dafffe6bc0db0a947abf64ff92c409aa1015b92cdb099" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00872-of-01024.json.gz": { - "num_bytes": 319570251, - "checksum": "83ca4f125bd628cb28210fb874db717635009e36c60b42237bda48fcb611a53f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00873-of-01024.json.gz": { - "num_bytes": 318755978, - "checksum": "d94ce49fd17da5f70d1a89bc9e5323daa54f0b8417e1ee5d991467c80c068ec7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00874-of-01024.json.gz": { - "num_bytes": 318986904, - "checksum": "f634915d1b529d9d728fd96993bb151dc07016767cd44ceeedddec73eaf37074" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00875-of-01024.json.gz": { - "num_bytes": 319116193, - "checksum": "6367b1216e1c6ab18af66471d866f39caeb9a538209134a9e6bbbcb81bc51db7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00876-of-01024.json.gz": { - "num_bytes": 320829257, - "checksum": "c9ad4ab8c6e5995aaacd72ebc6654b43b4756804bf3cea808610f9b618f98fac" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00877-of-01024.json.gz": { - "num_bytes": 320082625, - "checksum": "835ae7d54732c309bc9aff231268474af66653b06ad6ca17b54dab6f4a7d30c5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00878-of-01024.json.gz": { - "num_bytes": 318964554, - "checksum": "49c761449d5052dd6c408268c77196bffc5125eb5189390f73ba0ce8550f0175" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00879-of-01024.json.gz": { - "num_bytes": 318699617, - "checksum": "521e1c5fa967a6f29641e7c4c2b210acda0736b32f318e24aef0e587895ed492" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00880-of-01024.json.gz": { - "num_bytes": 318723630, - "checksum": "dee1814b24f9bbc3aa3430cd80302b08b863eb1b92698158960b6be216845843" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00881-of-01024.json.gz": { - "num_bytes": 319839271, - "checksum": "9e57ea6a0e3d8a7798a0cb3e6344e1711e8fd879e2e396294718ff360fc7c4df" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00882-of-01024.json.gz": { - "num_bytes": 317773196, - "checksum": "2e5e5749618e53668222c7d310929e2177772dd7c14592e61dc86f163e353c8a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00883-of-01024.json.gz": { - "num_bytes": 320262049, - "checksum": "f80afaa4495a2d41ad4d7380b79040569179b24ef5c2df17f75ce8e135d786b1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00884-of-01024.json.gz": { - "num_bytes": 319146213, - "checksum": "77338479b420dab9316a4737fc243de84b5e88392cbbb46fa0619045a42432cc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00885-of-01024.json.gz": { - "num_bytes": 319022605, - "checksum": "3a67fee2fb77e64aa13fd595d7786b432203f36712ff723ec5999a341834b38c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00886-of-01024.json.gz": { - "num_bytes": 318624429, - "checksum": "2afe387f2500c57294acf1403a8c27f27f6c7c2d228dee0f1ed70a02c438f838" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00887-of-01024.json.gz": { - "num_bytes": 318733911, - "checksum": "3fe087b3441f74730ab137ba9486650cfedfe2d724573c3d166565d7d1e40938" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00888-of-01024.json.gz": { - "num_bytes": 319926754, - "checksum": "dd2df1977458cac34ef1e52059bbc28738e541761d7ad11c0ffc8ef3ca061190" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00889-of-01024.json.gz": { - "num_bytes": 319085344, - "checksum": "4172244cc3fc4a4e9e09f04f8097cbc678aebaedb9d1fb97b1daae16b0b8ef45" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00890-of-01024.json.gz": { - "num_bytes": 319838671, - "checksum": "8ffaf34eb8209e7ec250303298f9eebd2833fedcf80414c20331e8dbed42251c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00891-of-01024.json.gz": { - "num_bytes": 318169092, - "checksum": "daaf74ba5d12a7415da94be0f4454336aa3d86ad5cd300dbe30cef596835ac8e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00892-of-01024.json.gz": { - "num_bytes": 319662776, - "checksum": "6d99c0419a6c9633620fb0aa7b7610cc5d06696e839a1a52953fd7db7a18e053" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00893-of-01024.json.gz": { - "num_bytes": 319541919, - "checksum": "5f246aeacef0dc8d40a036bb1eeecf278f66d7215a134fb746d30f3420d18c18" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00894-of-01024.json.gz": { - "num_bytes": 319528897, - "checksum": "9975fd5d23d25938f00de3fc9240d77c27b4784c2f443b1914652a06d3b59fcf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00895-of-01024.json.gz": { - "num_bytes": 317548307, - "checksum": "7af9e2abfaebd4afe05a0e28d3e6e3126800a8b9b7ad49de360e42f2eb2c8506" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00896-of-01024.json.gz": { - "num_bytes": 320278601, - "checksum": "1941689d6a0e449423faad6e41714f33d5b23cdb1bb73961a888a87678fc74b0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00897-of-01024.json.gz": { - "num_bytes": 320161831, - "checksum": "3d951cb1ae4a9b3c6ff70555139435febda83d24bb04ea27b229a05424b470c2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00898-of-01024.json.gz": { - "num_bytes": 319341305, - "checksum": "3227b97aa9ff57b62be2a26fd8131e9ea45f7731673acb43432e529ea4978a25" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00899-of-01024.json.gz": { - "num_bytes": 319658969, - "checksum": "c746f8bd5fffac933640ff39db0b9d7b022edb28d7a4b3237d8c69fd919b7b48" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00900-of-01024.json.gz": { - "num_bytes": 317494627, - "checksum": "0327f0c57a668b2b34e72f4c53d4cfaeed787d879843d0bba27b5be58d1ee5fe" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00901-of-01024.json.gz": { - "num_bytes": 319683481, - "checksum": "886449092779ee26fccd11e0c89c36e449346dc6b1f0a7cb15b6b53c897790a3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00902-of-01024.json.gz": { - "num_bytes": 320228529, - "checksum": "6960d8539df78e98858ba8cebb2e637b6c2ef20890b5f2af1cbf4621b52c364e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00903-of-01024.json.gz": { - "num_bytes": 318961279, - "checksum": "4ddb3c9e9276d220f1d4dfc32bb61a090e895e9e3c9f53c169db99a024e7cd95" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00904-of-01024.json.gz": { - "num_bytes": 319926290, - "checksum": "69a941cbbcb673efdb254c162854fcfff6fe1132182210235b91d1d21ed4d2ed" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00905-of-01024.json.gz": { - "num_bytes": 317982280, - "checksum": "1d9613f366b91102d018e57894df520aaf1910aa98e06cf369d9676e498610c5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00906-of-01024.json.gz": { - "num_bytes": 319012210, - "checksum": "4855989c814582f5cc0a5e9b8f9d1f642ae33de81625d4bbafaafb709c1cd260" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00907-of-01024.json.gz": { - "num_bytes": 318515420, - "checksum": "8f34dbaa454215922a29fea975357e4e705381a65e4dcaf8b0d8c200f9a277bd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00908-of-01024.json.gz": { - "num_bytes": 319286320, - "checksum": "536bf0610a2c14d1d59aea0b52fdc29cec19cd7eaa4c3a5e5fec04dee103b29e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00909-of-01024.json.gz": { - "num_bytes": 319938295, - "checksum": "3bb3943183f579c15d0d30440f6c82d0c9c64d6ded398dfc7c67502d73868781" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00910-of-01024.json.gz": { - "num_bytes": 318423425, - "checksum": "adbdcf170531c725b54c1e5713676b789589b2fb77310f3e64a0cc30b83602ee" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00911-of-01024.json.gz": { - "num_bytes": 319578185, - "checksum": "a1342a95ce77013820c36e7d038ed47ca4d40cdf3584a66abc310132435b25fd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00912-of-01024.json.gz": { - "num_bytes": 319154715, - "checksum": "4973afcb1d7b4816e3a3df1b9ce1e48a0eea4fe8ead5f83ea753e46a934e5ddc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00913-of-01024.json.gz": { - "num_bytes": 319011218, - "checksum": "c9a158f69a123859569e1cdd475355afda32d7e5c48001591f0b6c20dc17d572" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00914-of-01024.json.gz": { - "num_bytes": 320027387, - "checksum": "61f6c0f839908e7d3105a6926c501bcacd293d1ba50c3b8639ee227c9a8270b1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00915-of-01024.json.gz": { - "num_bytes": 320280632, - "checksum": "a74fb91d8f7d79b09017a7f996b6ca5d59e4ecad9fec354ac977c0076d53fc66" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00916-of-01024.json.gz": { - "num_bytes": 319278877, - "checksum": "cbbb8dc274fabb4435db5fef5da1d91671e1a4c7f3f652742324f9632b01c5dd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00917-of-01024.json.gz": { - "num_bytes": 319616831, - "checksum": "31e62cbd6209fb7831078e4a262d1b25c0590f9425c62b2b208d4030ed5722d4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00918-of-01024.json.gz": { - "num_bytes": 318635363, - "checksum": "95e5c2f51abc9ef4c0422e91b77f79ff83c8cc38e585df621fbc0dfef48a84c7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00919-of-01024.json.gz": { - "num_bytes": 318885096, - "checksum": "ea5960d4fbc7d5e7097edbf2c9c706e6b7c7e9d3e36633be9bd68c4038955f10" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00920-of-01024.json.gz": { - "num_bytes": 319228627, - "checksum": "73b721ae576dcfa83bd963e49530f73d76b788a669e3abc1c02189900c80cf02" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00921-of-01024.json.gz": { - "num_bytes": 319557114, - "checksum": "710c65cd504e87b5019c01f658e669d1e023473d879913a9522760d33546cf24" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00922-of-01024.json.gz": { - "num_bytes": 319356053, - "checksum": "f0b54b3c6b51a356debc9414df0438ee525ae5114cbb7c8176634b7493095022" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00923-of-01024.json.gz": { - "num_bytes": 319766600, - "checksum": "d5b80091c8113c283d91ff5826b46068b96c423c0dc74a646e2c8d1c5d815cea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00924-of-01024.json.gz": { - "num_bytes": 319733540, - "checksum": "56a54c7d4114c21c1657df0d295839c2bd4904cd1b651104e2a155c2bf1b5aca" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00925-of-01024.json.gz": { - "num_bytes": 318944357, - "checksum": "4d396c29cd1d9ba16016fac37c333c0a872f6cb0e9faae7966e53f6e5c879d67" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00926-of-01024.json.gz": { - "num_bytes": 320276135, - "checksum": "39a64c261a76d5e13f187f12c886b22e2db08fba968bc9d0c1cb0d3c241abda7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00927-of-01024.json.gz": { - "num_bytes": 319181837, - "checksum": "86db529dd52fb67173588fcbc9f0e52c99ad6dd34e44865150bc6c962de5b3c1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00928-of-01024.json.gz": { - "num_bytes": 318966114, - "checksum": "d232df8033ddaa7397dbcfa8ba4ded9421ee9bfc091c725b311fd963b29f13eb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00929-of-01024.json.gz": { - "num_bytes": 320087917, - "checksum": "fca6bfe8fe17c867681c58df081f2186dcc6bf22e46ce3783f85b918644c0b6a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00930-of-01024.json.gz": { - "num_bytes": 318921677, - "checksum": "b8031359e758cd835c44e81303e04ef7b2137d2e1a9472d7e04552c353d883c7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00931-of-01024.json.gz": { - "num_bytes": 318978028, - "checksum": "bb5f2ea8a2e56c69813bdc08cb243c0763126e7b5f6c5cb57e7f4767d2126f89" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00932-of-01024.json.gz": { - "num_bytes": 318627424, - "checksum": "f6fd2065ce202d5347243a2b396707bb606be20c1829989bd7dff6d9fb7adec9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00933-of-01024.json.gz": { - "num_bytes": 320226802, - "checksum": "b303d2ece81c1f7b882703b915765212796518010aea6a108a441dd0a84a6128" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00934-of-01024.json.gz": { - "num_bytes": 319908526, - "checksum": "e5b05714922d132073122e83933853f52f0046c9f51f985cfbdbd310e8d677de" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00935-of-01024.json.gz": { - "num_bytes": 318941663, - "checksum": "4296055a31409a778c516afe25a8108f23dfffaf13cac33e5ed834a37c46b37c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00936-of-01024.json.gz": { - "num_bytes": 318430860, - "checksum": "4634630c012ed184b264ea01c97f7bb3f1af030f2466f1d99d20bb0472f74511" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00937-of-01024.json.gz": { - "num_bytes": 318008229, - "checksum": "131cc9a2fef4ebe81749f1844b7c4b194b97de7db4f5253ce59207e68d8b4df8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00938-of-01024.json.gz": { - "num_bytes": 319099506, - "checksum": "fff55e3b2ff8b53e56ab99def626a7334ce67d2414351b2e83d84298052dd9b6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00939-of-01024.json.gz": { - "num_bytes": 320457851, - "checksum": "8431e38c86516ed88d5c028f4a1dad32b02bcccdc03f9687d18f8312e493bcb7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00940-of-01024.json.gz": { - "num_bytes": 320607829, - "checksum": "a68c577555781adc777c09c68f623431469d67e9b66af7b0813f09a512b7d777" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00941-of-01024.json.gz": { - "num_bytes": 318923471, - "checksum": "807ffde4034b6b95a5eacb71f093686586ca11e417517894cca99dfe7b12563d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00942-of-01024.json.gz": { - "num_bytes": 319880902, - "checksum": "d03d04f619a8f3afbefa6d67986f50d5ee264c45de36c0ba67b069e343e002ad" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00943-of-01024.json.gz": { - "num_bytes": 319079341, - "checksum": "e482c4dee03a34a1a5756e6def26134c9a3f18ee386f5569d6cbf16d3875a429" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00944-of-01024.json.gz": { - "num_bytes": 319436318, - "checksum": "6241f9f35640598c05bc5cd00d8cc024dde59c0065c8935da229a8a583de32fd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00945-of-01024.json.gz": { - "num_bytes": 318998098, - "checksum": "85f192c1ee9734da0f1dcad31c2b8111076977582e139ecc1ba959bf2df6b262" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00946-of-01024.json.gz": { - "num_bytes": 321951470, - "checksum": "44bccedf6a8db115bb6563d6775ff03c67511ce4e23a2de77e79edcb568c9fa1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00947-of-01024.json.gz": { - "num_bytes": 318689631, - "checksum": "36f0bfa191ad7d51452d51249c724150f8c3774142df3720f176f2772f42f3fc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00948-of-01024.json.gz": { - "num_bytes": 320347661, - "checksum": "f4a7afa90b6d81a4cdc99100b75b4d3174c4d5d670042766c3e0418b7a97ef80" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00949-of-01024.json.gz": { - "num_bytes": 318054841, - "checksum": "f39d0c9bfc0a562ede67b8cfc57e6974a8a999e2bbc1b6940f107169b4f06e4a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00950-of-01024.json.gz": { - "num_bytes": 319722042, - "checksum": "bf376260e5a838b3b901ceb22f922829619be710718446ee95c24400cbc73495" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00951-of-01024.json.gz": { - "num_bytes": 318315382, - "checksum": "987cd895f63bb74c9d4ce229ee853c7bce53c75c324366a0d06377c36030e39f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00952-of-01024.json.gz": { - "num_bytes": 319247792, - "checksum": "d218dda02748a22821c2ecccf1cbb136dc8772a25ddfacc7ab354fc089470e87" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00953-of-01024.json.gz": { - "num_bytes": 318411551, - "checksum": "698768f3d7959b33fa74a3827e995b0c184bb3b4c46eba667d7dc3365fdd07f3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00954-of-01024.json.gz": { - "num_bytes": 318809810, - "checksum": "651d9ff43d5a3f7f5945ccf26b9410018248bf64956f3485c50b0df9034fb2ee" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00955-of-01024.json.gz": { - "num_bytes": 319761211, - "checksum": "29fa5c68fb8d3719e5f5f17568ce888522de64499554b5f0f4dafafb4ee5b40b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00956-of-01024.json.gz": { - "num_bytes": 319255736, - "checksum": "333a90a9c13f71e41a7cdd4784684bc142c79ef99155b9d62d062db318798b93" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00957-of-01024.json.gz": { - "num_bytes": 319504417, - "checksum": "730c90615fca09c81d9644cfae40d325851bb9bbc1af696caaadd67d8282ab5b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00958-of-01024.json.gz": { - "num_bytes": 319066016, - "checksum": "bb565af6529720ba2a3e989769b33d978ef49cb2aae49c60f2ff98a981414280" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00959-of-01024.json.gz": { - "num_bytes": 319887940, - "checksum": "8992783693dd0ad5ce07427f6b5739c818f13952d90bb61312ec98f9c813f313" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00960-of-01024.json.gz": { - "num_bytes": 318051437, - "checksum": "4773edbc822ff8d51ec13af6c371214aea7545047d9babeeac0b29180d52fa0b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00961-of-01024.json.gz": { - "num_bytes": 318373291, - "checksum": "ff33854746566f7d3b4ba9eadd1329ece48c034345fda000d9af73cb26d197af" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00962-of-01024.json.gz": { - "num_bytes": 318572513, - "checksum": "a6d07f7caf55fda0df74a22b454d196fb2e29312d433bc5506b00448c22b579c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00963-of-01024.json.gz": { - "num_bytes": 319488084, - "checksum": "453f666c6578376508b1fe8bd3fb8ea5bf030aca5cfedf383cd23b27de15228f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00964-of-01024.json.gz": { - "num_bytes": 318905670, - "checksum": "74f64ed6583e6a4df4b3c3f8a76263a2d63905d51d5680d9683d86f5039d5b56" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00965-of-01024.json.gz": { - "num_bytes": 319452844, - "checksum": "88016c1a0663b89dc3d76689c827c82a6d128401ae05f7b70c8727d75302cd47" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00966-of-01024.json.gz": { - "num_bytes": 319334588, - "checksum": "dd9300bdc27513dd62578e1cf3c8302647b49c61185c282a684011d788c43d17" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00967-of-01024.json.gz": { - "num_bytes": 317872396, - "checksum": "90747ee63ac7d8176fde1f2afce8deb7e39bf19e682e17d0fcc1711d09d5f1d8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00968-of-01024.json.gz": { - "num_bytes": 318988069, - "checksum": "2cc785d650013d35d5d31b1e85c5530b197687c69117881362bf6b98f47c22fa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00969-of-01024.json.gz": { - "num_bytes": 318324244, - "checksum": "83750d93c788ad32a256862b8173db3549eedf52ac131f09f662f1fe0f46bd13" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00970-of-01024.json.gz": { - "num_bytes": 319494164, - "checksum": "e0e46e185851ec569dc13a18519988ad926bdcd9bf448eff00aebf6df141f5cf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00971-of-01024.json.gz": { - "num_bytes": 318714665, - "checksum": "941c9bf116353230417950d292c38b12b00935184162227eaec01870ab7f4510" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00972-of-01024.json.gz": { - "num_bytes": 319518275, - "checksum": "de30e19a155a6f4303afb0311416aa84cc3baf5a09cef55b8e2adc2a4f478f6e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00973-of-01024.json.gz": { - "num_bytes": 318092574, - "checksum": "f70bf6727f1f308d93684ca41e9c2c68dfbd737a90da6375b58f162e8470fdea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00974-of-01024.json.gz": { - "num_bytes": 318555677, - "checksum": "109fe184ac9498ac571cd9c6cb38ae5ed566b0e98e8b7718984656a70cc6b224" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00975-of-01024.json.gz": { - "num_bytes": 319045215, - "checksum": "03c4257851857450f7397ac3d627a60ffc98708ad5aac6e1f73e6ce818fe7be8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00976-of-01024.json.gz": { - "num_bytes": 319172031, - "checksum": "7d98fa662aa9d0ff7ed50cc72195bdda2147212b34a3d22f0f757a4eb158d5b7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00977-of-01024.json.gz": { - "num_bytes": 318650530, - "checksum": "bb8ccc07ecc6fd39ae97136418efc543efe5541e85910a7f333ee5cebaa3b595" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00978-of-01024.json.gz": { - "num_bytes": 318609909, - "checksum": "40b49f3fbb2fce73bb1851304b290fc7fb400d13c2448ac7e5e559dccfda7ce5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00979-of-01024.json.gz": { - "num_bytes": 318881197, - "checksum": "b29f96cfba574428cb66f54b20c4a848bc83438256167afdaed576a3931117a0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00980-of-01024.json.gz": { - "num_bytes": 318506081, - "checksum": "a15996adaaf41e5615cb5c7fa2ef1b4e3003836542d0851d1c6907522f534fee" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00981-of-01024.json.gz": { - "num_bytes": 320000305, - "checksum": "38e282b433c4e3dcc9fc2b056f6ddbe4eb857c5137f7c51301d53ca259d6bdc2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00982-of-01024.json.gz": { - "num_bytes": 319959158, - "checksum": "97d5e58088a87a15b71db975d5e09b69daf497b7dff3ef809e1b8292caa27905" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00983-of-01024.json.gz": { - "num_bytes": 318921242, - "checksum": "f062e04f89132576ac1969fdaa43db761a0ff7e4269a6f173d87fa011a4c289b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00984-of-01024.json.gz": { - "num_bytes": 319577980, - "checksum": "e52a6c08d5243717f21120b4c3ebc8fcf77168928945adf68bc665392a6e8d11" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00985-of-01024.json.gz": { - "num_bytes": 319812101, - "checksum": "8b4f5645ae0e0b190af4ca5335c57735ae919d3c6402438af506c7907f1d1494" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00986-of-01024.json.gz": { - "num_bytes": 319582409, - "checksum": "3654109968d918aa4d8db17cb7057111c42894cfc7eee093df13036cfb3ac6fa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00987-of-01024.json.gz": { - "num_bytes": 319957581, - "checksum": "4b9e6febb461940b993c50945a2ed06736c6786aa8f758565ff545814ebfddcd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00988-of-01024.json.gz": { - "num_bytes": 320346479, - "checksum": "2891565dd75fd4354777b4f4f393983180584ee9c64b5d9b4557dbf26a3c4cfd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00989-of-01024.json.gz": { - "num_bytes": 318546717, - "checksum": "929d0236c9fb77d638e0a18aa97b00004316bbb0ef3c4323e39f61aaf7c0af53" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00990-of-01024.json.gz": { - "num_bytes": 319606761, - "checksum": "6ebd2552ecdcce7b194d4f6d5b5e66ede9d65da4e4999ee8ec4705d847e473ac" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00991-of-01024.json.gz": { - "num_bytes": 319117521, - "checksum": "1b3496964d0a895b347529ddb7b712d211c9419317fb41cdd6e20bba43f39f05" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00992-of-01024.json.gz": { - "num_bytes": 317781551, - "checksum": "9f9cfb5f9152b9a60121b03c24d944129c1ee43e862112fe3896e2772fef99a2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00993-of-01024.json.gz": { - "num_bytes": 319341839, - "checksum": "fb329b7470ae127efe1be4adc960b06eec4f55bbcbe1f3f0f0b794d70a8aca14" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00994-of-01024.json.gz": { - "num_bytes": 320357337, - "checksum": "bbe9a60c3c2b3b5b11a5d531d1d85f0a90ebe3dbc79189b3825e169ae302932f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00995-of-01024.json.gz": { - "num_bytes": 317824612, - "checksum": "26643091ae3425b63036453ffca7ed82c85c24b6a24264197e6516b68a39a4c4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00996-of-01024.json.gz": { - "num_bytes": 320453890, - "checksum": "db33809437e62bf1f086f40e4d66ad0133db7c7d406b2ce52ce5d9c9b0809961" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00997-of-01024.json.gz": { - "num_bytes": 319469732, - "checksum": "3447b74f09dc4d63dd04d6bbd4382147071504338e6ea428b37c3a5174877537" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00998-of-01024.json.gz": { - "num_bytes": 319562604, - "checksum": "270a1c19e6321541398836d3d982c2e396db99abf94317912714251d1f68e8ac" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00999-of-01024.json.gz": { - "num_bytes": 318895764, - "checksum": "d68f8f4d85d91679c20e972b2b1955d41a8f6601873bb311a2621f4b3f3152a2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01000-of-01024.json.gz": { - "num_bytes": 317697031, - "checksum": "68b47464ca3e97e9d3f4075b656f804c1bab667f231701db9cce1f0b0a921088" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01001-of-01024.json.gz": { - "num_bytes": 318915840, - "checksum": "582216879b058ccd4d0ca2edccaa2db49b64459371f8798a1d9c66c06a0cf908" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01002-of-01024.json.gz": { - "num_bytes": 317811256, - "checksum": "6864299a7d0174f92abc696dc293524291623891b86cd69132348fdf78760a4e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01003-of-01024.json.gz": { - "num_bytes": 318605529, - "checksum": "4ef35b7546266f99eae5f332cbe3e284801c5d7b39f840297d67e71c036edf62" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01004-of-01024.json.gz": { - "num_bytes": 319379897, - "checksum": "040dfa80eaf8355370d8a50692bc3ad03a1d57272af340d70031a4398f37b9ee" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01005-of-01024.json.gz": { - "num_bytes": 319515177, - "checksum": "012ac70ef2715181ec1fb578a2366d68e786d3a9ea41c59c08d7c494b89b429c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01006-of-01024.json.gz": { - "num_bytes": 320078217, - "checksum": "46030d85d8333ae224320fa54e487f3770de7de280cd0001344136b0bd87c431" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01007-of-01024.json.gz": { - "num_bytes": 318526753, - "checksum": "dd432d865ef3dba4b5af30e42b11ace96900bd7b97af053ea892292e75bd142c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01008-of-01024.json.gz": { - "num_bytes": 319407137, - "checksum": "165cd3a688be6f9f5a4cedde198a9dda4f9d3dbc1d275d1e99411f3ee96a0d62" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01009-of-01024.json.gz": { - "num_bytes": 319763066, - "checksum": "e44e86d497f8471e53531374b0e6ee61aac54996b6af64a4af0f5620673f9f7d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01010-of-01024.json.gz": { - "num_bytes": 318653930, - "checksum": "61115f16e718d3a2b66574cc17841aa5d02739762138abe3c9a7f325cf9f2e31" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01011-of-01024.json.gz": { - "num_bytes": 320037079, - "checksum": "65e18df845f1e6cce1bb92a45f71274dca94d3f0ece1d556116085b5c0e6338f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01012-of-01024.json.gz": { - "num_bytes": 319753418, - "checksum": "cd5a8ee1bc7d9ad58e98aa6fe56d60501115592519a19efcf9fa370668c6327b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01013-of-01024.json.gz": { - "num_bytes": 318657671, - "checksum": "986ead2c1b37f4094aa6f7a7882824ff013e6393323d5290d7f3e9215589d07b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01014-of-01024.json.gz": { - "num_bytes": 318028602, - "checksum": "3c82c0611fb1fb0f635eaedd2bbe7cfc9d53d1ae967a9cbd0416def046e4b104" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01015-of-01024.json.gz": { - "num_bytes": 319164504, - "checksum": "5eb5cf76022b12d8751a2fce5c4d4831066785a68edd7b3cd3dfc10017f91621" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01016-of-01024.json.gz": { - "num_bytes": 318474894, - "checksum": "a99d827be814e27d948264d6ae55c6a032a664f3ff0ef6ae94bda90f7faf29bc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01017-of-01024.json.gz": { - "num_bytes": 319516762, - "checksum": "7eac25ebb9383a4592023634b852d88a128604c494972a8fd9e2b183fbb303a2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01018-of-01024.json.gz": { - "num_bytes": 319433935, - "checksum": "35adb751748043a36f22b412d3ea0e01166037cd96216f516abc547e9d2609ea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01019-of-01024.json.gz": { - "num_bytes": 320305440, - "checksum": "54c4d52564221e48dc5354cb51d447658707ab8edaa3d6d8fec5ec379a29d462" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01020-of-01024.json.gz": { - "num_bytes": 317445661, - "checksum": "edf1c6ab9900d75b91738fc7e9e3db8cdde3f9ef2234ff249833b5cdb04c65a2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01021-of-01024.json.gz": { - "num_bytes": 318134525, - "checksum": "1c5e670ec9d815637e9bdbd75289c7ef7f3ecf384e32f403ae8a9fe2595cc983" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01022-of-01024.json.gz": { - "num_bytes": 319809162, - "checksum": "9def881764ca614c88ceabb41032d3e145f06c843a7ceebd87dba6b93c974a6e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01023-of-01024.json.gz": { - "num_bytes": 318155801, - "checksum": "552a6a2be423c0ecbb767611074200c5b85c1cf76c8640c79e3be5e967b293b5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00000-of-00008.json.gz": { - "num_bytes": 40471190, - "checksum": "1f25b6af12da84115301d4ee93ea5246c8fea5bb4a2008472794d95b917cc97f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00001-of-00008.json.gz": { - "num_bytes": 40675053, - "checksum": "db4c23d7a336032de37dfe2f3ed39653c8afd94004d4e8d9c73c03222299292c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00002-of-00008.json.gz": { - "num_bytes": 41175078, - "checksum": "4bf6b248b0f910dcde2cdf2118d6369d8208c8f9515ec29ab73e531f380b18e2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00003-of-00008.json.gz": { - "num_bytes": 40728516, - "checksum": "082b72c1ec600502df2e4403df6884390c85627ffdf37a5b700397c9a1ac6b8e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00004-of-00008.json.gz": { - "num_bytes": 40920200, - "checksum": "37c2ce46864db0b6f1fe89220ebf4ef811ea10485c8336f1712227bbbdb530e1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00005-of-00008.json.gz": { - "num_bytes": 40921460, - "checksum": "00b164e59df49df5dc1df170db99bb0d9207a6329cb9272ed8b6ef7a55058359" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00006-of-00008.json.gz": { - "num_bytes": 40549809, - "checksum": "86896a9baffe0ab9df39a2901f0e515009989ca1fec9a42583d718ce16166b5a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00007-of-00008.json.gz": { - "num_bytes": 40446172, - "checksum": "0bf87534c7050091c60466df50f174c3147d052ec7dc645da9574c902445beaf" - } - }, - "download_size": 327104523018, - "post_processing_size": null, - "dataset_size": 1658004128680, - "size_in_bytes": 1985108651698 - }, - "en.noblocklist": { - "description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", - "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", - "homepage": "https://github.com/allenai/allennlp/discussions/5056", - "license": "", - "features": { - "text": { - "dtype": "string", - "id": null, - "_type": "Value" - }, - "timestamp": { - "dtype": "string", - "id": null, - "_type": "Value" - }, - "url": { - "dtype": "string", - "id": null, - "_type": "Value" - } - }, - "post_processed": null, - "supervised_keys": null, - "task_templates": null, - "builder_name": "c4", - "config_name": "en.noblocklist", - "version": { - "version_str": "0.0.0", - "description": null, - "major": 0, - "minor": 0, - "patch": 0 - }, - "splits": { - "train": { - "name": "train", - "num_bytes": 1029628201361, - "num_examples": 393391519, - "dataset_name": "c4" - }, - "validation": { - "name": "validation", - "num_bytes": 1025606012, - "num_examples": 393226, - "dataset_name": "c4" - } - }, - "download_checksums": { - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00000-of-01024.json.gz": { - "num_bytes": 396728190, - "checksum": "06fcf4d9bf6ae45fac94245952f000c924d2a0b5cc8841c916b3ee949333410d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00001-of-01024.json.gz": { - "num_bytes": 395686133, - "checksum": "8a0b64c5efb1db1ebcc0a664c801221049f5812652dc1a727a0e9f8d0df0cd0e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00002-of-01024.json.gz": { - "num_bytes": 397762165, - "checksum": "087fabf9563297a6eab8bc39b68c0c6d15169032001d3a17c9bd964080759f2c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00003-of-01024.json.gz": { - "num_bytes": 395307518, - "checksum": "1e5b89200528320e354f60be0868a3ab6dbbe667a6b16b48e4739b988a6360e8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00004-of-01024.json.gz": { - "num_bytes": 396280504, - "checksum": "8291badbe84854960c0ddac3d6c226cb519268d1b3fd267bd72cfb4f10800de1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00005-of-01024.json.gz": { - "num_bytes": 396636600, - "checksum": "c74226ceada7d78e3e7a2ad931d0a99df93f4cc4377ec69d4f1fab4164c3d845" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00006-of-01024.json.gz": { - "num_bytes": 395364336, - "checksum": "4e52e99dfc4e55c41226978b4dbf48fac2f886b9b0446bc3bd576f32bdd7cfea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00007-of-01024.json.gz": { - "num_bytes": 396428805, - "checksum": "283ae93ecc3f8daefa9c47651ded763dc5f339ddc619c8cb5e32dce9cb9cfe4c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00008-of-01024.json.gz": { - "num_bytes": 395030041, - "checksum": "d3fc7fffdf9c2172d233bea3bb7dc485d753319e6196672d0186b8ba04a1d903" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00009-of-01024.json.gz": { - "num_bytes": 398255693, - "checksum": "61e10cef5c2cab162fb1d26f97fd9d76b30c9ee989c01ef8597d2a4e35b303da" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00010-of-01024.json.gz": { - "num_bytes": 397825333, - "checksum": "f72040887c2a2c17564c2c6a9a4b5ff95fce6a0eed4f0800cdeff8277af651ff" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00011-of-01024.json.gz": { - "num_bytes": 397877458, - "checksum": "ee34ff11164e10a86f76593205cb13986c70ea3d3a8849174a6dfb5b4ec91262" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00012-of-01024.json.gz": { - "num_bytes": 398317059, - "checksum": "7a3ef558efaca3e5d19e9ad02b47dd61f9639dd806130b62d66e9c3341c0edce" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00013-of-01024.json.gz": { - "num_bytes": 398518794, - "checksum": "f5a6c18992ab2b59a9c02469d20768bf5757624e03bcaf92957ce736a3a9edb5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00014-of-01024.json.gz": { - "num_bytes": 397026214, - "checksum": "c174b625c1534c69814f8e4879169b58af96f801dbb433113740af0d78535abd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00015-of-01024.json.gz": { - "num_bytes": 395621683, - "checksum": "4e8e52a602d4eb4b27104780f4a36617505505fb66a82f36e90631a4e668f5b9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00016-of-01024.json.gz": { - "num_bytes": 398138551, - "checksum": "a3e7a95b16f09e09e45f1c3bed3524415581e21b065d8efcc66cece705dee4d2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00017-of-01024.json.gz": { - "num_bytes": 398720813, - "checksum": "79cdb89052e8dcecd1f1319e47f4c4ae1d350ab81777a9ba8077cebdb558e795" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00018-of-01024.json.gz": { - "num_bytes": 398538940, - "checksum": "8da6aac3a794ce326b5a3971fb75a2ee848f008940d4f1bedd724ce7c5874278" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00019-of-01024.json.gz": { - "num_bytes": 396834319, - "checksum": "b57c93502949dad9001e89847947f6c65943927eb519e16de4eaf5590b235faa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00020-of-01024.json.gz": { - "num_bytes": 396402861, - "checksum": "05e14c7e21df3d4af7be7a597fa22463868464d6475282376536e12e82367401" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00021-of-01024.json.gz": { - "num_bytes": 397560852, - "checksum": "756d15d8b07414dffd7cff3efde606aa62cf8f73b85d8e1cd17408d6a339414b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00022-of-01024.json.gz": { - "num_bytes": 397210987, - "checksum": "60aa08d9c5d813d5f2448d910bc23a705cdd0828a9403c18ec223e53623889cb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00023-of-01024.json.gz": { - "num_bytes": 397563062, - "checksum": "bd865213ffb2b40c2cd3eb16724b68c0f37e29f68215990dc84d91852c7c0d72" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00024-of-01024.json.gz": { - "num_bytes": 395799120, - "checksum": "08ff3615ecea3eb5b55703e123475c95afbecfe7107eedf05750147c9ffd12ef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00025-of-01024.json.gz": { - "num_bytes": 398336372, - "checksum": "e3e30b97e585fd881b3a1b006775854a11a2b967d992e7eea886338d8beefb13" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00026-of-01024.json.gz": { - "num_bytes": 396819084, - "checksum": "fddc9e1a8405c5e05e63ce98b19c7833c0fd46392b4b55532b317e7f81426590" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00027-of-01024.json.gz": { - "num_bytes": 397912380, - "checksum": "d3e597b3a96b993840e47adb761cce2f2ae1c96aefcbd6c250198dedaecde15a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00028-of-01024.json.gz": { - "num_bytes": 399078461, - "checksum": "abd6d2341b6c61cdb89b80a8b9bfd938bb6d8a423a89e6a9f997c22c6479d537" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00029-of-01024.json.gz": { - "num_bytes": 397303107, - "checksum": "ee35a3af1056cdab79b644f6352150aeb6fb19a630cd6bc893a072e35fbfbad2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00030-of-01024.json.gz": { - "num_bytes": 396602401, - "checksum": "1d04d4bc295aee2ab80b24f587f8c483599db7d5a8157acc99a1d8b001f8353e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00031-of-01024.json.gz": { - "num_bytes": 395941329, - "checksum": "cf1dd244555511245c0e6a5b1dc9c24f747b8377674aa3690677ce08ebb8c26f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00032-of-01024.json.gz": { - "num_bytes": 398049663, - "checksum": "c83e5572647eba5ab14fdc4dcba8efb6981740b99b8f634e2c6b1942a051c249" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00033-of-01024.json.gz": { - "num_bytes": 398044404, - "checksum": "b76815aadcf4ad802071428864ce0b406cabd73dfc2be5e20b44885ec6a85419" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00034-of-01024.json.gz": { - "num_bytes": 396885224, - "checksum": "da00d92418fbdb9799d8f16977b3a33f67cb98a31808544cb68cf3b42ea9adf1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00035-of-01024.json.gz": { - "num_bytes": 396185021, - "checksum": "265ad43ce00666c83fd441d35ff29ba1ebf7d62442cc3e3c176091b4c725ea9d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00036-of-01024.json.gz": { - "num_bytes": 396702503, - "checksum": "4733156df48f2dd0f2e859fef28f56d12a84e8012085ca9318073ae647b0fcdc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00037-of-01024.json.gz": { - "num_bytes": 397582277, - "checksum": "7d62d03c3496ee2e17ab6b9635710efef9e4cefb88ddccdc16ed720a414c38c2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00038-of-01024.json.gz": { - "num_bytes": 396186761, - "checksum": "670affddf8fcca6933af3f5b30efd1bf490c3e38c3e90f2e8e9a464994d613f1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00039-of-01024.json.gz": { - "num_bytes": 397056953, - "checksum": "4acbd97f9c8fd9a930a6f4284a11cfe37f6cca3b5858ae3c2cde747dae35e0d2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00040-of-01024.json.gz": { - "num_bytes": 397809786, - "checksum": "d350e48a36bb1ba3125f72a07ed8024d26eae6d89ecac686ac0bdf3d5d89e1a7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00041-of-01024.json.gz": { - "num_bytes": 396944358, - "checksum": "817a58dc40440b8b1f54d129db08ae9124e0293e5a0e45f034fbffb2140d90c0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00042-of-01024.json.gz": { - "num_bytes": 394327995, - "checksum": "6bd6bc1269c2dd81db466ae9c41f76b8b8cf71cc7bd6e131452fa1a1318ff459" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00043-of-01024.json.gz": { - "num_bytes": 396476043, - "checksum": "f3525d9c861d984ea0cdacba7fddffaef058d8f95aa99ef1f09f9f0792fde5e3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00044-of-01024.json.gz": { - "num_bytes": 396893614, - "checksum": "292ca2b6b9ba41567fe7cc60e5424aa1f3e431ac874d06ae8eb98794563a7d35" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00045-of-01024.json.gz": { - "num_bytes": 395885483, - "checksum": "ea2c8fac41ededba7da8bf2bb48463d83f148e5c0970a689876d4932ab18a3c7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00046-of-01024.json.gz": { - "num_bytes": 396963386, - "checksum": "97672d9bca357cd2721f51301aa37d37a271dd3ca7487244c057570b995da66d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00047-of-01024.json.gz": { - "num_bytes": 395856712, - "checksum": "52c517670ba4eefb262cb71373d6370f86ddeb0aea7391a47a22d52a55bff7a8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00048-of-01024.json.gz": { - "num_bytes": 396091027, - "checksum": "49f5b68e29c55eb50da941eab1cf446c7d8c9d0b30290318977edb39ef0b887f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00049-of-01024.json.gz": { - "num_bytes": 396892998, - "checksum": "82a51eb6f301c00d927ca7920338247038cf4e9e0072d74c02bac897701f5859" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00050-of-01024.json.gz": { - "num_bytes": 396308050, - "checksum": "d72f92ecd27b716cd90cc4abe562d25fe6d49740b4a3d1fb9beac2526a61988e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00051-of-01024.json.gz": { - "num_bytes": 396137777, - "checksum": "a956e4d086077f7ab309ff10b0eaf4833e4d3ed74435293e96588f4361e1536d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00052-of-01024.json.gz": { - "num_bytes": 398302544, - "checksum": "5a54f7faa07661ea6a5f0585ca49ad66c8f7025fd9627b3af832dc886d50f78e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00053-of-01024.json.gz": { - "num_bytes": 399616791, - "checksum": "7f8fa496d50a0b7c399faff4c1864e24717b3f9c86b2552536c8f91e3e0cf9d6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00054-of-01024.json.gz": { - "num_bytes": 397332881, - "checksum": "ab862f26b4fa38b6c16d8cfd0d63a9f0973827e45915e85aefb95d4e182b7b9c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00055-of-01024.json.gz": { - "num_bytes": 397075146, - "checksum": "cb67aa9229bec8b88e496829aa0a60ca1c3ff4a2293632cf7782b69aa71aebfd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00056-of-01024.json.gz": { - "num_bytes": 397827600, - "checksum": "2f63e3ec40d32237d4a50c873b966d7fc2c16ef5c04a2bcfc33328b128654e7c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00057-of-01024.json.gz": { - "num_bytes": 397533583, - "checksum": "7c90bf39bddf8ad0c6a8bb3dff02caea8bbc2abbd76047c5d523930d2a00dbc9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00058-of-01024.json.gz": { - "num_bytes": 396411363, - "checksum": "ee6059f3c8a2df34858a0110a06ec4e9673555fa56c1a2b40930337ba5b1b39c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00059-of-01024.json.gz": { - "num_bytes": 396735510, - "checksum": "d9dbe2421edba1820294e757d88aa25455db42ce8992f8933b51cd84cfc35a36" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00060-of-01024.json.gz": { - "num_bytes": 395694553, - "checksum": "b05d6502fc95587fa7047fac64978d6be13761dcc6954629332812e5937c2731" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00061-of-01024.json.gz": { - "num_bytes": 397740757, - "checksum": "39303faa5dc33995dfec683b44fc24066ecccdf6b5001b9c0644d8e9899d45f5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00062-of-01024.json.gz": { - "num_bytes": 397358263, - "checksum": "fe27dd467cc2c34abe5b0bb34473ee68859f2198eeb78304e1d2e54460a67383" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00063-of-01024.json.gz": { - "num_bytes": 396826654, - "checksum": "1da2c414bd03e5547d8c9c7447e42b8dcff5f6ca8ba35c53076f2895e8ea63f6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00064-of-01024.json.gz": { - "num_bytes": 395781869, - "checksum": "af96de4d6b5bc1ab0527efa33a73d7eb788dca15829acbb7291ce72ad05e6c66" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00065-of-01024.json.gz": { - "num_bytes": 398192274, - "checksum": "7f46ccfc1703fee106e932bc9a1bc5dedf7de944172cfa34ec9b31413bf0bbda" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00066-of-01024.json.gz": { - "num_bytes": 397133438, - "checksum": "dd3b67d8578927d7474dae76bdca35f35a2aa125fc50873e4a9f6e73d7a81831" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00067-of-01024.json.gz": { - "num_bytes": 397204214, - "checksum": "4cdc87a7c9fea33e15d638e5c921f45149212769bfba5f59f0a5943398ca0d55" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00068-of-01024.json.gz": { - "num_bytes": 396489592, - "checksum": "64d175c23574998f8c5d28ce3d3f3934144b1fd4f6527ede1aa3420c28bb90d0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00069-of-01024.json.gz": { - "num_bytes": 397697351, - "checksum": "3329857f531c9fa22d98bd567638f0564f73062da1478ca84385246f71baabff" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00070-of-01024.json.gz": { - "num_bytes": 398449973, - "checksum": "bd13494aa03a95d943a01f3436f62c46ee3390b30f6ff0fec0636f3c0b09fa1b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00071-of-01024.json.gz": { - "num_bytes": 395498960, - "checksum": "5e69529ae82c305acbf1f58a7021b4e3fc67285a871dcbcaaff0781d0e721070" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00072-of-01024.json.gz": { - "num_bytes": 396170387, - "checksum": "9b9c7e11b9bb2cf6ea0fcdfd58754f522a95070feae74c29559522e12e1b41f4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00073-of-01024.json.gz": { - "num_bytes": 395915819, - "checksum": "87a2069589fee8de23730b8b994ba59d63d5128175b5326ba0a8c8ac9e01a3dd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00074-of-01024.json.gz": { - "num_bytes": 396986018, - "checksum": "e073efb3f00db65c1ee14e8bfa6e8c807f7827d0f3dd4d4026f823bc6f61b1cc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00075-of-01024.json.gz": { - "num_bytes": 398555103, - "checksum": "a1793748c7979e241ca34291c843ca3cc90dd7643f04810b6cd324220efbd6e7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00076-of-01024.json.gz": { - "num_bytes": 396357420, - "checksum": "7b1cd69788ca9a7e614de70a8b908183f41f316eaadf3b0236a7c4e126db9844" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00077-of-01024.json.gz": { - "num_bytes": 396666167, - "checksum": "aec828d3c2a1f7fa970de328a8fd1a85a90493dbcbec4f50816ccbc2275a1fac" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00078-of-01024.json.gz": { - "num_bytes": 398167446, - "checksum": "e14bdf5af810574aca7c6f3daa67e503f24ab1705435a62129c66c248667ee97" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00079-of-01024.json.gz": { - "num_bytes": 399696096, - "checksum": "b63756f81b8b19ecdc9bf227045df10840cbf973b60bd8ffdf28f58a53cdb028" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00080-of-01024.json.gz": { - "num_bytes": 398755610, - "checksum": "dfc118f680b79260e7ece75f27c0459484eb8458f2422df9f1918f726b54ccb6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00081-of-01024.json.gz": { - "num_bytes": 396606787, - "checksum": "17d6a503947f5132728f53ea62fd093f55bf2dc6a32316a5c0413353cf13eff3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00082-of-01024.json.gz": { - "num_bytes": 395714484, - "checksum": "8ca41818ee6a0ffd5b00714779289c18cd97d620258c5d3d741c482b72344300" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00083-of-01024.json.gz": { - "num_bytes": 396807173, - "checksum": "12d87c0a948f32f788497858751c3ef22f289136e6ae58518a97a2e976f5cdc8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00084-of-01024.json.gz": { - "num_bytes": 397241529, - "checksum": "7c3da4ca4d2b2077f0ab7be511038255732fc88d954f2f17cb0f3ab144216206" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00085-of-01024.json.gz": { - "num_bytes": 398357369, - "checksum": "26df55183e78f8d69fb16e21d07edf98659b69bcb3c48f340da6a5bc44007f4d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00086-of-01024.json.gz": { - "num_bytes": 396997317, - "checksum": "09f0641e9075cb88800d0eaae3f7b99b047552edbc71d1fd2d8594f645d22c2a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00087-of-01024.json.gz": { - "num_bytes": 397978000, - "checksum": "c9437ef5f58a46b8a6d8efcae37fa658da3f2c4f1cad0f9cf47fbcd09bb82f8c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00088-of-01024.json.gz": { - "num_bytes": 398468913, - "checksum": "be187fc14017f666b84ed7049c169c1a28654441c2f523eee8b655b3b9d9ba8e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00089-of-01024.json.gz": { - "num_bytes": 397071121, - "checksum": "637c3f964ee2c750a0a175f2e5d24b786a37d37701f10616b448804d68b72f4e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00090-of-01024.json.gz": { - "num_bytes": 395753807, - "checksum": "8eef7ff1a8080aebe5226cc3539baac46ab64d93f8e3ffb6e8b7ab3346e151dc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00091-of-01024.json.gz": { - "num_bytes": 397039764, - "checksum": "a2904ae5bf69b393a697afd62ae9b8a560c1f076e8a141e6f3feef29cb5d1352" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00092-of-01024.json.gz": { - "num_bytes": 397058578, - "checksum": "eb4d7e2712a9983bc1581133fa8eaa2e1d28b314861833bd8d810d615ec1ed81" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00093-of-01024.json.gz": { - "num_bytes": 395855981, - "checksum": "5c9a7573a5644d89d46666306d333ff1e4af3213f287cb9adb48ef87a023d479" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00094-of-01024.json.gz": { - "num_bytes": 399516118, - "checksum": "de7ae1508815e48ba031762c084cf6946b084871463821407090d23c197c6474" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00095-of-01024.json.gz": { - "num_bytes": 398236235, - "checksum": "616cef1f21ef078ffb9fc2b4148735668debdd15a8bc1be281183ba3659e9fcd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00096-of-01024.json.gz": { - "num_bytes": 399526010, - "checksum": "eb754381b8a6f3c74dda5ee5852958f7b69c707a3908cbaa9410c972e002a0cb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00097-of-01024.json.gz": { - "num_bytes": 397935028, - "checksum": "6d6d2ca80708b7c6ad4240a042dddc2170060e8976c2e7b4ace446d2f2395076" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00098-of-01024.json.gz": { - "num_bytes": 398645934, - "checksum": "568db6971230fb42df8973ecb5a2a6d77204aa8cf0bdf47b386c04370da8dfd1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00099-of-01024.json.gz": { - "num_bytes": 398110916, - "checksum": "9bacb381e3b06976619e816e40ac2ccd3bcf3cb9ecd30c294b388cfb75c8bf77" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00100-of-01024.json.gz": { - "num_bytes": 397631228, - "checksum": "7d515ac0f767736600a216ebe7280b9751f16e70df969ba601d1aaae15f201e5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00101-of-01024.json.gz": { - "num_bytes": 395102356, - "checksum": "87c5c81e154e136f3e090ba91682ad54fe678653f86f6f32002ae5ec3c9aa743" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00102-of-01024.json.gz": { - "num_bytes": 398926159, - "checksum": "2df85a9ac13812c3870180901dbba99b52e53fc045da019160a3f06d0dfa5e95" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00103-of-01024.json.gz": { - "num_bytes": 398383820, - "checksum": "8134d12e84ed4a58a5f8f6eff8a4349f7d6ded6a1d7539b5c23193571569d6c7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00104-of-01024.json.gz": { - "num_bytes": 396628542, - "checksum": "208f0cb3365b0243d70e7b4e52ff977e9b11d8e451adea521a5bf6e10cd40ee0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00105-of-01024.json.gz": { - "num_bytes": 398737797, - "checksum": "855ac7b8cb621a240319ef00197d2f20338d17db71a1aec68fb66930bc17c59c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00106-of-01024.json.gz": { - "num_bytes": 397281064, - "checksum": "544d5d91d066f2450bfe622ce55bdfe16a300aee9c05aaffae8a645966bc695e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00107-of-01024.json.gz": { - "num_bytes": 397919761, - "checksum": "f4af405c0f19c9139d93b3073f3fe328be998c9dc6f74afc7e21ad068964b92c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00108-of-01024.json.gz": { - "num_bytes": 398810219, - "checksum": "bdfce29353c6caa33b178bdebbf7e48526c391bc6c71180e3fa378b723879563" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00109-of-01024.json.gz": { - "num_bytes": 396605124, - "checksum": "ed6acc172bc9af0e31170f5533001a8fcd344e6732a4b3a714b7ad43740f25f4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00110-of-01024.json.gz": { - "num_bytes": 397491755, - "checksum": "428b6c91f12c4f7032fa692bbe887f1a4c02635eb88b91d876da4c71f3da5e4e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00111-of-01024.json.gz": { - "num_bytes": 395754897, - "checksum": "a723863559edf291fd8a6c2736cc1cefed70dd3c8625b967df049ce0d373f68a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00112-of-01024.json.gz": { - "num_bytes": 398567649, - "checksum": "a90ddc9ccfbca20b9c75bd2b7d63ee6abd03236a0f0dd2827eb9f7350d9c3931" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00113-of-01024.json.gz": { - "num_bytes": 396706569, - "checksum": "479052b6b9edcc2bbda40b982976e7e28d84fad7b2dce46b017f4e3d1f61e0d2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00114-of-01024.json.gz": { - "num_bytes": 397384355, - "checksum": "a95984e4c261a3057d1bc51939aefd9413853111e19030b19c5d26f778be00ba" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00115-of-01024.json.gz": { - "num_bytes": 397702826, - "checksum": "5eaf7fc2c9d4b2ee3e216c215da7f4fc7558e89d6993033b95a940a78061ab05" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00116-of-01024.json.gz": { - "num_bytes": 397252590, - "checksum": "268033cbbdf3be9790cb6010791693f1b490af06f9fef91b0b307420a4e30a08" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00117-of-01024.json.gz": { - "num_bytes": 395506730, - "checksum": "cb80908eee1054ddaf7e2e5d66c9a41505025c2b6dc7fe6aa287db0a9f3829ff" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00118-of-01024.json.gz": { - "num_bytes": 396452136, - "checksum": "d75bf895c88ff2e9c4031c1f65b067222cfbb1a937d685ab4dd33369f5f5ff7b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00119-of-01024.json.gz": { - "num_bytes": 396777389, - "checksum": "2c00362f4d99cef2bae2f13f17b79ec56a5ef8aca18ffd56a12fea2308e5017b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00120-of-01024.json.gz": { - "num_bytes": 397730478, - "checksum": "e31296949f7ce2e2a74fd2443552cb64b9f3cddcca691097a56992f51033fd11" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00121-of-01024.json.gz": { - "num_bytes": 396593647, - "checksum": "c2f0f81e3c835848a47532d8fd1c215a624f47740196a7bb45b5099916853014" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00122-of-01024.json.gz": { - "num_bytes": 396576172, - "checksum": "72edb7581a623e20f26cae4885f3b9d7f329581921253ca4d7ceedfbca17b7b9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00123-of-01024.json.gz": { - "num_bytes": 397378329, - "checksum": "4f045ce7bd077b7f878012aead8c51073022448de66d2e35a755d4c8c4a6f59d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00124-of-01024.json.gz": { - "num_bytes": 396545003, - "checksum": "dc7949657328520d31a27d8e267c2ab07cd4e8639036d4b1bb59454c309f862d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00125-of-01024.json.gz": { - "num_bytes": 397630505, - "checksum": "530bd95e5ef9a1d5989c595e60e0ab11583e0f42d16b2bd37c49ed09a67af207" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00126-of-01024.json.gz": { - "num_bytes": 395483747, - "checksum": "d9df071edec6959ba842509f72ad43be3ea3f529b60d48f3dfbf390908887a5f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00127-of-01024.json.gz": { - "num_bytes": 397295159, - "checksum": "02b61f5bc7d1d241484c4f04fd517960ae755a69f35192bdd5bb471baeba5614" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00128-of-01024.json.gz": { - "num_bytes": 396276865, - "checksum": "0c7d618df232c36ba018269ddf3b2863cd6d63bb7fabeaae33fd508715bd8ce2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00129-of-01024.json.gz": { - "num_bytes": 395314703, - "checksum": "03443afda032187d2dc2e696ce6eaecbf2219e6dabbdd593379e97c0e00e3112" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00130-of-01024.json.gz": { - "num_bytes": 397411481, - "checksum": "8969873d5efd3df0cef1742e4bc67f2df7a5b5d9e641f7a12e77c7e8e96a1bf1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00131-of-01024.json.gz": { - "num_bytes": 396925311, - "checksum": "31adc39ea4eda8667662608bdad6bb32bbc82b1ee1ad53ceb4df50924a933bdf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00132-of-01024.json.gz": { - "num_bytes": 395826124, - "checksum": "d2f035ba2c388fec2d847bd43449c885eadd0bcab5fb8afdf031a53e72c4ec32" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00133-of-01024.json.gz": { - "num_bytes": 398892794, - "checksum": "b7ed60983058a5f9f0ef72602789f50359f415ecbe60dc967e7a869866d833b6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00134-of-01024.json.gz": { - "num_bytes": 398206890, - "checksum": "9ba78624879aabb72bae0b4119fa2625793915382031ed897a0b4c3f2863b8aa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00135-of-01024.json.gz": { - "num_bytes": 397161888, - "checksum": "9fa6fee55f5e8f887dcc64d94cc65ada6f283a580edc7926cb159b80d0084ea8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00136-of-01024.json.gz": { - "num_bytes": 396185585, - "checksum": "81a1fcafcedfdd9bcb32d2467d9c963cc7d8b2f32e13e52ee04db41b0d3f5483" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00137-of-01024.json.gz": { - "num_bytes": 396933735, - "checksum": "c7558304b614e1cff13b0f6e967fc5ef77e4953a1eea1f39ed925c33076d7723" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00138-of-01024.json.gz": { - "num_bytes": 396371698, - "checksum": "3e896da8bf296403f7b4061ba0b24d3c3978993de4854fabd688cfce9fbf7bba" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00139-of-01024.json.gz": { - "num_bytes": 397289537, - "checksum": "1a5ffa3aaf565ccf4db7444983643ad06e386938a0a2d313aecdb972c36111e4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00140-of-01024.json.gz": { - "num_bytes": 396983259, - "checksum": "4047916916fd9dd7b76a8cbc595d52803344467135f744b23bd10296004a47d7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00141-of-01024.json.gz": { - "num_bytes": 394947050, - "checksum": "7edfc9e5870d80d470e3797e8bef5183e9d170eab410ab50957e946dde2e8199" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00142-of-01024.json.gz": { - "num_bytes": 396852755, - "checksum": "4affc3a24616858fab84211e3825e90a1ea7d9c8f2cfabbe9a5c9b24c21a116b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00143-of-01024.json.gz": { - "num_bytes": 397579248, - "checksum": "d5aa9ba68e9b30576bd640f647d4069b6c56db276cc5229573440e4a38a7f1e9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00144-of-01024.json.gz": { - "num_bytes": 398800367, - "checksum": "fa104e63eb7a8a6b066a5f00bf05b3ea095bad35a902bc728251f096173f1417" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00145-of-01024.json.gz": { - "num_bytes": 396709510, - "checksum": "b615ecd58821b1697c82094cb3435375924263827c342ab1b87e53907d4aa63b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00146-of-01024.json.gz": { - "num_bytes": 396042389, - "checksum": "6004c782f3235490865b6634b2c4840a989745b70ef2da674e75c62aeedf8a6f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00147-of-01024.json.gz": { - "num_bytes": 399840661, - "checksum": "5e8b46726f7ff2c3dfd381fb252f1b4bddf9436fd9ffd10fa300cb0fbe76998c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00148-of-01024.json.gz": { - "num_bytes": 397098215, - "checksum": "0851cb274aff2ec4f781c82af11c94f8938a797aca5097fb0089299cb4c75aff" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00149-of-01024.json.gz": { - "num_bytes": 397540697, - "checksum": "7cadf4ef9b0e29d9e8f68474464dc072b78e909a0f03c74e61b67912ff9b551d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00150-of-01024.json.gz": { - "num_bytes": 396347701, - "checksum": "521e4f67d12ae47b8f2a02b6f77e0c85cdf9a0efbcb45602d09ae116110ebe66" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00151-of-01024.json.gz": { - "num_bytes": 394890490, - "checksum": "2255bf3e1940ea28da9656028dee26865a9ee682cbaab4d5aeb34c081062f8fe" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00152-of-01024.json.gz": { - "num_bytes": 399584675, - "checksum": "f8ca4aaf5706ffb0f5518c7461d9045d18c645df068aa436137299e5ca77df82" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00153-of-01024.json.gz": { - "num_bytes": 395606567, - "checksum": "24f0e81dc3140f063ac89173fc262b01f2420133025b114f29632262cdd2e7fa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00154-of-01024.json.gz": { - "num_bytes": 397925578, - "checksum": "5f40a87b15b0acebbd324e7c5cd2c0f31f911558d57f774f278634db94f2d5f7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00155-of-01024.json.gz": { - "num_bytes": 395428741, - "checksum": "36281c154f187a09a83822878da815cd9b7f659a41cd90ac64653b437e798c72" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00156-of-01024.json.gz": { - "num_bytes": 396799274, - "checksum": "0fb66965107e54c9fed0013962763e874b940b0e174d775b21fa5e688fa53b33" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00157-of-01024.json.gz": { - "num_bytes": 397321211, - "checksum": "014d1443a4940fe95089bf87e245817d3a90c50e3e371a703098f5b9c3f6c759" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00158-of-01024.json.gz": { - "num_bytes": 398736992, - "checksum": "f912d27d68318fc0089fbaf8e0481ebe8dc5d2963cb89ed315f3bec637460bfc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00159-of-01024.json.gz": { - "num_bytes": 397250687, - "checksum": "1bfd02a301b09bfd53058522d0613e1fbecb788d3173eb30b58115cd1cbdb477" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00160-of-01024.json.gz": { - "num_bytes": 397492158, - "checksum": "149a7bd76e9ea41185d99d21df870ddd4f32857fdd628cee927d6bee7d6a527d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00161-of-01024.json.gz": { - "num_bytes": 398383574, - "checksum": "0c385b4c9b33574cdc75070309a0aed46aa7b2e3b8754a7692035a3c5a04f916" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00162-of-01024.json.gz": { - "num_bytes": 397126197, - "checksum": "5c012b2a6bbc9413914ed1420b6150a5549cd74185bf2788d8809005034d433f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00163-of-01024.json.gz": { - "num_bytes": 398201223, - "checksum": "79448c338e86cea2609399705268fc6011cb21c4f0aff82e3fb7660391ce85c4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00164-of-01024.json.gz": { - "num_bytes": 397914908, - "checksum": "dfb89631dce146ab4713a03f184e864472eb133b2cd04db8b4bccab688e9e287" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00165-of-01024.json.gz": { - "num_bytes": 398142696, - "checksum": "74acc88d6612aae7bdf5187d3b9eddcdb04cf60f1cc350661ffa50219a747f9f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00166-of-01024.json.gz": { - "num_bytes": 397533050, - "checksum": "757d23402b3a155cfcb6b30bdc305c8014c9b64ba4e067753664670c2c5e9534" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00167-of-01024.json.gz": { - "num_bytes": 396241119, - "checksum": "521bd7a9dcfa0390c35e50a3d0cde3ea627ca538dfc419a97ed83b251d8a3005" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00168-of-01024.json.gz": { - "num_bytes": 396041761, - "checksum": "dc540ec27d5999f6a4c71f075ae1ec64ea84415c720cd2b6ef3fdac925e576da" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00169-of-01024.json.gz": { - "num_bytes": 396350882, - "checksum": "36d5d35075a82038dfdd5abd29a839f4e9ab79d51f0bbc635d3dcf3f5f1e2732" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00170-of-01024.json.gz": { - "num_bytes": 396885157, - "checksum": "db9a3f6a7e085007eee381357ea9e4d5d6f702580d38220860967ec441ba3525" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00171-of-01024.json.gz": { - "num_bytes": 397266368, - "checksum": "7f8098cb6532bc888d3c1f0ea5072cf8419ce1689b9ffe1c370ca20071e7e1c2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00172-of-01024.json.gz": { - "num_bytes": 397140430, - "checksum": "90ae7e2551b1f3bf2e5ccf4fb3fac8fa3512add5e299ba7c90319611baf8c840" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00173-of-01024.json.gz": { - "num_bytes": 397069631, - "checksum": "a86f5ab72e1a9b1d491988154fd6400e6ee8c74378a9e64276df438a3c4edf9f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00174-of-01024.json.gz": { - "num_bytes": 396743897, - "checksum": "451cfe8e14c17113a2f6673ece27e01f8d54bed1b57d1b20cb84f125879939ec" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00175-of-01024.json.gz": { - "num_bytes": 395780705, - "checksum": "3252e9781545bc3f9f19ac6e8fdb87d81cdc5a94838798daf6037c9f4f473db4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00176-of-01024.json.gz": { - "num_bytes": 396205053, - "checksum": "49d1648d37150b90632a6459828eedd82deb2fce7f108bf4e1b050f2f9ad1668" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00177-of-01024.json.gz": { - "num_bytes": 396248718, - "checksum": "99346ccda762ae85038a10baba937ef8ef668a0beab483c4005dce77e331768b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00178-of-01024.json.gz": { - "num_bytes": 396634813, - "checksum": "8d3bb1610ce79cf359d75f32e7624b6203140ed3eb276362b040615e9ffd4b54" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00179-of-01024.json.gz": { - "num_bytes": 396524113, - "checksum": "971e5c9499425294cf5945436b2ee419379a75bdd72d4cd6a33b1d17c17de298" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00180-of-01024.json.gz": { - "num_bytes": 397938782, - "checksum": "dd6b3e60219788b82ab3fc63a9e65f38f64aa2f7b294135ec2d16b36350f1f40" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00181-of-01024.json.gz": { - "num_bytes": 399155769, - "checksum": "c6a806d627a9d197789bfc6257a92b0223ca51e724c3c2ad10fe2397dbe30848" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00182-of-01024.json.gz": { - "num_bytes": 396136228, - "checksum": "2c48e3237253eaad9afc121e6946a9e1856bbe82c5a7cb287b05cff3e6ea8e8d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00183-of-01024.json.gz": { - "num_bytes": 397083292, - "checksum": "52645e03ab47da01bb40226eb90042be914f1170688ae940314871e16cbb1037" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00184-of-01024.json.gz": { - "num_bytes": 397402964, - "checksum": "1edbdb41edeabc108f0147e18b439a75e390e0a843ed915f1cbf73a7c7f7867d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00185-of-01024.json.gz": { - "num_bytes": 398411052, - "checksum": "ef071e52174a19597e567696262470906275c2cd1cbbb0b1e98864999ea2d463" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00186-of-01024.json.gz": { - "num_bytes": 397122443, - "checksum": "0d87080bc08f7f8a1952a7df57ce2bdbf61e40c05b61937c8c19ae0ecd952b1b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00187-of-01024.json.gz": { - "num_bytes": 397244868, - "checksum": "4aed75ea9f885fc3dab599c19c7bb98f7d57ce2b2ec11ac8ab3258fa479fc0db" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00188-of-01024.json.gz": { - "num_bytes": 395677432, - "checksum": "342882e436ea826cda9fd38c0caca68bb35444a2a07596f8de0e53a3e2169f59" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00189-of-01024.json.gz": { - "num_bytes": 393653750, - "checksum": "22ed9e389f6c8410c9bde898d97ad798c236c2da4d0b2c76b86d013f8686da03" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00190-of-01024.json.gz": { - "num_bytes": 395437920, - "checksum": "b3f9ba5834d4f0280d6defd3bd50fdf961bee6be4c71ed47046cf4e115acab01" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00191-of-01024.json.gz": { - "num_bytes": 396944861, - "checksum": "4e7ed636a60edc44b5ba709dcd83bf4263ad8d5a06a02827d3d27191bf3731a3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00192-of-01024.json.gz": { - "num_bytes": 396611165, - "checksum": "4fea34466d9b470bf0bc44455183b2c61994c4e71e4bfb684dff3b5e3870d1e4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00193-of-01024.json.gz": { - "num_bytes": 398283211, - "checksum": "4c4e6d31f455831330971ed1e0c33221203401b817adbda5b53de16f8299a9ba" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00194-of-01024.json.gz": { - "num_bytes": 398915952, - "checksum": "dfd0b1ceb2a437da8cd38c9c791af809e94f2e36ab4399b2a45a5b916f4ccaa9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00195-of-01024.json.gz": { - "num_bytes": 396352694, - "checksum": "0ccd90ced34b3ff28c21d015a87eca3f31eae2bf31f11f25ac073139f9d50c22" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00196-of-01024.json.gz": { - "num_bytes": 398582922, - "checksum": "f22e59765cec074a0c687c500f4e6348250d0e418d12dcba211e39c133aaf290" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00197-of-01024.json.gz": { - "num_bytes": 398839554, - "checksum": "95fa68cd75d77a1b5bb526dd5ef16a2f04a3520604f734baeb6e2d95608b5973" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00198-of-01024.json.gz": { - "num_bytes": 396202192, - "checksum": "f0e6343e8105178b38f75eade6774aa6e85b62a271622fcfcbe2745f1cae11ec" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00199-of-01024.json.gz": { - "num_bytes": 398029364, - "checksum": "4c58736410c8d3c7174ce011e2f281cb16e4949d756ff4ace86b4a9d4795c04e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00200-of-01024.json.gz": { - "num_bytes": 395867629, - "checksum": "1cb798ee6609e670053987d881d130d5b73db19d9f37fecff7a6da41152aba05" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00201-of-01024.json.gz": { - "num_bytes": 396858169, - "checksum": "7357eb22b2aa75c55885252c62d12e08cf8f7ef285c0052cf1d706c3f0f74fef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00202-of-01024.json.gz": { - "num_bytes": 397955766, - "checksum": "8901d0f27c4c11916cda7cf806cd00000771b6351954c8503bc312cca5ad3a10" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00203-of-01024.json.gz": { - "num_bytes": 397737882, - "checksum": "ed51917fc8936701b681cfc49ef95b2dab451ca597e76b34ba90be9405a1a0b8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00204-of-01024.json.gz": { - "num_bytes": 396094006, - "checksum": "88692bb8da78347cb97c0e0849d1a10a97b1686cde1f75626236b89bd507e2b0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00205-of-01024.json.gz": { - "num_bytes": 399027636, - "checksum": "fb17fe19d1f0fcaa43fb31a3ad9b105b3d93fa287351c7f93fb599edb7f40bc3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00206-of-01024.json.gz": { - "num_bytes": 399406254, - "checksum": "668d2a9927080b686a4d728236e4cfc780b262f9045dfe9575cfc48cb69d6adb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00207-of-01024.json.gz": { - "num_bytes": 396291803, - "checksum": "928f451dddfe42bb2ca791dbc61c36ddc618006ef709eaccbc2beb665c8427e4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00208-of-01024.json.gz": { - "num_bytes": 397807368, - "checksum": "11e8627b758588056b61d31de07c50092222013a38ba802b7a9ae34b6b8b84a6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00209-of-01024.json.gz": { - "num_bytes": 398085408, - "checksum": "d49d31d1719698ab7a2b9ee91d887f3192c8fc1b6108152a75b39de2a0ad25a6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00210-of-01024.json.gz": { - "num_bytes": 397670254, - "checksum": "049b3294c3e22e6db6c115979a4a55f0650966c600ca17250e91b241cc97bbd4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00211-of-01024.json.gz": { - "num_bytes": 399643598, - "checksum": "7772f26fd90f47033670e7f1d3f6fe092116486bb9a991577f9560b54ed3832c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00212-of-01024.json.gz": { - "num_bytes": 397390768, - "checksum": "7a24e4a70f43f6227fe6491fcc7bb6b2a19cae203521c803bedf8882c995d7e6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00213-of-01024.json.gz": { - "num_bytes": 398657925, - "checksum": "21d0ee8d1a01957b56ac503aa88c6f3269b4e4692762a3f929fe0e7069be8c0a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00214-of-01024.json.gz": { - "num_bytes": 398282324, - "checksum": "ede2d9824d8f99dd578a36ea82caae942ebcafd99f308cf5d0ff8aa4a56f0a05" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00215-of-01024.json.gz": { - "num_bytes": 399178235, - "checksum": "82516fa361dec02c7ed59ea2d0510d9ee4187609b449dca649a04141b12bc037" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00216-of-01024.json.gz": { - "num_bytes": 397630870, - "checksum": "4a6d5e60354b7b93f005010c6fc55c0a81596e98a116cdeec99e1ab4e58fd03e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00217-of-01024.json.gz": { - "num_bytes": 398628848, - "checksum": "02dffb623b628a3a3ea38084fe6bb840aafab8419feed3d1f2bd3598cfa80aab" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00218-of-01024.json.gz": { - "num_bytes": 395087998, - "checksum": "e1e9a7ac7a922d6a9bb90f82cb48dff11ab7208dac08511e9613cd2726ca67ec" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00219-of-01024.json.gz": { - "num_bytes": 397622792, - "checksum": "955afc7d45a080ae137e9dc25ba3d85629a6a14c3d9bbe4065aa37d710345b7a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00220-of-01024.json.gz": { - "num_bytes": 395112655, - "checksum": "a3560918bec20087e9908009a362957ecb06401924789e20b36c26e363db5ae7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00221-of-01024.json.gz": { - "num_bytes": 397132000, - "checksum": "d8459bb5b6fb6b341b24fe517cfc5dc099765ad70c3383bae913229e06cf99e0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00222-of-01024.json.gz": { - "num_bytes": 397138513, - "checksum": "20d3c6219921dc9c2928d637000e488635fd9a12b5636de5a6a7e52c1b67d781" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00223-of-01024.json.gz": { - "num_bytes": 397167661, - "checksum": "43a18accd194646893324537991e0162f6f98a9cec5ff59fe8fb510d81d707bc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00224-of-01024.json.gz": { - "num_bytes": 397905941, - "checksum": "a516485cbefdef2e31a493cd8827a5f936f10674ff3525b71d414e17f48241c3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00225-of-01024.json.gz": { - "num_bytes": 397218123, - "checksum": "791c85c78c5e7f3557855a1fc71acd860521710515b89f92e54e02960549f46e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00226-of-01024.json.gz": { - "num_bytes": 396619135, - "checksum": "52a36037696e6245efad80e00d1f123c36dbd79e7ff52b1fb99f579e712d2b30" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00227-of-01024.json.gz": { - "num_bytes": 396654998, - "checksum": "e31123ab579fe95bd50afa10d52a51e9c15a4af28c06583fb5aeac4e3418f129" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00228-of-01024.json.gz": { - "num_bytes": 396899165, - "checksum": "86481361fff334dee3183fac8ab3f346e44ab3e6e7b35bbd7e6e062b2d2fa0d7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00229-of-01024.json.gz": { - "num_bytes": 397489378, - "checksum": "bbb717711fb4c78ebe8a0476296a21a50285ec41d9fb9f08d5d66d899577e04a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00230-of-01024.json.gz": { - "num_bytes": 397462301, - "checksum": "054414aac29b5c8faee71a918f2586ad3fce8ee44c71e7a2e2af4b91e0169523" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00231-of-01024.json.gz": { - "num_bytes": 396097584, - "checksum": "8136e320fccba75a493954fefbb560f92532be44a6e0990404edae659d48ce1e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00232-of-01024.json.gz": { - "num_bytes": 398984795, - "checksum": "3d9362aab157beef3b5fcd4a0a0236d59de635a565b1c86423f45b26e8b437b5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00233-of-01024.json.gz": { - "num_bytes": 397258012, - "checksum": "e1a532922477d17f7cbea7db72c2391d26b4db580e526ebd5a90be23607a8d31" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00234-of-01024.json.gz": { - "num_bytes": 398350453, - "checksum": "c464829565bcaafdba165b2d886be4580f3c0a516b5417853ffc4fe30049cffe" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00235-of-01024.json.gz": { - "num_bytes": 397147353, - "checksum": "573a6a1d33ccc6c5b605d381f04d73989504bb6d24514b938e92c3d4f61501e8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00236-of-01024.json.gz": { - "num_bytes": 396963006, - "checksum": "21318462014bc185d0da7cbd342fddd07521401ca2b73e47eb5cb4bd42a82bbe" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00237-of-01024.json.gz": { - "num_bytes": 397087111, - "checksum": "49459c97b078726bf8377748d4bb2066bdfa47e2717315a9b3c8075cfc4b9b10" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00238-of-01024.json.gz": { - "num_bytes": 396984031, - "checksum": "befb46e9f928876edc580c60ea4242f63cf6df77c6c107fec6e4280d279e348d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00239-of-01024.json.gz": { - "num_bytes": 395915197, - "checksum": "dc5ab17e04e4f2678771094af67909dcaa8be36a6cb047cfa66e75f986c91312" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00240-of-01024.json.gz": { - "num_bytes": 398321096, - "checksum": "25b92f7a499e9aaf0496a57f6292a7f65941b34dd6c78f14b08358d180070029" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00241-of-01024.json.gz": { - "num_bytes": 396626980, - "checksum": "1ae21ee5585ec718763a3c7bd70d9338aaf77d0e02f92a41f6ed213d1eefa5b4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00242-of-01024.json.gz": { - "num_bytes": 398220596, - "checksum": "c29f98174a0c02a817d5cfa3ebb2a92d5f49df8a34fa40abd360f1b39b4bde05" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00243-of-01024.json.gz": { - "num_bytes": 398250083, - "checksum": "819387c95ea7183b1f9e1e78d077de65023c4809198ef3a0c946f46f8b6c19b4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00244-of-01024.json.gz": { - "num_bytes": 396943969, - "checksum": "7a0b0b984d7afc4181827705212f917cf4ac12412f640a2c8120513763cdb390" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00245-of-01024.json.gz": { - "num_bytes": 398365865, - "checksum": "a424157137a5eeca89819d600deea2a1619ea8f5ae1ed395c88ac600a85e3afa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00246-of-01024.json.gz": { - "num_bytes": 397285385, - "checksum": "73029f721bdaccd9d126e871973e70a551f48f077f5903656b305ea9885c4798" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00247-of-01024.json.gz": { - "num_bytes": 397132841, - "checksum": "b223cf1270d2c728592ec65b09599bbdef8d64f7df2eb525e114f86268500daa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00248-of-01024.json.gz": { - "num_bytes": 396316645, - "checksum": "94102d9bcc086ed5b203bc0c6b830dd245c9bf6c695b23b19922b2a98eeb6a52" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00249-of-01024.json.gz": { - "num_bytes": 396644237, - "checksum": "36be793f4d76070ba1c696b3274e6dbab43f415c8fbaf752145cc99af6558680" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00250-of-01024.json.gz": { - "num_bytes": 395860541, - "checksum": "313febcf026d2cd1495fdd3d5ba3b492ce5d5749153e189672b6d9dff3e26a61" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00251-of-01024.json.gz": { - "num_bytes": 396709140, - "checksum": "7e2480b3d5869ba35007c40e18585f3fa208cdf8e004078cc8de4fac36773507" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00252-of-01024.json.gz": { - "num_bytes": 396508847, - "checksum": "25df46ae56c0d4a6f945922e31fc697d12e0b7c525be9bc2b8eced802641488d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00253-of-01024.json.gz": { - "num_bytes": 396364816, - "checksum": "6b2125b9eab9bf893e7f8913a6beedbeeef5de53893fbd6172f706e33bab5177" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00254-of-01024.json.gz": { - "num_bytes": 396122930, - "checksum": "7947e5152c5305863e2d664622e3de49f9386b4384eb09630c5bfcad21fb458e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00255-of-01024.json.gz": { - "num_bytes": 396929803, - "checksum": "a1ec8c609ac969c24e2524f0f3dc31ef43ca0147ffe66569d3135e4f28394325" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00256-of-01024.json.gz": { - "num_bytes": 398432943, - "checksum": "3fd0373f5a8974a3499c436d96ea73be95f5619b8388dc316f51aff01e9ecad7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00257-of-01024.json.gz": { - "num_bytes": 396003748, - "checksum": "516cf3626076f083962983b2d6c596ef355609492f2e81c6c3cdec01acf8c5d7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00258-of-01024.json.gz": { - "num_bytes": 393890690, - "checksum": "700760a7764f890c8aae337e7ee458c8467eb9048347edd237e341dd2bd5d236" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00259-of-01024.json.gz": { - "num_bytes": 398130606, - "checksum": "d868f8ef5e1cc971ffd00908bdc7eace32ec151d7405d7cac5fac22df9ea10c0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00260-of-01024.json.gz": { - "num_bytes": 399765969, - "checksum": "7d5eb3b88eb8a0291ae70c1997458cf5aecac645397e50a67fab3d1193064353" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00261-of-01024.json.gz": { - "num_bytes": 397418895, - "checksum": "ca607c9e13d7cfb73a29ee3131f77e6bef3130d8627037cef9f57ed459185f0a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00262-of-01024.json.gz": { - "num_bytes": 397925991, - "checksum": "ca789394ab4398c41490ec6147a41ffc8847155ea9ff74d7ff8b3402ed0634e8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00263-of-01024.json.gz": { - "num_bytes": 397082336, - "checksum": "aac81d1bf0ade80758c14d01842b9b06c89ebf2fcdb9a06b1472bf2f70bbc348" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00264-of-01024.json.gz": { - "num_bytes": 398101079, - "checksum": "3cf56a2989b5c3f26ba94124cc534f5c9ae9770bdc6a3431dd745603b480ab19" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00265-of-01024.json.gz": { - "num_bytes": 396949669, - "checksum": "d4f252a6c2f43833d6d89bf69337449b4cae5dc88fd08fb20b35fe7194a50ddb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00266-of-01024.json.gz": { - "num_bytes": 396242007, - "checksum": "71c745968d8ee4a0d64f38930a76e65d68ea094ba3e0b963d5d6878f65f51b34" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00267-of-01024.json.gz": { - "num_bytes": 398342031, - "checksum": "706a560c862979594265925c3200d4bd0981a9eaa279841f2cba673634f7074b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00268-of-01024.json.gz": { - "num_bytes": 396399468, - "checksum": "eb3dea553c37f220b3b9b5f377d5a4ef94243b3c0b6b46981e3e5b7ba5b4a935" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00269-of-01024.json.gz": { - "num_bytes": 397181296, - "checksum": "4f0feae035dacaeb720ca3b6ea17685144895a0d78cfa358e30983f8d6c4ec76" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00270-of-01024.json.gz": { - "num_bytes": 395712883, - "checksum": "6e0f6de1e5a5c6d4bf23d0539ee72ecc2b4285da2b0f1ec2cdcc443d2e22aa88" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00271-of-01024.json.gz": { - "num_bytes": 398066980, - "checksum": "4c5cd1ef1917ed762d7d8c5c54e1da05db74e45721697df8b0626e0aeac96966" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00272-of-01024.json.gz": { - "num_bytes": 396667308, - "checksum": "77a33c37a5d88e419e2b31cf560d53f129a38e5bc2306b5baccc187b7e94e589" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00273-of-01024.json.gz": { - "num_bytes": 396020214, - "checksum": "b18e40c00b8e0e02dfac40ea0519964e231c8a2f28bc1294b044fb090f41a9fb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00274-of-01024.json.gz": { - "num_bytes": 396300833, - "checksum": "34c8945a6ebac564fe87881d6968d05363a89985f297692a3df7104128b9c26c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00275-of-01024.json.gz": { - "num_bytes": 395206463, - "checksum": "1e41d7e2a6117224dc23fbaae8e9d20df9d7744adb4687d2b0e570bf8d9e47f2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00276-of-01024.json.gz": { - "num_bytes": 396667995, - "checksum": "45973b91c2f1140f79265a24f484fc6d6653f43f83d5bd2d18954892dfa4dfae" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00277-of-01024.json.gz": { - "num_bytes": 398134029, - "checksum": "b7da91889b6695cf01bceddfc139b23f9465bda5cad54088b84a1f5a4d7a4f9a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00278-of-01024.json.gz": { - "num_bytes": 397422615, - "checksum": "e794a2903bda1f3c082e8f590383c714a518c202ecb99eda5513d6b320f70e86" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00279-of-01024.json.gz": { - "num_bytes": 398776175, - "checksum": "a5528d3e33151138ef9bdc2433744f1797de2b20673a570de5bd4d81b306354a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00280-of-01024.json.gz": { - "num_bytes": 396208086, - "checksum": "1be2d8c3d0eca510fac7b06a5401b2b8873bc6dfbf85a3c736301756f9681309" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00281-of-01024.json.gz": { - "num_bytes": 396893734, - "checksum": "1db3e9017561d38a91c417ffef875b7a948c4f64c51b90b0983c71bc9d950903" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00282-of-01024.json.gz": { - "num_bytes": 397411883, - "checksum": "4e23d39fcec2c310cbde3fdc5d9c185046086877ac03bbf9d772b092614f93da" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00283-of-01024.json.gz": { - "num_bytes": 397906911, - "checksum": "850eb5e60b84bca4d2f10b2e511fdb2661e3d08444a07db1782ad85c754fe808" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00284-of-01024.json.gz": { - "num_bytes": 396043261, - "checksum": "fea24050c6aec13eb706a6f3854b4debde62b1b842f2992fc027820c66218b0f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00285-of-01024.json.gz": { - "num_bytes": 396961329, - "checksum": "6052f82887cd2362320f72f6545d2e5b5a775e9bef95783c9b9995ecb7a5ecc4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00286-of-01024.json.gz": { - "num_bytes": 395697481, - "checksum": "f4361838b5b679c8306447364166c1c3083af392b4c8793399c122af09c7312a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00287-of-01024.json.gz": { - "num_bytes": 398773520, - "checksum": "9add91f23f31ff8c5d8d84e6a0af75fc6fa08ceef8ccd9b633d8c49aa1d0104d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00288-of-01024.json.gz": { - "num_bytes": 397684645, - "checksum": "64dc94555a122353c3a3c9999e67d17b0e4b682096ba80be2258c791ce1c2b9d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00289-of-01024.json.gz": { - "num_bytes": 396655864, - "checksum": "2472c76b1cbcfc3cb82126795673126e8f532119a03722a304396ceee9b7db3a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00290-of-01024.json.gz": { - "num_bytes": 397415313, - "checksum": "960b71edbdc6a6a62a0d3cc1069bbbfb11893cc017aba543e10c9a23cb759d1b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00291-of-01024.json.gz": { - "num_bytes": 395617977, - "checksum": "96e582d7a750bee597331f373ec2e16d3a9686f48a49d39765d39550c8cbbad8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00292-of-01024.json.gz": { - "num_bytes": 399332500, - "checksum": "cd6ec4941aa5babbe274684945bf899447ec2459b8f7076ec8c74d2b3fe794c5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00293-of-01024.json.gz": { - "num_bytes": 397021546, - "checksum": "d0d0c4d80e75c5d02103b49027d9e2e6f7db74c12f8b53f600d7fe420b2d0a7a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00294-of-01024.json.gz": { - "num_bytes": 396272726, - "checksum": "caf5708a6989f867ec6c4c56f338aca9f3a43a1806a27ef473d9b0f219001cb4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00295-of-01024.json.gz": { - "num_bytes": 395233811, - "checksum": "a7b5f904e34c0b370238e6beb19149d4bb96d0cce43a1eca3bfaf181952ede53" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00296-of-01024.json.gz": { - "num_bytes": 396480926, - "checksum": "4fcf284d98c2f7b63e47573e9d084eeec2516fbfa62be42c3ff94e1cf518e313" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00297-of-01024.json.gz": { - "num_bytes": 398883718, - "checksum": "c1cb458076497e7dee645f50281d1af2fe5dad556d28a2cbbd73abe6537c8a9d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00298-of-01024.json.gz": { - "num_bytes": 398733629, - "checksum": "4a612c715025292e62860fb0018e9fa2d3fade692342746d044be6297e25a034" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00299-of-01024.json.gz": { - "num_bytes": 398155026, - "checksum": "d33f4043fad9551f92084a45b7f54d920ded9d6fec271cbbf85f71b021f9ee4f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00300-of-01024.json.gz": { - "num_bytes": 398612975, - "checksum": "61b1181b796a2f40db3cb6954f2890397c3722c486dccd4075d74679cf61a70c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00301-of-01024.json.gz": { - "num_bytes": 395385748, - "checksum": "95a78e9d3cece0620430c85822fedf4021ebd88ece57d6714933c268d3b6af6c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00302-of-01024.json.gz": { - "num_bytes": 397620059, - "checksum": "321aed402a5e779febe9766294ad040a3f8dcf57bae68648c03d3c59023aafa3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00303-of-01024.json.gz": { - "num_bytes": 396549027, - "checksum": "4198f6a2b5bdaf90ac4251f013908123a5964429870ccd6b245a9069278c4e17" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00304-of-01024.json.gz": { - "num_bytes": 396596460, - "checksum": "74a6440e93d18d0d6d0622ab7d8832d7ccc91c03297faf20c8090d16f7c042d6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00305-of-01024.json.gz": { - "num_bytes": 394881271, - "checksum": "654deec494bba4eece19c27140426049574cf529c93ccb422fcc09fe4496af15" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00306-of-01024.json.gz": { - "num_bytes": 397760377, - "checksum": "e0840cbc94db6cfc35df66d413a11261756392dd59b0fdf89d9ff166ec76f3e5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00307-of-01024.json.gz": { - "num_bytes": 396671816, - "checksum": "31ceb8cfcd09fda621a9a483b09dfb43f5436e867363f6736ea3f710a6af10fa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00308-of-01024.json.gz": { - "num_bytes": 395961013, - "checksum": "8c1e5acc3f964eaa5aff300731a74dde84ed0671cd764b121ea638fb08c3dd0b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00309-of-01024.json.gz": { - "num_bytes": 396035179, - "checksum": "7d555942b1bcb2518aa5ff9c0549d98fabe7bb563cdc6c73d3f11e6a0bc502b4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00310-of-01024.json.gz": { - "num_bytes": 397140669, - "checksum": "859eeb7a9d2ed03d5299bbf7f1c3e719236477950d7601112a458ea5a2adf7c9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00311-of-01024.json.gz": { - "num_bytes": 398170419, - "checksum": "1e7661637b0a4445119ba403e4f8ede129c829fb7d1907ca7660870b536b8b29" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00312-of-01024.json.gz": { - "num_bytes": 395605627, - "checksum": "87a3ccd2ac9deff1ac4a5dd02bba269a48692d4598c5899630e8d2e4136dbb99" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00313-of-01024.json.gz": { - "num_bytes": 397081206, - "checksum": "c6952116cf573a6e20c849cf1b7d8d0edf3b9d00fc7e717e7bacde915c4c52a8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00314-of-01024.json.gz": { - "num_bytes": 395555727, - "checksum": "762066fd85c596ee01b3b8070708517cc5759bb1e3c4bb65f4645fd62b550d13" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00315-of-01024.json.gz": { - "num_bytes": 397871218, - "checksum": "814f19cc5e81144f5bfd7037f5f522dd5c44faf150c10337c675174a5965a5b9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00316-of-01024.json.gz": { - "num_bytes": 398577523, - "checksum": "27643c7c3c0a1a78c9003b936ea27785709a2df80d09817278a179eecaedc352" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00317-of-01024.json.gz": { - "num_bytes": 396388623, - "checksum": "5f840180e2017c41c6b1c865784788dc3b002478a9ecb43c3859174af788ba5b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00318-of-01024.json.gz": { - "num_bytes": 396173471, - "checksum": "2aeab99fbc84a2640a05081e2c7438451e75f76cbece3cbe5d82e85463a61966" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00319-of-01024.json.gz": { - "num_bytes": 397912127, - "checksum": "fda805ed19f4b996b048386f4bd73924dc965a069e85b8b4452a54a1372375fb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00320-of-01024.json.gz": { - "num_bytes": 398765416, - "checksum": "bce244d024c076911c1c6dbd35609be5442c8b0440690e2cbb342ac64bdc494b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00321-of-01024.json.gz": { - "num_bytes": 396005962, - "checksum": "763584ee096223b8aeffb1576ec6e4f3bea674ec4de40fa163c2f2221b3701d9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00322-of-01024.json.gz": { - "num_bytes": 398615672, - "checksum": "5c12ec1d0c450fb7515c586f24311bad145050dfc64180d65bacbd346c2ce9c4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00323-of-01024.json.gz": { - "num_bytes": 397861187, - "checksum": "93326f43273fb963593e0b1caab1e9588387291c23d5c14b5ae40b46b199998c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00324-of-01024.json.gz": { - "num_bytes": 396679008, - "checksum": "6ebfe6e28851e6d79cfdbf370602373fc2136e88936eece302ecaa8ef8251827" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00325-of-01024.json.gz": { - "num_bytes": 396358086, - "checksum": "51190fbfd48479842ec3c7d910b5519e01ff797ca0143c39be142c1650c5e893" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00326-of-01024.json.gz": { - "num_bytes": 396490692, - "checksum": "f4d9bbfd1bbc6e939fce9a2df26e45c79be73dbe2650fe79af395bdaa39cd121" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00327-of-01024.json.gz": { - "num_bytes": 398354656, - "checksum": "c70c824b6c16e5fad922ec9b8d363d97bed90501522b641b0eb0f66b8c086325" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00328-of-01024.json.gz": { - "num_bytes": 397326336, - "checksum": "7e6008433a0e5bc6eed28a13b9dba17246e7d65ca96c31092086c3546a3a397b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00329-of-01024.json.gz": { - "num_bytes": 396390524, - "checksum": "f379d844a35172424554bb82a65c790c354b76c0e7abfd868225d1968017d1a5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00330-of-01024.json.gz": { - "num_bytes": 398259199, - "checksum": "ea15be4a83c3de66c42410e13e5ef9c93baf86099a8eded1c1d10b0cd5ad0f29" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00331-of-01024.json.gz": { - "num_bytes": 397618860, - "checksum": "7b6aad6224ead9ee3a0c860cfd991301ef5e97093b23c76d713e73f4911d0e44" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00332-of-01024.json.gz": { - "num_bytes": 396743573, - "checksum": "bc5333d383020d2296aa0f6ec940ab586a367efe50d1c597f9db55ca72fa66e0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00333-of-01024.json.gz": { - "num_bytes": 397460128, - "checksum": "095b3a85a9598009638622ca21cb00142efa0d68196c8c3a8bb922cccb465e8c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00334-of-01024.json.gz": { - "num_bytes": 396900262, - "checksum": "6f005575f4843b84f4512e1b7c1b748edf497e4e9f55eaae47f9b4637161ccab" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00335-of-01024.json.gz": { - "num_bytes": 396106895, - "checksum": "66bfe399d0859f71c20db01de53ca7bf997b33afcd3d181f181d9f265a2c2fa2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00336-of-01024.json.gz": { - "num_bytes": 397732616, - "checksum": "1f1e0435de870b98b119e91edd4a0d32d078dbb810f919a70b85360cd860f0cc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00337-of-01024.json.gz": { - "num_bytes": 397834763, - "checksum": "1db4bcdaa6fca612c3f1b38dad6d5402679ca21aa6a545850d61bcda10103697" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00338-of-01024.json.gz": { - "num_bytes": 396712179, - "checksum": "810c104a8862699c490fc8625a7be4115872fe2de4d8c061e095dc5a81eb4d19" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00339-of-01024.json.gz": { - "num_bytes": 396838831, - "checksum": "9bbc616d5c4aba46475957a22544dbdb0557f8de31cdf919718fbfe55bc70ac8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00340-of-01024.json.gz": { - "num_bytes": 395587861, - "checksum": "48c8411ee2b5fc8cffe1589ed204d0ac8a12b5b3bb1857373f84bae984d49e8b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00341-of-01024.json.gz": { - "num_bytes": 398093153, - "checksum": "4ff8ba83e489580da2401aaa23ca3329befe8fc08b6f299b612950c358688604" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00342-of-01024.json.gz": { - "num_bytes": 397248009, - "checksum": "c72e063f95d10ce661b4bc97538eccf6da6ad493b7e54da555a46e4a47aabbed" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00343-of-01024.json.gz": { - "num_bytes": 395939409, - "checksum": "249eb2080c55402aab34a31a442b06bcaa25d2df3f4319ea1a5f50dc6bb709b0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00344-of-01024.json.gz": { - "num_bytes": 397608807, - "checksum": "8cc57604fcc5fa920b0d16df6e8d8b7f4ca88c0c76c86f9ac81f42a615b330e7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00345-of-01024.json.gz": { - "num_bytes": 395751274, - "checksum": "13fbc76e49a8b856f7563b945bef10d786a86caff63b4cebea50416ca34932ad" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00346-of-01024.json.gz": { - "num_bytes": 395516794, - "checksum": "61d43da2e3e7770016ba7235eaa74a1e6a180e64cd2cfacefed5c34e8b72eca7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00347-of-01024.json.gz": { - "num_bytes": 396180000, - "checksum": "4a0ca2103de168d05d0090c8800d47f216cc167a9cfe9e736403aedf040c5e46" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00348-of-01024.json.gz": { - "num_bytes": 398461180, - "checksum": "a56396961496499ac289a85d126b916132e787d0dc4fbd9961aca7dbbc7cfcff" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00349-of-01024.json.gz": { - "num_bytes": 398049366, - "checksum": "ca012572c575f6a8e6ad6453296ff93f22118995c17928e76b655da44ce5810b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00350-of-01024.json.gz": { - "num_bytes": 396532962, - "checksum": "bb35d17862201063b46d8745dc182756d1bb09e809c4c355452ab1967e655491" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00351-of-01024.json.gz": { - "num_bytes": 396576223, - "checksum": "19ea45ab2fe5487d2a69cca7c9a1db7a09c8d5dfdf130412bbcd241cc60a61c5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00352-of-01024.json.gz": { - "num_bytes": 395956381, - "checksum": "bb5869b8649fffadd5f1945ca9a79588e84081a8fc45b7e4cb5507149b5be2d9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00353-of-01024.json.gz": { - "num_bytes": 398903623, - "checksum": "cb16a7ecadd28a8b5622c4e581f463f0ae2fe20a3e6582fa6885d76e7523715a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00354-of-01024.json.gz": { - "num_bytes": 397316693, - "checksum": "42aea18548695c458ddc229d8c837356845609aca3bb64ce6e07b185443b9468" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00355-of-01024.json.gz": { - "num_bytes": 396240550, - "checksum": "1577d76807548d83427293b9f534a3261fb72a345569f0491a1fd2691047bd92" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00356-of-01024.json.gz": { - "num_bytes": 396132315, - "checksum": "b6e17a39292e082e517082b23b381305ebe889c2530fb5eb74a2683d36d07a86" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00357-of-01024.json.gz": { - "num_bytes": 395948117, - "checksum": "524ebed10c881f52f155db5d6690806f5a97aa8f811deadae916323b50427ed5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00358-of-01024.json.gz": { - "num_bytes": 397397242, - "checksum": "8e23d852bc3a0dda4684d5fd511003ad6f18232e5f54e32638c8db62e9d18c6b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00359-of-01024.json.gz": { - "num_bytes": 396141321, - "checksum": "345c34dafbc59f5e93355c8b2e6fcde6bf59bc9e1ebbf5cb962d54228e6d3204" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00360-of-01024.json.gz": { - "num_bytes": 397258644, - "checksum": "51db06055d95e2b43fddebf8c2b7d76b7572745f129d89fe005f8e5d3f12b758" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00361-of-01024.json.gz": { - "num_bytes": 397913411, - "checksum": "2c0f6054fef084d3e7cd10e2de0b1d3a48dc716af1e9146548195df128bdaba9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00362-of-01024.json.gz": { - "num_bytes": 397722576, - "checksum": "664b390b20498eb6e78fc09604b3a947fc1847a01e3eaae4c7861d1dde3b90fb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00363-of-01024.json.gz": { - "num_bytes": 395416894, - "checksum": "c57529884c6d4977a279a097c0dfbcc31d52048cdcf64950182c743583d7989a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00364-of-01024.json.gz": { - "num_bytes": 397028679, - "checksum": "ed4f252d63c679f6e3f35847e0871c3360e072b0d6963f662d7e808b6615457f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00365-of-01024.json.gz": { - "num_bytes": 397574891, - "checksum": "68e8e44a531d98897245fee90ad349f4fdee891b2f68dfda78a1dedcc9474326" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00366-of-01024.json.gz": { - "num_bytes": 396905692, - "checksum": "9e88b888d85633671e009ed7093763b934a42054ed6a1252222dc64781a20e22" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00367-of-01024.json.gz": { - "num_bytes": 396802011, - "checksum": "2abaf3f3946788258b8543fa2ccccc0c20e6980b9d26a38decd356e67f575fa1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00368-of-01024.json.gz": { - "num_bytes": 395630737, - "checksum": "b4960e3395d8a1bf8350f57e5f6280b00443a4c6b85e6fd47478fbbfc1733caf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00369-of-01024.json.gz": { - "num_bytes": 396228047, - "checksum": "08e8210426e6c6ef9746675592a3eea4a92eff9aa4bb7ffc6bf6ba54bc411f72" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00370-of-01024.json.gz": { - "num_bytes": 396548482, - "checksum": "10e0305ac4d1e410d749637e0c03386d969563f8eb73bbbc376fc1d21025e4ee" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00371-of-01024.json.gz": { - "num_bytes": 397344482, - "checksum": "03df0f4aa5c377f6b45db3c3b863240bfb1211ddb226bc055433fbcd9ee8e873" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00372-of-01024.json.gz": { - "num_bytes": 395872223, - "checksum": "9b70549213cb01595179928cdb020daaf7bcd2085c5e947d111f3cc66e406d2c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00373-of-01024.json.gz": { - "num_bytes": 397399096, - "checksum": "945c204cdb107669a8d1252a91323eb300c902bdd6c6a8167a90805ec02cba9b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00374-of-01024.json.gz": { - "num_bytes": 397755002, - "checksum": "8353d4383f73caceb5d112f260b37d1349dc7898af2d05b98ffe17d22aea97ca" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00375-of-01024.json.gz": { - "num_bytes": 396534763, - "checksum": "a3de41388a6d8ce3b605c6586e47b74a565dd2f54175551987bda0a0ff95036f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00376-of-01024.json.gz": { - "num_bytes": 395594630, - "checksum": "7cadf813f2b31a1bfe44fdfc84aef4eb65e889c2616c56b189890734c22b731f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00377-of-01024.json.gz": { - "num_bytes": 398241040, - "checksum": "15df154b52cb4d9314dbc4ac26ca4b4df7125b12131d538fd480f8a6b3fbdfc8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00378-of-01024.json.gz": { - "num_bytes": 397217224, - "checksum": "208ce680427f62d78dad857bee91122a79f968589b4e44f2f89919e91f4dea30" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00379-of-01024.json.gz": { - "num_bytes": 398504097, - "checksum": "0052fe7f27e720423b6143f401b8618428d913b22fc2af2950874785e2ef7528" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00380-of-01024.json.gz": { - "num_bytes": 397494149, - "checksum": "15c4f07a2629c7bd79b243c97367e3e18de02b5ab09eccc0f85b1eba0e0b071a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00381-of-01024.json.gz": { - "num_bytes": 397190859, - "checksum": "77c71b4a79ac2f462040ea0e8408fdb8f719fac0f09fadb760ed00b709e9dea5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00382-of-01024.json.gz": { - "num_bytes": 398126420, - "checksum": "aa44d029398c33f733065c489ab3ded9395f6e53263407173b6e9c27b6fb9c45" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00383-of-01024.json.gz": { - "num_bytes": 399108296, - "checksum": "f507161fbe96f8abe9dedccba2458448719e6b153bcc1256ecee6b4b9c82256e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00384-of-01024.json.gz": { - "num_bytes": 396156787, - "checksum": "83c236bbc8508fb81992c837751a4d8ad4b9bc138dd1f4bb5c1fcc68203e12da" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00385-of-01024.json.gz": { - "num_bytes": 396878483, - "checksum": "df45b4749951a46695f88789fc536617ee3470083e55562292f606e09185e4a6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00386-of-01024.json.gz": { - "num_bytes": 397495799, - "checksum": "a8240c9e7266e47bda8880e38ac8a5afa8541aed4b989d6642b31497716a51ac" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00387-of-01024.json.gz": { - "num_bytes": 397062301, - "checksum": "e6fd54ea6f17d5570fa4cc97554813a7a33bd4e44cbc456b27b0c87c1af22c60" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00388-of-01024.json.gz": { - "num_bytes": 397074091, - "checksum": "fdc2a134df4a669deb839f26947c86b7e7a4bc7596a6a1c25562cb97fbb6b089" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00389-of-01024.json.gz": { - "num_bytes": 397056868, - "checksum": "e7390f0007582a3460fa67375b2628c85a1aa85954796d8e6584fadcb35761cc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00390-of-01024.json.gz": { - "num_bytes": 396404332, - "checksum": "820a97060abd3172852f38e1636706c8389adad8495de56f4c3a2c3ba6008235" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00391-of-01024.json.gz": { - "num_bytes": 397125489, - "checksum": "68732c5ab9f4b6945e79ce2a1b45b97a97822d6a107aa79aa9135f29d91173ab" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00392-of-01024.json.gz": { - "num_bytes": 394992472, - "checksum": "c9d1e8cfd481631a76544e5880ceee9990e7553c88c5978a91b48ec8aa47717d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00393-of-01024.json.gz": { - "num_bytes": 394778146, - "checksum": "7a5ec4f0878f676a3ac2c417f512186066d793f28d611f97135c3626b3b60fdd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00394-of-01024.json.gz": { - "num_bytes": 397024190, - "checksum": "44e32db5a39684ab1789cfe97b6e9cbd3c539390e7a4c8ec9298e7177945452b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00395-of-01024.json.gz": { - "num_bytes": 396537190, - "checksum": "601ec281240753ac5793ec7cb83802a788c4d88e56dfd83e6c875cf2ef9bd8f1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00396-of-01024.json.gz": { - "num_bytes": 398049705, - "checksum": "b1024b69e191b2c7073f5f4f3ea51e8710be54db8603ce8aaabbfb919ea6694d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00397-of-01024.json.gz": { - "num_bytes": 396670567, - "checksum": "11357bc600f9b0c443f124c7fa4046d10cf03e19016e5ba8cdde884d2ff76c9b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00398-of-01024.json.gz": { - "num_bytes": 394706629, - "checksum": "778eca6d845b9a7d49e22941b959a95e5e4d2d9714720f27b810230d136acfde" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00399-of-01024.json.gz": { - "num_bytes": 398257272, - "checksum": "27c2a30af83975d32469e85fb2e27953a3aa9f97514f621063325cb9af1829fa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00400-of-01024.json.gz": { - "num_bytes": 398732278, - "checksum": "aff9a39748526a03d3476288cdbce122c3683baf113362e9085895609d03c3c8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00401-of-01024.json.gz": { - "num_bytes": 396372632, - "checksum": "a6af262bb962eb1c45d2003ee1bb2be1a3a12cb3e53d4ffe58b4b68dd852957f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00402-of-01024.json.gz": { - "num_bytes": 396783625, - "checksum": "db9aca12012da21fc5a0619a47e9c3075959786d6d6d74f6a244af1cb33c402d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00403-of-01024.json.gz": { - "num_bytes": 396950960, - "checksum": "b3566f7b9251f6aea9343d1344151f10fc104464f92e8f10a97742defffc2244" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00404-of-01024.json.gz": { - "num_bytes": 398481154, - "checksum": "897904040b5887620b9996cf89656f5bff329a430a8c3dfd6802d0c879675376" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00405-of-01024.json.gz": { - "num_bytes": 396065216, - "checksum": "45e0108549ab06d9a8ad5c45dc53250798d0e58f7e940080a754106801250009" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00406-of-01024.json.gz": { - "num_bytes": 395637879, - "checksum": "bda70f3a19b19e2ffdd1c3a26b959945b447acd450cab49e72ce727d2218af5f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00407-of-01024.json.gz": { - "num_bytes": 398356109, - "checksum": "1df9e8b4715d9a3f02a0b06aef6095f81d38acd1be0b4fa402acaac0258c3116" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00408-of-01024.json.gz": { - "num_bytes": 396041456, - "checksum": "e89ebf354280543204e78f4308a8f8751cc26094524628cd8e9cb691d9911b82" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00409-of-01024.json.gz": { - "num_bytes": 396254329, - "checksum": "15729474174d6a5adb5935f25afa6de2f03a8dd2f73b780e23795ede92f5762d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00410-of-01024.json.gz": { - "num_bytes": 397850848, - "checksum": "98f1b8fc845e0005b76d7eac70a430ce98e6989569344ea92266f8391b1396fe" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00411-of-01024.json.gz": { - "num_bytes": 395527322, - "checksum": "52b2e31f2adb61c8e703c6758016cbfc650f8104dcd5f78867c81434be155ea6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00412-of-01024.json.gz": { - "num_bytes": 396155992, - "checksum": "7b6b4192f9bec4fdeaf9d6dcabd9cbba6b4c8ebb42d26730fea21bad139823c0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00413-of-01024.json.gz": { - "num_bytes": 395766377, - "checksum": "775d1fac6b1708ba0384d922640b2f372b3ee146fc79fbe692ff69a7c6c699b1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00414-of-01024.json.gz": { - "num_bytes": 394860848, - "checksum": "0386d8a8e0cc9d5d613b1f84085791de57ad05751d94d25681d86dff5cec1afb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00415-of-01024.json.gz": { - "num_bytes": 397566065, - "checksum": "1957b0d185943b1952dc66e78f0a7d449f49f8f55fc0978bf77e8dde10f4714d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00416-of-01024.json.gz": { - "num_bytes": 396297306, - "checksum": "3f8796934edb79d172e682511a5ed7666aa09ff541ce55e2c66406bdb6eeda9d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00417-of-01024.json.gz": { - "num_bytes": 398314475, - "checksum": "8da08075b966c04aa7859275eefd34c78cd2b9edc366684733d027ad6d619ba7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00418-of-01024.json.gz": { - "num_bytes": 396296110, - "checksum": "efe43733ebfc7b65c646aee68b883cf40124c1446a28e70ff2bfa9e1bb1377cc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00419-of-01024.json.gz": { - "num_bytes": 397614415, - "checksum": "c0f02d78715de9c3ea0c684dad36a506386081fed2011ec298ca0ee623c7792e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00420-of-01024.json.gz": { - "num_bytes": 395133656, - "checksum": "6237f5797a35dcdd89a0b70cac4dedcfb3fe418560f8dbbf6cad685f11c870b2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00421-of-01024.json.gz": { - "num_bytes": 397061849, - "checksum": "ee37899a6a49269026633ec79577491ff4b11e219e0236dcba68eb168279067b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00422-of-01024.json.gz": { - "num_bytes": 396539584, - "checksum": "e5914a4b97c27da82eaee2f4f67a165de946bb38a00d6126b1527f5eb1200417" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00423-of-01024.json.gz": { - "num_bytes": 397715346, - "checksum": "b99e628f8790a7baa8ee7828e31f2ec72374f9a8390c1d64c9b8092b10d9c7fe" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00424-of-01024.json.gz": { - "num_bytes": 396335469, - "checksum": "9cb3b9eb00760bb68f3df4b66b96f1e5798c338231500472fd64c49cd87c6599" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00425-of-01024.json.gz": { - "num_bytes": 396714466, - "checksum": "f28d4901ccde8eb7afcede9732ab94fd18c49e0e3731659ef587058d6ea2ab28" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00426-of-01024.json.gz": { - "num_bytes": 395566563, - "checksum": "9ab75a89a425ce974fd36e936476a30db913c2d7c9ca6e5522b91ffbcbbe30cf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00427-of-01024.json.gz": { - "num_bytes": 395379035, - "checksum": "5e1ca658bea5ba5506afbb9ae5a5da4d35cdc3a215478c68e11652a7d5d918f5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00428-of-01024.json.gz": { - "num_bytes": 396419259, - "checksum": "d740b37b576bcde0e1c8eee27c3bfb3b58c1a0d3c5b471001804b2a37f277ac9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00429-of-01024.json.gz": { - "num_bytes": 397116774, - "checksum": "d1c10b0ba72aa2d4cb4640d1263c32868190942b1e93b4bb4e9798e25f10ba67" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00430-of-01024.json.gz": { - "num_bytes": 396634586, - "checksum": "11dec038b4c1c35d32d000915812b6ec8da9abbbec2e15f7493551198b6a1ef3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00431-of-01024.json.gz": { - "num_bytes": 396704705, - "checksum": "efdfdef444cf68fc05090107033ffe2ac906b6efe2fc138e90f47cd4bd0b6204" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00432-of-01024.json.gz": { - "num_bytes": 396264701, - "checksum": "fa649c2e2dbc992408c3a60327e5d5ace4697c84010446bb286e544eb6c604be" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00433-of-01024.json.gz": { - "num_bytes": 396887722, - "checksum": "3d5fd3fbf209dfff2057143a3dcf7eceeccb1e85967a9a85a992f465e3522335" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00434-of-01024.json.gz": { - "num_bytes": 398856291, - "checksum": "ab6dc5343b052da901f4671c1cb3173850fbc6bbfac2623ca14936b2b83d9667" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00435-of-01024.json.gz": { - "num_bytes": 395888569, - "checksum": "26abd1e2263af02f998705501bd02ead2edc3d7f68fadc7b198e7fcf4dffc454" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00436-of-01024.json.gz": { - "num_bytes": 396976077, - "checksum": "a5dadf6ec93e8dcd62b0e1de3cb03c866147bafe0da8e631341663ccc03bb801" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00437-of-01024.json.gz": { - "num_bytes": 395809168, - "checksum": "7f98e98270f9b88570b5e498511ee65d07428db604af349ef9107dbcf65ac4e5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00438-of-01024.json.gz": { - "num_bytes": 399136723, - "checksum": "0e03ec507b90b38d5b6d7dfe27d40e127efdc9a0bae349bea2e743375ea29b9d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00439-of-01024.json.gz": { - "num_bytes": 396435416, - "checksum": "5f868ba66ea32a23be4a926fda0a86d0d2ab4948326e1ebac615fa16a2a6864d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00440-of-01024.json.gz": { - "num_bytes": 397487165, - "checksum": "d30005787e7472313982cf2860e0a0764900b82a7bf616da27e6c1c3298eb215" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00441-of-01024.json.gz": { - "num_bytes": 395968030, - "checksum": "181461b447d88040130c3348ae7d22f220e0f97ace030d6f54301a9a3d483fc7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00442-of-01024.json.gz": { - "num_bytes": 396909150, - "checksum": "0854cd3454047e0c6a0746ef21e0cbbb22fbdf4349c2e668f4fa1e49add183c1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00443-of-01024.json.gz": { - "num_bytes": 396271897, - "checksum": "2493db29dd3cadef3719576c34213496eff807df5ae8cf538f13e84d403fec77" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00444-of-01024.json.gz": { - "num_bytes": 395540084, - "checksum": "5e717d9e0c1b6f728df0f206e422a0958a537dddf31fffa4d699e5bf4b3c2b16" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00445-of-01024.json.gz": { - "num_bytes": 398750991, - "checksum": "b8af9d413da48fb5f9a9174b12ad253b2eb2c1ed7709cab710d66710841568e3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00446-of-01024.json.gz": { - "num_bytes": 397575547, - "checksum": "2bad5a914cb9f2e5e99d76afbf85eef66c18e7c1cf2e11c5d455792ae86ab441" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00447-of-01024.json.gz": { - "num_bytes": 398035036, - "checksum": "d834925674a33ed5eb8fcb335fd81b95e4ab882010e434e3fb9323e0f23be2bc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00448-of-01024.json.gz": { - "num_bytes": 398658613, - "checksum": "16f3ac40180e47b9b97998f5d1d7c0e9336e2fee5612a3397fd161937f7a2b07" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00449-of-01024.json.gz": { - "num_bytes": 397934476, - "checksum": "09dd3d5a529f62b10d1ec97f37ed142315190fb437be3f50987ee955b11f7672" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00450-of-01024.json.gz": { - "num_bytes": 396444119, - "checksum": "8a25c11e0adc5fdf50944767fbfbf01a9c35b3c0e07205c7c06288d1f68b4c10" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00451-of-01024.json.gz": { - "num_bytes": 395963541, - "checksum": "f3ac2e295ca4b3ca1f55c8b500ea2588f1519163cec381297ad4bef390fbbe1c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00452-of-01024.json.gz": { - "num_bytes": 396594911, - "checksum": "25a57709e934077c2972f0f8a1a9db7afe9b7558ab023bd6ee5224b2f8cd770a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00453-of-01024.json.gz": { - "num_bytes": 396745507, - "checksum": "75c1a4803bb58efe5df885bccd13596d46dd1f3ea30899a7e83812167b990bde" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00454-of-01024.json.gz": { - "num_bytes": 396193342, - "checksum": "c151679573ea5f5b52e26e8b50da7e14760d1ec15c63a5b864b648190efd48f4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00455-of-01024.json.gz": { - "num_bytes": 398096160, - "checksum": "7f86270b13ee4133adaa06de809f26ef581229407813fca05db521d9d36880dd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00456-of-01024.json.gz": { - "num_bytes": 398965570, - "checksum": "d5b292189c5d318e0ad622eec1e764993084d0477147f51f29acd637935fec5c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00457-of-01024.json.gz": { - "num_bytes": 396672892, - "checksum": "8b490f615b3ed701390ed671d5645dec4aa3fc576a032da8f9d434087c1eb8c0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00458-of-01024.json.gz": { - "num_bytes": 396911580, - "checksum": "8bcadc16baaa4e36fe17ffc0862c264230385e18bbd861671ad5fd8cbb86404d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00459-of-01024.json.gz": { - "num_bytes": 395969213, - "checksum": "b8ff8371a01d7bd1782044058ee0f53d4d1275ebca0870ba16104c1c4b12f07c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00460-of-01024.json.gz": { - "num_bytes": 396928338, - "checksum": "23dde1fe55277467d6d2385684b71e90e9066e6a3c349a1da30a1487e87c8539" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00461-of-01024.json.gz": { - "num_bytes": 400009637, - "checksum": "34b98d46d207c5b6ea7416fab6f3cfcb1444cdc19376464ae9abb9296fd14c3b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00462-of-01024.json.gz": { - "num_bytes": 398107677, - "checksum": "2031735c0f38ce43e37a5bb1b9728fc37c758fc4af71758c3d3b9535716a3253" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00463-of-01024.json.gz": { - "num_bytes": 395503017, - "checksum": "7820184904183fad9a61b6c638df9de11d4624bb3aca08885b842255172cecee" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00464-of-01024.json.gz": { - "num_bytes": 397493281, - "checksum": "b39b1b1e6686014a3c62e74912ec3b915dfc161b62e2d1108410354e6dec760a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00465-of-01024.json.gz": { - "num_bytes": 397080149, - "checksum": "a65cc7f590cc498da334d5a8653e818421e09e5e6ce2e8bc2a29ac67a02c3d43" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00466-of-01024.json.gz": { - "num_bytes": 396633690, - "checksum": "15d891873ba02923893cbc8c42adc0468bb39161f898a810037cc2e9f82e0796" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00467-of-01024.json.gz": { - "num_bytes": 395045117, - "checksum": "711686ff5478ec35ccaaf1549b7a33b941e322585f702257dfe2d31630245ba9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00468-of-01024.json.gz": { - "num_bytes": 399486439, - "checksum": "59c4599c8610f4c54778daedbb358f5e26fa527f8f94c3364b70565ebc90571e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00469-of-01024.json.gz": { - "num_bytes": 396170105, - "checksum": "4263dbb03135c2d8b16fb323208f98fe1a1ff1223e76a7ba085f881411a0ab95" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00470-of-01024.json.gz": { - "num_bytes": 397479432, - "checksum": "2db90de8f4d2bde9af453478ed4667166f636af701bb487095311f99b28e59bd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00471-of-01024.json.gz": { - "num_bytes": 396679096, - "checksum": "caea3c4744adb89f006d9b0d9ef93241a55c1fc165cb0cd62b6d07fa3a40cdc0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00472-of-01024.json.gz": { - "num_bytes": 397080237, - "checksum": "34995676d953f4c95f8bd4f54fba8f92b86189cd73298ab77ee2702611b86e5e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00473-of-01024.json.gz": { - "num_bytes": 397881706, - "checksum": "c0fc6c68ae509d8273e7ca0efbe24f1452a57dcb000f44f550fe9600fd305e62" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00474-of-01024.json.gz": { - "num_bytes": 397705270, - "checksum": "50aeb620f8c03a2e4f2346a0c79a4509adfae084ffbeff0b86d8892b858a821d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00475-of-01024.json.gz": { - "num_bytes": 397201717, - "checksum": "4fa508d23abd417bdb0b0e7a61f9aedfb770609214cd85b10b4bde7ced7f12b4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00476-of-01024.json.gz": { - "num_bytes": 397522775, - "checksum": "27da6164865687041e4f53d9ecec2edc877b147da5b424acbac2c69480132a08" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00477-of-01024.json.gz": { - "num_bytes": 397323156, - "checksum": "e40115fc4901a3930494652ce9ee7abb0c3f41abc6d6c58c81fa75a0ee752db8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00478-of-01024.json.gz": { - "num_bytes": 397380721, - "checksum": "79a16b7016aed0eec375ca383eb316765687f12421f786b2e133faa5690ef197" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00479-of-01024.json.gz": { - "num_bytes": 396828680, - "checksum": "08185ce3c3e5b01552be7d8f08ed5b27a6b1b121bb2d7d70a78b7074fee02fa3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00480-of-01024.json.gz": { - "num_bytes": 398678311, - "checksum": "37a5804dafb2f4aff9e393af5b127c3577ab8a5dd23f1e41f2304b25a4c428a6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00481-of-01024.json.gz": { - "num_bytes": 397654112, - "checksum": "47ce12535b753d8936ce3b569675e76cb6f638bfb74a93caf201f3ffc409d71a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00482-of-01024.json.gz": { - "num_bytes": 396387301, - "checksum": "1d07828a199bb1e1c0c8342ba99e484093557188370d1ced90803c2615d24b7b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00483-of-01024.json.gz": { - "num_bytes": 397178863, - "checksum": "b6499612fac654798010e11c27ee8a25fc05d1dbed8aaf2338fd0ea377dc4732" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00484-of-01024.json.gz": { - "num_bytes": 395826769, - "checksum": "ce197ad5a226249bbba53c34b9f3c83508b542853748c3094a5b98befb537f2d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00485-of-01024.json.gz": { - "num_bytes": 397100006, - "checksum": "f483044a4a0418b695e0b989f0fd03bfa79df01b649991f2356443bcb29d0820" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00486-of-01024.json.gz": { - "num_bytes": 397658615, - "checksum": "297beef7b85dc128a6a58d834c5fd1b24bd7fe84c7a317500461720c742235f1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00487-of-01024.json.gz": { - "num_bytes": 396904673, - "checksum": "06751938694fad1645ed575208e8e2c1efebb7165b4feb2d0ea871dc348741f8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00488-of-01024.json.gz": { - "num_bytes": 398019631, - "checksum": "eb58bf8b011fedf15835841317e445e9e757c9939b4453a013233f020f98a697" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00489-of-01024.json.gz": { - "num_bytes": 395822836, - "checksum": "b339e33e7affbdaf691852d3668ff79adf8476a3c33eb86ad9f4ad4a6ebbf3dc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00490-of-01024.json.gz": { - "num_bytes": 398410737, - "checksum": "4d8356cf804474538772c5520e77e75ac750dce3e6b103c9feab49ccd46a58ff" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00491-of-01024.json.gz": { - "num_bytes": 396607853, - "checksum": "1757097fb884d03aa288a05870016b1c2b9f1700ac5913d85c9821cf2e367702" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00492-of-01024.json.gz": { - "num_bytes": 397612443, - "checksum": "92e98e431a378e0402d81299c49209c66d39b0ba7ae63711f8d6ecf542f5fdf7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00493-of-01024.json.gz": { - "num_bytes": 395595466, - "checksum": "d839e1763aa6ebc7cbcf1b870d947ba45b0b4ac95b0adbe4941a0b121690a311" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00494-of-01024.json.gz": { - "num_bytes": 400397068, - "checksum": "31caeb5f0ef694c06ce434df44c01f4a91fcd48e4acb4f1bf167eae6e59a02de" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00495-of-01024.json.gz": { - "num_bytes": 396458630, - "checksum": "26291dfcae5145cdc306317ecf95851a3f693b4a7c6e132e55384ec69d85ef3c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00496-of-01024.json.gz": { - "num_bytes": 395037560, - "checksum": "b32344b92f81006ad9e2e471f5ef8133e87924c5150145b13d51c3d7a0f68c46" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00497-of-01024.json.gz": { - "num_bytes": 396247929, - "checksum": "0396f0bb16b06ff130e955f260233ec868ada1daef6e8cbd480ce388628d49b9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00498-of-01024.json.gz": { - "num_bytes": 394798084, - "checksum": "28d43d4e7bbce4e20167741ea2bbc3f17981aa51f9c040cfc41c522e732c6d32" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00499-of-01024.json.gz": { - "num_bytes": 396699883, - "checksum": "c6f6deff919b375fb08c74e159c25aa66362e4cddb0700f9b1e0e2701293ae70" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00500-of-01024.json.gz": { - "num_bytes": 397014521, - "checksum": "7ee22957fdfad0880f132f47860612331afce7a48975b9312233ba8ddf537bed" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00501-of-01024.json.gz": { - "num_bytes": 399063718, - "checksum": "ec94186b620037002819cd40347e6aaf67cb847848483790cd687222c9addbbf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00502-of-01024.json.gz": { - "num_bytes": 396938850, - "checksum": "a218de10cee75c4bb5a7102fbe208e6e65142ba5f960ecdc2b56b6f85fa30840" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00503-of-01024.json.gz": { - "num_bytes": 394631309, - "checksum": "8189de9454986f63253fa1ad44c63d5c2f692ff4bc3a848c7c2fd02e08f4e1b9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00504-of-01024.json.gz": { - "num_bytes": 397884411, - "checksum": "b7b268545c27573840bf8a6abb7361c209f92f9b5f0f8028fffd49b0c773854b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00505-of-01024.json.gz": { - "num_bytes": 395784113, - "checksum": "b9f1610be9f045c15e43a7343bd2918743a71585a7122a4e781533dd39a73132" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00506-of-01024.json.gz": { - "num_bytes": 397939195, - "checksum": "f07b77d1be71c5922321e8683140f9a63a90903f1fbd1515d908807e12fc4597" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00507-of-01024.json.gz": { - "num_bytes": 395925741, - "checksum": "23e9927e9e83fd03e9d99c3fac05f1bf63d6c296a2b02d1aa208798d27d8dc1c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00508-of-01024.json.gz": { - "num_bytes": 397426015, - "checksum": "f4b8a74c610cea50a6b144337f65fcfed11fff21df6683503f25d4b82e29a4e4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00509-of-01024.json.gz": { - "num_bytes": 399072341, - "checksum": "c3069ae9658273cbaeaed1730f171837c8d3042e31d1093cf0f519f601309a41" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00510-of-01024.json.gz": { - "num_bytes": 395859781, - "checksum": "e5863648f64423397ca1a7838df18aeddbb3d5d3a2551321fd99a480508fa86f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00511-of-01024.json.gz": { - "num_bytes": 396948832, - "checksum": "a2209ec05a794f083cf163c102c6ddd8d5e5627674686950e17e586128a81e60" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00512-of-01024.json.gz": { - "num_bytes": 396585426, - "checksum": "1c6fdb002dab490e6ddd7fe6023b2124bb944b7ebe95ee3b7faca9a92f4b5de3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00513-of-01024.json.gz": { - "num_bytes": 396789970, - "checksum": "83b02c0cf9ffea9d021adc102269c30a33ab3a803d331ba8d39aaa9b3b7acb43" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00514-of-01024.json.gz": { - "num_bytes": 397131474, - "checksum": "783f25460641cd3532c3bb3920c7d3f0c68b5e674d44cba33b1ed755608cf8ba" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00515-of-01024.json.gz": { - "num_bytes": 396127068, - "checksum": "61e5b9947f77d929442f23fe84465d88044631aa1eb6438a0b86372cba7286fa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00516-of-01024.json.gz": { - "num_bytes": 397526020, - "checksum": "539b032f528d1ec3a8e8420514ef2118f05482297b052f6d28876a8bf776a080" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00517-of-01024.json.gz": { - "num_bytes": 397748661, - "checksum": "03b85a51aa7bcde672cc017fcbb0f11976cbd1447fc0ccb4f4bc822b2b04b27b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00518-of-01024.json.gz": { - "num_bytes": 397915751, - "checksum": "80dec6dc7d15459c113c16f23978c38cdc1157ca18468d8a00e0d2192bb2ffd9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00519-of-01024.json.gz": { - "num_bytes": 397847480, - "checksum": "7125e7915fd03c6312cfe448e4e7a8629249765c13d8558b17c240c2aef713b4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00520-of-01024.json.gz": { - "num_bytes": 396232144, - "checksum": "27974f9766c18fd0b652c94eafa3493243c8e1b25b6e850e857ab6246b193b48" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00521-of-01024.json.gz": { - "num_bytes": 395111538, - "checksum": "61406e92a8f9a6ab800b3dd25cbac842e3487a4c7db7b1bb2070a41d627367a0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00522-of-01024.json.gz": { - "num_bytes": 397690206, - "checksum": "b2e29801d120132a5fbbd3662a54290e46ff5e178b3146ebfc2169facf72e7e4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00523-of-01024.json.gz": { - "num_bytes": 398274007, - "checksum": "79905dbc45756c9f1c225120709d39cbf3caf435e322a531a4add690a1d0440c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00524-of-01024.json.gz": { - "num_bytes": 395689218, - "checksum": "1dc3086cb869abb13862970186f6a77cb29b687cd49518173f639c148d937f6b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00525-of-01024.json.gz": { - "num_bytes": 397979085, - "checksum": "6958bbc6029c00229fb0059d016a6b7a2bd21cfdc69392893423d2657c35c7c5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00526-of-01024.json.gz": { - "num_bytes": 398473877, - "checksum": "895f42c4e7569f0db3832af13e56499f65fff74e93fc0cdf60c1c4b4b08881c9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00527-of-01024.json.gz": { - "num_bytes": 395879939, - "checksum": "e84e72048b56878b1ff904ee83d92c208e15b16663b99a9d763edc23c2e0e55f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00528-of-01024.json.gz": { - "num_bytes": 396472889, - "checksum": "badcc3cda339c61936591e9333787ea032c42d7ff2288fdaff791bdc8504ce96" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00529-of-01024.json.gz": { - "num_bytes": 396983038, - "checksum": "ad20643f9d50c7c508fa136ceed0039ce39708e0e7a5e743c1981f1000bc3c4e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00530-of-01024.json.gz": { - "num_bytes": 395774249, - "checksum": "9453fa3fd296150b436f0146171ea8317512c6735ee9434622a83765a5d9e310" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00531-of-01024.json.gz": { - "num_bytes": 396171120, - "checksum": "3e3c230ab6beda13e4dd4747c7c6291e57b1ccb4a96ac2edb46ffdb4c3cb05b5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00532-of-01024.json.gz": { - "num_bytes": 396200411, - "checksum": "e9b52c3dad233fd1c4310cf5f76c2e6d0788ed084abcf931f99ab7002976d75b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00533-of-01024.json.gz": { - "num_bytes": 395580851, - "checksum": "e135cc4420d9f4d17ab523f7db8c559021a46a9a6bcdd21a6c4075047465906e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00534-of-01024.json.gz": { - "num_bytes": 397459281, - "checksum": "bb4f32ee1c1bedf4582b0f4f9ec7644be73fa25bf18cca7506e3c26e98818bad" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00535-of-01024.json.gz": { - "num_bytes": 397344480, - "checksum": "3766ddf8313c5cee08a575fa96bdde06a5b293f1964e58293ea583d72bd18e20" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00536-of-01024.json.gz": { - "num_bytes": 396588089, - "checksum": "56d236a4250f9488d80b93c0c005962d018da256ea5632c7e16ae26c54188749" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00537-of-01024.json.gz": { - "num_bytes": 397606873, - "checksum": "d7ec24ef99de2769937b89e0ca7e291eca2bd0438d501d9228d5ab035f49d83e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00538-of-01024.json.gz": { - "num_bytes": 397608864, - "checksum": "1a60378a0f1a200b11f85577bbd0f373ae47022eab16fad53da492ca1ed35bfd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00539-of-01024.json.gz": { - "num_bytes": 398377669, - "checksum": "787d263107eb09e852b015c17d1d0f54d8b93e78292c0c1e60cf99f27535c608" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00540-of-01024.json.gz": { - "num_bytes": 398516980, - "checksum": "dce03ef0813ef66e27df8730da7e341b49bf7e684bffd3a9cf700905501d1d72" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00541-of-01024.json.gz": { - "num_bytes": 395557685, - "checksum": "e4035222d65124bd3e33372b76b65c2dad9e696701607ceeb5968d483595645c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00542-of-01024.json.gz": { - "num_bytes": 395725875, - "checksum": "4e7ae0b1c0c4d514e0208e21336d095fea5970475077d6690a917faadb2b72b4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00543-of-01024.json.gz": { - "num_bytes": 397625187, - "checksum": "a96ac467b6ace74a08f7dbc4bb8e3fc57fae36abc8975d6b60a7b7353ca9ca88" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00544-of-01024.json.gz": { - "num_bytes": 397078230, - "checksum": "337470c84cde5d02bc6a89003a6796de9e63db269e7800637ef2d220d75bd3ae" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00545-of-01024.json.gz": { - "num_bytes": 396145060, - "checksum": "da65d66aa4cfff77c754f8017eedd92cb82494b9425c2d5c5491d64603b2231e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00546-of-01024.json.gz": { - "num_bytes": 396093007, - "checksum": "399f7b70d1c1b45ce315f396d5fa0db2c69e41c522b0514e19bcc6802b953b1f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00547-of-01024.json.gz": { - "num_bytes": 397457696, - "checksum": "47fc8fd82271e6b1fb074512da45dc005e22cb7f0aca3b7b621ea87613aeff9b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00548-of-01024.json.gz": { - "num_bytes": 396246097, - "checksum": "3108770b39746852d7c048d9a8777722480505bbf4592732c7d1f231e2505c55" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00549-of-01024.json.gz": { - "num_bytes": 393096516, - "checksum": "9bb2b88775593afe4060349985ff4417a37f1ba9b4ef33399c58644c01a92b89" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00550-of-01024.json.gz": { - "num_bytes": 396631619, - "checksum": "cbb55d645d145ecc2ff9b96524463f82d5548c0bdf42381fc6faaad256e7ead7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00551-of-01024.json.gz": { - "num_bytes": 396806780, - "checksum": "ece03d7f12daa39473b6b8d5faed08a3f751efb9b1ee99f69c5188633d4a0f43" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00552-of-01024.json.gz": { - "num_bytes": 398608968, - "checksum": "7fbbde9c39d67d8d7f9f16c0848188b743c6ff5bc44e6339d5fd88c32e1aafef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00553-of-01024.json.gz": { - "num_bytes": 397696672, - "checksum": "85f9c5c5fbcfd06f715b520a1a3a63a014b1831d2f65de5f02cfea49a18ddf63" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00554-of-01024.json.gz": { - "num_bytes": 397122204, - "checksum": "78e3d43c3d2b71d8483788a085cd5706648767de7a2fc4aab707d6a05257ff00" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00555-of-01024.json.gz": { - "num_bytes": 398704893, - "checksum": "113e5fd99ada6ca96c086487b6e4012bad711d1d482d580e22d3af5b9d118572" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00556-of-01024.json.gz": { - "num_bytes": 398099675, - "checksum": "c7a816f8f2f74b4554ac17ffc41e67ebbcabb7c8b0c94292b4569bea372bea3d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00557-of-01024.json.gz": { - "num_bytes": 396538561, - "checksum": "7af6d2c9886481a0d393e026739b5ad7d0fc358ecc216d2fc124160402d4b50a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00558-of-01024.json.gz": { - "num_bytes": 397660839, - "checksum": "c1033428189671d4e1ba55c822040f307748c6ec31b80be3e4ed8e7a4325066b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00559-of-01024.json.gz": { - "num_bytes": 398754128, - "checksum": "69c9f88840166363f2b7ddaef05ac9d10441fd184d8451abfde76eb105572342" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00560-of-01024.json.gz": { - "num_bytes": 394988981, - "checksum": "a2dc4fc315a0db8f1a868d631d2941ab2806f44c2ae698e94bb7e8308bd67c70" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00561-of-01024.json.gz": { - "num_bytes": 395801300, - "checksum": "dc1b2b4594e3fc7f8795f7649d1c524405edce56d617f1e214692565de8c8937" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00562-of-01024.json.gz": { - "num_bytes": 398322250, - "checksum": "c23404fef6a6b5b887cc2dddfe341e983939ae36078d62842919a3739c96b43a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00563-of-01024.json.gz": { - "num_bytes": 397584845, - "checksum": "c909fe429772c8198f904496ea6cf239d669c6c787889cefcb7623e08a988db0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00564-of-01024.json.gz": { - "num_bytes": 396436964, - "checksum": "8e7cb1863057a3b9929af4da29b4e1cca1f71c254f5eba91a657d9e8c1fd6dea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00565-of-01024.json.gz": { - "num_bytes": 396486039, - "checksum": "23ba56e78c4edc4d58fd7fbfcf784b29037204a641e43a9894c95c68bdb982fc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00566-of-01024.json.gz": { - "num_bytes": 395358745, - "checksum": "71259a300ff096b49e3461c91824a8185037ca85ef2018dff2617f335ab304b6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00567-of-01024.json.gz": { - "num_bytes": 396405726, - "checksum": "d9b56ed523376681dd81cb9831727467461bdfb87c80d3932937338370093033" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00568-of-01024.json.gz": { - "num_bytes": 397509797, - "checksum": "c650aad13a48d5b0c51162ad19c9eb3135559d0a3318dba701a90e8138a8cd24" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00569-of-01024.json.gz": { - "num_bytes": 396514261, - "checksum": "d71e4126c2deffae8ee55077cee9dd2b70ce27adec767bce06e02afb23b42416" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00570-of-01024.json.gz": { - "num_bytes": 397072833, - "checksum": "519a32e1bdf7f5b97e1a438242a79218317e04e44021dc61aa65c526d35ce8ed" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00571-of-01024.json.gz": { - "num_bytes": 397170114, - "checksum": "919a9659156cafb26b87190fc00b9d33c4fd536dd35544cbef8e5ddc018ae365" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00572-of-01024.json.gz": { - "num_bytes": 396475017, - "checksum": "3d7e4e548f01c9ad5fc99b4342cbf9a9004737058dd93aae8b7d95b2c00856bf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00573-of-01024.json.gz": { - "num_bytes": 396749955, - "checksum": "032f8e37328c9f0fc046e5a6ff5a79cbb744f3100c4cbea78e397c449471bb10" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00574-of-01024.json.gz": { - "num_bytes": 396036505, - "checksum": "8e795341527712be32a69307ce8cbd2d6195c6b2fea596d326a279734505198e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00575-of-01024.json.gz": { - "num_bytes": 396722381, - "checksum": "45a43576cfc61842bde146eaa566b4f22a128c3c2eb8f30c59a6b6cae4bcd4e7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00576-of-01024.json.gz": { - "num_bytes": 396163377, - "checksum": "38429d2d6176ee42ddd495e052c01735a9a7f0076cde107d24a0a9c7a26bf2a1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00577-of-01024.json.gz": { - "num_bytes": 396813305, - "checksum": "eae77c319bba236feaffc9f74eaa38e911fa48eb06f4794c9b1a6d17edab91a7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00578-of-01024.json.gz": { - "num_bytes": 397797226, - "checksum": "1dd2b3d7e99fde8903bc12625568ec4fc6fe653737b3af5e9c71432e311cf5f0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00579-of-01024.json.gz": { - "num_bytes": 396012631, - "checksum": "d9322e66701b4ada3788b91a07e87b03af6c91eb4cfaaefee23c0330987a1840" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00580-of-01024.json.gz": { - "num_bytes": 397943129, - "checksum": "23deb32e1b0f07a55a5cf1572cb8e313ce716c748a07f58bd90cbae97290d0a0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00581-of-01024.json.gz": { - "num_bytes": 397614648, - "checksum": "6193f8b848c7930fc04b9f2429dbccf36f1b291271b3eaf646c655433bf3ff9f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00582-of-01024.json.gz": { - "num_bytes": 396659280, - "checksum": "40997ef02c7040356cd1c5acd8e6a5121e00b31253713cad4f529ab2922affc9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00583-of-01024.json.gz": { - "num_bytes": 397686445, - "checksum": "5cd21271e4ae036f8d1e0c320330a6c93a8b1ffbb9293a80c56c2d7f123f9ee7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00584-of-01024.json.gz": { - "num_bytes": 395500815, - "checksum": "c25befb7c735b2340b092a04375d2109c1b876d2b0057dd8d4ed4beac87118ad" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00585-of-01024.json.gz": { - "num_bytes": 398413461, - "checksum": "073f632e95c218fdf17274fc21915c94f56bdfbb58a6b1a0550de249ce4d2129" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00586-of-01024.json.gz": { - "num_bytes": 396849745, - "checksum": "647cbe9bd7709c0d8a01485096fd88ad0fc09b27de324eae141a8d841536b71b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00587-of-01024.json.gz": { - "num_bytes": 398567154, - "checksum": "557af97a8d2b2656149bc25ee5b362116d173e6a48911b860ec10d512b4b763d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00588-of-01024.json.gz": { - "num_bytes": 398086388, - "checksum": "9e9afa15ee3534e497c9fc7c8cd967388183193dade3d1ec82a8e2b0e82c5118" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00589-of-01024.json.gz": { - "num_bytes": 397335823, - "checksum": "ed8a1d0b9c55f465b5d4a4e5ea022f6d17aaa8b82569be7cfec55629c1bf26c6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00590-of-01024.json.gz": { - "num_bytes": 394931693, - "checksum": "3fbe539fcf64f0d914c19b383de9953b0605d4a69f48801145f0db1972f9c6b6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00591-of-01024.json.gz": { - "num_bytes": 397828770, - "checksum": "9165de8866384d3d03c3876c39c96706e33a24b9f95acc09999c2dbfb85cd9cf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00592-of-01024.json.gz": { - "num_bytes": 398782493, - "checksum": "433a9cb730d7ab024b56ad662a3ea53633f7ff26c625051c4c02f252beeb87a6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00593-of-01024.json.gz": { - "num_bytes": 399264489, - "checksum": "4a7e5f40aa8b692cfa0519d33a868e9a05e579ad430204bc13c48b533eadc5ce" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00594-of-01024.json.gz": { - "num_bytes": 396629833, - "checksum": "521d5e90550dbc97ab26a18a0b75da81e38ce2083ff5fd93340fded2e54e1ca1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00595-of-01024.json.gz": { - "num_bytes": 396916313, - "checksum": "30c9be1d99ce0a41b214fdbd5115988c82ca317d4aceb30c19fbca05e0a409e0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00596-of-01024.json.gz": { - "num_bytes": 397013253, - "checksum": "b16bd9d7d893b4a71056575fa0799bef96120c03cfc6e2a88c292469a67f2614" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00597-of-01024.json.gz": { - "num_bytes": 395980036, - "checksum": "3bd15089b6fff342df2b3109d7ebadca35cead4f44ca5b1b55e55d8892aab82f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00598-of-01024.json.gz": { - "num_bytes": 396295935, - "checksum": "6252d951a9570baea9767cf3350a6d09ac5a5fc34ba80eae3b5c40adb8361ab9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00599-of-01024.json.gz": { - "num_bytes": 398608239, - "checksum": "b265a385cdd5e64d1fb2ffce739e72f2fe2cc8944621f20e2084dc52b91cdd9d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00600-of-01024.json.gz": { - "num_bytes": 396563743, - "checksum": "43d12028cbe738e8f450911f6a55dcb00f8742cefc2a2c4da5f9e9220b0572c1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00601-of-01024.json.gz": { - "num_bytes": 398256993, - "checksum": "9368dcfc581e6d572d899ef25b129bc0268901a2fa009500174a0985bcf330df" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00602-of-01024.json.gz": { - "num_bytes": 396202546, - "checksum": "3cc57d7afd161fcd411f73da8369d98db4c6d8e30643ee01450adef21e8ea3ea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00603-of-01024.json.gz": { - "num_bytes": 396338425, - "checksum": "cc21fc5b8ed6e5115bd8924954d685ed52cd5b773ab63d37188343443c95851a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00604-of-01024.json.gz": { - "num_bytes": 397597307, - "checksum": "d24f6d807ae35037e695e19917ed446f74448166fa464c862e31fe7ba2bea196" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00605-of-01024.json.gz": { - "num_bytes": 398278313, - "checksum": "99166183c752aed8d0f2cc9c010f1ebdd4fb93d40e936fd6c082eb3542baa956" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00606-of-01024.json.gz": { - "num_bytes": 396590468, - "checksum": "657ce79340c15524a5897459a6cf712fa4127def2445f7eb3de21c9b46db3794" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00607-of-01024.json.gz": { - "num_bytes": 396603228, - "checksum": "3705441435f18d1e4aeea9e794e1216fcd29b48213763a554808e3d3697951a6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00608-of-01024.json.gz": { - "num_bytes": 397280580, - "checksum": "be0bef2c16e9bdd0387276402dc99fe5a9a0a7a105a44e88bdb783139f2de474" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00609-of-01024.json.gz": { - "num_bytes": 398284528, - "checksum": "3a7c7a8cb01f6d7589152a1483682a5fa99e119490f3e70d8a02f582f2e2b19c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00610-of-01024.json.gz": { - "num_bytes": 398872039, - "checksum": "c349aac5b64227397ec2870992ac9e4fac9fe39f1fd4e0a7b8c727e171655e14" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00611-of-01024.json.gz": { - "num_bytes": 398736440, - "checksum": "63ca5eb2d27632b3b4dde8e40f9925e71e21ef737262bcda7a99324a67e0fab5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00612-of-01024.json.gz": { - "num_bytes": 395170895, - "checksum": "3b4bb3e14ee981a9edb9828ce40b86b5d83dfafcc1a5e0e02642cb40924bd6ed" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00613-of-01024.json.gz": { - "num_bytes": 398443337, - "checksum": "e95adbd7d55024b7e62145860f217a6f04f5fcef79ac23e92dd9e14f9a0b2a30" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00614-of-01024.json.gz": { - "num_bytes": 398854661, - "checksum": "def8cb789f8f79fa169e855816c5e4bc7d5c253e565502691a9abb826d7436d4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00615-of-01024.json.gz": { - "num_bytes": 395505189, - "checksum": "6775ca6aa4f834289396a438906b90936ed0ff6390213dac2b0861f40d7761e7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00616-of-01024.json.gz": { - "num_bytes": 398999454, - "checksum": "6cd5efddacb09cc80ec1eb79f93b562044787903b3cb1c879be2acec64a9dbdb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00617-of-01024.json.gz": { - "num_bytes": 398570431, - "checksum": "26d1f587377446e8b1499be7a3b6776d437baa40353fb04c591203a420eb0cc2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00618-of-01024.json.gz": { - "num_bytes": 397064982, - "checksum": "e59a87fd1cd3d87fff4b15c3a9331521d7587ac7f4a7fd51ec3906b484ef9ad0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00619-of-01024.json.gz": { - "num_bytes": 396676338, - "checksum": "8077c3a15d93579d0fbf00bd9d117bf4f50092c5be3acf46c7d4433ef7be9dfc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00620-of-01024.json.gz": { - "num_bytes": 398186471, - "checksum": "ee3fb91d7797ebf1daf8dcb81563b7dae7b161d97732efd35e3eb6ebea732ee2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00621-of-01024.json.gz": { - "num_bytes": 396467968, - "checksum": "386adb83129a7306ef4da37c1cbedc39b3971e7633d516d406a982f307577e67" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00622-of-01024.json.gz": { - "num_bytes": 398293882, - "checksum": "b708cad0e04c56174d0feec84d7224a4490cb8db023d38e57398cad89b78568f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00623-of-01024.json.gz": { - "num_bytes": 397396780, - "checksum": "c50c4568c6f103b3e6a3702cbd915ecb530df954df808156bc38a98f36a0b944" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00624-of-01024.json.gz": { - "num_bytes": 396971282, - "checksum": "11351ef83c9fb883d6c0f484af5c10f0d686b7ac4a2f08fae9ac3d9837df0a0b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00625-of-01024.json.gz": { - "num_bytes": 395882440, - "checksum": "dfa97ea7949c9bbf7af43d43ac5c8d0034bdbd1ad572895159b7c7846ab89676" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00626-of-01024.json.gz": { - "num_bytes": 398292846, - "checksum": "fbc9c23dc286ad6fd7f01f344de97ef5789733af581de278488869bd36f3b246" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00627-of-01024.json.gz": { - "num_bytes": 399890427, - "checksum": "f43bbde36b8bd34ed9998b99b42c85434b8bbc8bbaa1cf5b38cec6393099c23f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00628-of-01024.json.gz": { - "num_bytes": 399589466, - "checksum": "c50058a4937912b678d33d34ff91e2287e8701365f4f71fce61f9002652556cf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00629-of-01024.json.gz": { - "num_bytes": 397355095, - "checksum": "051c4631d0587b6f65827410ad2f2121c05c849a009274415bc5e7f72db42d44" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00630-of-01024.json.gz": { - "num_bytes": 397860559, - "checksum": "07b48a86a8a3245fe5b78f6943c8970c839942b8d86abf173507225b0d1520d0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00631-of-01024.json.gz": { - "num_bytes": 396161304, - "checksum": "70a03f0308105de5266c4a40803b51f99888b362b71409719b7f71f73761b590" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00632-of-01024.json.gz": { - "num_bytes": 395620184, - "checksum": "c6923984c419f08bb4e6effc27dd25dd986513034338debc9b238592dad9f607" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00633-of-01024.json.gz": { - "num_bytes": 397572527, - "checksum": "900fc701703234031e825a1eb2d11b364f1dda97eb0c7943e17ef278695f7bea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00634-of-01024.json.gz": { - "num_bytes": 396215174, - "checksum": "0cc838e395581933123fc57c6690afbdd2be1b67d213336d9b8c08b3876f8458" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00635-of-01024.json.gz": { - "num_bytes": 399176005, - "checksum": "5a3daa1bd0be8c997da56257f063a7d1c7b2b271648a46615b26ca4beeb42863" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00636-of-01024.json.gz": { - "num_bytes": 396035356, - "checksum": "9d21ce1c8b5a7c1330cc95b1f45286fb8578d5dcec0686724ff6e25a97f38a7e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00637-of-01024.json.gz": { - "num_bytes": 397214839, - "checksum": "83cd34e1ba09c268b515fda7699e12bfa2531fb7e60e2f861946ffdc01e54a04" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00638-of-01024.json.gz": { - "num_bytes": 396292535, - "checksum": "82a7bae9a7d35fa707bcb6d90f7b244f1509e112dfdbd604c9be1f8b8ce7150b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00639-of-01024.json.gz": { - "num_bytes": 398009954, - "checksum": "b6d7ebd102c67960413caf5fcdc5b4aea728b6d3d6369ab8dd3cd6bee6c769de" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00640-of-01024.json.gz": { - "num_bytes": 397558496, - "checksum": "151c55d019fd84fdc0eab73d24984e5d88ac964c86f89a361a03dc776a22b5b4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00641-of-01024.json.gz": { - "num_bytes": 398031508, - "checksum": "e0e87304a8ac408adca2badf2564ec52caf155295ea303a121c30f3b1ce797b7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00642-of-01024.json.gz": { - "num_bytes": 396594124, - "checksum": "73d08c99b6b96d96b82d88267b2a392a7dda2084ba5142b8eefd0d23212702d5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00643-of-01024.json.gz": { - "num_bytes": 394552252, - "checksum": "ebccf3b935d63c30f626d317af250b6bd0f04ef5e1cced829287ba64fbb0d25f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00644-of-01024.json.gz": { - "num_bytes": 397586341, - "checksum": "674c0965a9a880c057b6f2dbb785a4a6ae048954d44ba4f5266dd5e65095d06e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00645-of-01024.json.gz": { - "num_bytes": 397950976, - "checksum": "7ac8d4dacd682a2977818f01d860c3dfa5a5e5a78f7d2d95be0353a675452e93" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00646-of-01024.json.gz": { - "num_bytes": 397511840, - "checksum": "452a9cc03facf9151552f914f9a8a3507a96fd8ea40f7d04951a29ecbf6aa1e5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00647-of-01024.json.gz": { - "num_bytes": 396692070, - "checksum": "5a795a238203444596c711bcedc634e653e5240c9a800a9884c51f878340b494" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00648-of-01024.json.gz": { - "num_bytes": 392707626, - "checksum": "9cc366c37950624df6af318ee52a97d32a40e278fcb519cbe8545b04bee3204e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00649-of-01024.json.gz": { - "num_bytes": 396283284, - "checksum": "4ddeec31a30b5c563838b17e1115ad30041e08c70a94f299ea324ee4b71fd82b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00650-of-01024.json.gz": { - "num_bytes": 396349662, - "checksum": "f5bc63114ec9d73d6cea7f8e38a95031ae2bcde849b27440afd840a3e72aac13" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00651-of-01024.json.gz": { - "num_bytes": 397187042, - "checksum": "7199c0242b2654509af187c9c8bbfc22cc5067aafa1ff69949b1f0e5b718425b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00652-of-01024.json.gz": { - "num_bytes": 396263026, - "checksum": "c9e62b6df7213ea5b71913fbf736403f33c51e5a868bf1035cebcc39d80635bb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00653-of-01024.json.gz": { - "num_bytes": 398689010, - "checksum": "f3bcc9eca4d71043e920db6399a032f916c23b1da329d2ef86434a74f8e7b318" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00654-of-01024.json.gz": { - "num_bytes": 396938678, - "checksum": "fb41df26e1f68e1e9d12ae8740535ca66e80910320be2270d680fec40d6fe9a7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00655-of-01024.json.gz": { - "num_bytes": 395995226, - "checksum": "018b40ddf6d88c4c346c8018439d16f6ca66ee0720970e84ddc34b1010ae35d7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00656-of-01024.json.gz": { - "num_bytes": 397860049, - "checksum": "8f3847e9bb5a8145e2959b340f86cc06f85e6646f32d5d785c5c90ec11a9f404" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00657-of-01024.json.gz": { - "num_bytes": 397142407, - "checksum": "a1ae8735a39bd099dac2e50c22e312f1a010f2644774ef53c995f3437c0a5524" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00658-of-01024.json.gz": { - "num_bytes": 397827609, - "checksum": "f6154377cfff2453392fb899f81514a7c0ffd40dbc35d8842d61a115d0aeef35" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00659-of-01024.json.gz": { - "num_bytes": 396861858, - "checksum": "4299633524667921549573c469a73e33abae89d107375d5ccc6a6d987c2a2a26" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00660-of-01024.json.gz": { - "num_bytes": 397773823, - "checksum": "44eaf6c1739d8a9c13c54750c473ac04aaf9d2223d8893cd8094f1769b1f6f8c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00661-of-01024.json.gz": { - "num_bytes": 396311257, - "checksum": "18edb60444b660c7cc68dbe59ac71989be0e20ff13639725a5f05e4d4d512514" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00662-of-01024.json.gz": { - "num_bytes": 396176936, - "checksum": "7b60541181fbb92f361fbdf0bee80d086c75279610aab792a7b3877d49a3e1bb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00663-of-01024.json.gz": { - "num_bytes": 396274985, - "checksum": "59e057ee5f5e8c7267138c18c5c88f3ca24d30f86c484e4bb0c0a4eb5169c4a4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00664-of-01024.json.gz": { - "num_bytes": 397483935, - "checksum": "585f45d3ac3f88c3bf1c86e01daa46537f8f5c5165521412de0e67393cb6da33" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00665-of-01024.json.gz": { - "num_bytes": 398831104, - "checksum": "e403d2f4ff6e74abc9639749f93f77cc868453908c10821fea7fafdbcc981a06" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00666-of-01024.json.gz": { - "num_bytes": 397668116, - "checksum": "f9bbafa396a466b24630a259a01804b2857c1dde2fa3cec60b2967a88ad9f528" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00667-of-01024.json.gz": { - "num_bytes": 398123165, - "checksum": "ed693d5ecb9dfcaf545e831b5769b877e927125794cae61a0ec7821c3c85dfe6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00668-of-01024.json.gz": { - "num_bytes": 398152096, - "checksum": "51c33c07d503743704f564bc6a372c2f6f8f13a1ddd00b0b9a2c44c94cc57444" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00669-of-01024.json.gz": { - "num_bytes": 397927981, - "checksum": "d356b5268ba39e38ffccd20e95803f3218407e0a1ca3b4d1165ff82796ec1bae" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00670-of-01024.json.gz": { - "num_bytes": 399074605, - "checksum": "bb96ea8154ae01275a9197709820e670c4e6212c740e92a7f1cfb7c618a49bea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00671-of-01024.json.gz": { - "num_bytes": 397864381, - "checksum": "afca3dbcaefdc368e996259fd595b77fd98a885ec005a93069a01b83227c827b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00672-of-01024.json.gz": { - "num_bytes": 396077133, - "checksum": "3da96ebd1b28b55b03bbab8e85f78295cffdad9020f869cb456da27058ffa090" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00673-of-01024.json.gz": { - "num_bytes": 396943842, - "checksum": "6a4c344a8af68a95e20d58b64fff8fe616c2a406cf26f642cdfea65fce5883d1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00674-of-01024.json.gz": { - "num_bytes": 396975969, - "checksum": "e6b0f7727d78143fa180abb76e617b37660b35f6323f19bf1dcbc78fb9374508" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00675-of-01024.json.gz": { - "num_bytes": 396692800, - "checksum": "e4ed97b19c6d83e618a3fcaff75460d828ca419b1e62842a1493b0ec4c9703e5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00676-of-01024.json.gz": { - "num_bytes": 396514400, - "checksum": "a5672f1561ab85f071395de43e702791aaacff77a9f67f6ec9e14b12aba675b2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00677-of-01024.json.gz": { - "num_bytes": 395939125, - "checksum": "3dacd3bb90b5e645d1b9a962d8df87f571b0fcf227996068535bb98a68f9191d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00678-of-01024.json.gz": { - "num_bytes": 397022852, - "checksum": "c1a0ef31342161369b7fb709be17e3c86191c1a52cb04b704fc58190818302c3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00679-of-01024.json.gz": { - "num_bytes": 398325372, - "checksum": "47ddd1056ad977407f61b2eac3ff803d17b1aa8fa0719279bf911caf49bbb7c8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00680-of-01024.json.gz": { - "num_bytes": 395502228, - "checksum": "cbb93f322d684ed558cbf8d92b9f83958ba772fe4177093a334b4596343f3cd4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00681-of-01024.json.gz": { - "num_bytes": 397981781, - "checksum": "9ec2dec493733846a1ec9f68ff5130cd461d7ab9c07b22d4aae94463bcf03146" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00682-of-01024.json.gz": { - "num_bytes": 395265758, - "checksum": "7731cb9a2898c730a650e5d1b358886ed562228928aefe55d991cfaaa61a9a99" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00683-of-01024.json.gz": { - "num_bytes": 398783283, - "checksum": "6f2bb48070e809ac17fc90e1117d63bd8c7cd0079d9e44c9f262c4ce60f5d373" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00684-of-01024.json.gz": { - "num_bytes": 396160769, - "checksum": "fd07413637b97b68cb3a7a6cb86c4656017b7841728e806485ae196294e79f8c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00685-of-01024.json.gz": { - "num_bytes": 395594461, - "checksum": "939925a9169da729891fbeef926f420b80bcc60e0f170bcf9a2095449a22d424" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00686-of-01024.json.gz": { - "num_bytes": 398275260, - "checksum": "13836c45719ba10f2d581cf17cdab1daa4cc207a49db2b4786b451605842ac4b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00687-of-01024.json.gz": { - "num_bytes": 395256765, - "checksum": "0c0d0e6c1e3cb9a024c184a8510066a005c031a15af74d117d0e736a358a91d0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00688-of-01024.json.gz": { - "num_bytes": 396635904, - "checksum": "2462e084563f8b8de68c6e826289949ff8ebf8cfaf323344c07ab93e56373539" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00689-of-01024.json.gz": { - "num_bytes": 397749444, - "checksum": "d03746220f3374c80102ed39d8f6ae0daec40fc1b23312c08ecdee82a65ac6df" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00690-of-01024.json.gz": { - "num_bytes": 399380060, - "checksum": "217d032ecce8d0b7e448befe83aa051a3bfab8cb0e167d043b6abc833f5e9b4a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00691-of-01024.json.gz": { - "num_bytes": 396975651, - "checksum": "354fe9bc07aefc55cbbf8752f53ad69d45761da928bc8deb6fee1de9e244e93e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00692-of-01024.json.gz": { - "num_bytes": 399720848, - "checksum": "21f88940b6cbceefd66ea5e8d466467806370ae24a5833ca308cd840daf5ff8d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00693-of-01024.json.gz": { - "num_bytes": 396787846, - "checksum": "c8d28980ffa1eff4459d2fbf0043a1f8eeaf840a3b1d1ea4989b2192c7a82041" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00694-of-01024.json.gz": { - "num_bytes": 397945967, - "checksum": "1936570da24c4bab9fe0559826f1cc509c4ab6eb3679e26d697efa6e7e5c8a81" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00695-of-01024.json.gz": { - "num_bytes": 396349049, - "checksum": "8e497506f84513272a8a0694e7d4efb004b1e3b515887e3b5762f59b6c659dc3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00696-of-01024.json.gz": { - "num_bytes": 394901418, - "checksum": "9e1d6cc187ff67ee734bbadc6cbd57eae05634a448edfde184fa8d6fc3259836" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00697-of-01024.json.gz": { - "num_bytes": 399142528, - "checksum": "9584496113a8612620748aaba35e185b8f47b7c96b4ff0dc7bfdd6024a3faa14" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00698-of-01024.json.gz": { - "num_bytes": 395923784, - "checksum": "83a3c57b3870ed9beeaf3ec8ab694e0be458106f3128b14b2a44a036e89d32b1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00699-of-01024.json.gz": { - "num_bytes": 397137494, - "checksum": "0befea64fe749d79592e337bc359bcef70ca8816d0126ebf89d4b8fbfbdcbec6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00700-of-01024.json.gz": { - "num_bytes": 396554785, - "checksum": "34739b543636aeadb6dcce3e7c97ca49026cc9897c13add6b592fe60e5c40338" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00701-of-01024.json.gz": { - "num_bytes": 398091188, - "checksum": "c9bcc7c9e91de707ee548e67452d6970af2e19bef91f966b19fa71504e5305fc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00702-of-01024.json.gz": { - "num_bytes": 396039798, - "checksum": "fcda5f8ddc5ed163db84aa70c565f8181731af9a29918a2ece0436d3146d7125" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00703-of-01024.json.gz": { - "num_bytes": 396889704, - "checksum": "c80445d442a766d2e87ecf5804e87bf7f8b23c2238476fc2b51f657400739306" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00704-of-01024.json.gz": { - "num_bytes": 399465260, - "checksum": "0bb73674d579523fcbe079fbea7190138911711f023404ae46ea7b685fc09c73" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00705-of-01024.json.gz": { - "num_bytes": 398579507, - "checksum": "97d6fd9cea2a47913c6ee9d1e34c3440858f25f3d670cc81c8f83f2346fce6e2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00706-of-01024.json.gz": { - "num_bytes": 398761590, - "checksum": "2f4836001b8b80066ae09b6e385ed0048770c13ba2410e0f0309ab4b9200e37d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00707-of-01024.json.gz": { - "num_bytes": 395576626, - "checksum": "8e0c0c635a7a7c32d4fdb1a7906ee95a9f334a55b2ff3881cdc7d5e816a9c817" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00708-of-01024.json.gz": { - "num_bytes": 395930921, - "checksum": "e6978b92f333230972e2b4c31cb86b5286fb899948c7680c7a9cbe75a9d60296" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00709-of-01024.json.gz": { - "num_bytes": 395734676, - "checksum": "13071a3527071f06570c6cfa485073f2f3980c83cac782db6bf66a75dd865df3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00710-of-01024.json.gz": { - "num_bytes": 396501107, - "checksum": "6562cb3675a42a58b8c8b2a232043adf532fe49420e30c3c237a6d8889a8de30" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00711-of-01024.json.gz": { - "num_bytes": 398422179, - "checksum": "f38b59c4739d3c15e5bf5dbc0965d1a5dcc0f49a3c89eb7a6822003aaa1ae7c3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00712-of-01024.json.gz": { - "num_bytes": 395905103, - "checksum": "500b4914f3c42d5e24ced7d36dbd3143c49e4fd5dfc3d53a172d1a55ae738889" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00713-of-01024.json.gz": { - "num_bytes": 396009909, - "checksum": "4f50bfa762db1435a89195fd180615e9f569c1668e128d343c87c40ac5cf60ef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00714-of-01024.json.gz": { - "num_bytes": 396963447, - "checksum": "fd9eea7dfb93916a3798a8b69d29fb5d4bf0fec448b8a24427f729e7a41205e8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00715-of-01024.json.gz": { - "num_bytes": 397474378, - "checksum": "3c61bcf6f24e21d2584bb4ae008230540d9a375e35f3c4ba1668621b80d85c5d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00716-of-01024.json.gz": { - "num_bytes": 396285471, - "checksum": "c554e562a369d9696219ea8b0e363907c50f626d7c410a26515e07de801da74a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00717-of-01024.json.gz": { - "num_bytes": 394827995, - "checksum": "f8b4678c21d93c19d50cb576f0910050d24dfd606238bbf8013c45f98defda12" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00718-of-01024.json.gz": { - "num_bytes": 395517823, - "checksum": "1bf63affd6914d98e197b6e1ce526cae7754ecdc750184154d3cb8e3bdd21a9d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00719-of-01024.json.gz": { - "num_bytes": 395561934, - "checksum": "c04b162d984ff2ada9f39aa6c0fac04a1531fbde05175f856d2e3ca2797a448a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00720-of-01024.json.gz": { - "num_bytes": 396227762, - "checksum": "25da2ac7c1f3cbc361807f67e8826ffa95f4caa25f81f66832cbd0a08f1a51f5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00721-of-01024.json.gz": { - "num_bytes": 397716450, - "checksum": "28180c6396deaf34e2a197f5cad1b53ba1c9532db8b5c21dd7d81332b2793181" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00722-of-01024.json.gz": { - "num_bytes": 398022279, - "checksum": "9c3a8038a7f9431b90f67ea0d3b77353d0508b09865f49af575b6aaf5e32d6b7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00723-of-01024.json.gz": { - "num_bytes": 398064523, - "checksum": "4b18959f604bd5f379a73b52947261cb8d63f2243f5afeb5807a13669ef4a800" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00724-of-01024.json.gz": { - "num_bytes": 394747045, - "checksum": "615f13a1b2a6942931519b7a7f6aba286f6045aad65b041c2c6643ce906de1a6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00725-of-01024.json.gz": { - "num_bytes": 396726374, - "checksum": "4099a416eccbb56818efda68bd027c993c1a5fa1a8e722bc268041fd3f804cfb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00726-of-01024.json.gz": { - "num_bytes": 397361407, - "checksum": "152d5e2bad0de3b6b48fb26066891b160ea79c4c382ce6aec6047196e3b08ef6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00727-of-01024.json.gz": { - "num_bytes": 395542925, - "checksum": "ce1d46b0cd7d9e4075db3feab71d2f72939817ebf45819e73ec277c9cc07307b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00728-of-01024.json.gz": { - "num_bytes": 396647931, - "checksum": "c859626b14584c1bab396c867ad5eb11ff3af39628206b03612ee2d2b3058497" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00729-of-01024.json.gz": { - "num_bytes": 398272080, - "checksum": "758fbdc5bf6d66a36d69d31141742b2a917bf0341494b844f22ab82cd54e7ead" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00730-of-01024.json.gz": { - "num_bytes": 395977662, - "checksum": "56a7fcb59ece26d4b19be0bd5e6c2d0f05e4b1b23e8ce7b4fab064a29b229c02" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00731-of-01024.json.gz": { - "num_bytes": 397530948, - "checksum": "bf0f4dc8796a737daf80b977a6e3656cb1e244fc40d6df92852da45e53e6cfdd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00732-of-01024.json.gz": { - "num_bytes": 398314575, - "checksum": "1862bcc85d48f59283eae56836e5598f20287ce36a185252abb24bcfbd1377cc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00733-of-01024.json.gz": { - "num_bytes": 398547748, - "checksum": "476389cb582df3c214f3f5a45268bdb47b581a432c08723bd811daa5f5990083" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00734-of-01024.json.gz": { - "num_bytes": 397380175, - "checksum": "2b6fd36a8f8bc3edfcd8a486de44d2f3132f7b8f4bb2d4c93453dbf1a1b6667a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00735-of-01024.json.gz": { - "num_bytes": 399584382, - "checksum": "3e0a067fef0b40edcd23ce6680efc07253660b8c00699630bb7629b9d803a198" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00736-of-01024.json.gz": { - "num_bytes": 395312038, - "checksum": "e4f92413c837d269481ecc0b5d0fc87548bd2ae718ef7f9bff18674ece289bc7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00737-of-01024.json.gz": { - "num_bytes": 396820243, - "checksum": "e61680c57505f027ef8cbd28a45e706936befa2ab40a24a63e638019a1717b63" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00738-of-01024.json.gz": { - "num_bytes": 397691872, - "checksum": "d3acc0c9c76ef2df89f49896744dac53f488f830d3d42f0c481f2321ed60fa67" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00739-of-01024.json.gz": { - "num_bytes": 397912166, - "checksum": "18d281ed9831f28c4c54256a844ab2cff7a5b681da1b7c8eab2565b106381aa9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00740-of-01024.json.gz": { - "num_bytes": 397093867, - "checksum": "6a65230910384587f5e7f34b52c2a6d9a86a8b1f7a23d26f890b6e810c051815" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00741-of-01024.json.gz": { - "num_bytes": 396371058, - "checksum": "26eb40e98075ab716b4edec76d1723a679e648258d6812119b46f7522dfa9b07" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00742-of-01024.json.gz": { - "num_bytes": 398346941, - "checksum": "466043ec98eb806916806cff7495f0bae89cfeb2835204ea34328030b92a27f2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00743-of-01024.json.gz": { - "num_bytes": 397366055, - "checksum": "d98d31aaadf95dd0d1cf0548db515c8e77c95bbc4b611ae9ab5650429c171889" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00744-of-01024.json.gz": { - "num_bytes": 398722902, - "checksum": "a43c80ab3bd8d12d12b4ea41d9054b90214fd3ea2ef957f317d6ed6fa7b60e34" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00745-of-01024.json.gz": { - "num_bytes": 397562514, - "checksum": "1e6dad94e0f90bfa0fdc5557c58873aaa95fa9ce1c7b70a1fe76817289cff78b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00746-of-01024.json.gz": { - "num_bytes": 397731351, - "checksum": "21fefd6cffa9032c9ca7cec91cd775c83bbd37419ae236eeec9589f8bc4be0dc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00747-of-01024.json.gz": { - "num_bytes": 397781450, - "checksum": "b84c74bf1caecf92777fb85129bb009eb3a27fbab1b97af567f36a8bf100e704" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00748-of-01024.json.gz": { - "num_bytes": 397425031, - "checksum": "fe9bb225f6d03b44e552ec985c844e5012e90c4ad99f699ec4ed4297db91349d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00749-of-01024.json.gz": { - "num_bytes": 397925850, - "checksum": "3913b2955fee02e2ba716d843559bc4bf4e85a2884ae4495446a379f857a30e1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00750-of-01024.json.gz": { - "num_bytes": 397089489, - "checksum": "773486144d3008cb3207c3c8b65fe6081c9e64dda09728d3586bc82e6bb73fca" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00751-of-01024.json.gz": { - "num_bytes": 394819424, - "checksum": "d728b117a7b74150b03ed7d562514c2e45ccc03b0bceb120eddfa8333166a923" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00752-of-01024.json.gz": { - "num_bytes": 397199683, - "checksum": "6c10c3f4e3737db6a70375bd605139de61ae8b09a1aa91dd1cfdb82c183f0cb3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00753-of-01024.json.gz": { - "num_bytes": 399197199, - "checksum": "101c4ed5426b586a4aeeb7dbd377306eae9eec2eaf934e79d25583abff70b15b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00754-of-01024.json.gz": { - "num_bytes": 396415619, - "checksum": "732f4dedcf1266bcabf15a6a1cdead617ea37d428d8cfbccb5a9dd7521133075" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00755-of-01024.json.gz": { - "num_bytes": 394564662, - "checksum": "a23f1bb1de23554efff68e730d85802a6491936fb54e256744af641f97ec155b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00756-of-01024.json.gz": { - "num_bytes": 395577258, - "checksum": "2f4275994a103dca517d4eb3656009c8138930079e00303c7b8746ab6094fd19" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00757-of-01024.json.gz": { - "num_bytes": 397161772, - "checksum": "ab16360173283b22a7e19d181fbf55a6a8d07f0d9007b51aa159c1e81661f5e1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00758-of-01024.json.gz": { - "num_bytes": 397545456, - "checksum": "ff5a6292bc557aa9895de39697e8aea5843fa5a00c83c7983eaa36640d446ecf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00759-of-01024.json.gz": { - "num_bytes": 395470957, - "checksum": "66a64accfa6c281d2bdfa7b6846397f56c2d4f8a22ae8925a07af853e42f5521" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00760-of-01024.json.gz": { - "num_bytes": 397328304, - "checksum": "46778c90bcc6da96cf02e66956a1bcabcb9a95bad538cfc0d5190db473a278a9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00761-of-01024.json.gz": { - "num_bytes": 397706141, - "checksum": "4825f25d6e1d13c70e6e65ce13ccd7b1922344c48ee2806952f3ba1b6e26d3ae" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00762-of-01024.json.gz": { - "num_bytes": 396983663, - "checksum": "25e1645f05d342b5f872ca809b36d516c7336c22035bfa86cf295d0865e08789" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00763-of-01024.json.gz": { - "num_bytes": 396355038, - "checksum": "d4c3a92808f0bfb042423cd4166abc57d20603ef07a0f0912058a718a38f26d0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00764-of-01024.json.gz": { - "num_bytes": 395434042, - "checksum": "aa4384f587fd64c24fad9a27defb0345eb44cc536b3d45c710017d225c191ded" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00765-of-01024.json.gz": { - "num_bytes": 397204482, - "checksum": "cf419554f6c4f6201ebe92e7a232013e5949910f3d54f5cf3d1d65845685c7ca" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00766-of-01024.json.gz": { - "num_bytes": 396420917, - "checksum": "32076dd8004ebe35f46d6e790fd6330ad1d7df2b7ae3c4ede325b0da73a673ad" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00767-of-01024.json.gz": { - "num_bytes": 396840905, - "checksum": "08e5fd0fc1578a337f3dafdb3c718ade437256119e1968e9f958a8ea9d052c81" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00768-of-01024.json.gz": { - "num_bytes": 398085225, - "checksum": "3579e0756bb6cbf1eddfca27de5cf067a212d683134bc6f8c26a79b7d802bfce" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00769-of-01024.json.gz": { - "num_bytes": 396879117, - "checksum": "0913c93203a084521212e473d08c1d11e8136a8e37f1891330fbce0397bd431b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00770-of-01024.json.gz": { - "num_bytes": 396386647, - "checksum": "6c12ab51c92b9c92336a6142a1a4e2f7c3725beb7e61dcb004551d13e8d5488e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00771-of-01024.json.gz": { - "num_bytes": 396279989, - "checksum": "752deaefbf22dd1b1adb36561e8524c1dc555fd105bf3acb78611be9bce72318" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00772-of-01024.json.gz": { - "num_bytes": 397850815, - "checksum": "4f1969284d1f448caf0bff5d05eeb995cf2339801f6a71e01286f4f7f387c564" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00773-of-01024.json.gz": { - "num_bytes": 399466666, - "checksum": "20ba552cd30349bc8a2c0b6a8701d4587a005e7ebdf6e3f2a3bf95462c304447" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00774-of-01024.json.gz": { - "num_bytes": 398051538, - "checksum": "1f66196e8fbf0ebef977f235d2aacb7245f4033b53ecf75ada2f8007465a629d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00775-of-01024.json.gz": { - "num_bytes": 399284061, - "checksum": "97df92baa605c34ce857d380f1ca42f9e2a0de499ccaa9bab26a5c449451d1ef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00776-of-01024.json.gz": { - "num_bytes": 396710162, - "checksum": "4b1ec54b82c8e5d969d3000ce547f4c20df16d9cc0b889b2b58c8839e9d8e27f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00777-of-01024.json.gz": { - "num_bytes": 397265441, - "checksum": "03827ccc3c5bebbd12a04019e9797945c55becabf7f9c1f3fe5353513f5c5a38" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00778-of-01024.json.gz": { - "num_bytes": 396050013, - "checksum": "54aeadf4fe16949b2ee9438feabe979570e7587bb07b3c57e47422f662191936" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00779-of-01024.json.gz": { - "num_bytes": 397124991, - "checksum": "913e268b5474a8b4cf1426f5a0a06c7f437eeabbc35f0126481328b419f85bf6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00780-of-01024.json.gz": { - "num_bytes": 395196367, - "checksum": "4c1a4f296916c30103a5dacacf8a167e43bb424d085ed3491b19f0ec1985d9f9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00781-of-01024.json.gz": { - "num_bytes": 396578403, - "checksum": "a54f26c233662299ec8f0ae1bd266879e93cf4676707b0955114a1a80e2fcf61" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00782-of-01024.json.gz": { - "num_bytes": 396142106, - "checksum": "3713c6b725afd833063402e6577bc0ed003a87720f700f9272864c2360bfd260" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00783-of-01024.json.gz": { - "num_bytes": 396470511, - "checksum": "fe9d904a07ffb2581b6734c8dd847435b867d3043ce4b4840b1c54374919d757" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00784-of-01024.json.gz": { - "num_bytes": 398156228, - "checksum": "af762a9ff3eeb7ed4a56f54702911f0c190b97f8efaa02cb89b1626a1c44c9f4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00785-of-01024.json.gz": { - "num_bytes": 397185035, - "checksum": "6629e1827aab88f55d53de24625f8362daccf910663db8584d959aa44f8043a8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00786-of-01024.json.gz": { - "num_bytes": 396556703, - "checksum": "ce51603900ea0aad8981fbfa8d05d684bfef5360413dadc6933246c2dc81c413" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00787-of-01024.json.gz": { - "num_bytes": 396214799, - "checksum": "6eed5802b89d63eea115cbfd9e00f6d1b4970bb3600a887b904b548181a4acef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00788-of-01024.json.gz": { - "num_bytes": 397965162, - "checksum": "eaa948fdaa744576f006bd70d54f129968772a479fb0bd8e946d7605857545d2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00789-of-01024.json.gz": { - "num_bytes": 396280999, - "checksum": "e0b80ec73507f96310abf070e5cd17d5a67ffb4a337820a8b79a02afe81a0b99" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00790-of-01024.json.gz": { - "num_bytes": 396224660, - "checksum": "2b4a06fb6f68c773da34f8d4c33d7746b6a3206bb242042841e5e007fe3cb6ea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00791-of-01024.json.gz": { - "num_bytes": 397681975, - "checksum": "1b167c20d0414d970cda74cd357cf07d69abd1d3fb0f57222028b369551d513b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00792-of-01024.json.gz": { - "num_bytes": 396210611, - "checksum": "ab55128753a1e58d1032b8fd747c48158a721b12e85990627478f22b78e156ff" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00793-of-01024.json.gz": { - "num_bytes": 397534599, - "checksum": "e7476bde08e0065c523d09932cf2cf6ffe8ba023ae0ee435238efb5dd6f93d7c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00794-of-01024.json.gz": { - "num_bytes": 396536137, - "checksum": "6228922504b2d3ebeef4735abdff06cc786d6533a6c150d50f34042aeeae1544" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00795-of-01024.json.gz": { - "num_bytes": 395235406, - "checksum": "9dae151c15898d7991417596a364e30f00e0ff6280f1505953e6de40c2e228e2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00796-of-01024.json.gz": { - "num_bytes": 396226178, - "checksum": "1dc8decde490324087fcd06e4b1e17117606f2d61a80d506d89a12cce11ba291" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00797-of-01024.json.gz": { - "num_bytes": 398556774, - "checksum": "a454758e8cffccc88f83517a241f2457e683647949cde6aaf1e217de42f6a52b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00798-of-01024.json.gz": { - "num_bytes": 396109677, - "checksum": "3daa6b8602517b9873db96522a2852d940d52cdf0fa86f259ac41a9cd688751f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00799-of-01024.json.gz": { - "num_bytes": 397930210, - "checksum": "09dec669699a437d6fb78b3f2705028fb380b2eaa20ee73b77270216a48b8a95" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00800-of-01024.json.gz": { - "num_bytes": 394545441, - "checksum": "726f99301047519de253e3edbaef5f4a4f95e3850b1b98e01c7864499dad7833" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00801-of-01024.json.gz": { - "num_bytes": 395867151, - "checksum": "a97ef657bd8ea718427ffc686f55fc1786f0834755fce3ea3ae8402d9f75c11b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00802-of-01024.json.gz": { - "num_bytes": 398573429, - "checksum": "20ee1f30272a0d5db74e8589be12c17173580cc9f14b039b3d33f3197816ef95" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00803-of-01024.json.gz": { - "num_bytes": 398084513, - "checksum": "31d1a8f6965d3a8cb7e28fa8bf2cb9a5609d4a129dbc630a8e2a939f475b2003" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00804-of-01024.json.gz": { - "num_bytes": 397815811, - "checksum": "edb758146d462848bdb113df90fa4b9f451eca6658cbd2cab147c8b0eaf88a70" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00805-of-01024.json.gz": { - "num_bytes": 398641802, - "checksum": "b916bafa7269ad4ed09c58c74dc3f098b529444609dafc57e6e4056aa6496ee9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00806-of-01024.json.gz": { - "num_bytes": 397993720, - "checksum": "92fcc5881ca81b808c14f8c9960d873be70f857f95fd1e777b1ae1d4c62bbbaa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00807-of-01024.json.gz": { - "num_bytes": 397743279, - "checksum": "79aca62194176964b66a90dda7631d01acc2a6abea1ba19a90076139e390170a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00808-of-01024.json.gz": { - "num_bytes": 397076817, - "checksum": "a469391e432dac6967e841d46eaeabe9429849492a3df5e91431777fe9b9f164" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00809-of-01024.json.gz": { - "num_bytes": 395533122, - "checksum": "1278d928e105ea7d9c397ef1da79dcc8791dfad9177727aba098bd451734ce45" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00810-of-01024.json.gz": { - "num_bytes": 397468683, - "checksum": "5c6f3e7550827de9d7028decd82320a55722785394ea4951ee78f3ffadb2d4e0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00811-of-01024.json.gz": { - "num_bytes": 397348260, - "checksum": "8c1ece72814dd82bf1bb663b76a40c58129c08540195f9b2134eff5837faa366" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00812-of-01024.json.gz": { - "num_bytes": 396753479, - "checksum": "b3770924d0576f7cd1706771c411f0f288277c6c6c922dc7af4017b665109a88" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00813-of-01024.json.gz": { - "num_bytes": 397977743, - "checksum": "864040da6f03f4d2ed2a9eae4daedf304e0d27196f0b522cee4e8fee55f9ea71" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00814-of-01024.json.gz": { - "num_bytes": 396168620, - "checksum": "542986bb3b75ffcfc853af11a80edb6a31e12527d2588f1c5b2119fe35d3f150" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00815-of-01024.json.gz": { - "num_bytes": 397639162, - "checksum": "a617c2f27306ce5de74ab756cbf74707fddeb0aa92277b66d0cd65be230f386a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00816-of-01024.json.gz": { - "num_bytes": 398296204, - "checksum": "174a2e77e6562384cc4e7459ebf536db5cf4b530e4f1d7714e60d082ac7a19c6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00817-of-01024.json.gz": { - "num_bytes": 396112543, - "checksum": "95af2c4f32efb4ed2a41cfa38dd2be09d51d4b0dc53ca8763309503f0276d56b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00818-of-01024.json.gz": { - "num_bytes": 398371592, - "checksum": "67789e3525f2daf6af2551df12a50341c3ef51c89a9c714a8def76209b5b7460" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00819-of-01024.json.gz": { - "num_bytes": 396751420, - "checksum": "07431a263e2bb92c048fadbab74ce1399f76fc57a04d7f9e90cb33aa60a4c5e9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00820-of-01024.json.gz": { - "num_bytes": 399213859, - "checksum": "83c03df95869973c2ed46c909c0e92e7ecd75317c06b09e447a62b592421d1c7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00821-of-01024.json.gz": { - "num_bytes": 398408628, - "checksum": "b5cb8c52a8713c5291ccf29c171e9bd9b57a54211392a19e8f31182d1053a032" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00822-of-01024.json.gz": { - "num_bytes": 395429180, - "checksum": "8c47bf7a0d2b9c84d255df0e7da058fba2b4ca6da3c20cbdfe5a686e01cf5c45" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00823-of-01024.json.gz": { - "num_bytes": 395437149, - "checksum": "62818e45f34e70728494c74daa583e30c70aebf91c2f057470039f6d35059691" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00824-of-01024.json.gz": { - "num_bytes": 394503147, - "checksum": "e9fd88994b23531ba26e6859ec1985798a2ab9b300c2fdb1e202ac553ab305b0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00825-of-01024.json.gz": { - "num_bytes": 398841091, - "checksum": "77ad5a9ac5e3c1d1180981bffbbdbf8a429854001d990258c615e0e16c8a9f6a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00826-of-01024.json.gz": { - "num_bytes": 397404278, - "checksum": "06a39374c1cda19cc4b034c4877e1fd3bdc84290fdb621fdcdc77f3c5eea9a47" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00827-of-01024.json.gz": { - "num_bytes": 399316947, - "checksum": "fd27a73b130c1cf8256f22212e23799d0dd31281cd29bcf9bb658bcda457b66e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00828-of-01024.json.gz": { - "num_bytes": 397514415, - "checksum": "3e7d199d05f885e8bba769d21a55a3f2ef2114b66ed738428ceb506fdf272ff2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00829-of-01024.json.gz": { - "num_bytes": 397251538, - "checksum": "91650563e9520b2d1ec2cd726304b781b4156ffb68bc172635a53f425fa6bb0a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00830-of-01024.json.gz": { - "num_bytes": 397653118, - "checksum": "893ef017cbf7d46c99d9c69ba74344cfc2800bb23faf93e7400c0c282422945f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00831-of-01024.json.gz": { - "num_bytes": 397299276, - "checksum": "4eb3c91e52547f3b4af586f5bbdb0cdaf6a345b202a09c6aabff5c5f628b2948" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00832-of-01024.json.gz": { - "num_bytes": 396915924, - "checksum": "9fffd46fc1f1bce010484f2850102e2e153c5695c277efb67f65811630c2493d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00833-of-01024.json.gz": { - "num_bytes": 397652261, - "checksum": "3b89df9375a906c96eb1e21a6572a07de2f5d875996c01c744933984edb1af1a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00834-of-01024.json.gz": { - "num_bytes": 396070735, - "checksum": "b758b4cbfdfb799a8615ec9c3678b27dcd9b1d63af4f272879e0dae84cac9d63" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00835-of-01024.json.gz": { - "num_bytes": 398028152, - "checksum": "6e07f1e6a099aa496fef3015514fe5f3cc665c742f8a783389c7da4ce0e0e72d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00836-of-01024.json.gz": { - "num_bytes": 395941604, - "checksum": "6bef1291a741ea5976749456185a3e3a03c3fcc9ac00370f28672ab39c552db8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00837-of-01024.json.gz": { - "num_bytes": 398655070, - "checksum": "b0b7e1c826302417630c3e1b1877bf106beefb5a7a11feb9bbf1ac3712714fed" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00838-of-01024.json.gz": { - "num_bytes": 396374435, - "checksum": "3e9bdde8b73397a5fce143e91c92f9e66f46b45edfb30da1cac400b9aa7b2ecc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00839-of-01024.json.gz": { - "num_bytes": 396388725, - "checksum": "4154322b97c600742660125e6458787e603cf1a44b49267f4d1c569387fd132e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00840-of-01024.json.gz": { - "num_bytes": 397564603, - "checksum": "f9560028196fc934378389e355101e5e7f8fde9e5c921722704a18b24ebc5804" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00841-of-01024.json.gz": { - "num_bytes": 397001678, - "checksum": "0dad99ac959765280e6bf6d9d1a1468ef9dc9cc781e8f5bb832f7295e4e79f69" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00842-of-01024.json.gz": { - "num_bytes": 397139167, - "checksum": "e81fd683da081349629a0a7ae8ff7813351ed23caf4ef87041b64524034abc83" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00843-of-01024.json.gz": { - "num_bytes": 396044889, - "checksum": "d8e3a5b4148c7e86dea50ee5ba89ef55629d3550fd926c41754e5a26e7e52c36" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00844-of-01024.json.gz": { - "num_bytes": 397365441, - "checksum": "c4d2ffe853b55464961b707b6d0264d6852817077204a0380c906184c077012c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00845-of-01024.json.gz": { - "num_bytes": 396477802, - "checksum": "7b3c4d435eca57a0fad05c106ec5928750aa01d95047618a3bc84e5342e912c4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00846-of-01024.json.gz": { - "num_bytes": 395983616, - "checksum": "bdad2ba411291435ac0cdd083e46aa8369499f014a788fa85ed8c419fe9cb2de" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00847-of-01024.json.gz": { - "num_bytes": 397646062, - "checksum": "3f6bddcefcceaa4184161432e4f0b9292ae4fe7dac3079d4191a31a38f48c7bf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00848-of-01024.json.gz": { - "num_bytes": 395958111, - "checksum": "5ed10d926e5fd1dcbc777df82391eb3ba57276c7303d488d6f3591022d20cc4a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00849-of-01024.json.gz": { - "num_bytes": 396960036, - "checksum": "ab82adc6f66ab0403cbbb38859009a460e6c8c38c789bc2b2420da8b87096a9d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00850-of-01024.json.gz": { - "num_bytes": 396603592, - "checksum": "5a6aa59a01504f5655d429dd5cb3ebc39e3994b22cbaeb5b09ceb29a26b94031" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00851-of-01024.json.gz": { - "num_bytes": 396511886, - "checksum": "f1954da7e217d893a0237a0f431dd2a9071723e543bf0f4943ce38fab048a44e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00852-of-01024.json.gz": { - "num_bytes": 397626831, - "checksum": "f5cdcd7ec4f3c855a1006f9278ed4df50574a3fa7aa1c5a2e255ea5fa1a770cd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00853-of-01024.json.gz": { - "num_bytes": 395811873, - "checksum": "24b1033da877ebddc09cfe2d3325868448dab9083b5147d6cfc4fa63ab402a94" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00854-of-01024.json.gz": { - "num_bytes": 396513614, - "checksum": "419952e0bc38cce474190c0b9ea581ccbce77da5e045dd60f5ff1fa1d2833d19" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00855-of-01024.json.gz": { - "num_bytes": 396493352, - "checksum": "3d2b529871c625fc9c1c59b9d5cede2a77e609041f1ea044d68ac16e9fa6a30c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00856-of-01024.json.gz": { - "num_bytes": 396852729, - "checksum": "a3b56e6171fc2b14ebe67f6a71af688ea6135597bb8f8cf83e2fb460727aa5eb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00857-of-01024.json.gz": { - "num_bytes": 396428653, - "checksum": "de550a5d608bffde45c149bc0d4c1165cbd3b5baab3d3529f006a02aba6d53e7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00858-of-01024.json.gz": { - "num_bytes": 397039613, - "checksum": "11374c2685676ac2eb3dd0d281b44b512ff1d2968ab320d9c857b44304eb8ab8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00859-of-01024.json.gz": { - "num_bytes": 396515194, - "checksum": "64879e565e5c467e630566ab75524bb300d58798c814637ffebd15646544cd5e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00860-of-01024.json.gz": { - "num_bytes": 397764125, - "checksum": "7e22be61b3413c8fca2414087655b7ef7bef2ab5ee373fee74d13c8fb991675b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00861-of-01024.json.gz": { - "num_bytes": 395314420, - "checksum": "29c451c69c8c05f6eee2741b9ef6c241f551257a45da8342a1d6bb341f80314a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00862-of-01024.json.gz": { - "num_bytes": 397763845, - "checksum": "679668616899f548fb35da32c3e5f121002670cc3296c0c90f5bf45eb3ea1d79" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00863-of-01024.json.gz": { - "num_bytes": 397356206, - "checksum": "43c5b3af2173d4293396f336ec363aa2f31580b65128f44ca8bb891f2022859c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00864-of-01024.json.gz": { - "num_bytes": 395463092, - "checksum": "77b7b6299955f4869e5db994fa6b20fe3007cf8cf2b6609442fb1ed49284cee6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00865-of-01024.json.gz": { - "num_bytes": 396909291, - "checksum": "7eca0e82842b52f99640ab574e4b2446309aba6ac262f980fc6d249a337d06a4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00866-of-01024.json.gz": { - "num_bytes": 397587651, - "checksum": "931014d99ab2a765ebf90e876694647c265ca5e6bf2b459eb027d6b06643a8ac" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00867-of-01024.json.gz": { - "num_bytes": 395992645, - "checksum": "0976a5389aed40e4bca89cf22382cf121390c75bd755437be474c097c8fee0ed" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00868-of-01024.json.gz": { - "num_bytes": 397789857, - "checksum": "6ffd848d165290a746a21767e79a9f046b70534aaf7b14fc01f9365e4e3f7d93" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00869-of-01024.json.gz": { - "num_bytes": 398124116, - "checksum": "5fb85058bdf40c0ee6cf748cda7483b1b3cfad18c26a90c2150c2a3f30ceeeca" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00870-of-01024.json.gz": { - "num_bytes": 396432487, - "checksum": "89d50aaa3620eac4ad593a403ea637b2ff090361ead05c3aa8c7a3351c66ad65" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00871-of-01024.json.gz": { - "num_bytes": 397484772, - "checksum": "490f4104981a9ab3ef04600a4865b9a2a18239e335d7fb7fff79ec1b7a225318" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00872-of-01024.json.gz": { - "num_bytes": 397240896, - "checksum": "d344994866bc49475f66e9937636afa787e1ff560e3f62dc1a0e4d0220d6ed39" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00873-of-01024.json.gz": { - "num_bytes": 395450398, - "checksum": "5d3b320aab1f7f09450531649666ded1aba8a9bbcf0f47992c43cb40a6d7a929" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00874-of-01024.json.gz": { - "num_bytes": 396365056, - "checksum": "346aae20204537ba2f4a865ca80b5d1c6da1e3a3b78d306d7570a69f185cc4fb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00875-of-01024.json.gz": { - "num_bytes": 396679348, - "checksum": "ba81f9c1650d30853edbb9886dde84658c254dee5a3ac1062484f7194cd413f6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00876-of-01024.json.gz": { - "num_bytes": 398278881, - "checksum": "88fb38aad7cadd76c818dbe7a372144dfe17d110f7d2123a80d14686fb43a6dd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00877-of-01024.json.gz": { - "num_bytes": 397051868, - "checksum": "049e4a62056c98284b35d10a74ad5ef7014265a6dccb99a71f93a409933a685f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00878-of-01024.json.gz": { - "num_bytes": 396132123, - "checksum": "bb7b97a82bd6d31612de66a03af35d404b15808b925e7fd94bd0a8e9e928b927" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00879-of-01024.json.gz": { - "num_bytes": 396520374, - "checksum": "2a56fed53aa022e6a7956f604d54d99af89a15b6c7fc6b037f94d347f1d15f51" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00880-of-01024.json.gz": { - "num_bytes": 397004524, - "checksum": "1cadef434909d4508a9a6bf40d6a9323256f3089615a5d2963c83040d5f549f8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00881-of-01024.json.gz": { - "num_bytes": 397336334, - "checksum": "0e36dcd0eb1773eec15ffd0fbbe8951343bb6961dd1838b51e74da2e055db176" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00882-of-01024.json.gz": { - "num_bytes": 394949798, - "checksum": "78c99406cb921c2b8f5b86e4e7eeed24c799678732e5a5450db6b12b7ceeef61" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00883-of-01024.json.gz": { - "num_bytes": 398647721, - "checksum": "f0e7a0a9970c7fdb5f629771e76bb06bf62b79e9cbf5008e866f954dd436401b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00884-of-01024.json.gz": { - "num_bytes": 396040500, - "checksum": "05272a55eb2840f94a7dcc30a8d09b957511b983b0fc3fa618a8995bc594d055" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00885-of-01024.json.gz": { - "num_bytes": 396460591, - "checksum": "27511aa50410260d261866dc970b897b10a95dd4dfd92b0bc3a5fc41e6c75335" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00886-of-01024.json.gz": { - "num_bytes": 396149133, - "checksum": "e66ba9c7ceca631a4b43ecff1e151524a209368f298ca83624476ee9144cc3cd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00887-of-01024.json.gz": { - "num_bytes": 397164216, - "checksum": "95e341054bd8a21e7f49e4a5aaa5fbe51517ff631e66e67ff1cdaea6e3178002" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00888-of-01024.json.gz": { - "num_bytes": 398216402, - "checksum": "6fef57de31fa1692d8a4021b317554688657fad3f55dc144e2971d63083e7879" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00889-of-01024.json.gz": { - "num_bytes": 396976936, - "checksum": "36da1bd0eaa27ca6e8510a3c005695fbbd7b0fedf63f077e3787590d4b1af625" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00890-of-01024.json.gz": { - "num_bytes": 396903125, - "checksum": "6bbbe5db2c0938efe5f8afe7b30765f45cedc9fd4209bb7826c489381175bc5e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00891-of-01024.json.gz": { - "num_bytes": 396404354, - "checksum": "47601b1b1a0a725c32ae0c32364f7ac188b7e8c68d29a2dffbe1a4dbe39393f4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00892-of-01024.json.gz": { - "num_bytes": 398144052, - "checksum": "a7b6bdafa5a226c22ccdf97c873e4915ed8dd8b59e2820a4dc62f600b4710175" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00893-of-01024.json.gz": { - "num_bytes": 397990484, - "checksum": "12f08cfa1fb4f94a3d7d9584cc3f5ae9fa518cc095e4cb07939d02ecfb7ffd9b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00894-of-01024.json.gz": { - "num_bytes": 398271782, - "checksum": "004bf46ac7c8d7770b458ec341322f5cef643926aff9255954f08faa1dd43d53" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00895-of-01024.json.gz": { - "num_bytes": 395489909, - "checksum": "3ea14b3dbd7a4c9cb7aad83d1311d335714aaea5b2dd0374debd63c56d02dcbb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00896-of-01024.json.gz": { - "num_bytes": 397589097, - "checksum": "c0f1c7e54bf7a808f66d2acc9aec79f1ce936ba480f5d1e379c6853714413175" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00897-of-01024.json.gz": { - "num_bytes": 399215096, - "checksum": "20958123acf2d578448a5166f1209b0452db33ed395cfe512015106bf99ad31d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00898-of-01024.json.gz": { - "num_bytes": 397044516, - "checksum": "46c5145069d861c04b2ac1afe80c4c4453f91869f6cb6a1d9f7b648f1b08942e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00899-of-01024.json.gz": { - "num_bytes": 397687759, - "checksum": "2a3923d8ff2ce0eab5978a8e0198bc2d1512cfa19c69e673e048b8eaa72f82b6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00900-of-01024.json.gz": { - "num_bytes": 395192267, - "checksum": "9cc72deeea7fbc0fa3782c41938d66315923dd9f53d89f47c00f85f93e454ce5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00901-of-01024.json.gz": { - "num_bytes": 397806320, - "checksum": "8cfff74f280636416f523c271f75e5704a570db4cddb8a70d033158868c21347" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00902-of-01024.json.gz": { - "num_bytes": 398450537, - "checksum": "7df8804eb5ecb79177001f9ce3c66f0ad20cccd8151e817816e9342d07c392be" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00903-of-01024.json.gz": { - "num_bytes": 396733151, - "checksum": "89551a52d1e97b4ec3007f8c43191c1ae1475d0ba5b48d20818a12c85b0add74" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00904-of-01024.json.gz": { - "num_bytes": 397497719, - "checksum": "2bcde59dfaa642722969d1401a4ce43a35c57930bb1d664371efece1e2e91c32" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00905-of-01024.json.gz": { - "num_bytes": 395760696, - "checksum": "ec844272b0666a455dfe0cab065e00df44e8da2156a03797100418307c96830c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00906-of-01024.json.gz": { - "num_bytes": 398496346, - "checksum": "ff68909d470edef08929a91068e1de02841c16a000fbbd17ef042cb76f1fff37" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00907-of-01024.json.gz": { - "num_bytes": 397085405, - "checksum": "a9b26676af61a6a1355225bce5bbcd67aeaf0fb7dc2209f30235b275536baa85" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00908-of-01024.json.gz": { - "num_bytes": 397037103, - "checksum": "e86688677a46103b0b224333faf1b4f89da062e4ec0ee35752c91ff9772697c7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00909-of-01024.json.gz": { - "num_bytes": 397394775, - "checksum": "93082177607900bfce7fc53f1665a831093bb50caea33e014f327181579c0012" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00910-of-01024.json.gz": { - "num_bytes": 396668466, - "checksum": "dcfe639607c18a309e2c91864a6912dce3851abd62bbed3ba16390899e637327" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00911-of-01024.json.gz": { - "num_bytes": 397926997, - "checksum": "aa995c38d953237b1d6d53be7237958a00ca2dbab4a753c7c4404849fb416d5d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00912-of-01024.json.gz": { - "num_bytes": 397810240, - "checksum": "e3f17ac285e8c9b04713713a957602a63e176f476d4a67018012e9cf2a3e5a84" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00913-of-01024.json.gz": { - "num_bytes": 397143597, - "checksum": "4082ab833be47cf881693ea4442e3940625e0d2c1117e15234886fdfa779bce3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00914-of-01024.json.gz": { - "num_bytes": 396398347, - "checksum": "7c62dfd17b21ff64af640e4aca8fea0240998596d11ca551a3ab045d5041fcac" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00915-of-01024.json.gz": { - "num_bytes": 398622100, - "checksum": "69abe67cda4b1613d5f741804ccdb294cd5f457027818d9366db8cf2f5f40871" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00916-of-01024.json.gz": { - "num_bytes": 397387266, - "checksum": "6effa83cbf3345fd7e41e432ef82156bb1334f2cf17589bce313aebee9727131" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00917-of-01024.json.gz": { - "num_bytes": 399730979, - "checksum": "f0d0ff1ae76a84c07647fa1517410533862f1927fa85dbf38017dabf4607bc1f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00918-of-01024.json.gz": { - "num_bytes": 396895902, - "checksum": "84cc56e725be31047d0b6a025cfacefc462f4a1a546feaa34af95a6f25a4e1a7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00919-of-01024.json.gz": { - "num_bytes": 395247578, - "checksum": "daa3156989ddaa9a7eba228848697ccf6a385679359ab765881d2293bef107aa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00920-of-01024.json.gz": { - "num_bytes": 398305242, - "checksum": "2a9e02ef643962f6009e42304b983c87bae7b74c1edcbf8e6808b320ea7ea776" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00921-of-01024.json.gz": { - "num_bytes": 396446011, - "checksum": "f83526ad11d81820fce4231e3303d613dbbe56a8fae878d9442c8d7e98023437" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00922-of-01024.json.gz": { - "num_bytes": 398010331, - "checksum": "e47cb9d7550644ef807c3ea9e19ca4aa1df54eb908b54651bf0e17f0ded9157d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00923-of-01024.json.gz": { - "num_bytes": 399160018, - "checksum": "470401e5b0777096806113a36dcb92b8d453d6e8f5f4f0b15df2788e382ca03f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00924-of-01024.json.gz": { - "num_bytes": 396880756, - "checksum": "c86e546c68bf8458951fa723c086d6efa5b210f53cd4fcb2de4b9efc7a71a275" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00925-of-01024.json.gz": { - "num_bytes": 396806561, - "checksum": "5d9b1105c0053dc9530c911046f4da458f41d92c771282d0df8a3a22838feaec" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00926-of-01024.json.gz": { - "num_bytes": 397479994, - "checksum": "c3253305ac4ef226501e4fd4a6acfc6067a76c084ad852eb2a9f5916aa3d51a2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00927-of-01024.json.gz": { - "num_bytes": 397083225, - "checksum": "8931df0ee597f72ea3592d0a4d236ce655a92cf4e7eb9298145f496246c18c21" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00928-of-01024.json.gz": { - "num_bytes": 398000839, - "checksum": "5e29e75231bdb413dedd1211bd87e9fc3f4ab8bba41999afc1ddcddc16f4599a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00929-of-01024.json.gz": { - "num_bytes": 397731309, - "checksum": "03f7a9199b7927a6d78a8aa4eed32c250d32dc409e3bb2847d7db948ee63d46c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00930-of-01024.json.gz": { - "num_bytes": 398133003, - "checksum": "b22a79dc228697394d0ce25b7d31112f9e1a6508cdc4b57af35e84e65167bfeb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00931-of-01024.json.gz": { - "num_bytes": 396694508, - "checksum": "dbbc65db3d442f9ace85498a3b27bb598c20cea171b3de17d409f9b989c262d5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00932-of-01024.json.gz": { - "num_bytes": 396255463, - "checksum": "02af4162b084004e99dc6862c88749545593e342a83523597cada140e57a0ab7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00933-of-01024.json.gz": { - "num_bytes": 399013035, - "checksum": "dc4d3b4f03c36a8f1393ba15195c3f64b128862b812839689fa387e708ffabaa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00934-of-01024.json.gz": { - "num_bytes": 396593138, - "checksum": "02a5a8e02b2636c9e912a9ef8a79ececde4f4fc92bea74e59791d181bec104cd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00935-of-01024.json.gz": { - "num_bytes": 396748502, - "checksum": "05d1d6290580d5c74b906ab03fe6773ecaaa1ff3be84dfdef48d1a2e7f5e1120" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00936-of-01024.json.gz": { - "num_bytes": 397737673, - "checksum": "351d3543b1457da9719061948a1b4bdd79be8a0b786ecd6a9a8cc0db49cd2181" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00937-of-01024.json.gz": { - "num_bytes": 395377872, - "checksum": "d431b01bddcf911d7da5bad74a78d0d1527d60d9720f77868ef08e1a65850986" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00938-of-01024.json.gz": { - "num_bytes": 397193715, - "checksum": "bff5e755b174e3608ba72b39898a2bb5e9ca6d3362b70bd66143566aeff52690" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00939-of-01024.json.gz": { - "num_bytes": 398044482, - "checksum": "03facf22c376f03a8078e99d1dcc1c22ed5d7e179de472019cae894f40c7a4ad" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00940-of-01024.json.gz": { - "num_bytes": 398894204, - "checksum": "3d3a2125262ee8ca498cd54db52fe626d010a2a93c000ea2b45f931e491ea9e5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00941-of-01024.json.gz": { - "num_bytes": 396758197, - "checksum": "b3957de08e7779d8ec23af02a6d709189796314c70a99f46c90d0bfbd14ad561" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00942-of-01024.json.gz": { - "num_bytes": 398181993, - "checksum": "74aec8dec794c79683dfe43d8aece4c1c47c5389aa6d4bea847ac461cb5ba21f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00943-of-01024.json.gz": { - "num_bytes": 396271547, - "checksum": "231f63d05f81d249f618768c9f712cc31314dacf55a6004902a0e7d0bfb13724" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00944-of-01024.json.gz": { - "num_bytes": 396603419, - "checksum": "d5661730f3ed6cc5bbc5d935a6f1ac7d241b40c52dc83775a421e7a1a672f518" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00945-of-01024.json.gz": { - "num_bytes": 396596660, - "checksum": "3b5aeb0786dddf0b9cabe2ca071283b276822e2861d8688e38f927595c159b02" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00946-of-01024.json.gz": { - "num_bytes": 399900563, - "checksum": "6d5549970af2c6987583477991552e1944b411642782c07d17eb52f91e714a1b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00947-of-01024.json.gz": { - "num_bytes": 395391489, - "checksum": "f5544ecb42c385cd5d5120c82140e4a36051f6a401d89ce30c8f2fc08cd69804" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00948-of-01024.json.gz": { - "num_bytes": 399257562, - "checksum": "1448cca7f1b9824adcf8437a33d14a7e95b705396611f82e7aba9a69e0a25118" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00949-of-01024.json.gz": { - "num_bytes": 396371965, - "checksum": "a7eb228f1d1ff2744af3d1a1358a94611cd92c25d81edac0e209b9f81c8a0a60" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00950-of-01024.json.gz": { - "num_bytes": 398022110, - "checksum": "8651693d2180e518039da487f638c532c53f6d79a33356922b2d8706aa6a83cc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00951-of-01024.json.gz": { - "num_bytes": 396224338, - "checksum": "c46bc8aa1621153fbd913b5d0b23a82352a28b36ec997c4df4b92dcc6ef26895" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00952-of-01024.json.gz": { - "num_bytes": 397581207, - "checksum": "02775930e3c420978a9d2785ee0137c3963dba7bc34538b2155eb38dd6ee89a0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00953-of-01024.json.gz": { - "num_bytes": 397045599, - "checksum": "9d54940cb594de6e0f8593f64293e96375f0a5c56f3569c72720476bcef1f1a5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00954-of-01024.json.gz": { - "num_bytes": 395457873, - "checksum": "3c12a1c3061164f345d9e402bed28be9af84ef56d5df1b22a3cf9f818ed47ae8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00955-of-01024.json.gz": { - "num_bytes": 396450938, - "checksum": "45db78bea4fae6cd69d900c581fccda873d2aa9f24ac5e9dfc18b486c15c3788" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00956-of-01024.json.gz": { - "num_bytes": 397120474, - "checksum": "7db7ea23446bd8a66737546c5daa0c2dec7bd5c4743f52eb53685ccbf54d9b17" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00957-of-01024.json.gz": { - "num_bytes": 397403279, - "checksum": "89de2950bc3f7dd4f95d8a0b7cba19e9678bfbc23175bc22d9f9599ec1ad9cd0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00958-of-01024.json.gz": { - "num_bytes": 396861933, - "checksum": "f325478647cbec9d79bff2266672144147276a82f665d3014c5d2fa9c112c387" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00959-of-01024.json.gz": { - "num_bytes": 398439950, - "checksum": "70d786bb337c012269caf6aeea3bf9604d279d3e4335294c72ca6cb5a9fbd951" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00960-of-01024.json.gz": { - "num_bytes": 395684257, - "checksum": "e1d170b0a4d6954a920ef3923688a7dbf40398609ed2ae04b2635df9ceb07821" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00961-of-01024.json.gz": { - "num_bytes": 397526287, - "checksum": "47b90e3747f35bf67c872d65d843f6dd9bfca15dcb769b31bf3586c6645858bd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00962-of-01024.json.gz": { - "num_bytes": 397473683, - "checksum": "d0ddb2c104f515144265bd3eed526a65ada46f848183688b420694751b113272" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00963-of-01024.json.gz": { - "num_bytes": 397964876, - "checksum": "74725b631c1699b1166589eaebb66374c031b170eab3ab359230cd4a23a8ae79" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00964-of-01024.json.gz": { - "num_bytes": 396523661, - "checksum": "fa0d49a2cc726628d9a1b5ae2ace52ee90401af8ae15add27c3f4566dd99a79b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00965-of-01024.json.gz": { - "num_bytes": 399289514, - "checksum": "11fb1878a8b204181f7f776a764f5e9e577d0fe62d4b2e4ce2164ce9fcc30b8f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00966-of-01024.json.gz": { - "num_bytes": 397411408, - "checksum": "5646014ca3c99f53bd13183187b1e6e8f84cb6c846d6f1f3a3c82edb4accc47e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00967-of-01024.json.gz": { - "num_bytes": 395095282, - "checksum": "b799b17f36d85235eaf1bed9f4f760a22b75fca736744218e44fae5917a2286c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00968-of-01024.json.gz": { - "num_bytes": 397189410, - "checksum": "8d9748f5a92a9e0b836fe74b962bd2da04b62a0a2943ea5e440cef19166a5479" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00969-of-01024.json.gz": { - "num_bytes": 395651742, - "checksum": "f42c71219641fa302692698b4944864f27b7f87d4477a86babe23745dad72715" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00970-of-01024.json.gz": { - "num_bytes": 396180197, - "checksum": "383d9586f27579b4a97c5901013b3e025f10dc813047d65158d6621430803aec" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00971-of-01024.json.gz": { - "num_bytes": 396574555, - "checksum": "d2c9700fbac454d3b3a42b2a3c4eb0111eb7cca7cab3d545b0912aba60415c91" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00972-of-01024.json.gz": { - "num_bytes": 399639122, - "checksum": "5d59e643bf20156a28e5e9dfcd811c5a6c3779e1875f375db09a0fa1871dcc90" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00973-of-01024.json.gz": { - "num_bytes": 395456709, - "checksum": "8b22e82588e30f30f664895b9716cbb0cf38d5ff4331d3be31ab25663c634a00" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00974-of-01024.json.gz": { - "num_bytes": 396693438, - "checksum": "5fba4f9d634d968f15d5d4fb29d253646494e3e125aaf1c2f8fab38a7e60180b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00975-of-01024.json.gz": { - "num_bytes": 395697641, - "checksum": "b4c5fceb9fa2397a9b7c75249bd3386b8dbf999d5b52521051a86e067d698448" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00976-of-01024.json.gz": { - "num_bytes": 397172005, - "checksum": "093aa01a944a222828656d31dacd8ecd57a24a51d361a8742514bb6af009dce9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00977-of-01024.json.gz": { - "num_bytes": 396182407, - "checksum": "1beef6e248c00abee5f8952641b12d3f5b12d58adc05c8d461c0a073a6ca9b39" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00978-of-01024.json.gz": { - "num_bytes": 396180428, - "checksum": "0f2bb125af300de2c9fe347899673a4bd2842ba8298146bfe94c9eddc41893cf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00979-of-01024.json.gz": { - "num_bytes": 396479117, - "checksum": "1fe9d0e54b9be79722e6483e386801263ca51d6e9ad925dabbb58a38c4df877e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00980-of-01024.json.gz": { - "num_bytes": 395119279, - "checksum": "0f262ff2d4701497f6fd6d4f9d3cb1aa3a730ad6bef1961d890a3b0cb4747ee8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00981-of-01024.json.gz": { - "num_bytes": 398285798, - "checksum": "a295b85e63c176cecd9f5222ba417eeda307e41847eb38c61dec9b83101a8256" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00982-of-01024.json.gz": { - "num_bytes": 397811687, - "checksum": "2a3a0e0f454dd72a68ed1dd71c508a9b24fb2349ffdfc588cbfcef728cbaff05" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00983-of-01024.json.gz": { - "num_bytes": 397069906, - "checksum": "5b4256392755c4dd79cd37cd6ede645a9a549c4436acd27495e974ebe1d80bc7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00984-of-01024.json.gz": { - "num_bytes": 397670152, - "checksum": "68d4f5dbb3fa349a6811edce8056eb297e771cb9c9939c3a84d30c6ba3ad9dc2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00985-of-01024.json.gz": { - "num_bytes": 397949975, - "checksum": "6ba478b8a1ebf3b1dd67ed7b4a055cc9cc3c01bc90c1852aea8f5a99f6c07e69" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00986-of-01024.json.gz": { - "num_bytes": 397730984, - "checksum": "a39a23589cc434e573613e3ead44f33adb005c2c13cea8b33601647c97300fce" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00987-of-01024.json.gz": { - "num_bytes": 399173506, - "checksum": "eab46d9d0a0cf05dc5ba475017d98f02f1cfd756c8e707d9823a0463713ebf23" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00988-of-01024.json.gz": { - "num_bytes": 398674037, - "checksum": "88749d380aac85314df66448542b696e9ae6f61f1b27dc395556737f59ad9024" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00989-of-01024.json.gz": { - "num_bytes": 395313344, - "checksum": "bc565b662396e3ab4e108635e01873014515663bd5216926a59ae80f6cd4273b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00990-of-01024.json.gz": { - "num_bytes": 398567254, - "checksum": "e9b9bd97a30ccac353a2386babbd01c3a3bbede8c07bc28d17aecc7ef5af6330" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00991-of-01024.json.gz": { - "num_bytes": 396958611, - "checksum": "505ab5458d5e52d656048284fd22cc0fcd16e49ba19331669239be37645cb04e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00992-of-01024.json.gz": { - "num_bytes": 396102263, - "checksum": "59ac5b2b04f224be04a4ceac6a16e29a33681f19cd40cbce3d3e8eb961b9f33f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00993-of-01024.json.gz": { - "num_bytes": 396935362, - "checksum": "c804f2311de9f7ae5691280e16261b9f8385ef9a71929b2111dfade532b6bdd7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00994-of-01024.json.gz": { - "num_bytes": 398832432, - "checksum": "594727bdc3756e678bd4d156216712ed6c8fc98d3f8e9594cfbed10b2e414554" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00995-of-01024.json.gz": { - "num_bytes": 396699737, - "checksum": "bb3c73c6d48aebf9c60cde56944faa5bb6727db4cc48ae23d67650742462c42d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00996-of-01024.json.gz": { - "num_bytes": 398059244, - "checksum": "ac1a7e6e2c2a5468c704f5a2318b5617dd4ce140b98271e2034e00015db6cd76" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00997-of-01024.json.gz": { - "num_bytes": 397439167, - "checksum": "ce9664b29c86c05d3541aee377acdca7a32ef8f0220e0b4b6bf18276b692529f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00998-of-01024.json.gz": { - "num_bytes": 397383159, - "checksum": "1b4db1b59255f106dd2af7510112eef6d6b611d9f9e000a0e585b623fdb8ae98" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00999-of-01024.json.gz": { - "num_bytes": 396339114, - "checksum": "ee5e1508704b03f0a9cb3c4bfb578c08fb83a4d20760e3b40f101c58cbbb3ec7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01000-of-01024.json.gz": { - "num_bytes": 395172166, - "checksum": "f8cbf0bd9c2b90e588942048848fbfa1a20cf775364cb9c84b4d5dd7cf19e603" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01001-of-01024.json.gz": { - "num_bytes": 396629363, - "checksum": "7cad3f9a28e5988ef91073c48e9d85ea7030289690f817545cfa9f1165dd33d9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01002-of-01024.json.gz": { - "num_bytes": 396507390, - "checksum": "b4ae1017913509855d6d8d4413ff3de4a8d519d91f354b6e5b5267219d20658b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01003-of-01024.json.gz": { - "num_bytes": 397652598, - "checksum": "0c115446c159d27e6e1354173ebec29e6dff5f38c4d2ddb46c07c450523309c9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01004-of-01024.json.gz": { - "num_bytes": 397408971, - "checksum": "f0b559a832a9ee50225fe1417d936d6b898026d80a105b976deaeae75f9e30a0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01005-of-01024.json.gz": { - "num_bytes": 397753911, - "checksum": "e001c9285ade7de6ac23716b596ddcc733f05bd6abd7e1a67874894c93fbd43a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01006-of-01024.json.gz": { - "num_bytes": 397962701, - "checksum": "acf13433824104e4bfc3a8aaf8805eb16712cd97b2dc1d48e7d771bee4bd41c0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01007-of-01024.json.gz": { - "num_bytes": 395966285, - "checksum": "4c6069f6a95d036fd3e05a4246db932ad5ab89b9470274f23a17df0b77b9b717" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01008-of-01024.json.gz": { - "num_bytes": 397075505, - "checksum": "9b3b9c0cd4ee02e18a5d22142183874586da8fd23b4f97033e354f9681d150a2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01009-of-01024.json.gz": { - "num_bytes": 396881470, - "checksum": "14d2d7cf2ebf3b2c73bad4a6099fa1d2b1cb341b100976b03232fb664a7d020e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01010-of-01024.json.gz": { - "num_bytes": 397471393, - "checksum": "01e6f56bebe0c874d82135f551a6b917759c41af48d127df181267dc9b8f6486" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01011-of-01024.json.gz": { - "num_bytes": 398092801, - "checksum": "ead5b6b13bd09136fccd9548c224398401bda0ca7ff62ca4db852760760f13d3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01012-of-01024.json.gz": { - "num_bytes": 397831436, - "checksum": "daa2d1507f9b56de0c4aa9d86d93259c1e6f73f0cdfd553ce075a16807dbcb56" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01013-of-01024.json.gz": { - "num_bytes": 395098326, - "checksum": "c2b21a1a56e9879335c72008919e8f7998dcc1e8df2258fdf2196ea86194e3cc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01014-of-01024.json.gz": { - "num_bytes": 396164077, - "checksum": "0df125946c83c66c6961eae2aa45ad7eea7038d808281d633ce30686a8245e01" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01015-of-01024.json.gz": { - "num_bytes": 397895284, - "checksum": "f6f6eee8fc113b7e717654b9305cc5129c3ee1ce9f263b91f0202762f078a526" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01016-of-01024.json.gz": { - "num_bytes": 397723033, - "checksum": "48426df1f4665d3179251904c96a0e73c041ed5b57885b4dd852809e632685b6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01017-of-01024.json.gz": { - "num_bytes": 396761053, - "checksum": "f33cf2d744585e0338b29a5a5638752123b7b59f9ae3b723cf7e7b536f9f80ed" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01018-of-01024.json.gz": { - "num_bytes": 396562520, - "checksum": "72adb0869cac573282c4bd938cdff556f659540dd4a0a6663711974cb2dc147a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01019-of-01024.json.gz": { - "num_bytes": 397564701, - "checksum": "3b64235effaf41ad61698b2c28f4d73ced1b6ec6b6d79e0f52314176fa0feb12" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01020-of-01024.json.gz": { - "num_bytes": 396053080, - "checksum": "b16b9f815823d176f94388d4c482652ac656aa763ec738ccd8c8a2a3bdefc1e9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01021-of-01024.json.gz": { - "num_bytes": 394731398, - "checksum": "f4c0044abadd339055bf13843938eef4c066856757250fc15f77060fc0881ba6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01022-of-01024.json.gz": { - "num_bytes": 396548645, - "checksum": "5ecd8432526eda57065e6161f0618a19cd5993c7dfe86575775f1bf01836f750" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01023-of-01024.json.gz": { - "num_bytes": 396863581, - "checksum": "c6cd29b8f6067152ccd584ded81df1f9cb905515d48815b8a546d104ec7a3565" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00000-of-00008.json.gz": { - "num_bytes": 50774357, - "checksum": "7cd6c8b1072af3f3ca3fa160d9411960908142743b101f7229223e6658acb42c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00001-of-00008.json.gz": { - "num_bytes": 51252663, - "checksum": "d36ef5fc04b24117a19d992de06400e5f290f11786be99be9de68818f7495694" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00002-of-00008.json.gz": { - "num_bytes": 50860289, - "checksum": "ab8b3dee7c0698c3cc3a74f159d85495b6bb9529600ef9246bec218ae6775e28" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00003-of-00008.json.gz": { - "num_bytes": 50141661, - "checksum": "54d62c9359000b99713a8a0a0fdfa415f1c09824555526f01dc7217b068542ad" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00004-of-00008.json.gz": { - "num_bytes": 51141505, - "checksum": "c11e31de558613237533b41354ca29f0635b599a1c9232517dbf4c2cb1197319" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00005-of-00008.json.gz": { - "num_bytes": 50797157, - "checksum": "20d39c0f52c34a3148c0a235238ed3849576ed895c3a43cb47b0159bf233c7d5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00006-of-00008.json.gz": { - "num_bytes": 50158887, - "checksum": "754a2b7f134bf45f17db7450d5c0eaf2b8824e4a6072be7b20db434f9cb7968f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00007-of-00008.json.gz": { - "num_bytes": 50232244, - "checksum": "f90c1d79c51ee1a009dc05930fc40e9ee4c3840ca2412cc129855156aaddc279" - } - }, - "download_size": 407016751197, - "post_processing_size": null, - "dataset_size": 2060282008734, - "size_in_bytes": 2467298759931 - }, - "realnewslike": { - "description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", - "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", - "homepage": "https://github.com/allenai/allennlp/discussions/5056", - "license": "", - "features": { - "text": { - "dtype": "string", - "id": null, - "_type": "Value" - }, - "timestamp": { - "dtype": "string", - "id": null, - "_type": "Value" - }, - "url": { - "dtype": "string", - "id": null, - "_type": "Value" - } - }, - "post_processed": null, - "supervised_keys": null, - "task_templates": null, - "builder_name": "c4", - "config_name": "realnewslike", - "version": "0.0.0", - "splits": { - "train": { - "name": "train", - "num_bytes": 38165657946, - "num_examples": 13799838, - "dataset_name": "c4" - }, - "validation": { - "name": "validation", - "num_bytes": 37875873, - "num_examples": 13863, - "dataset_name": "c4" - } - }, - "download_checksums": { - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00000-of-00512.json.gz": { - "num_bytes": 30085821, - "checksum": "6666a680b0a34eb8756dcb5fd2b12f0078237f3502e8a513bd3e5b71bb92be00" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00001-of-00512.json.gz": { - "num_bytes": 30065900, - "checksum": "61c3f9ab763067f76d9bea349d86efb97af7539d481b5d2807f362204971c327" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00002-of-00512.json.gz": { - "num_bytes": 30028880, - "checksum": "3aa4405d957ed42d10d643efe7c0f51b05e8f29cf4ad8783448083c1cd3f2a24" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00003-of-00512.json.gz": { - "num_bytes": 30136880, - "checksum": "f6eb49e4c0d691e67fe96ddeb3f8370c5e63a7297a31a8da0c58f5cb3a9f6061" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00004-of-00512.json.gz": { - "num_bytes": 30110499, - "checksum": "6e0908780f555f4b74c6a5055e2c9708333a8466f0b8723a8ea38cc04828ce44" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00005-of-00512.json.gz": { - "num_bytes": 30097927, - "checksum": "a333562df3fcd4c5ccf51b4c00e11f6619ac4a28a878383aefad277bd30131a6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00006-of-00512.json.gz": { - "num_bytes": 30013820, - "checksum": "7c436cd0993077187988239cf74c3e64de440dacad62ba4b02bd4ac0a8d219b6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00007-of-00512.json.gz": { - "num_bytes": 30557005, - "checksum": "dc9e43681c404fef1741e9608295b8dfae0953473993f3fc44fb83af07a6b82b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00008-of-00512.json.gz": { - "num_bytes": 30369535, - "checksum": "8de7a4005acdb60436b4e5d7274084e28df3aee31a5457c6837452094544c541" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00009-of-00512.json.gz": { - "num_bytes": 30033048, - "checksum": "32310a6c74cbee1dbb8b196e0cfad41f79e88e48d8f04c88692d42506113b903" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00010-of-00512.json.gz": { - "num_bytes": 29948345, - "checksum": "b7df217de849e26ecce5ed7a35b6e6238fcc1c08e969023f209307842dd496c0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00011-of-00512.json.gz": { - "num_bytes": 30558885, - "checksum": "82e5428aaeecf27141a7105e48b78dc02516ae6ebc3d6cd4ef13963316279e1f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00012-of-00512.json.gz": { - "num_bytes": 29888513, - "checksum": "f3d7e496b7c85ed7d020c8f8a24a0b27f9b2535abdb22b45c08441a29398c44c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00013-of-00512.json.gz": { - "num_bytes": 29936292, - "checksum": "bf04d82f0cdddc09ce4aecd9f71910b9858badaf6456253d43d89e6a8c56cba7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00014-of-00512.json.gz": { - "num_bytes": 30169338, - "checksum": "15b4611513154de0dfc1c9d470326fd053adf70de814ecfe8ba7ccee66de947e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00015-of-00512.json.gz": { - "num_bytes": 30071363, - "checksum": "887bdea83bdefc50786c93e8014d1d49999f8090ff15168598c884cd0724fec2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00016-of-00512.json.gz": { - "num_bytes": 30451660, - "checksum": "288ad0d553d54052354be506f87878fa7c54b0fa65811c6e456b3262e1d117e1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00017-of-00512.json.gz": { - "num_bytes": 29940254, - "checksum": "b13ad58ae9f38598cb9d560e3ab34c1d0200db73fe86da12230e50086b532463" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00018-of-00512.json.gz": { - "num_bytes": 30282186, - "checksum": "5a67e71955ab2d8f6531bd3949cd8ab71f4ff91863ea5a6ec3e7b33c31a05dd6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00019-of-00512.json.gz": { - "num_bytes": 30373907, - "checksum": "a70682315a0cfe0af815c7b2abbcd63310fabbc33ad6e19daad19f1f51506955" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00020-of-00512.json.gz": { - "num_bytes": 30104199, - "checksum": "980e544ce130a06e9e99ec906342eb0ab8aeaa96ac26eca01c56ebb463f5d688" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00021-of-00512.json.gz": { - "num_bytes": 29733696, - "checksum": "a69729b8f3ccb9db12476a31917783c1c6e036e7bbbb4089f430362aef71f467" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00022-of-00512.json.gz": { - "num_bytes": 30012894, - "checksum": "589e698fe450e22cba47813a5a28da5393e79702a528f6a8469f72f6d630caad" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00023-of-00512.json.gz": { - "num_bytes": 30024851, - "checksum": "2a7b036c38fb4d2df6535631018c23d001931e5bf8d8a815fd5b2f9343ec4529" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00024-of-00512.json.gz": { - "num_bytes": 29906809, - "checksum": "7e512306cb6ebb0b0c3e96ceb16dade9e1e1f484e754bebd0078e7f545fc5b6a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00025-of-00512.json.gz": { - "num_bytes": 30332268, - "checksum": "b636b91fcd9a91ce05b8cbeea6f591a0e916175ab23b0cfaf688171c8a98ae8c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00026-of-00512.json.gz": { - "num_bytes": 30288490, - "checksum": "9e2f8e2a37dcfe66873cc5355740448ef75a1de2deeb2d8c047c3c3a7ee485c0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00027-of-00512.json.gz": { - "num_bytes": 29897688, - "checksum": "882616d1e8ca66c0b6e7aa2ccb18d9239021603ab1b9486638a9a3447ddebe0b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00028-of-00512.json.gz": { - "num_bytes": 30201690, - "checksum": "0312b12f50c64fbe7b894a28e0940089ad57af95df8116cd7d43c0435ec2e79b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00029-of-00512.json.gz": { - "num_bytes": 30237920, - "checksum": "1e8677140186b219d32e764889dcc344ccac9db51685363324d1bc13ddef2bb7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00030-of-00512.json.gz": { - "num_bytes": 30048903, - "checksum": "43558e81c291cbf53a5b6a016aecb0e07e26a98b8fb32f4a000037b281afa363" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00031-of-00512.json.gz": { - "num_bytes": 30294528, - "checksum": "c33ae8a2fad7e5264d093fbe89ed1611357110a4f0f26dd5a93a4dc15560f205" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00032-of-00512.json.gz": { - "num_bytes": 29868168, - "checksum": "5dc2a8f96db8da87607efc0b708e6a2172530f0c9b43665dc01286109b5c55bc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00033-of-00512.json.gz": { - "num_bytes": 30105916, - "checksum": "c4cdc2b39a86eff251f903d7f3d39605b721615aeffa6a2753f3588b7dbef6c4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00034-of-00512.json.gz": { - "num_bytes": 30126174, - "checksum": "6d874182112b0881dc929c0182a30ec4f9f1633372a2b822200a7b1faaf4f1bf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00035-of-00512.json.gz": { - "num_bytes": 30084101, - "checksum": "5bea17f0cd4dd888f5d8a2d4092138e4777d80493a1f410d618d4cedf353b914" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00036-of-00512.json.gz": { - "num_bytes": 30095974, - "checksum": "6e7f42f3012d8ca7500c7e2ec82d27c26b3cd8bb5b8b66a7fc8355d77284f433" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00037-of-00512.json.gz": { - "num_bytes": 30239345, - "checksum": "54ee45bf25152060679bab3e5fc6f5cb5a3add6acd2664cb152f88c223f83239" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00038-of-00512.json.gz": { - "num_bytes": 30247683, - "checksum": "f738a2f0f156f7bd897d9d822748d4192a5fe46b566c7288ed5b840c4ffeda64" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00039-of-00512.json.gz": { - "num_bytes": 30057005, - "checksum": "60235900d69579334660c153c4fe384c08f14f4e729a06a1e8247e8b4ab8a213" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00040-of-00512.json.gz": { - "num_bytes": 30185136, - "checksum": "5a059d64fd6a1b42a2faeb4088db327c47f9e8328737ab74a0e0457f84433374" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00041-of-00512.json.gz": { - "num_bytes": 30314653, - "checksum": "2cfdc460c8dd0fb4766191ef2aec0af856af7c95d11eb3f1d731f63b71db4daa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00042-of-00512.json.gz": { - "num_bytes": 30123256, - "checksum": "64e59b8ebde3c12b0a1d218a302252b96aeb5bb4976927463101a9509579ec22" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00043-of-00512.json.gz": { - "num_bytes": 30057043, - "checksum": "edd200b97394f15f9cf0a6289406a83b42c3d6f961456f031f5814db4f6d482a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00044-of-00512.json.gz": { - "num_bytes": 30029900, - "checksum": "1b2980f21ee5cffb271591adc8eaa414438841426442f194b5f4b703356f4e5e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00045-of-00512.json.gz": { - "num_bytes": 30367170, - "checksum": "83967210891345b831956722e8dcd29cf55fb17b786c85c2dd2778528ab4d1c2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00046-of-00512.json.gz": { - "num_bytes": 30105866, - "checksum": "6921ac4854e2eacaeb4be07669faab85f2bab33f744c7efae1ce17be25176bb5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00047-of-00512.json.gz": { - "num_bytes": 29957618, - "checksum": "e8eba2ba9f51e76a06a2df43b6b120c47b6e41f61e46a2e3331518ebb2d0c84b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00048-of-00512.json.gz": { - "num_bytes": 30329887, - "checksum": "6af9c44a53d7eb9df9d86ee4d895fb9f7f2b9b3863fd30aae325e79fb792a10c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00049-of-00512.json.gz": { - "num_bytes": 30116207, - "checksum": "57dc1e94f73b55e0be5690b01d61188a62186ea9f5f85b556ecef3bcaa36fb92" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00050-of-00512.json.gz": { - "num_bytes": 30236341, - "checksum": "eb75bdf0e63e798838b3d7abfc6a3bfab5de2ba39af833c38048dfe39c1175b1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00051-of-00512.json.gz": { - "num_bytes": 30357091, - "checksum": "f48b1f5e07311ca9d69787019a56ad849932e6868d1f7778681cf7e4cc9fc562" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00052-of-00512.json.gz": { - "num_bytes": 29944959, - "checksum": "debf9490c057f11e404898b4a57cb424c1eb523fa90bb7899b1317f970481638" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00053-of-00512.json.gz": { - "num_bytes": 30240416, - "checksum": "9e847a5c6eb80e5c045fbb405729c695911674bd8d29b1d0be0791303d02f41d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00054-of-00512.json.gz": { - "num_bytes": 30174556, - "checksum": "65a80db1cdde9153e08277ad2d9074dfba1682c0f771fbb9f4aa8f88ca557f43" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00055-of-00512.json.gz": { - "num_bytes": 30134394, - "checksum": "beb8d280d322520ded21aec92ae087867d0bce64aac4e243a127a88f143ff578" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00056-of-00512.json.gz": { - "num_bytes": 29891026, - "checksum": "82fceaec35a2456487a59ae652d72f41a940d2d6bafdc4f05a6e02bcd7ed4dc9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00057-of-00512.json.gz": { - "num_bytes": 29920525, - "checksum": "e4fd55ba5fb2825ef4209aec87706ecdd3db040242c6aacfc82f350765fbeff8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00058-of-00512.json.gz": { - "num_bytes": 30060421, - "checksum": "3cfc894a1853e3d1f2daa314873b7919fa52b7208b590637f8face6536305770" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00059-of-00512.json.gz": { - "num_bytes": 30038488, - "checksum": "4f06ab7b5ce8e8c696445db4a3e32896b6396e3f67d7414a593e7398d752e564" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00060-of-00512.json.gz": { - "num_bytes": 30129718, - "checksum": "7923385ee0c6801073feb10437ee3c59e5f5dfe82c2311ad8c4ec670dcc0ec87" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00061-of-00512.json.gz": { - "num_bytes": 30130505, - "checksum": "5cd682e148b8488775622098214fc2009ef9c95355f46341bd78434f1b560fa2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00062-of-00512.json.gz": { - "num_bytes": 29968130, - "checksum": "53562fc23501f3a1d11c8ae6a59e719d6f4e67db8b8ea1d55e2b1b80849afd08" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00063-of-00512.json.gz": { - "num_bytes": 30116532, - "checksum": "008cc5c0cb7d60e84ffdfe2132f6bb49aafbb31083fd026067b3859326ca64fb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00064-of-00512.json.gz": { - "num_bytes": 30236194, - "checksum": "8f9eee169071e80c94c248f1c37b7fa631bd75a7f6e401f6a963aecd8815910b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00065-of-00512.json.gz": { - "num_bytes": 30077312, - "checksum": "8c5e18ea3575cd350e98d062ef88d3fd1df068e4bd410be8732723bda03656c0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00066-of-00512.json.gz": { - "num_bytes": 29920862, - "checksum": "e377b8112dc6ff6834607c27b927636429e887f4ab8edc0824363941b7bb311d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00067-of-00512.json.gz": { - "num_bytes": 30278223, - "checksum": "ec2c2ac74cc3f4f814d645410cccda266151949dd36aae518b8082b948b47edb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00068-of-00512.json.gz": { - "num_bytes": 29940464, - "checksum": "ddfc16a17cabf48a2c59fa8ef25ccd12d899d3462d08b45f2a301567ccc105c4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00069-of-00512.json.gz": { - "num_bytes": 29903118, - "checksum": "66d9d1791cda56607b2561199503cef216df86b28d4519d5862905671a4ec4c5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00070-of-00512.json.gz": { - "num_bytes": 30082323, - "checksum": "8072d3bd5e19c005493c0332b73ca5be253397f54be90be1bb7b2ef8df7ad117" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00071-of-00512.json.gz": { - "num_bytes": 30128276, - "checksum": "b7c68af5a6dcac3fbb3dcbe12123d1045a79baf657a8b3bdada60c1a97404c48" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00072-of-00512.json.gz": { - "num_bytes": 30458419, - "checksum": "cfe5c6ae2ad1531271b0039042e033bdd7caf9604bfa219980ca27513cea755f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00073-of-00512.json.gz": { - "num_bytes": 30366974, - "checksum": "a132f5e85376b0d0a06c6ae6af9c226dcbc98394461578c4fbc6cd439ba6e721" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00074-of-00512.json.gz": { - "num_bytes": 29987779, - "checksum": "f905e808b50908a7d2a7f0944e7e6c01ffd97ec16e5f0b6ed7169a60d66b0100" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00075-of-00512.json.gz": { - "num_bytes": 30070204, - "checksum": "b57458683803936f6bc03b06fc26be9d1a09ba09517b5c1518676f468e404595" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00076-of-00512.json.gz": { - "num_bytes": 30129238, - "checksum": "81e88ec53e39d6191e40e5852564f592b745abf99c71ff78302292632f636792" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00077-of-00512.json.gz": { - "num_bytes": 30051399, - "checksum": "218b0f6e219e42113e35d99458861f8511266dee6c17d9e2780a17af8877f822" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00078-of-00512.json.gz": { - "num_bytes": 30144230, - "checksum": "c0a337619559362e0e1cd0fe87c9ced5c987313a7f3cb65eb44f8b861c41c616" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00079-of-00512.json.gz": { - "num_bytes": 30544297, - "checksum": "27e257efda6adbce01585b3b6cdeefa95d31f607012fed5dd4310bfb5a790ba7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00080-of-00512.json.gz": { - "num_bytes": 30188866, - "checksum": "26411f1a0a7b299d0bf6cf78db04b0bcc617894cd87d59e54614f3258dd393ee" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00081-of-00512.json.gz": { - "num_bytes": 30418881, - "checksum": "87a659f6b24560a754ccbfb6aee019484e48e3ddc7955a6c7a18aa9098952cfe" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00082-of-00512.json.gz": { - "num_bytes": 30086460, - "checksum": "708fe5108042b957688817625c84059c11700b18ddcea3814b86b6c8c66af8a5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00083-of-00512.json.gz": { - "num_bytes": 30138639, - "checksum": "8d8681519538afdb7622b677ca5d3ae2a643382bae9639e3ad90c82d36477653" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00084-of-00512.json.gz": { - "num_bytes": 30228150, - "checksum": "db708760b9d45e0b20c8dde9b0008f01761d9bb0f37a194845b4d097a60e477c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00085-of-00512.json.gz": { - "num_bytes": 30004564, - "checksum": "19ba55c7cbc44ae30a6497373fc15b548e5c45667f790c392857f6fdaa7e2bf6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00086-of-00512.json.gz": { - "num_bytes": 29696360, - "checksum": "4cb07dd259a084818f9a79a4fe4fb7b24ea1adda0cd4fd405ba003e7bd481f12" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00087-of-00512.json.gz": { - "num_bytes": 29927300, - "checksum": "7c3c07dbc9c57881a3c1abab85a927f1ba609c58da9dcec22d7415079cd336b6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00088-of-00512.json.gz": { - "num_bytes": 30038333, - "checksum": "59158c87d7e9e5011516f98dec1313758072ca6685c7ad9df5ee4a075d9ff8a2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00089-of-00512.json.gz": { - "num_bytes": 30223506, - "checksum": "d3f39f7e90b4a82257779290a3f2de5619049d69b2169577f1e3c81791d85419" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00090-of-00512.json.gz": { - "num_bytes": 30266969, - "checksum": "88ed3237aadff809cec186fa378e176774d3f32aef1a6d8bfdbc530f64e8aed4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00091-of-00512.json.gz": { - "num_bytes": 29885840, - "checksum": "b9a247993a8eec31b3f853d1329ae79da29397dd27eb4acdc196b71c091335e3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00092-of-00512.json.gz": { - "num_bytes": 29942337, - "checksum": "3d83cc54c06cad8effdb7a38ed6666b5d912e6fffcf4c82471af064b0aabe05e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00093-of-00512.json.gz": { - "num_bytes": 30129376, - "checksum": "d72ed9855fa86ceb4089435da3d78e8d4151b92185f828329b534d1adf3821db" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00094-of-00512.json.gz": { - "num_bytes": 29613450, - "checksum": "f61f74aa65a81616b97cbc34a8be1b563f83f69709642b8156eb76cdda02103f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00095-of-00512.json.gz": { - "num_bytes": 30469526, - "checksum": "926d1ba2e4b191e75b0bce0cbe4c15f95f244445ec03a6095c009c34e36f897e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00096-of-00512.json.gz": { - "num_bytes": 30126036, - "checksum": "e74818ad94e408498644dc71f1ed967f356f539418222f1dfea467a21c99badc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00097-of-00512.json.gz": { - "num_bytes": 30374980, - "checksum": "d9cc8827ee38bddd1a31e48b2b0064a567520e3c0f2e1be745acef57d267e4d5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00098-of-00512.json.gz": { - "num_bytes": 29928579, - "checksum": "090ad37fd9eaeb53308599f2da1053b19b1c6478adaea5a8a1c35d6c35340111" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00099-of-00512.json.gz": { - "num_bytes": 29901456, - "checksum": "c0e7d9a7cbc3b9b940077508441e471a1eb70e822479fcad726b900e6c196382" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00100-of-00512.json.gz": { - "num_bytes": 30033459, - "checksum": "b62033de618191de3200205e6e40725baf045e403060d10417211d47854d6bb0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00101-of-00512.json.gz": { - "num_bytes": 30280468, - "checksum": "8726d092785856ec690dcd8a9edcd968cd04af1cfafe8a83192e3c0782f02b4a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00102-of-00512.json.gz": { - "num_bytes": 29805195, - "checksum": "248edf4dd6c9a1137c7b45ab0b5a05a5fc93fd14cec17a5da4d758b9f7b359df" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00103-of-00512.json.gz": { - "num_bytes": 29995494, - "checksum": "d66b75c3f08a0db141d2c0162eb3dbc351e656ba1ba480e77eda051435d1390f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00104-of-00512.json.gz": { - "num_bytes": 30318447, - "checksum": "09bd2068c20d33783f39322c95756fd3dbd0da91f4380fae3822cb33b7d06779" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00105-of-00512.json.gz": { - "num_bytes": 30209523, - "checksum": "0a399ecb1116890e1a0189cd2842d64d8ed53213b1623ae38229a6ac4f5c1c76" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00106-of-00512.json.gz": { - "num_bytes": 30476739, - "checksum": "540f682a7c977d20f920b5af1ec7e40c14a0d54f1718b43271e22dece9cdce16" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00107-of-00512.json.gz": { - "num_bytes": 30203291, - "checksum": "0dd51deb74ab391c54b20862f7df561f74d00be2ee4fc13987f91771870c099b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00108-of-00512.json.gz": { - "num_bytes": 30265100, - "checksum": "172b09a108b154014077a415f644cd16db6a66f178bf780c120a6c4fecc3c0a8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00109-of-00512.json.gz": { - "num_bytes": 30342649, - "checksum": "214a8f147f2d77ec0f3889b0a2d782e5d44230878359e695e9523561e6723a1d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00110-of-00512.json.gz": { - "num_bytes": 30152418, - "checksum": "dc0d34ce7918b80ecef3528ec2b063edf7b12223c453ac7fb9d39232fecd81d7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00111-of-00512.json.gz": { - "num_bytes": 30160329, - "checksum": "d0594cb69d26f0e853575d86f92b1aa233b5bb236804a2f496a792fa031014ee" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00112-of-00512.json.gz": { - "num_bytes": 30428351, - "checksum": "2b0542d973bab88e696fb9efbe042167600da397d776ef65344dce868bbcb0b9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00113-of-00512.json.gz": { - "num_bytes": 30200133, - "checksum": "10dcb929692795fefcf4623040191d9cb6199fbb3b164648b62b9867e8392379" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00114-of-00512.json.gz": { - "num_bytes": 30205273, - "checksum": "f16631d5bcbbe133a01675286ca7667400ecc7e6df13d728015381d21ec71cfc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00115-of-00512.json.gz": { - "num_bytes": 30164849, - "checksum": "bed27819db4bb7e02cb42cdda18acd232659a2eaa43eed910ba26d686cb3f837" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00116-of-00512.json.gz": { - "num_bytes": 30117752, - "checksum": "4eb4bec7adac3c2f431d356212f8a9d47136f0011f5f9e71dd29d82b1b823e2a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00117-of-00512.json.gz": { - "num_bytes": 30062588, - "checksum": "79639624734885b3051b10f052f5486d7124bbc4bcd18d99348f3683ee2fc54f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00118-of-00512.json.gz": { - "num_bytes": 30125828, - "checksum": "e922a4a5332a4182ddcf6ac8ba910024fe4fa878b524f7368b27373f75bbfe44" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00119-of-00512.json.gz": { - "num_bytes": 30156741, - "checksum": "a44aba8779b99ace2f212789389af058d12dfb0706221b296676d5e10528dd78" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00120-of-00512.json.gz": { - "num_bytes": 30489925, - "checksum": "82bec41bbea7bc5ddb67b3bccea51122da7d0922768f8bda7a0c9d489bd20cdb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00121-of-00512.json.gz": { - "num_bytes": 29606989, - "checksum": "b49238f5b75aaf876657826cfbd4346d250f564a86bdb010aa1e85b44a969229" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00122-of-00512.json.gz": { - "num_bytes": 29770557, - "checksum": "0803ccbd505db47cd09b20d86cc6ad459c7a8d1c583a5ee756b0397369d8b6fc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00123-of-00512.json.gz": { - "num_bytes": 30248121, - "checksum": "d73a1bf285a0355bd61a25891cd8c5fd9da66535ec515dc7e1602a769b994727" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00124-of-00512.json.gz": { - "num_bytes": 30131013, - "checksum": "65d2dcc7e63a28e1911717d149b907d0c74fda6e36db2840353a0290f7880324" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00125-of-00512.json.gz": { - "num_bytes": 30348971, - "checksum": "5dee3c7afe0364ccb8e36647d01e78ffe61690f29f29aa033efac9a0413c2a47" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00126-of-00512.json.gz": { - "num_bytes": 30370074, - "checksum": "1dc04b3755291842711623d1d6cf042e2d66987103a0c708f01c9136a8c42db6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00127-of-00512.json.gz": { - "num_bytes": 30320846, - "checksum": "e31a27ba25bdf13e6f929fd38d53409dd3f50be78ad955b69b1956709de5aedb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00128-of-00512.json.gz": { - "num_bytes": 30076235, - "checksum": "122ee9d293428a7a823c17b3a432b5b2198fa2a68bbb246b97e981bd09f78f0c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00129-of-00512.json.gz": { - "num_bytes": 30569486, - "checksum": "918bf43ce3ab54d535dd02cbcd09f1081890be3287e23fd81bfa032beec61ebc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00130-of-00512.json.gz": { - "num_bytes": 30280169, - "checksum": "ab0a53e8c10dfdd139281175b5fcfe3090fa238fcb383e27b1dcdfdbbe8a879c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00131-of-00512.json.gz": { - "num_bytes": 30338899, - "checksum": "e54771e12a6f3583c3accf9bcc01b598819231f367e7f80cbd44cf6683c5c852" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00132-of-00512.json.gz": { - "num_bytes": 29969011, - "checksum": "f69d7052ca7657fdebe547a6e196b109285d5d4e4f1a68f3900a37ba6fecc22f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00133-of-00512.json.gz": { - "num_bytes": 30179558, - "checksum": "cf2130dedafd8f47e97661a5b1555813433e3f7293b5c5cb222cf551d90a0604" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00134-of-00512.json.gz": { - "num_bytes": 30080257, - "checksum": "1a32902fc21633ae8d41e4e5518804f4c719dc8729b866ebc32d3c36fdadbc10" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00135-of-00512.json.gz": { - "num_bytes": 30284972, - "checksum": "6e3a78e7a530d91ee4578caf462a4c685a5f221f0cd8eb9639c9067e2b655a7f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00136-of-00512.json.gz": { - "num_bytes": 30130265, - "checksum": "defc57340cbaa5f325994a91b5134789c84a76a4ca7b9fdbf993b0e634735f05" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00137-of-00512.json.gz": { - "num_bytes": 30146793, - "checksum": "7ce5035f452eb2e1adeff36d0c6d6d65c245d139a86ef48bbe10c5275975183b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00138-of-00512.json.gz": { - "num_bytes": 30180265, - "checksum": "298849a53a8ea0e68d01cc137195bc36d686077bed722e1198337a1dee3c51cf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00139-of-00512.json.gz": { - "num_bytes": 30398387, - "checksum": "ef2ac4b8f195141a79a357d934d5d97bd4d2c64027ec7509b5873a4ae32fcb9d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00140-of-00512.json.gz": { - "num_bytes": 29652990, - "checksum": "290f1c99b696e345aaa6ac6d5a882a87dcf5d3939b08ba859a359d2459498785" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00141-of-00512.json.gz": { - "num_bytes": 30083642, - "checksum": "fb6a38388a25261d86fbd8ffea63e06bcbcbd6846a4eb6f13fd09d7fe5a1fbc3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00142-of-00512.json.gz": { - "num_bytes": 30131064, - "checksum": "b61ccf6166ea4b777629bdc07d543f299bf7569deab18228ec5bb9edc8cd3eb5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00143-of-00512.json.gz": { - "num_bytes": 30244435, - "checksum": "22812c50efdfcf2c0fdcf593639dfea09ffee8068321c30effc669c8234d4f3b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00144-of-00512.json.gz": { - "num_bytes": 29725094, - "checksum": "79cfa65a3115193629d16606643d90dcf27d3108c320cc9e364ba19fdb9fb1d6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00145-of-00512.json.gz": { - "num_bytes": 30335033, - "checksum": "e836f0bc9acba85fd1721d19cc24054e97defb0d12678bdc0d086f40deb9b1a6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00146-of-00512.json.gz": { - "num_bytes": 29905680, - "checksum": "bf684871a235078390d6c6bb03fc2d5bbffec2b095806df652a19baf5e67135d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00147-of-00512.json.gz": { - "num_bytes": 29852459, - "checksum": "0e716de5b3b09ec287b039be0f0dd6edd7d541aa6d3f9d2be18768e1cd5f4cd8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00148-of-00512.json.gz": { - "num_bytes": 30364788, - "checksum": "4cef624e6b7c2b73dbfb47227e31681223a5a9369c4b7daef8606b796f010dd1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00149-of-00512.json.gz": { - "num_bytes": 30096278, - "checksum": "fb448ccc7412f5ca8667004a70f3dd6e1b5e6cb7f6facc06564bd22b1d815593" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00150-of-00512.json.gz": { - "num_bytes": 29776995, - "checksum": "1e14268cf723bc7336b33896537643d21dbefc1f05ffd5201feb5fb1130f9683" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00151-of-00512.json.gz": { - "num_bytes": 30205172, - "checksum": "797224cf74063fbcaec741535278ccce141e6dbbdd69a2191d07f89816ab14fa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00152-of-00512.json.gz": { - "num_bytes": 29845034, - "checksum": "77eeb2353f544c714deea68d4a781b498c40d7c1e27db3aade4987b381ca29c0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00153-of-00512.json.gz": { - "num_bytes": 30258796, - "checksum": "0fc581e92e70dda031d72a4aa0bbd65b1e9b28884f0ef5dd5e895cbecb270609" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00154-of-00512.json.gz": { - "num_bytes": 30249734, - "checksum": "ba10dd0a24bded170541e23078264b82b35bc99e402db594e2335e31905ededf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00155-of-00512.json.gz": { - "num_bytes": 30198742, - "checksum": "fe285ac893126062bcbc20df75a9f65c57d3a7391354fa7e62b7f6a7122d6e77" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00156-of-00512.json.gz": { - "num_bytes": 30168323, - "checksum": "d21826b71bc85dbc496dd947ae9ee79d62885cffb3fa7c47409feee6ab247f17" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00157-of-00512.json.gz": { - "num_bytes": 30241978, - "checksum": "fc41765301b62849eda0b7b08f792e45f03db458fb92063af70c43d7cd0d0bb6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00158-of-00512.json.gz": { - "num_bytes": 29959715, - "checksum": "1eded3ce0bc099c7e198e9277719d578c3fb6c425bb2110cb0ca6ce469d1d19f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00159-of-00512.json.gz": { - "num_bytes": 30109595, - "checksum": "eccaab5b694c2f0017fe1d423637872d5587f6deb316796f7c0ff5517fa28178" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00160-of-00512.json.gz": { - "num_bytes": 30201741, - "checksum": "4ceee71372da6112101665f5bbf942a85f065feaab924c6e3f83498169bbe255" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00161-of-00512.json.gz": { - "num_bytes": 30176266, - "checksum": "6ed829daaad190b2d50b626d840edb750a063afad95315ffe7604a193183a489" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00162-of-00512.json.gz": { - "num_bytes": 30018118, - "checksum": "dcf8509a55213425a41706e5209ad411afb715fb9cd8c1a8b8edca23fab7d6cd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00163-of-00512.json.gz": { - "num_bytes": 30236016, - "checksum": "d93cfaabcc7197637f233896b5799527f27d5b2dc60f0f0411ee51f05f09c500" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00164-of-00512.json.gz": { - "num_bytes": 30150055, - "checksum": "cc7de5ed3c774ff1dc350fbb5167dc1610c4f9a0dbc7c5d60ed4cf08aaf23ce3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00165-of-00512.json.gz": { - "num_bytes": 30348056, - "checksum": "b41c4a3b7b4e96262fe5c87d06fbeb000dc48cc1d304a475bb4f4e1af84a9afb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00166-of-00512.json.gz": { - "num_bytes": 30015834, - "checksum": "0a0821b7628b9b019995a9f34223e2960ded84331ce1bb55089838becb8a170a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00167-of-00512.json.gz": { - "num_bytes": 30282254, - "checksum": "1285af56d024efe2166fa892878d471948e1d4c996922c7673e3c0f7f0f76bef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00168-of-00512.json.gz": { - "num_bytes": 29815124, - "checksum": "29ec54ed647725ca3b9aec3bae341151a8e2b708cf21cd87b4389329298442b8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00169-of-00512.json.gz": { - "num_bytes": 30346843, - "checksum": "1791e3f8371a63f9f849b7bf430e70d3f4011dbdef572c166cc5d49d06162fd7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00170-of-00512.json.gz": { - "num_bytes": 30175685, - "checksum": "de8f82986addfc64b88fd3041d7ee6fdb64e6f770758146dc4c9309df348e965" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00171-of-00512.json.gz": { - "num_bytes": 30145505, - "checksum": "0dda47f679666862de6343e1109ed92866a42e8fa129ee69e9f0b73f18b6aecb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00172-of-00512.json.gz": { - "num_bytes": 30009998, - "checksum": "2990dae6c16b7d60652439bed8b80ee4cf93972f33d8511d3d6aabaddfeca5cd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00173-of-00512.json.gz": { - "num_bytes": 30062185, - "checksum": "e154a969bba2bf9430e0c8307561de78599fd2bd527cb1f15bbaf8f8e88cdf23" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00174-of-00512.json.gz": { - "num_bytes": 30055129, - "checksum": "e714ae153e8a927c88fe577d4c27017985d3ed7f3d0f5470f9a5f25c2e901a9c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00175-of-00512.json.gz": { - "num_bytes": 30091082, - "checksum": "5f47c663d1e15d94fb0057d303048be990c713f3285ada2c6233137b1d84d60f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00176-of-00512.json.gz": { - "num_bytes": 30235767, - "checksum": "20b05e4e99e5a05f6a4c29b304803b895bb8816caea6203643723ca587d66128" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00177-of-00512.json.gz": { - "num_bytes": 30071950, - "checksum": "29294e4b224df4695c9342c6f23d5495de9a0ca6a1be7217aa2211506e8ac7bc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00178-of-00512.json.gz": { - "num_bytes": 29932121, - "checksum": "6022ed3b2ceef02324e40d3c7407622c95ead2cd3d3c41ab15ff9dd218265673" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00179-of-00512.json.gz": { - "num_bytes": 30119251, - "checksum": "42fa0aa883d9db4303a4981e4e308b2432b031fbccc98c3e1994ec775ba8023e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00180-of-00512.json.gz": { - "num_bytes": 30175456, - "checksum": "6fb2ebd61524846f6b1f746f9c6356045623beb4b685fe265a23446037c9cd9f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00181-of-00512.json.gz": { - "num_bytes": 30029564, - "checksum": "b779d721bb135fceaeddebb0dad1bdb43c9067a5e8595b3d544dfa7a084eb9f4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00182-of-00512.json.gz": { - "num_bytes": 30437016, - "checksum": "b388fc0e862d7f6bb5b879ff7c69c301038faf5b542f6b40cbea4e2096a41e6a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00183-of-00512.json.gz": { - "num_bytes": 29994048, - "checksum": "8208eeca7bc76f8b1786c95939d321ca0c7ae190b1f12dae86738810e412aa8b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00184-of-00512.json.gz": { - "num_bytes": 30338616, - "checksum": "49859e75d999f65de99f9236e649a81989360f0328ba684671057b0dd7cf5e79" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00185-of-00512.json.gz": { - "num_bytes": 30088874, - "checksum": "ff6d32fdd471d3076a9367c175baab84a5d699ccd6dcfe00c755f0b714ca6074" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00186-of-00512.json.gz": { - "num_bytes": 30193681, - "checksum": "82508ed104fc57de3062258eaea57854ab9e1934437a88dc0d8a9921f3641bbc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00187-of-00512.json.gz": { - "num_bytes": 30171163, - "checksum": "409d6576b25ad27455c755e5484e3f51d5d9788962efabe1c32e06bb3febacab" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00188-of-00512.json.gz": { - "num_bytes": 30060432, - "checksum": "fae94de96fa2962ef51e2ea90a5f760a5cee5de249bfd9f56d7c7b4e5c20f6de" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00189-of-00512.json.gz": { - "num_bytes": 30180741, - "checksum": "25293d5cba09980086f380d9e9ab44543adbbdcd05ed08601248b3a2b16d118c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00190-of-00512.json.gz": { - "num_bytes": 30207152, - "checksum": "ccfee160de15df5d88f0ff5a898a0c5b2d0ef4ebd6e6832715a9ef8a9904f88f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00191-of-00512.json.gz": { - "num_bytes": 30143987, - "checksum": "4c579619e465d9d97451801147202826a3855e772ea6dc4e9968e43ce2b8c05d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00192-of-00512.json.gz": { - "num_bytes": 30072097, - "checksum": "9c32ecb6d4ec9feb27c5b642879b464e68ca8804db161219503f624e7ca1166f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00193-of-00512.json.gz": { - "num_bytes": 30172886, - "checksum": "8442ddc3843c72aa169ca67801ff865ff85e4183beb38faa664f4f1d1c22a5d8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00194-of-00512.json.gz": { - "num_bytes": 30037105, - "checksum": "2942ecacb22cb9a2953c68f21ddf3368cd47ab1f2b2d8e1f5c76b1c849b28d91" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00195-of-00512.json.gz": { - "num_bytes": 30014854, - "checksum": "9e5c6815a5734403a7062bb27b2565d433a3520a401c836ac3f16e743a1dd949" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00196-of-00512.json.gz": { - "num_bytes": 30020510, - "checksum": "792712f0073c158b5f96f7a99d97970fca3819b69739d34d7d2b7f4b8b407b7f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00197-of-00512.json.gz": { - "num_bytes": 30072566, - "checksum": "3ece37e2d0d0b26fbd839b5d3facdfd70844945a06867fb68b141f6b1378462b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00198-of-00512.json.gz": { - "num_bytes": 30036679, - "checksum": "c3f37a9b89987dde4578b394b5c3916c2d4fd87e0902309b4c81af19b1d2d5ea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00199-of-00512.json.gz": { - "num_bytes": 30195178, - "checksum": "ae01bb5515097a083afd498d8530e788d99671e7cf802c4402957d6252b2ec77" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00200-of-00512.json.gz": { - "num_bytes": 30064374, - "checksum": "2399d4869f3a8bb4a9adced5ec548a9a3fde1d4fbc4e3abd9a0a3b495fb9a8ef" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00201-of-00512.json.gz": { - "num_bytes": 30136711, - "checksum": "5c922040697bad8d7807d79f34f2b667eea63ceefba89b2d413fcd4d66497607" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00202-of-00512.json.gz": { - "num_bytes": 29962983, - "checksum": "e4df518d612a8614de73d5944a31d22ad06ec9ecd26fb52e500df71fe363c1be" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00203-of-00512.json.gz": { - "num_bytes": 30178998, - "checksum": "e84a98a176451fc82d940a64cdec821e320a648780edba6466b74a1966eca47e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00204-of-00512.json.gz": { - "num_bytes": 29988832, - "checksum": "c6dc56388bc7c57cbdee8280895ab80da7b4d49c9a0101a685229c50cad2e2e1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00205-of-00512.json.gz": { - "num_bytes": 30229414, - "checksum": "e7e5175b6a7372377ba3a0db439911e189db459787d48588183ac1a0198c5fa7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00206-of-00512.json.gz": { - "num_bytes": 29914929, - "checksum": "eb263433133660ebe219cd5817dea3b546ef2fba0e15396b2768d7091117cdea" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00207-of-00512.json.gz": { - "num_bytes": 29912800, - "checksum": "7f8a5f62ba5912b64af5b02bd987b4d81727223ef8eff110022e89d01961366f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00208-of-00512.json.gz": { - "num_bytes": 29900590, - "checksum": "bc2af142244601bb7a96859dfd9885196940e675ca217cfc7c73ac9c614ea938" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00209-of-00512.json.gz": { - "num_bytes": 30242768, - "checksum": "fa51a4337faecfc790ca925802f87f10761552e16578b880ced80497f62bba60" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00210-of-00512.json.gz": { - "num_bytes": 30039857, - "checksum": "3adf7482ec6a3ad106c8edca3645a94032c33f84fcd26bd9876f2b8a1f6b5722" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00211-of-00512.json.gz": { - "num_bytes": 29846856, - "checksum": "8e931aaa9c1f069c0eca0b4605277610df9d2d0c07a0dbe6191fb7081b0e642a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00212-of-00512.json.gz": { - "num_bytes": 30022172, - "checksum": "21c8bba1c83544c27977b22b077fd77f8df9cd06bc4eb5e9e9a532c511498d36" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00213-of-00512.json.gz": { - "num_bytes": 29877918, - "checksum": "b64ebaa088df5c6230e69f207267a038705c38f4d327970e9117979e1c13d1ed" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00214-of-00512.json.gz": { - "num_bytes": 29906552, - "checksum": "55d833a2b78ad564e6532d1acd14511e8b48d703030e3bbc92d7c835c1ed38c7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00215-of-00512.json.gz": { - "num_bytes": 30075441, - "checksum": "999c77c136d3df83601e33c823f389b133f33c4c0b03736ceace617b526cb293" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00216-of-00512.json.gz": { - "num_bytes": 30507152, - "checksum": "0b23d4e57eaa101c78bab46151add537668d2722bf0c50470c1b434ec3389ae1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00217-of-00512.json.gz": { - "num_bytes": 30044236, - "checksum": "6abacfd53e231a38c714d436018cef9a58f53320026c2ebb27d6caf08f02d7ac" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00218-of-00512.json.gz": { - "num_bytes": 30047926, - "checksum": "01120ef69493d84c44d112a41c69a851edaf89232679366e812f240fd26a0e47" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00219-of-00512.json.gz": { - "num_bytes": 30349211, - "checksum": "c4fc219559f0f076f634fc6812d4b13c229908c1ae45c3b74c059fb3b8124f63" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00220-of-00512.json.gz": { - "num_bytes": 30063445, - "checksum": "11f712439d54ef062cfa1225328fc4faaef5f6c9c0b0d87a0a81d25a71350e28" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00221-of-00512.json.gz": { - "num_bytes": 30115660, - "checksum": "9a344857ef4f9d141b57df38e25f717153b773436d72c23e10289ffe67c315eb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00222-of-00512.json.gz": { - "num_bytes": 30134562, - "checksum": "227cd1847a948e388b404b5cda9289f05510d4e22f0ae5ec4d5a87a8f7f98a45" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00223-of-00512.json.gz": { - "num_bytes": 30120819, - "checksum": "e0029aa6b612a98f76e37d82107fcb90f2b57ae8d52beea172b5153b76334f20" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00224-of-00512.json.gz": { - "num_bytes": 30371365, - "checksum": "1ce5242d163ca12dbb22655eb841bf80750b552353af4f84973285d823d0add5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00225-of-00512.json.gz": { - "num_bytes": 30319212, - "checksum": "71cb82bb95107a7e0b7777a5fcaa0f76b465ba828ac47401babcf7289eeb2335" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00226-of-00512.json.gz": { - "num_bytes": 30020940, - "checksum": "b7b8d98ade41f52ece23e896bdc4c19ad034a92ba18adb5fac85c7271afbfa65" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00227-of-00512.json.gz": { - "num_bytes": 30109958, - "checksum": "b2ec382f44caf4e8e46fef2faf6bd2e4000420e6da2eb12a5d9f6e7efb4e1564" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00228-of-00512.json.gz": { - "num_bytes": 29940895, - "checksum": "ff86264683d0fdf9d689aa30e7889c4ceed21098b7c60a220db92d396614cb1d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00229-of-00512.json.gz": { - "num_bytes": 30080588, - "checksum": "3a5502cedd61501055eb16adb6ef861c75880524c5468a69cd346bc03e98e219" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00230-of-00512.json.gz": { - "num_bytes": 30376399, - "checksum": "6d3a4171a1febe9149f6900e3cca5a38046ca9d59214b548a4ef9de7de754bbd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00231-of-00512.json.gz": { - "num_bytes": 30031670, - "checksum": "a2c8d9bb3eb260d5d8a7dcafc4703540332e2896e5127372d380d7efbd567a3a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00232-of-00512.json.gz": { - "num_bytes": 30132612, - "checksum": "c9dec917eff4d72c684d6f8373ca66839061e29d25f0aa5fd6fb7de5c30df469" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00233-of-00512.json.gz": { - "num_bytes": 30178285, - "checksum": "1eb83b8eb7e72b2b3e55420436bb17521b989d0627da46f8cc61fe9f420fd464" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00234-of-00512.json.gz": { - "num_bytes": 29991258, - "checksum": "5e14e2a9e8c0aba73feb9134c694e99baf57357bb524877322ff5181eedef1f2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00235-of-00512.json.gz": { - "num_bytes": 30045172, - "checksum": "50a118a072498b5338802cceacb97a9aa9242252e8d76d305cf5f0d928fd4af6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00236-of-00512.json.gz": { - "num_bytes": 30403542, - "checksum": "7d7605576975232579e422a1b72625ad6f9d714d27770725dc7b99ba258e1985" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00237-of-00512.json.gz": { - "num_bytes": 30242989, - "checksum": "22d152fa02c5a959e978ea4887dd873dfef7267af0a577b4d796ff0cb52d5c56" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00238-of-00512.json.gz": { - "num_bytes": 30214634, - "checksum": "6d0af6f396fa21867e899a7678c633e47bfe79bcbda29b8072c5d32ab20a9aa3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00239-of-00512.json.gz": { - "num_bytes": 30255546, - "checksum": "d35a93632638b6283053b121f0f30d47ea20b2747d871c3dd0beb13f4ffbcad9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00240-of-00512.json.gz": { - "num_bytes": 30347604, - "checksum": "fd052d532fcfe811d96f8433f79a684f68f76ec42bd959c76ae3b63aec0b2c3e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00241-of-00512.json.gz": { - "num_bytes": 30135691, - "checksum": "12c80c41dc4d6313bce4a171999ecda93ffc59f2c70cca363bce214cd12dc9f7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00242-of-00512.json.gz": { - "num_bytes": 30229834, - "checksum": "fca5b81914ac0c5fe0b0c1a554a1e62c64af5c98740df1f8ce8f48f2a62b6a48" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00243-of-00512.json.gz": { - "num_bytes": 30053753, - "checksum": "ba41c505579524e9d244354a70060c9a0131007e0b129f03e628bb7b7b512ca9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00244-of-00512.json.gz": { - "num_bytes": 30216889, - "checksum": "54a391c1d2de7627e739f3cd94eeccd50a80d56a40606f7c5392f6098df456cf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00245-of-00512.json.gz": { - "num_bytes": 29887569, - "checksum": "c3263ea7e16e0036961dad28fef57ce4f0495219e59b4e800af82b67b3c6c506" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00246-of-00512.json.gz": { - "num_bytes": 29906815, - "checksum": "a3dcc92aed81708434edee84397010eae4ffeaa38b39aaf3919256f72deee625" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00247-of-00512.json.gz": { - "num_bytes": 30074896, - "checksum": "019e983a95908651bfae83e37bda5200b3888b03ab235fc8db2d5b16742f028f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00248-of-00512.json.gz": { - "num_bytes": 30108081, - "checksum": "6f68835ec02cf899f8f44a795b1e3117956ff5bb6c8946435d9861ae7a112df3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00249-of-00512.json.gz": { - "num_bytes": 29957882, - "checksum": "9bed6b7f56d93fa3973d4f177dde0973fa0eb6fe17d8d85279d865531613f963" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00250-of-00512.json.gz": { - "num_bytes": 29822284, - "checksum": "1848bef8d11360df55a576c64147e519327b1178f77d3ec14ab9522b33b1c423" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00251-of-00512.json.gz": { - "num_bytes": 29956462, - "checksum": "425f69c361a8671cf571df577ac0cfafb4894de494360084b7cbe9cb8869bc3f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00252-of-00512.json.gz": { - "num_bytes": 29733712, - "checksum": "7198e831e75eff1e116513f9cbe098c071f051c545b41d1943211a1d996a3c67" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00253-of-00512.json.gz": { - "num_bytes": 30450662, - "checksum": "0452804e723c919bd3c84217bb1dfc8764112fd70c5581f84520df7592f28ae9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00254-of-00512.json.gz": { - "num_bytes": 29944765, - "checksum": "dbbff2253d70094537de481344e5706315271fdfce7ebaddc8d277ed05ddfe24" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00255-of-00512.json.gz": { - "num_bytes": 30321363, - "checksum": "79173dd85d535cee71afb52f7775bbf7289509bc555efe21a8700d36f7e5da25" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00256-of-00512.json.gz": { - "num_bytes": 29982818, - "checksum": "bacd191568e72da06c564fc7476225ce83440de6aea6c85ebe7f5279f1c15846" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00257-of-00512.json.gz": { - "num_bytes": 30338592, - "checksum": "998287203665559c27a66e889611ed716b7a389e403b2e857086f548b2c47b39" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00258-of-00512.json.gz": { - "num_bytes": 29911193, - "checksum": "ed9829f41a71cc187d0ddfeafc9cbde8e362b52914c988708a1a5ffbd3c152af" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00259-of-00512.json.gz": { - "num_bytes": 30227794, - "checksum": "2fe86814499a3379601a179acca1d440b3c79467827ce9ef9787e1ab311904e0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00260-of-00512.json.gz": { - "num_bytes": 30206902, - "checksum": "c4efdad05d3f5e9f27884399ab0ec82081c26486e87f0ed5408a9eb80b223daf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00261-of-00512.json.gz": { - "num_bytes": 30035514, - "checksum": "e47675a956a626a32b1870c61e6f98c3cfe9cc571901cf477abae982b4e63c96" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00262-of-00512.json.gz": { - "num_bytes": 30406718, - "checksum": "ae19c1389e26562322f745bafbd7839e7a95b3169743d48baa7ae7f2db2a0b5e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00263-of-00512.json.gz": { - "num_bytes": 30266531, - "checksum": "289c9fee87f12ea22ad5329f80cb379e5e9c22c5cb6639077748958228c62bf7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00264-of-00512.json.gz": { - "num_bytes": 30100823, - "checksum": "7c65dd5d90c6df49ca2dcbfdbf1b9fbb0789cb32043795942d88c5f2d7a99869" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00265-of-00512.json.gz": { - "num_bytes": 29957109, - "checksum": "e3a1b501b2cc3f5f2667ef179d7876db602daedefd0cd741c0898679b24984e6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00266-of-00512.json.gz": { - "num_bytes": 30196603, - "checksum": "9337dd8240f168da5f6a8b57c5c169a2a400a9a160eccc8a6e44e7b32004ff19" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00267-of-00512.json.gz": { - "num_bytes": 30304605, - "checksum": "513eea4e78c399cc045e25f13bb5f77ddb6c9b606522bed8216945c529894e8a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00268-of-00512.json.gz": { - "num_bytes": 30312562, - "checksum": "0503c5bf6848213c5fcb81a5c94307fc010d910a8989e104ad5fedca58c76f7e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00269-of-00512.json.gz": { - "num_bytes": 30045257, - "checksum": "59bd3011d12d7d70b5fd64bc2dd2016b1a9ca6f0d210dbb3e6c202bbbf74ced5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00270-of-00512.json.gz": { - "num_bytes": 30027628, - "checksum": "8d3ecf4c61acafc49b624d08b6aa31340643e030f6c2248f689e8a17d355359e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00271-of-00512.json.gz": { - "num_bytes": 30014730, - "checksum": "b2e4820a0a7287786f802b3b40602c8ca77c7813b5f50db8a336b89b89bbdf37" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00272-of-00512.json.gz": { - "num_bytes": 30145705, - "checksum": "20c73e4a9056a5201621a4799b86c323c5136af43caa63a74298a5c3bee890a6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00273-of-00512.json.gz": { - "num_bytes": 30165945, - "checksum": "8f07a91b6b40444635d869b94558fa68e3593626808bc6122d4e17403cf76101" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00274-of-00512.json.gz": { - "num_bytes": 30097947, - "checksum": "9530522c841d8f09ccb89f4f0238f7b9048c211e85b27449fb3c09d3bd2bab7b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00275-of-00512.json.gz": { - "num_bytes": 30296359, - "checksum": "51a358db81805a20df4f920baacf3adea05209282f800fbedfc7fa49638a072e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00276-of-00512.json.gz": { - "num_bytes": 30311407, - "checksum": "a51253cf73fb200053eb5fd5eca398a7a070fcaa27fc99b23389d09eef7fe5ba" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00277-of-00512.json.gz": { - "num_bytes": 30372345, - "checksum": "cc4f6d9040d8c4909d4ea5b661a7e54ba4775ff1c7c55db1ff686a56d428e2a5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00278-of-00512.json.gz": { - "num_bytes": 30379507, - "checksum": "1052defa657524e1211e67d775a32243b164eda431c4c6ed351f0c6727f21b16" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00279-of-00512.json.gz": { - "num_bytes": 30195406, - "checksum": "6f4fdc92c516ad779fd521afba7d8d5bcd40672e63028f43f70fff4d7605f5ba" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00280-of-00512.json.gz": { - "num_bytes": 29902057, - "checksum": "c26f89efd0977465f45fe321036d88e2d6ca3ee1edc4bafe4b40ad1895cfc0e3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00281-of-00512.json.gz": { - "num_bytes": 29779702, - "checksum": "094139d741b7a47faaaaf50093ab4edbef6ad1943985c6f453ce45a67a95b190" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00282-of-00512.json.gz": { - "num_bytes": 30063500, - "checksum": "280d69bfc795f1502a9e744d53d1a189051a1e771042721f8e6f74f6559e25a7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00283-of-00512.json.gz": { - "num_bytes": 29956350, - "checksum": "505e49b7eeab46c77a324959eeff103f8899da1efc4d0fef5c0e6c6f8879a721" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00284-of-00512.json.gz": { - "num_bytes": 30146285, - "checksum": "9b075f2cfdb9a90fcdc7f779a52b0c5dad36385214844d4fd9df1e528ae78b6a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00285-of-00512.json.gz": { - "num_bytes": 30160056, - "checksum": "d9b9f3cbb9ce2a0a0a1a2f7ce91e98621d48a7a900c278aeef437dc6c0a7cdf0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00286-of-00512.json.gz": { - "num_bytes": 29844025, - "checksum": "6de9ff1013484662305e414725be2d0a4a1873a941250b95b80b5dea8919cf95" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00287-of-00512.json.gz": { - "num_bytes": 30089218, - "checksum": "444ff132c4a5330653b7319d34b2c7f4ae3b960d8b510cbd7389e3881f65ac5d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00288-of-00512.json.gz": { - "num_bytes": 30092170, - "checksum": "46dc5b3b84e4387ad718fdf96b751354d7048e898ec664e0d3bdfc21ee841ec2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00289-of-00512.json.gz": { - "num_bytes": 30365397, - "checksum": "b42e35746112198143ac18509e4f0148772db75e19f5eea9ed0d7e2849dbba48" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00290-of-00512.json.gz": { - "num_bytes": 30275920, - "checksum": "25d99877235c4b9dacd5d1dd7e9d16bba76cdf6cb1725fa617209142873dca0f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00291-of-00512.json.gz": { - "num_bytes": 30125784, - "checksum": "51da68b6f2751a83e2534c342b6e9d69c419fb606b44c42b872d69f5f726df3c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00292-of-00512.json.gz": { - "num_bytes": 30201021, - "checksum": "1e0a42b5e7ea7049c3c86b96d37c5d1c36f3ba2e2dab02145a897ef056fa6a87" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00293-of-00512.json.gz": { - "num_bytes": 30124224, - "checksum": "8c744f5c6eb92c0de70649cd773c0ad147bc7a1487b2ae7f1107bce9d19da601" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00294-of-00512.json.gz": { - "num_bytes": 30074708, - "checksum": "b3cfa4c4408c1a9f39b48e18a62e112ec3c132b226efe0850f9e58e2a517aa97" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00295-of-00512.json.gz": { - "num_bytes": 29990007, - "checksum": "012f63e147d22e34249e930975a2d8958a8d0b17350a9f6e368d702189b40d5b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00296-of-00512.json.gz": { - "num_bytes": 30093755, - "checksum": "5573859cc485ae4535b83fd408dcc6a82f644832c93e6125db9a16dd6ded338f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00297-of-00512.json.gz": { - "num_bytes": 30078472, - "checksum": "25e694485171ba1347ccbd7916c1b87a0d46acfd13795a8aabb1cb57b5eb1221" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00298-of-00512.json.gz": { - "num_bytes": 30327122, - "checksum": "6d6832cb3b1c86b6392bc9ca52f69a0bb16bf71c3c7664d9fe668ee259a40a30" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00299-of-00512.json.gz": { - "num_bytes": 30214180, - "checksum": "9f3c3d87a525874ea117e36e0b30d7f5cc6c64564506808058a0788d74943634" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00300-of-00512.json.gz": { - "num_bytes": 29895171, - "checksum": "e99d296965da2f731ea660889ce834cd1d21edf427298bab3a059ff3ebc64a2d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00301-of-00512.json.gz": { - "num_bytes": 30131063, - "checksum": "e5eeb0f237cf986134c946bb3c2a4b5483fb9c88b3c2b16b9db26135043036d6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00302-of-00512.json.gz": { - "num_bytes": 30184609, - "checksum": "4ac9bf5ca6fac7f7293238852424340326347ceaa6f5dfa6fddef8003421bebd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00303-of-00512.json.gz": { - "num_bytes": 29956412, - "checksum": "559019fe1ef1f7e77ac53ad98b3556965ebc524ecb80bbc3f26255d5ae6e3609" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00304-of-00512.json.gz": { - "num_bytes": 29974071, - "checksum": "3c54edc4b6a7e34048cbbadb55cb3b16496a4e6e7334b4ede4e1368daf4c5301" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00305-of-00512.json.gz": { - "num_bytes": 30338106, - "checksum": "1c91c0c5bcc2bec0a698318ad6f576a06db7885c20ed7f36782427b80580a75a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00306-of-00512.json.gz": { - "num_bytes": 30178986, - "checksum": "fff99f2758c2de57ccbfbfc6388f67e624d00d4a6cccb5820a7a8f5fcf02d386" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00307-of-00512.json.gz": { - "num_bytes": 29493455, - "checksum": "5d08c6e3909e21bed456ff9d06c983f14d3a277cb399a91047a692184f87c4c3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00308-of-00512.json.gz": { - "num_bytes": 30228844, - "checksum": "04bffac195e24383d06b0ab9ebf019959a4e7abe8e8e6a0cdfbf0a8e7c23c899" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00309-of-00512.json.gz": { - "num_bytes": 30351688, - "checksum": "3ce14d5104d1318c6a16d042735f0a71f4452897de60d17408181ec5b135bbb2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00310-of-00512.json.gz": { - "num_bytes": 29993012, - "checksum": "afad2f39bf4cb932e50d9a0be93940b423e7abcc3d67dac15b1939e4e40f4ce4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00311-of-00512.json.gz": { - "num_bytes": 30448951, - "checksum": "a049c31ef6304084d33cb7bdd2e21ada0c60b40b1002b2369e60d36a5098c4b0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00312-of-00512.json.gz": { - "num_bytes": 30034189, - "checksum": "557d1e88400a6d1d8ee4d717a959239edacbdd3e18d8cd20c5c85b77174dc302" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00313-of-00512.json.gz": { - "num_bytes": 30066486, - "checksum": "e4823ea1e9a59d5db84564a5b90c28fd8058450f238c60ad689ffd6b673d65f8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00314-of-00512.json.gz": { - "num_bytes": 30397706, - "checksum": "1b4c0653e7ccf7fda0a53d8cbd5ddd57322ac83822e9d05bbdb9eb8ac979cf50" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00315-of-00512.json.gz": { - "num_bytes": 30219107, - "checksum": "9c364c9cab4ff7acdd1818b13de2f36713df8fa6c504ba15cdf47fe8e3c30206" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00316-of-00512.json.gz": { - "num_bytes": 30098661, - "checksum": "84dd8a8739b5abc39d8180f0894b1fbf2930d6d333d7c86b646f40763327397c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00317-of-00512.json.gz": { - "num_bytes": 30178992, - "checksum": "16e4791b4e5ab3719dacf79fedb0b88ed54346372874c37ccb71d86bc419edc3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00318-of-00512.json.gz": { - "num_bytes": 30022982, - "checksum": "98345a826aab12bdaf5e639205d5dcdc1da8fecd7cafc1982df89ac8d4df7ebf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00319-of-00512.json.gz": { - "num_bytes": 30360409, - "checksum": "d53a39019a1627b42ae6bff68e283d37d0bb5f48b328c2c5cdcc1a3897f4e992" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00320-of-00512.json.gz": { - "num_bytes": 30347267, - "checksum": "c343a0eedf58484055e58762802ae8cc05f2cdb0b923785c493d056a2cbdb015" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00321-of-00512.json.gz": { - "num_bytes": 29967877, - "checksum": "cc5795d254ad749ccfe613034927bdf95529545ae1f277b694dd24a5996aca83" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00322-of-00512.json.gz": { - "num_bytes": 29885538, - "checksum": "d5eaaa1eea983bd37ed34651e6c16b746ff7c92e48038b234149fa6d04d3d866" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00323-of-00512.json.gz": { - "num_bytes": 30308848, - "checksum": "a42cfaef5e088fd6b24dfc121084a6cd038f5b0bfaecb9f33997ab22a97fb155" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00324-of-00512.json.gz": { - "num_bytes": 30351634, - "checksum": "0e2e6933f93466e9c8fe966f7770fe4c34caf182c713dad3206f4132eed1d41d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00325-of-00512.json.gz": { - "num_bytes": 30077168, - "checksum": "77cdbf7040ce7f38d735fef41813ce63aaa16fcd87fce80e6ca6bd56d350c369" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00326-of-00512.json.gz": { - "num_bytes": 30031750, - "checksum": "8d994c2dc1b766e3270dce3f0b8f6f8fe22d5c1e0e9780e1bfed52c1292b8641" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00327-of-00512.json.gz": { - "num_bytes": 29845765, - "checksum": "f6279e351d016769d6fb5482d01a15ba054d5fe6f9f1c4e92c0663cef0083002" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00328-of-00512.json.gz": { - "num_bytes": 30253188, - "checksum": "2ea84aafd94d1843a2cc4428279dbb079c6ae0aae6c00f90ee4b5ace3c827afd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00329-of-00512.json.gz": { - "num_bytes": 30124922, - "checksum": "49e3d91126d53eada7bbd87bfe9eaae74f059c69cd70a3a3b8101f49c1aca154" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00330-of-00512.json.gz": { - "num_bytes": 30026414, - "checksum": "07442fc4f7fb1732362293bc15a6754d70ecf4743392cf89c4497b3cd96269fd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00331-of-00512.json.gz": { - "num_bytes": 29961847, - "checksum": "f437c6f5f758a5d32c8fc949037060259162864c29aeaabf37032e79f5a1cf0b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00332-of-00512.json.gz": { - "num_bytes": 30167166, - "checksum": "96018497eb6dec020436c1333ff81980a64fb615997855fdd8cf35fe3f658db6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00333-of-00512.json.gz": { - "num_bytes": 30192963, - "checksum": "1c12ea6b9031049dbc84e4da6b5fdedf480e989385d758c88322c415a1cabbb0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00334-of-00512.json.gz": { - "num_bytes": 29847008, - "checksum": "c269285f15f626b4b15a7d1705ffa08e3f4d49ce13de8174b72f9f6276a1c6af" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00335-of-00512.json.gz": { - "num_bytes": 30262244, - "checksum": "179ee564e6fc644d9ee139bdb02d470a1172221b0f6e510ee5935683500f8257" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00336-of-00512.json.gz": { - "num_bytes": 30262910, - "checksum": "317933afdd8dc8a3a355e44ee3d84bbab12a2f30c98ea1172dde7074ed4c0557" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00337-of-00512.json.gz": { - "num_bytes": 30155329, - "checksum": "c5b850399252ec41b0fd9cb2da87ce25e5a44df9f44c6ed9d8c559a5729e5a0f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00338-of-00512.json.gz": { - "num_bytes": 29952961, - "checksum": "48083123ba97a6212e0501799bd01936f0795bdd4d9c2710b9aa67d54b29037e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00339-of-00512.json.gz": { - "num_bytes": 30403399, - "checksum": "313b60f985dcf591f34d351b758eedace655b6c6d3946dd2ddc55f34a9a97ae9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00340-of-00512.json.gz": { - "num_bytes": 29917484, - "checksum": "2c72290f3bd51dea2a2877d68a968dc2b75dadf99ab3cc2230e41be45f3515d3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00341-of-00512.json.gz": { - "num_bytes": 29905522, - "checksum": "1acd83a0da4a7a4912b589dbeb68b37396d0454371b2b71af4ae18b854d482ce" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00342-of-00512.json.gz": { - "num_bytes": 30022369, - "checksum": "8756be42335bba12d06de63e247659f8d603a092ff342360dfed645aec135c47" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00343-of-00512.json.gz": { - "num_bytes": 30229313, - "checksum": "863e29987a3ccfa08e14ae987c81367a53b9fe08795184db086117a9555e058b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00344-of-00512.json.gz": { - "num_bytes": 29924335, - "checksum": "aa9003a7cc3527fb658fd807c78890587a8b35634a1f0838bc221a6374205d20" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00345-of-00512.json.gz": { - "num_bytes": 30229482, - "checksum": "a7e88b015bcf7761217e9b3ffd413f13cac48f6afe083353436de6cbd0d0018d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00346-of-00512.json.gz": { - "num_bytes": 30029147, - "checksum": "b862ea62ac032c203c0038c061a44edabe4644be03b876ec7322e96762374940" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00347-of-00512.json.gz": { - "num_bytes": 29808182, - "checksum": "62915b86cbbf61a76f73d05509a8e839aae0b965134ef79022377625df7ef741" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00348-of-00512.json.gz": { - "num_bytes": 30091116, - "checksum": "6c384c2c6bc8340b88e085f8bbc2616be68c96fa7b8b88306b4500367d053a49" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00349-of-00512.json.gz": { - "num_bytes": 29867618, - "checksum": "bfb19508ecf8bd4d9a8847f0edab5acde6896182c27da706a6f2863bec43c152" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00350-of-00512.json.gz": { - "num_bytes": 29723106, - "checksum": "a645c62c94de9018175f15a0b38aa8bd2484601ee189b7c27d589288eb5af97e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00351-of-00512.json.gz": { - "num_bytes": 30047620, - "checksum": "991061a23834e6bb3dc0595cf0e8328e07746d10fbf7a7ba397c1410cb66175a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00352-of-00512.json.gz": { - "num_bytes": 29808328, - "checksum": "6c8e377a6cc82e81d66e2be3d23c1cdd42480015a68a1db458d542b7ff64ab7d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00353-of-00512.json.gz": { - "num_bytes": 30040117, - "checksum": "ead6f32d98a91c47fb9c21334143f02181efb0b831705baeebb9820d069598fe" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00354-of-00512.json.gz": { - "num_bytes": 29953984, - "checksum": "ba349e503d017abbc1c83da2314c0a4892a9f3e5e480173812578f44d9b5904c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00355-of-00512.json.gz": { - "num_bytes": 30179912, - "checksum": "2bfeab794bbe0432db52cc595d25864b17fdb0744a80d6d907f6f2ffc5c56b81" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00356-of-00512.json.gz": { - "num_bytes": 30312163, - "checksum": "d0dec696d28c601d3a1f75b0b6e6e711e00809f0d5ea915f63cb6d9b7adcc597" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00357-of-00512.json.gz": { - "num_bytes": 29931515, - "checksum": "d43c75371e32d0c1e65f43acc00aac3ca43762d4c6eb6bb61759ac5fca593a99" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00358-of-00512.json.gz": { - "num_bytes": 29739788, - "checksum": "96fef1b4a5d6a080ff5d4a10bc90911dcb2ddecb4be91d0c9620e6d2484e3ee3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00359-of-00512.json.gz": { - "num_bytes": 29913841, - "checksum": "05b065d2d13b787ddee4707be7e2be46173c23794b9e8c773d0da743f435db17" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00360-of-00512.json.gz": { - "num_bytes": 29805295, - "checksum": "826104b9f4c2634d128f15564bd4990057dfbbb4066f2a082039d243bab56935" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00361-of-00512.json.gz": { - "num_bytes": 29839676, - "checksum": "ee5ba4cb14ecee0c857828a866615c6bfe45f67b158173dcac44146a02d97738" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00362-of-00512.json.gz": { - "num_bytes": 30154783, - "checksum": "d67b49e6fa5dc293fbd3057b7ca0beb7e0bd1ff692cdad7f2dfb7abadc1f4599" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00363-of-00512.json.gz": { - "num_bytes": 30126118, - "checksum": "6940704da6cde5822d48dc806280b8d57e0593ba299731e68ca9c2a4f7cf65bd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00364-of-00512.json.gz": { - "num_bytes": 30184894, - "checksum": "e740b4a0240e691f16a423fd658aa3c7539986695418af3b5a171a48524db74f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00365-of-00512.json.gz": { - "num_bytes": 30386766, - "checksum": "5a6a9461ef9ca579a849f6bef4d6225504a885aa797d3b2236ed8df6f5ea72ee" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00366-of-00512.json.gz": { - "num_bytes": 30208411, - "checksum": "8e0ce2447dfadaa4d41b991a2ce1be63b409e58e88944594dc8591bf9ab41403" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00367-of-00512.json.gz": { - "num_bytes": 30266003, - "checksum": "04ea00b46a583edea7740d74d719ef7f303b7f3873365b9ff4e94f08ef80832a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00368-of-00512.json.gz": { - "num_bytes": 29993752, - "checksum": "38b1a55dd4ff1b504d2dbc0b2ad54fe43ab16c8bdba55bd97f4a55dafa8c83dd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00369-of-00512.json.gz": { - "num_bytes": 29833222, - "checksum": "a25c405918920ed00edf5f3007cb8895b59fb67618dfea266b048273303b9592" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00370-of-00512.json.gz": { - "num_bytes": 29988999, - "checksum": "2812e6d9865d77ca8ac2d1499ba86be1ceed868a1da2bd13fbd0967058a3516c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00371-of-00512.json.gz": { - "num_bytes": 29866636, - "checksum": "ecd1d3bdc41c3f41f8c9d3a63c75766c173f70ff117af748a08c221ca4273b18" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00372-of-00512.json.gz": { - "num_bytes": 30296883, - "checksum": "723d2c5ebbdd95ab84c53e458d81944b6907d08c7aec67300f012880624d0010" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00373-of-00512.json.gz": { - "num_bytes": 30310322, - "checksum": "ae45d088521f2faf9852cb169962176e84bbb81d5ba157d4228d348f7fcf60f4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00374-of-00512.json.gz": { - "num_bytes": 30340527, - "checksum": "9b09c9e1b424fd05540b720c5a85f71eea43d743dc4ebb318e839125ccac9383" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00375-of-00512.json.gz": { - "num_bytes": 30193692, - "checksum": "c3ca4bb179cadf872f25f1cdb5c3667933bb8dfb7af21068a24b1b09c961dfa8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00376-of-00512.json.gz": { - "num_bytes": 30184130, - "checksum": "5d801f4bc20c4c6d8821ccfff06cb5dfe4214e571734feacbea3325462afa280" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00377-of-00512.json.gz": { - "num_bytes": 30259301, - "checksum": "ebf08508c24e29a8a14b72248f090d765b02ee7a31296811d0391f2a2e73c046" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00378-of-00512.json.gz": { - "num_bytes": 29650049, - "checksum": "c13e994e68b938ca069d2d412e7891cbaf2ee205d65b1c17c6acfea01adce157" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00379-of-00512.json.gz": { - "num_bytes": 30265211, - "checksum": "667da6f0650dd684aa50bc691b5783968ae8cab847dea14fc8d8bfe203e351f4" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00380-of-00512.json.gz": { - "num_bytes": 30429631, - "checksum": "7cf0e9ae00bec72f571d152730107efdd944176818600517fb2d0412a859d366" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00381-of-00512.json.gz": { - "num_bytes": 29889471, - "checksum": "f781b3128e92c54365be7771695555378067a65fb922e04062ab6f3f092ec827" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00382-of-00512.json.gz": { - "num_bytes": 30029894, - "checksum": "2d133def2bc4b840312ebe5c466c9f22729b67aa4c2a41dda2e6a9a55ddcddbb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00383-of-00512.json.gz": { - "num_bytes": 30249255, - "checksum": "e8610abf7e2bd70b1067a1b2dbf392ac32be156945502629228969974d3899b2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00384-of-00512.json.gz": { - "num_bytes": 30362665, - "checksum": "f217071bd0c1b1bddb3342c85064d7ebb54bcde2512997636f0638a0b3641588" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00385-of-00512.json.gz": { - "num_bytes": 30080234, - "checksum": "2db4b15c7391b6e6d3791721ee574d09101df597110feebc59e4f0aff4df6c26" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00386-of-00512.json.gz": { - "num_bytes": 29897704, - "checksum": "035daed74487c5262b8cfbefdfaefd17f2834c7b4a1d293934d755e059b58f5b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00387-of-00512.json.gz": { - "num_bytes": 30072139, - "checksum": "73013fbd06eaf94a7c8a0f0de420f83bed56655fb2d4e5d93972e8ca1847d130" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00388-of-00512.json.gz": { - "num_bytes": 30123843, - "checksum": "5db846c3d0b36774ce771ddfa8c53a915767926a2ad48222256d839326336f19" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00389-of-00512.json.gz": { - "num_bytes": 30278955, - "checksum": "9e4c590e67b2fbd357af955e39864ffe73dda201d76759935fda80b10b463500" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00390-of-00512.json.gz": { - "num_bytes": 30013591, - "checksum": "90974ba6eff489e0f4f52187b6241120740c782945e86525cb5d1e551a54e322" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00391-of-00512.json.gz": { - "num_bytes": 29925212, - "checksum": "10fcd62813434e2557b5861fd8604f534952561065bee9dc525b1cd3f5b2730f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00392-of-00512.json.gz": { - "num_bytes": 30016498, - "checksum": "da88b36bd3f15551d8fad115a86f111cc5c3d9a3c6fa9497214aabec7bcd6aad" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00393-of-00512.json.gz": { - "num_bytes": 30061083, - "checksum": "1ed9881020f240e1277e6513bc2abf24ea48e9cb0046d7e87a6d3669c8b42a0f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00394-of-00512.json.gz": { - "num_bytes": 30043459, - "checksum": "a35c3de1b0c982df8471705574e6eb7cc730fff122ff17d1381f2c7b9f20d6bd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00395-of-00512.json.gz": { - "num_bytes": 29921106, - "checksum": "f4cf52f8d6a1288773cc366469df140f885b233fb6aa1cb75387a450d88ec94f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00396-of-00512.json.gz": { - "num_bytes": 30024980, - "checksum": "5ebe04e54e4242d52aacb4c2e107dd10e609d5a7a6ff0425d9952bed98ef4921" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00397-of-00512.json.gz": { - "num_bytes": 30096825, - "checksum": "3ac381004d8257aa50fb28f0fd2171abbb93ad825c3f43422b9dbec6e1c6f31b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00398-of-00512.json.gz": { - "num_bytes": 30059739, - "checksum": "40c38af325f4d01ae7c74aa9cd8f8d1c96c6af851175f80d3c50d85c5f5d3585" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00399-of-00512.json.gz": { - "num_bytes": 30049826, - "checksum": "2ba0109b2d5b88422250bcbd2494cc6e11528710f38fa6e83a1f699b840b68a7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00400-of-00512.json.gz": { - "num_bytes": 29953506, - "checksum": "010610ba3af3dbfbcf2fac93136b7066fc58eb914dce9ae999722d0cfec4d331" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00401-of-00512.json.gz": { - "num_bytes": 30271141, - "checksum": "29587bb4be2c367f6479705b5c3c28716affeefc857ac1f77e4c33e55264def0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00402-of-00512.json.gz": { - "num_bytes": 29861236, - "checksum": "8e399149c335ec599f881fada448c9b4be22326357153c74b0de627078f1d43c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00403-of-00512.json.gz": { - "num_bytes": 30175831, - "checksum": "0d2800836914a1e2ef4a1aaea6e70d19699fc2555582ec670223177cac05a4fa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00404-of-00512.json.gz": { - "num_bytes": 30097682, - "checksum": "f9665e9199978b123feb962ce347b30cc1520626c32dfef0ca3cd8895a45e445" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00405-of-00512.json.gz": { - "num_bytes": 29810961, - "checksum": "8ea29cf9f7774a16a4c2aaeff1b6353de2951073676a9c411f19b0a5fb755b07" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00406-of-00512.json.gz": { - "num_bytes": 29963498, - "checksum": "90b10c91f6e0006576ec9b426c424e50fc1726c25ae8eb91bf91bb9001ade2e8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00407-of-00512.json.gz": { - "num_bytes": 30089554, - "checksum": "cfa905514e4f19c4eb82e438f5eb987731004476f026f4bebbeeafbe519ec85f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00408-of-00512.json.gz": { - "num_bytes": 30148002, - "checksum": "dddada59e2ef306cdf83b7c9ce3c912792237852053a4ea683224438a242c5ff" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00409-of-00512.json.gz": { - "num_bytes": 29989174, - "checksum": "907667ac304b6cca7100a9606e915c003fee43f1640d5b01405beb16eac4c379" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00410-of-00512.json.gz": { - "num_bytes": 30519580, - "checksum": "acd5cd2ecc46927046c81c9bb3459dd72a98e346ebb59c13c0db08fbb60961a0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00411-of-00512.json.gz": { - "num_bytes": 30408107, - "checksum": "6a9c2d42717f853cd4a76fc5275e95e2a584b7465c6059f586f6a06417048a42" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00412-of-00512.json.gz": { - "num_bytes": 29699198, - "checksum": "29e76bdab47496ed61a102edd3c61c20e60ab52abeb8e6068f7aa4ad1868f4fc" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00413-of-00512.json.gz": { - "num_bytes": 30065457, - "checksum": "b4a33941d0b994b82e3be351542cb4a832742e050ebbd71481e7ba34c8dcbc3b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00414-of-00512.json.gz": { - "num_bytes": 30342960, - "checksum": "4ba7edb3c77a45f0e4cb7e969053db6f44ce8c0a8ef262582512814b1161d9ad" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00415-of-00512.json.gz": { - "num_bytes": 30201576, - "checksum": "25cb4eb4bdf3cd1b29289a23696be8bd41c5f577294e94607bea7b91252a04fd" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00416-of-00512.json.gz": { - "num_bytes": 30021170, - "checksum": "60472bd2a2896bfb57baabb583fc6cdd402a1d776f6a4c9bb58ed556e67cd76f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00417-of-00512.json.gz": { - "num_bytes": 30237505, - "checksum": "aea8fd33c2acf1cef890549b1f88b18a2eeb37f6d4dd22b552f735811ad0b8a1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00418-of-00512.json.gz": { - "num_bytes": 29999334, - "checksum": "93583d771ce7f0e1d044de2919a3ffdd48b7b7dab0cd3b6dc459200dd53d8762" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00419-of-00512.json.gz": { - "num_bytes": 30194801, - "checksum": "cd36e129487272742f3e60ab6512dd79b3d1ce3c22490d2e47c00c2ae595cfc6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00420-of-00512.json.gz": { - "num_bytes": 29903898, - "checksum": "6f18a5ffc7efe5f555b02d3a31ed43714e09e73f7462206220d70450f47cd6f6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00421-of-00512.json.gz": { - "num_bytes": 30015573, - "checksum": "cfacef2cffd953425eaf4d7b2b6cf5d2637bf5d58c6ed2bd0002442795c7d36c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00422-of-00512.json.gz": { - "num_bytes": 29966521, - "checksum": "14f646b15948cf586ec1abd4bf4bf45bf180913e4d09049fa779bc7a196e455e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00423-of-00512.json.gz": { - "num_bytes": 29972805, - "checksum": "ad7d4ab443c7a8122976570891a225a44ff86d2299d70706066633a6204eb0de" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00424-of-00512.json.gz": { - "num_bytes": 30317886, - "checksum": "37c8bf3b535ea4053aa2424c846e3449f9eb27d5ff999e1e93b6cee0aa975333" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00425-of-00512.json.gz": { - "num_bytes": 30059310, - "checksum": "674ca5eaf6a88f76881c8a1c48e1e0f93794785ee5ea17fb70f49228d7f39614" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00426-of-00512.json.gz": { - "num_bytes": 30182498, - "checksum": "988d08cd18162d9a309155d2e75cd4980f76ab4c73ef8286edae94ca4628ebcf" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00427-of-00512.json.gz": { - "num_bytes": 30253874, - "checksum": "aa8c08a684ea0bbfda9297aea07429172a2fa4a161268b964421796173275b35" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00428-of-00512.json.gz": { - "num_bytes": 30055421, - "checksum": "b1ed26e826bee7fcbc31cf1c368c9a63eeedbea1c2fd0fb07370b461a03d1a7f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00429-of-00512.json.gz": { - "num_bytes": 29830674, - "checksum": "3efdc67ad7a108416dae47886e542da5c2ab1cd7e1aedd25c1c5d4e0607572f6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00430-of-00512.json.gz": { - "num_bytes": 29938000, - "checksum": "3221ef5e4c28d44c1da4fa04689f318217991c07aff4fdee5e1091fe8e1162ac" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00431-of-00512.json.gz": { - "num_bytes": 29829687, - "checksum": "225f4e22df1b45a7dc9fef2f5a44da8f8ee25608cbe34195e21b49c8cd10f3ed" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00432-of-00512.json.gz": { - "num_bytes": 30006209, - "checksum": "9fc53637db7b16c8cf6f824adf21d4602efab715ad78eab62c4be7981a8bbc1d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00433-of-00512.json.gz": { - "num_bytes": 30656456, - "checksum": "6bf7b701dc18f68d0facd7cdea49a26cdcfdd7829d5346eefe555485cfa7f336" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00434-of-00512.json.gz": { - "num_bytes": 30138891, - "checksum": "793532f72aa41c1dd7c549e9597fe8e73796c53eb5fe410a73de418ec446d686" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00435-of-00512.json.gz": { - "num_bytes": 30430276, - "checksum": "0d13d345ad12999fb4e7a9675e08bb1c90980fd193ed8530e4258e07bd6ea754" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00436-of-00512.json.gz": { - "num_bytes": 30173309, - "checksum": "fbce5fadb4b49bf833f77337929d873b2b25c3b564f7622f3672dde7a044e5d0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00437-of-00512.json.gz": { - "num_bytes": 30142240, - "checksum": "76c34800a3223f5fe0f1960f3d3c9dd9ecdc2e652493d71ef245415b5027c902" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00438-of-00512.json.gz": { - "num_bytes": 29979673, - "checksum": "4784c3787d24b9d46ad7c835683c6506c2e55c84835391e2aca0355f032a1888" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00439-of-00512.json.gz": { - "num_bytes": 30169105, - "checksum": "5012d03e637769d7494bd3cef0a8dfc8b38c995e0d5780089c15d6b1495b3a8e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00440-of-00512.json.gz": { - "num_bytes": 30107004, - "checksum": "529beaf4ad0251e35be574b1f623571526ec91a588ebd7df43e9d1cb99445f53" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00441-of-00512.json.gz": { - "num_bytes": 30324563, - "checksum": "f5e5fbf5e329f5bb0e83f758b8fc76516d65c3f91ad97e328187eaea83e4b667" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00442-of-00512.json.gz": { - "num_bytes": 30335681, - "checksum": "b8a26ed60f87a87347886b4467aa576ec5e8c106931589a1aa821b99fdabdb54" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00443-of-00512.json.gz": { - "num_bytes": 30155655, - "checksum": "e27bfb813fd6aba96ada81b095a559f0b7847cd25f7f8973663b19cdc5b8985a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00444-of-00512.json.gz": { - "num_bytes": 30340540, - "checksum": "705dec13ba2824d45e801bc2cf3e709d6492b1ff6de2f9ddefb5a57dbdada4ca" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00445-of-00512.json.gz": { - "num_bytes": 30248960, - "checksum": "09a6b83910369cf269c4f095607fb2f0ac0ec7e25b501f577fe13920a8573ee0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00446-of-00512.json.gz": { - "num_bytes": 30316703, - "checksum": "8f88b794c08bb492f50073337a30aafac0d05819505b507ab283dba0cf17d125" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00447-of-00512.json.gz": { - "num_bytes": 30184407, - "checksum": "38c819df823197bea6d647c3f78bcc15024aabba814cae322c1663c45fa8382e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00448-of-00512.json.gz": { - "num_bytes": 30238484, - "checksum": "8c0abfb8dca37a179b01dadd2227206cbe6e5b916d0111c0b00d2edc3951c7f6" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00449-of-00512.json.gz": { - "num_bytes": 30143151, - "checksum": "9731e9644e5615d5d5ebdbacc6efa6382df856c8763b7485c9a5838864c1332f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00450-of-00512.json.gz": { - "num_bytes": 30122606, - "checksum": "3b746f616f21c91277cde8e6d0d7f792ead7874de7ecdf11830a4a56db3dc799" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00451-of-00512.json.gz": { - "num_bytes": 30128179, - "checksum": "d6cadfc64ee39c9beb93f0bf8c169ca9d9053e0f76e1c9697841438e20dddef3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00452-of-00512.json.gz": { - "num_bytes": 29979326, - "checksum": "42de19ffc3ec821fbf5ff686d1b36d189ad9ee5c4553a2ff0d003ee1a754c9c8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00453-of-00512.json.gz": { - "num_bytes": 30118272, - "checksum": "22f9b2d3a9f089f1015f74d1ca0aca8f2a4970595326d964817177cbe6859271" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00454-of-00512.json.gz": { - "num_bytes": 30018294, - "checksum": "17c16895edccbb8b40fcc52cbafc0c15957020eb530e071dcce34544d5958bd1" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00455-of-00512.json.gz": { - "num_bytes": 30155903, - "checksum": "8b9d49837b309c3389d03dd3bbae92395bf7086134fbc69d28d9fff60a90d4a3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00456-of-00512.json.gz": { - "num_bytes": 30282104, - "checksum": "ab63fd2efb0cc883d303241b3488a8135a196db7edc844458cfc1483898ceb3b" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00457-of-00512.json.gz": { - "num_bytes": 29920723, - "checksum": "dbde2eeef90144b209ef5afa6d5165ad638ae57d919926a379a10fccf6850a61" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00458-of-00512.json.gz": { - "num_bytes": 30163167, - "checksum": "800307106f5861e0bc246bcaae214e6dadeee849905cac184ecfe6d0b560fa68" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00459-of-00512.json.gz": { - "num_bytes": 30248893, - "checksum": "3e78d327a9463929f33311e18116f5d1d2ae4926f7a600378875ba854cf5ee47" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00460-of-00512.json.gz": { - "num_bytes": 29840067, - "checksum": "047568a5dad00b04ca1ea4aa262c7a4af9b61e87bc4ea02ffd5c6c8c049bf8a5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00461-of-00512.json.gz": { - "num_bytes": 30179062, - "checksum": "ed8abe7b465bc19150b831632cb7afa298d6cb4beb9b6043a35a0f8afb5f730d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00462-of-00512.json.gz": { - "num_bytes": 30266398, - "checksum": "d7b74f5c1c1f7bb489700adcfb7e48400c4fcca7669e2d56396d9fabb5a63b91" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00463-of-00512.json.gz": { - "num_bytes": 30158800, - "checksum": "224815aee29f6d04ddbc7457c84338eef9b127a767e7b50ed77283ff166d4f93" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00464-of-00512.json.gz": { - "num_bytes": 30393915, - "checksum": "0dd019fd2c19936ce2e6410b65872f630131c5da7543c8e66fa87547fd1a2209" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00465-of-00512.json.gz": { - "num_bytes": 30148939, - "checksum": "6d74dc9d74d28c2b8ba8d43ba3d594af0cb176cfa7bf738f3933be2a9c37bb85" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00466-of-00512.json.gz": { - "num_bytes": 30268228, - "checksum": "0e201327066f28c19b082fe35e4fb3bd76c8fd2d32236d1d6e2309489152aa66" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00467-of-00512.json.gz": { - "num_bytes": 30121937, - "checksum": "7352e5a9ee66dcbeed2c9e1fbe6c9355f0e5dd1b30b592a9fd5690958945e5a9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00468-of-00512.json.gz": { - "num_bytes": 30004669, - "checksum": "53876848336ac57c082c9d5735bc1717f69ef38688b221d5e5ab9cd9cb4ec620" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00469-of-00512.json.gz": { - "num_bytes": 30049860, - "checksum": "a5a720b38f106dd5d2a2b7647748b52b4531ac12294e3b0d8dbc92062639c0c3" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00470-of-00512.json.gz": { - "num_bytes": 29961380, - "checksum": "9611764fc4f84b92e86fa6f9ea41464f6c26b07d1c51241b627a3d155e99d163" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00471-of-00512.json.gz": { - "num_bytes": 30449164, - "checksum": "db508df549d518c3e8b99b2f0098ea93fead1e632f53d8ae2cebff1d3476577c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00472-of-00512.json.gz": { - "num_bytes": 30312620, - "checksum": "1993b5e292c6c60a3373aabe896f1a57afaad73fdce0ec60e30696368f7c0afa" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00473-of-00512.json.gz": { - "num_bytes": 30406764, - "checksum": "913045c61fb5a145379d9fe08c91ea63092b197400c0c87bfa65af91720b563c" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00474-of-00512.json.gz": { - "num_bytes": 30078563, - "checksum": "c495119e150b083d709ca915abd760683793361ebf3e079b04efc9b7e1900379" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00475-of-00512.json.gz": { - "num_bytes": 29860761, - "checksum": "50bb5f40d2e91ab136aa63063fff860529c8961f2a38500a645b10339751589e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00476-of-00512.json.gz": { - "num_bytes": 30199778, - "checksum": "c969cfbb7ed7716f665b336b2ed9f7b10b532c7adc6d8a347964831a39cfef0e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00477-of-00512.json.gz": { - "num_bytes": 30130742, - "checksum": "54c8b89102cf882eda5208544a6c5d317c1defa8d997f9450ebd576e58f91830" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00478-of-00512.json.gz": { - "num_bytes": 29901444, - "checksum": "f669299d794ecc0523c64ad31af8fcce5cf3f880e87fd73f4c3f434425e9b238" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00479-of-00512.json.gz": { - "num_bytes": 30587214, - "checksum": "25d0fbd9027deaf140650f0b82a2316c37939f199fe7633b9f643684404f2029" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00480-of-00512.json.gz": { - "num_bytes": 30145237, - "checksum": "68a29728290e1199ce8d1ac060365bc443ea67c24292b2b04f1b4ca44ca7238d" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00481-of-00512.json.gz": { - "num_bytes": 30204159, - "checksum": "1605034b89e33f6794c901adac1eb200bb489f76b9bae6bc56b01e9f6ab4c254" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00482-of-00512.json.gz": { - "num_bytes": 30430794, - "checksum": "2dce9df095e89ea6645fb599f518612511a62b6c475808ad004c32968b19bae8" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00483-of-00512.json.gz": { - "num_bytes": 30102412, - "checksum": "c7c626977521b0d1f5bcc02c484b3eb4f517ba71006a4802df08a0f4cfb8ea9e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00484-of-00512.json.gz": { - "num_bytes": 30171871, - "checksum": "519ed997f1f1f1de7864b0bddf202b25e25bed349f63593a88337262d7705968" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00485-of-00512.json.gz": { - "num_bytes": 30049539, - "checksum": "8d2314fd3239ba3dfa99962c1d0a38e05edf9194e1faebae88f6b19ecab8fbf7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00486-of-00512.json.gz": { - "num_bytes": 29949995, - "checksum": "a7521e09cbe77098c23172427bfb931dd50f0c9d58b034fd1621687849a8d379" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00487-of-00512.json.gz": { - "num_bytes": 30345072, - "checksum": "ebc6254a4d241afb886b8df20819301121fcb234a32a1dd4ee8ae49571081f92" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00488-of-00512.json.gz": { - "num_bytes": 30300622, - "checksum": "509bba28ddf770d38554a2e846f2ce0d2af59e3662a6d6ec4dddb75fb509f8d5" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00489-of-00512.json.gz": { - "num_bytes": 29949909, - "checksum": "996e61f8e674b0a016a568630ee13a7473f99a919437c225a4198d232861e628" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00490-of-00512.json.gz": { - "num_bytes": 29995429, - "checksum": "9730024ad352eb12f74ac446ed32b9c57898658954be5dd639184fc5264527cb" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00491-of-00512.json.gz": { - "num_bytes": 30293919, - "checksum": "65b2a7de3284e892441b0fe8e850d89de842355d78fa9944358b1ee5912a948f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00492-of-00512.json.gz": { - "num_bytes": 30115831, - "checksum": "26b535c3175bb86ef721593f81d9cf006d4c3749f156c63ccd2a2c04e1201236" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00493-of-00512.json.gz": { - "num_bytes": 30187809, - "checksum": "a0918223c5523da20bd8230de1985b0a3cbb1e239af3d62a83d720a3a528c567" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00494-of-00512.json.gz": { - "num_bytes": 30149878, - "checksum": "6e9a5e329f834e41b4a8a9a6809df3243e5bffc580327912288ad7f790b43ab7" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00495-of-00512.json.gz": { - "num_bytes": 29711944, - "checksum": "3b9ba9d667e1241692ff9a654a68e98e8e94e32244a9419b2542137b63fb4705" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00496-of-00512.json.gz": { - "num_bytes": 30114815, - "checksum": "24b78cc36bb0abc67c998320e7029b6e7bbbee267a367eb538f23956c13f27a9" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00497-of-00512.json.gz": { - "num_bytes": 30048480, - "checksum": "29c3606acf298498fc3498bd769544e2879afbd0d5c46cee298cb25058694aac" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00498-of-00512.json.gz": { - "num_bytes": 29934973, - "checksum": "8afaffea92dfad745be8aa8cd3de0ee97cbcc26fbad6c71d56683aef6a27055f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00499-of-00512.json.gz": { - "num_bytes": 29796509, - "checksum": "9cbbd8f6d8fe92207c4cb2f0422284726deca1bde7f30cb01cce7fcd4665b380" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00500-of-00512.json.gz": { - "num_bytes": 30221736, - "checksum": "902904aa9fadaecbe698402a27b4e68b00813e67b79f84d4c696cd9c72f08f55" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00501-of-00512.json.gz": { - "num_bytes": 30108320, - "checksum": "76e848f8dbc082158fc5d3a2f7c10cd6e03585667c00efc639f2c6f47d44aeb2" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00502-of-00512.json.gz": { - "num_bytes": 30381907, - "checksum": "885bbc9788235abf33728737f72f267e60d1f5d4a77493cae76f161651d89579" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00503-of-00512.json.gz": { - "num_bytes": 29983805, - "checksum": "5134934392b13e3f84dd32dcb1c59f4d5416d6dfd925bf896f3eb61881d82136" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00504-of-00512.json.gz": { - "num_bytes": 30041413, - "checksum": "4978245a7f545d676bad6edfdfe60ffdad94de47af0fb10649fa39e9b068939e" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00505-of-00512.json.gz": { - "num_bytes": 30021620, - "checksum": "64933c28ea3f608326f1c6ef56170886767f1ab4f9ecbc4bf3263c7043901fce" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00506-of-00512.json.gz": { - "num_bytes": 30260343, - "checksum": "84667dbe68ecf1f9bbdaba0e73eca6fe0444f6594a1e9a4b46e9812ae7bce7d0" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00507-of-00512.json.gz": { - "num_bytes": 30173739, - "checksum": "dd6d44e4f344f3ab1cd61bacced7b5f1429cf6823fc9282452a539012bda028a" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00508-of-00512.json.gz": { - "num_bytes": 29903443, - "checksum": "4afc46096ac2697867c3a75896c5ceb36617c4c21a749dded58a1ea4565e41df" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00509-of-00512.json.gz": { - "num_bytes": 29862664, - "checksum": "74a720dc16b389e8122d61aa94bc12a5bc4253ca6f39679781c938e2eb556878" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00510-of-00512.json.gz": { - "num_bytes": 29744368, - "checksum": "6a302049e7a1668c5fb2e4b5afca518fa53ba1a9dc717015ecb5768e85ec4139" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00511-of-00512.json.gz": { - "num_bytes": 29896714, - "checksum": "48b89e909c0e33fd59c9623f8517cdfa90fa35a4641f999c6f68e1cc9f2a309f" - }, - "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-validation.00000-of-00001.json.gz": { - "num_bytes": 15284943, - "checksum": "42ac859dc1c4d48d165ec602909403e2066ce1d4854149ed70b9ec9cc96dc65f" - } - }, - "download_size": 15435025687, - "post_processing_size": null, - "dataset_size": 76369191765, - "size_in_bytes": 91804217452 - } -} \ No newline at end of file +{"en": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "en", "version": {"version_str": "0.0.0", "description": null, "major": 0, "minor": 0, "patch": 0}, "splits": {"train": {"name": "train", "num_bytes": 828589180707, "num_examples": 364868892, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 825767266, "num_examples": 364608, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00000-of-01024.json.gz": {"num_bytes": 319308785, "checksum": "8ef8d75b0e045dec4aa5123a671b4564466b0707086a7ed1ba8721626dfffbc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00001-of-01024.json.gz": {"num_bytes": 318039285, "checksum": "b945059cd1a343cabe311881b7840a6f0363f570e745a0eff0e687e266f6b55d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00002-of-01024.json.gz": {"num_bytes": 319748667, "checksum": "2967dc7e587ced6ecb9ba617ad2d4c44901467969de5bf5b0f5a9e5b70555d75"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00003-of-01024.json.gz": {"num_bytes": 318564193, "checksum": "b79d9abef5741578929be0d59db9ca652a8276207ef18a944b7a5f11fef5beb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00004-of-01024.json.gz": {"num_bytes": 318579884, "checksum": "cd9f98eac2bc6062f55d9a36bd744cc924a78ea2fd998830e0034e4456f5d014"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00005-of-01024.json.gz": {"num_bytes": 318003681, "checksum": "8ac5907a54dbc7ab9c14624448c7c3f6afed33af9d0a855f1eae955e62e255b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00006-of-01024.json.gz": {"num_bytes": 318495137, "checksum": "8fd9b9a4b74c9414466b245ebda7db041e7bd8603971de51b5db782bd758aac7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00007-of-01024.json.gz": {"num_bytes": 318417273, "checksum": "41dd377a1ba6b72eab0260c39c626fe45ab6b649d42d57b311d3ba21a0337cd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00008-of-01024.json.gz": {"num_bytes": 318131845, "checksum": "64da652c235f089a0b52f6db5883ef5f1e9c31edc4c950332b34dd12439c99a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00009-of-01024.json.gz": {"num_bytes": 318185592, "checksum": "807a548efbb10153c9eff0df5733a97a1b51ab1743242530de1b02a8ea17ace7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00010-of-01024.json.gz": {"num_bytes": 319045292, "checksum": "3bd0f6f664069c3bd964ce48ceae60ba47b55b54745a4b00c207bdb3a1926b17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00011-of-01024.json.gz": {"num_bytes": 319686980, "checksum": "5baa0c010083459ba58e34b4e93bb758caa878f7db6fba0528921329fa1a6cc5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00012-of-01024.json.gz": {"num_bytes": 320119088, "checksum": "fdee7442c06856e2c4b7665cc51978e9011b5e0a2112c30dd15bc9e53818842d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00013-of-01024.json.gz": {"num_bytes": 319474856, "checksum": "a4ab3b24087781c3577945492525696e182ffd7ca5265b958f49803a02867ecf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00014-of-01024.json.gz": {"num_bytes": 319693210, "checksum": "62215b2451e71b117018ef73570c944aff890624b384c538950b64c37f184c49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00015-of-01024.json.gz": {"num_bytes": 318427305, "checksum": "9893c9f413a1223e7b535527829bcd6df3219929fb1abf8f2a114dd8f6ea0919"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00016-of-01024.json.gz": {"num_bytes": 318785714, "checksum": "bd0ade8b8a57348952ca31c39efdab538f54c852941a225ccd13d0a7170724e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00017-of-01024.json.gz": {"num_bytes": 320134331, "checksum": "4132cfff3f5126d9e783191a5ccc34e5d85938bebf0b8489657805277a227202"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00018-of-01024.json.gz": {"num_bytes": 318653930, "checksum": "4675ab1d77da3d676d9743dca15bfce8478498f7738f79816a25ed790d28fa46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00019-of-01024.json.gz": {"num_bytes": 319468974, "checksum": "1d2f3a6aeb0f6c159295f283d302794cd3eb944cff3fe68691997bb2dc4c7780"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00020-of-01024.json.gz": {"num_bytes": 319109754, "checksum": "b5f26d832a0ec9b0489a27169d94496f5ea33c7fb046868c565c7b5a2407221b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00021-of-01024.json.gz": {"num_bytes": 318514423, "checksum": "428da5a8d4585de16f6b3f30865a5ca7a8d1ddcd3b6002dcc1283368b0c3d60a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00022-of-01024.json.gz": {"num_bytes": 318715623, "checksum": "9bc4812ba5e08c0b2d83cd3804129ba3d77cf84ba3d8828159788ee02e155a51"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00023-of-01024.json.gz": {"num_bytes": 319874293, "checksum": "38843ab4f5c60ed2b9ec0cdc65074eaca454014d5702edd809a266190689d2c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00024-of-01024.json.gz": {"num_bytes": 318105764, "checksum": "4fa0c7ec94445ea57dcecda7864b1346275e711c9820c2c39dbb9fdb95c97674"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00025-of-01024.json.gz": {"num_bytes": 319122521, "checksum": "0758514fa2e2c133c995c00d5f4abfc14b66582a4eedd0e721bdd95c4632a755"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00026-of-01024.json.gz": {"num_bytes": 318116783, "checksum": "56a73b9a556d6794d9c706e1b1c7e729fa13b711ddc25dd403b110eb5ed857f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00027-of-01024.json.gz": {"num_bytes": 320171191, "checksum": "fea1eabb734cda33d72f3d959234a240080b4fd42cc70494814a8429b087f9e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00028-of-01024.json.gz": {"num_bytes": 319047090, "checksum": "47d1c385952d6c18c431a7294339a030c213b8832f970ac987965b621c8181a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00029-of-01024.json.gz": {"num_bytes": 318705639, "checksum": "3c744d3dd915ceef3a93fd18c3ff5b117fb5118d1ced2089979b6cafc81c4525"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00030-of-01024.json.gz": {"num_bytes": 318327902, "checksum": "7f6959020242fdc841adfc10c102bbe79e2ef8502a09dac8451e0cec6f2add16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00031-of-01024.json.gz": {"num_bytes": 318990600, "checksum": "e56f29011594c765192c34298558e7227a829313196748f9a16ec34ecdb76d23"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00032-of-01024.json.gz": {"num_bytes": 320451482, "checksum": "9ea843dfd85e449439f3106d657762daff8f326730fefb342455c43cb48144e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00033-of-01024.json.gz": {"num_bytes": 319878207, "checksum": "2633cdb7b058f126173608897f69add614659b0b21cf54ecc8a2f4a79bc16073"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00034-of-01024.json.gz": {"num_bytes": 318701510, "checksum": "853c4b9ff2d79621ed27a6be826dae198af609d9f9dbd1c2773b778241cf6137"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00035-of-01024.json.gz": {"num_bytes": 318529104, "checksum": "fb50dac3f35cb71472464f511e6b8aee72ded10b3b6896d0d1f74a18ded2b8d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00036-of-01024.json.gz": {"num_bytes": 318849657, "checksum": "5cef5cfd50cfafd58feb452b85324a3d8198fca48789f0ce69227755e72d8e53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00037-of-01024.json.gz": {"num_bytes": 319621215, "checksum": "f0b67abf30e2d58d291aa9bcc9c8a03668afe819549802e4e591a261c171d970"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00038-of-01024.json.gz": {"num_bytes": 318135467, "checksum": "991bad578a83294d34a1b11649af07339aa8cb26d49330afa9fcbca0b87942c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00039-of-01024.json.gz": {"num_bytes": 320131759, "checksum": "abbbc21f81555e94484e6afe1975e13f67af19a820cd6f8d090c987a250bd4fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00040-of-01024.json.gz": {"num_bytes": 320214476, "checksum": "48020d2656709899abd2572b3424c0455df3c1089a69fe26b776aeb24f0da0ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00041-of-01024.json.gz": {"num_bytes": 319581259, "checksum": "db6fb8db7162ac87ea002c153ef0c54322f24c8f7ec263cfa290ac8c3683b194"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00042-of-01024.json.gz": {"num_bytes": 318100985, "checksum": "d499cba2383b16bb0f26b98416211eabf2599641ecd6708a5ef487692ca9e791"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00043-of-01024.json.gz": {"num_bytes": 317803029, "checksum": "dc6f1ccc3fcce79b16c5157f7125942e351d74744efc593f8372f8a408720340"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00044-of-01024.json.gz": {"num_bytes": 318837063, "checksum": "6170fced793461bd687640a658a085d02f971c2e609f6ff33b90df944fb56409"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00045-of-01024.json.gz": {"num_bytes": 319659188, "checksum": "b2f79e8600815578ec326cfc6c5242c2827cedbfac51772fdcf15ef5d027aa38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00046-of-01024.json.gz": {"num_bytes": 318771753, "checksum": "e4b4a3e53ee66c280a5e7ee33602ea0e910903748db8c2adbbec4b48bab1580e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00047-of-01024.json.gz": {"num_bytes": 318088661, "checksum": "bf8597fc359d8e9c721fd1d98b8ff3db5c011afd0fec9640670f31c7a7dddb79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00048-of-01024.json.gz": {"num_bytes": 317777133, "checksum": "369db8e9646b8229a23044a7257c2face97b8e05738f0413b581892876f268e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00049-of-01024.json.gz": {"num_bytes": 319329891, "checksum": "5cb2aa0432984b355b0ec6aad92f926b2fb75aea2a0e08b97f4c6a62838e6cc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00050-of-01024.json.gz": {"num_bytes": 318172322, "checksum": "11a7cc48539ac97eaec87beacef9d9bbb71fc875a0bff0c9ff096044bff46a44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00051-of-01024.json.gz": {"num_bytes": 318704544, "checksum": "ac2beee992c2b1ae8b1f162054e843e2b971bbd7cec45a0a7a7b7795fcdc7c26"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00052-of-01024.json.gz": {"num_bytes": 320806303, "checksum": "3a591fe9993c3d98a9e7949e98ca215ce164cd313fe53f3ce762c91b5fec7c53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00053-of-01024.json.gz": {"num_bytes": 320565764, "checksum": "60e67c8e6f3bfdf8b490ecfe62c79a13c5d04d393fbac712a6cda49fd78e883b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00054-of-01024.json.gz": {"num_bytes": 320425170, "checksum": "d69305c853e9e516f5fd4e2a9afb1939d829925f71102d8aa09387ded5d000df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00055-of-01024.json.gz": {"num_bytes": 318713224, "checksum": "e01737df8097a1526d6c31d37d7aeb1b92c0a7253b39f6964fcc897bf0eba9fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00056-of-01024.json.gz": {"num_bytes": 319441227, "checksum": "fe516c8c0a9e59f9f035ac5fdd13e973d25dd6635eee05d648740d3e8c1fc742"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00057-of-01024.json.gz": {"num_bytes": 319821142, "checksum": "7e058ed9072e968e9c8b92f9b50dab318515873cca6c617b544dacab5a2f018e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00058-of-01024.json.gz": {"num_bytes": 318643105, "checksum": "3479dc5a5b111b7f45f87e5a91c433907af97dbe15b9db1637bad666dcbdec40"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00059-of-01024.json.gz": {"num_bytes": 318053548, "checksum": "8208b0943f59b5914fa13d29108ede31a8d8d34bc6d603a2278ab8b80d28b1d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00060-of-01024.json.gz": {"num_bytes": 317935826, "checksum": "71324b62706aabd6faee682205cdedcd10dad289579b534d0e53f8d9b92bf2c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00061-of-01024.json.gz": {"num_bytes": 318870698, "checksum": "cdf0abc5804f0991871de48b249e30b666cb96f2254762a570c39904c5780f8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00062-of-01024.json.gz": {"num_bytes": 318945246, "checksum": "5ac676e16108446bd2980f9601c787eb754811a68e92ab6403c333820a6b9622"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00063-of-01024.json.gz": {"num_bytes": 318827790, "checksum": "a26f7cfe123cfdf3db7687996d0163212e70ff7635872b0754c03cbd5c31213a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00064-of-01024.json.gz": {"num_bytes": 318914155, "checksum": "858a145617a5902ab02bc77e47ee2f036a6211384c4f2285767c7558eb93e245"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00065-of-01024.json.gz": {"num_bytes": 319794084, "checksum": "52742215df5aaca43bed5405a397571efe7c22107ee2caa8c05e3ed229796efa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00066-of-01024.json.gz": {"num_bytes": 320294453, "checksum": "5b11cd54de0e95a75e53e4e32f72912cb01053d3fb609de6b7a45afafab414d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00067-of-01024.json.gz": {"num_bytes": 319468309, "checksum": "4c6c69b3eba9bcd6786d7dce893340f2d7093012ead04f3539352beccd2794ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00068-of-01024.json.gz": {"num_bytes": 318800742, "checksum": "ce94afc3c612e9de423a412147505ad7757216100becba2677bf5eaf443c4b6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00069-of-01024.json.gz": {"num_bytes": 319416585, "checksum": "ff3084a3e5a3960425a5c605274684c42fa638f99045527f77e74d165e52b6ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00070-of-01024.json.gz": {"num_bytes": 319165846, "checksum": "04c368b05f0ea42b3a51ed9bc0e817894f205c0ecd74084da015158d509ff2a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00071-of-01024.json.gz": {"num_bytes": 318017381, "checksum": "e8320e9982fa377b07c5b3e8a4451ac143b05ab7a4a03f748034b37fb998bfb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00072-of-01024.json.gz": {"num_bytes": 318874499, "checksum": "920f8d5ef2cae6bdbd52f724d0952e04146ff29f4aaec4dbf10bef7b66a98f40"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00073-of-01024.json.gz": {"num_bytes": 317890112, "checksum": "06a41bdb7bf0d52e2fe8e71f594de8d36d77880639ffdfb41e883237f76e8a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00074-of-01024.json.gz": {"num_bytes": 319201956, "checksum": "e0267d6782d30f1619a82c49c20be1c8b5424e653c093e4652a5c8ed117c6533"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00075-of-01024.json.gz": {"num_bytes": 320575937, "checksum": "42108758abc3c3197e7dca8293eed3800f3e79ceae80d3208d90c7a9fd205594"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00076-of-01024.json.gz": {"num_bytes": 320070510, "checksum": "c904b6e6041e23edeb1d88b7b69f07a339b7ff9835d0c22e0b6c354519369842"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00077-of-01024.json.gz": {"num_bytes": 319042024, "checksum": "1eb2b70ad4d12b7587eeb1ce86477817ad992c08fecafe5ccafc26af6b5657f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00078-of-01024.json.gz": {"num_bytes": 319997520, "checksum": "070370654960e02f766c10321546b280e9933531b796c252a94999d645f360b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00079-of-01024.json.gz": {"num_bytes": 320736487, "checksum": "3aa4f007660706563030b590cef9be992c18ba7ec1876210bc92665ec42c4be2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00080-of-01024.json.gz": {"num_bytes": 320082337, "checksum": "3b54eaf407bb593c2b16df99690446f26497530d21cf433a7d525e0eaebe9c3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00081-of-01024.json.gz": {"num_bytes": 318008114, "checksum": "d01975cdbd4360331b1a0f55e9b7e731d7d9fc70c7cdd0f33f1c772eff7aa03b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00082-of-01024.json.gz": {"num_bytes": 317829809, "checksum": "2a65dd37027fae03819ea5a5f6c3b16d921706ad758442881dc1d15b08bc5048"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00083-of-01024.json.gz": {"num_bytes": 319265318, "checksum": "e14cf18c687f7eb304df6abef7235e263a5736c799d742524205dead2abfb043"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00084-of-01024.json.gz": {"num_bytes": 319166958, "checksum": "1dc3fa8702a4477e3a3128440b68d4cc17e6d2ce7f3c53da28d50a57b8332020"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00085-of-01024.json.gz": {"num_bytes": 320338078, "checksum": "0222db7b1ae14c9b10aacdb05d055d1432b6d035e3937df5640facd242c52aea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00086-of-01024.json.gz": {"num_bytes": 318941314, "checksum": "55ddf7a27dc91bf8d932a5efec4aa458122ee337f2cb050e2c4b0ae8e770f3a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00087-of-01024.json.gz": {"num_bytes": 319218368, "checksum": "c61552d76bedbfa750c599a674d6732fb224c8a1e6c6583fca7ccabb20532920"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00088-of-01024.json.gz": {"num_bytes": 318974308, "checksum": "693fae3d50068ec39ad27a14335372c3e1530138cc65931edac5268dd62b7e96"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00089-of-01024.json.gz": {"num_bytes": 318781044, "checksum": "2d90b9318432a2313dfaec542c8b91431505035cca7416a63e3197ab26ad6e75"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00090-of-01024.json.gz": {"num_bytes": 318569651, "checksum": "ee674beda8ed39395e69c899f666990c5190dfad5494867e51fa727e4d38d86a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00091-of-01024.json.gz": {"num_bytes": 319683433, "checksum": "add2489350310ce500dde6637518c747c156f95f079a34367842bf875a8fdf5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00092-of-01024.json.gz": {"num_bytes": 318734793, "checksum": "5cfd4f25e9effaa2f7381bfcf49f9263e10619811aeaa32a77d3fdfc13517006"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00093-of-01024.json.gz": {"num_bytes": 319161014, "checksum": "bed8774909bba5ac656ebaad6e5cacca9e5ea12c80a41fd5689e6798c74f3c89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00094-of-01024.json.gz": {"num_bytes": 320143246, "checksum": "96abe370925f6962b4e75da530b5234eec21fab820d6cb02ae59b6070ab63859"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00095-of-01024.json.gz": {"num_bytes": 319707377, "checksum": "37b68cd632e8f86f364fd61c9581f48ad7602122b7f33c55103ac5bd727f015d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00096-of-01024.json.gz": {"num_bytes": 320159279, "checksum": "fb93c7467f0361c1d4b186d5e25f4bce4f237adb33b4e0ef56f57831b4f97f81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00097-of-01024.json.gz": {"num_bytes": 319841818, "checksum": "7f4d4a9536e37a0c2b9a1806fcb472784ff4d3840aa57e9603e74233b877fbac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00098-of-01024.json.gz": {"num_bytes": 321001731, "checksum": "239b9fefebe3815c8d785bd48086013d1a6dcd76c142786502c674d2d874fb11"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00099-of-01024.json.gz": {"num_bytes": 319475885, "checksum": "0a610d25a547839b8b6dfc2fd964e3ca64b23f0edc52d311c89dcb5e8a44a2c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00100-of-01024.json.gz": {"num_bytes": 319515329, "checksum": "f24d17cbd27296a15f51b9edc713c74a6997bbe82267403fdb6282404c2f4e6d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00101-of-01024.json.gz": {"num_bytes": 318803422, "checksum": "54b8b0c72ffa325abce3dd15bdcd0856b5594500c37f4bc6a6327721ba91e4bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00102-of-01024.json.gz": {"num_bytes": 320934688, "checksum": "24b99b4afa3b631a718a487d679026c91e2c936132df01df969e3173b49e091f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00103-of-01024.json.gz": {"num_bytes": 319835920, "checksum": "a2c68654ba81fa55bc24beb4319c8905f7b532fcb6793a6a311344d4f98a82b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00104-of-01024.json.gz": {"num_bytes": 319402378, "checksum": "27764d82793e35b8a7be3a3fb0470d018243a89283b5501c0b76056de1879389"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00105-of-01024.json.gz": {"num_bytes": 320100928, "checksum": "3bb2499337ebe52b63a5f20ec6ca6283971937962439699bd5e483cf80fed02a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00106-of-01024.json.gz": {"num_bytes": 318707110, "checksum": "83510312aa188431a8dda8746903d70cfc7ffdf5437e44c1f74b7670b78bd52b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00107-of-01024.json.gz": {"num_bytes": 319904239, "checksum": "40d42c39dea8e4898efba1886aa3be67742501f7a51d5bc635b03a2c6c2bd63e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00108-of-01024.json.gz": {"num_bytes": 320050265, "checksum": "88ce3ddae88e8024e76614a1b701c157f66fe39c6f0852a4869c5063876f6e87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00109-of-01024.json.gz": {"num_bytes": 318053254, "checksum": "865a124b663037f36a5738f25c82f8bea2ab54d4bbf8255ca0d1d00d76f8b250"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00110-of-01024.json.gz": {"num_bytes": 319794699, "checksum": "b17e210c8ceef98219ee12eba5dddd2001ded0d417c93955743c238360d96e76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00111-of-01024.json.gz": {"num_bytes": 318761540, "checksum": "05be318a057bb33bf9d7faca58569cdb0880fe8eeb0fc3f57f5999d5f2af55fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00112-of-01024.json.gz": {"num_bytes": 319121509, "checksum": "858dce8e43b06a0c1e26ab3e4f109814b6cc50c6b0e4d146ec79fda001ad471d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00113-of-01024.json.gz": {"num_bytes": 317916736, "checksum": "2e3968e48cb15a3326457d5a6ad49838d20d38c8138c529eee51f94e6bf269e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00114-of-01024.json.gz": {"num_bytes": 319319540, "checksum": "b72dc8207d93848f4fcb265b3e618d0eb8649445f7b9187c5165f4adec3e0708"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00115-of-01024.json.gz": {"num_bytes": 318863372, "checksum": "85ef0bf3cb12bc2fede4158853ed2259dff5d25adf99b43e8c35d7e0b9d4fdd3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00116-of-01024.json.gz": {"num_bytes": 318898370, "checksum": "a0c82c8b48e086be7396338cdda0fed52e8c4753f04fd086b9472c1bedfb150c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00117-of-01024.json.gz": {"num_bytes": 318153138, "checksum": "531d5d03fd8099806d92fbff2a48a0d68dcf46325e732e698e9c142902d152f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00118-of-01024.json.gz": {"num_bytes": 318966511, "checksum": "24b1c5ebbd07d50043be0d5d5c5427e042bdc53280825260226a2823e9b7546b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00119-of-01024.json.gz": {"num_bytes": 318733748, "checksum": "ce1fb1192b770e625430798aee94c93bd748ed474ff815a7f95cadebb826161a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00120-of-01024.json.gz": {"num_bytes": 319672996, "checksum": "4c2a6874921ac4a626a9c8ac4c6e91dae58f1f5b52e79124b3abf254b7433119"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00121-of-01024.json.gz": {"num_bytes": 318779046, "checksum": "029d3ab92f3e1724e3708790148e63b4c211d2ddfd04e3d194b24145e97c922a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00122-of-01024.json.gz": {"num_bytes": 320861175, "checksum": "4bb595140e5cf92147f99b58d236634ddfafbc0b160b4c88b337255482611ced"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00123-of-01024.json.gz": {"num_bytes": 318338141, "checksum": "d508261be287fa3d27e5f44524e22870269054213b61011ee8a6728a77910cc0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00124-of-01024.json.gz": {"num_bytes": 317655056, "checksum": "7612cb9fdd9f4b3a4f8958087ace120d4a73cf26bd16289bb20fc871f5744f2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00125-of-01024.json.gz": {"num_bytes": 317524610, "checksum": "049ebe4971811bb1fdcfd10cc264b2074b3ace18536340644e718dcc3cf3affb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00126-of-01024.json.gz": {"num_bytes": 317902192, "checksum": "d97bddf003b8f647c587fe9a9a9aed75ea604478e0b550d501ad7f07b6061b86"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00127-of-01024.json.gz": {"num_bytes": 319243191, "checksum": "6da4c882f88816a452af54ed217f84d6e4601c11a8e33bd47c49c0a1ea04f49a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00128-of-01024.json.gz": {"num_bytes": 318045852, "checksum": "ea43f63e6ef3bb5723ce75bb51f7183a525d8ccb00c93f49aaf2d9b560f7bdbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00129-of-01024.json.gz": {"num_bytes": 318436174, "checksum": "72ceb525367d6e8d1c0fca94d99d4fe5353ead08a5d52bf00e30e3b596fa90a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00130-of-01024.json.gz": {"num_bytes": 319017217, "checksum": "92f1b2687bee78441eeb4e05bbec2a491469b23c3aad0d951fbbe35a3c27998a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00131-of-01024.json.gz": {"num_bytes": 319237739, "checksum": "0fd07585a82b7d71ddabbc315195c84e2fa78a8319de7dea971cfcc9b38707b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00132-of-01024.json.gz": {"num_bytes": 318123742, "checksum": "c9f5604ca28ea2a9ae5267db50f6e3d1e576841abe840134b3817f370c057073"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00133-of-01024.json.gz": {"num_bytes": 319009751, "checksum": "7ec982de577e0eeff57dc60346ce35a7b35b3c4f037987316cfc071b0ed58a87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00134-of-01024.json.gz": {"num_bytes": 319750057, "checksum": "2619d265d76d82f6b84e2686371e5b6d6c08058cbd5765dd2906af9f549af092"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00135-of-01024.json.gz": {"num_bytes": 319068231, "checksum": "5e1bf5b09f2cd132a7747116442d6f26ce0002eaeb9f56fb02bc00e3abee8716"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00136-of-01024.json.gz": {"num_bytes": 317800994, "checksum": "80ebbf64fbd91215da553e3a8d9442380cee6c3b09fbbf8353a0817993d15862"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00137-of-01024.json.gz": {"num_bytes": 318954070, "checksum": "3b5d2ccafe526a19c52ac0fee50109b6a95ac3c8f7f2272a9a0302c4219e82f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00138-of-01024.json.gz": {"num_bytes": 318452853, "checksum": "2dd88569a62003383a3bf70d68143f16f234535469bdc8ab01a8764f6babb5fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00139-of-01024.json.gz": {"num_bytes": 320013821, "checksum": "f32ca62f6a9d2c8a72901e6f2c08880c2d1907f52beb4e8fdc30f4c02c7ad10b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00140-of-01024.json.gz": {"num_bytes": 319510423, "checksum": "7799838d8019d7cd71a505951f155bdfb862b4a3b3b77e182c706a624617169d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00141-of-01024.json.gz": {"num_bytes": 318339814, "checksum": "1601f6dbcbf4e7f1db119b232e862f3c9fe29e9abe5827177458079299ed511e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00142-of-01024.json.gz": {"num_bytes": 318438444, "checksum": "71d891be156e1b608733a3abe8f8dab7a6213c02931117b99889bc3fe8329d38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00143-of-01024.json.gz": {"num_bytes": 319413540, "checksum": "88fb2e7c3d426a6bb5775041658c07005a469306af0d97df7d68f148b64cbfe8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00144-of-01024.json.gz": {"num_bytes": 319901095, "checksum": "2734ff57f4265653b0b1f292f513017ba791c3091cf8ac0bbf6d75d0074e3386"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00145-of-01024.json.gz": {"num_bytes": 318500183, "checksum": "da2e6747f7230af5941c6bee262a606b4f7792da359dbf7516d82d8301cdf90f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00146-of-01024.json.gz": {"num_bytes": 319315120, "checksum": "6daac97153d51addc8b1e43b686e3d641666df3a106270a141d734079db2ad35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00147-of-01024.json.gz": {"num_bytes": 320621434, "checksum": "fb2584e0ce366ad30c8110591484b84798e9f06e8a27cd864e7800b8d5e2d225"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00148-of-01024.json.gz": {"num_bytes": 318269045, "checksum": "1c963c0ceb6cd776822352b186ae7e3d829ef334efcba0fbdd9182dde4deed05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00149-of-01024.json.gz": {"num_bytes": 318576426, "checksum": "6a21397e0104c7fe0fcd9f1d43a8e546000596d896a95eb9b6c4ab92235e6a49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00150-of-01024.json.gz": {"num_bytes": 318447048, "checksum": "075b113a73e6e21d7cac49391ee559ee8aaa2bb3338f709017077a4007a7bbb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00151-of-01024.json.gz": {"num_bytes": 315388730, "checksum": "bd47e3ac0209676d8a32490eb20ca8c07ca3c45c2beb88dae18b5c8d925f349a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00152-of-01024.json.gz": {"num_bytes": 319701880, "checksum": "241d9cf003f49d95168ebdeccd8209230507d4dfd0d170fa1b57d2355240a95d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00153-of-01024.json.gz": {"num_bytes": 318370254, "checksum": "3aa86900a749224dfed8a67960c166e43c3b9ef3ac7b49d28129b496c7193e30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00154-of-01024.json.gz": {"num_bytes": 320064875, "checksum": "3160c723cea6717fa9f5a9eb627d76107040d084a64106973099fa0e8de48758"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00155-of-01024.json.gz": {"num_bytes": 318089754, "checksum": "5b6e76a85bb1093eaba698864a54a938329b04494f9f72c3c3bbb155174da5e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00156-of-01024.json.gz": {"num_bytes": 320049467, "checksum": "cc013e8aa7c1cf7fc28ebecc64d893d03b092a09d725b5e626851de0b311c814"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00157-of-01024.json.gz": {"num_bytes": 319931950, "checksum": "2a27b4c29455bcd813a84aa3a54100d16cb6bfed25171aa3c552ea452ae569e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00158-of-01024.json.gz": {"num_bytes": 319963615, "checksum": "e477f769ea1513cf607932a29d793fdf1722cdea757e00c814dad594329cfac7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00159-of-01024.json.gz": {"num_bytes": 319000491, "checksum": "ff5d09415753c2aa4b51196e8f4bd6c77ba100ab281314aede118f501565cea2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00160-of-01024.json.gz": {"num_bytes": 319069618, "checksum": "e08c35aef8a20dccad80f6bb1579d6d2ce80113c8bf8459730c69fb7048c3cc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00161-of-01024.json.gz": {"num_bytes": 318750642, "checksum": "13eef84873b58e29894f9bf68a4de72a530c1bfc80a5654262fe71420292b8ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00162-of-01024.json.gz": {"num_bytes": 319847814, "checksum": "a8579c6bcc906fe018881a8474724576c3d0f7f1787f1568b79e5accbd9f962c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00163-of-01024.json.gz": {"num_bytes": 320370365, "checksum": "b97a74837ab9f659c13dcb4deb53c600584beb9e5ceed29e99974c4953f644c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00164-of-01024.json.gz": {"num_bytes": 319894618, "checksum": "9b63afffa2b84c91b749991ddb384399f1d408bd7b6b643e7329e49531ce9a53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00165-of-01024.json.gz": {"num_bytes": 320166197, "checksum": "5b2414477dc4e2b080b34f3b98672bfe3de6028e7ad83c323a7dd1ee08c05a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00166-of-01024.json.gz": {"num_bytes": 319612575, "checksum": "2cda682db53000c14fcb5d251bae4f50c8c4159348f8594c3ef020260f277a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00167-of-01024.json.gz": {"num_bytes": 319183884, "checksum": "5c406d7a8a404436039fde7c2019f0174ff8855caff319fa62bb7960d341b41a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00168-of-01024.json.gz": {"num_bytes": 319396348, "checksum": "df6a422d57a2e1443d10d61b13ab2c5227734195c82b43e1ead2db723cdea293"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00169-of-01024.json.gz": {"num_bytes": 319452933, "checksum": "81c81138e7163072e3779dd10ea8af7dff12b705fa008665298e08cfc2699f03"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00170-of-01024.json.gz": {"num_bytes": 317748609, "checksum": "6586ae8862b8ac925f424afb6ba779e95a147323fb83fc8c4bb0813877b17718"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00171-of-01024.json.gz": {"num_bytes": 319052376, "checksum": "8b3cd21d8ffbe963ce935ef9e0b6efc45f4d5abab703fdfed19a1309b700dca8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00172-of-01024.json.gz": {"num_bytes": 319068859, "checksum": "a42f5f5a10bfc84d51dd0855166959462faccd6a182af4c5d2115ff9995f5324"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00173-of-01024.json.gz": {"num_bytes": 319142377, "checksum": "e26514c5d6cea27c0cf7fcc1daadfa6f218ef9e62039c6d6fccfc31660c0c96f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00174-of-01024.json.gz": {"num_bytes": 319134484, "checksum": "75349aa8c734ed894965500eab2fdf59657a63e40e5a53e822ef1e5a12838a02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00175-of-01024.json.gz": {"num_bytes": 318330467, "checksum": "a3d0d14b28a5a3cc559d6d89e2ec09e49e92aa189e44e68dbb4ea47978e1eca1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00176-of-01024.json.gz": {"num_bytes": 318584643, "checksum": "dd68b42e5bfc656b71fe5701bacb929edae84055131f1dd65bbf3f3ad734e57d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00177-of-01024.json.gz": {"num_bytes": 319275087, "checksum": "05a8ff159006241cf938ef27b292f65906158ac25ac28919aa6761eaa634052f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00178-of-01024.json.gz": {"num_bytes": 318490550, "checksum": "a3aa38083c85baada29b207240bcca1a0d562a93971b420428d039092e58bd31"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00179-of-01024.json.gz": {"num_bytes": 319083249, "checksum": "12858fecd1dec728eba2c8c4311b17e4f2ac1fdb27c23e9adcd9258c5c4fc777"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00180-of-01024.json.gz": {"num_bytes": 319752094, "checksum": "67e968cb8d3ebec2f68eddfc539ea7402aa72c9274034494a43ea7d207b69a88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00181-of-01024.json.gz": {"num_bytes": 320476195, "checksum": "c1bd59eb7ca799e31bf037dc7c087c1ad94e4f88a4f12427c454510d97e1c803"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00182-of-01024.json.gz": {"num_bytes": 318538551, "checksum": "dbe7205a1919dca9d6936158d5653a20d239f2e547ec73280956da4f8c609220"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00183-of-01024.json.gz": {"num_bytes": 319620265, "checksum": "46f9e603e04040b59df8da6ee01d1c30588aa7233a00526d6f0fd84c4172ba93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00184-of-01024.json.gz": {"num_bytes": 318301621, "checksum": "880a02eabae231da388a5782a7194eef0d0211c2d1314db0c56d740647a114c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00185-of-01024.json.gz": {"num_bytes": 320515340, "checksum": "f522147aed30ebb3ab352c92a9dd24cd2e8b93df1d4c4a6284d89ceaa2858509"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00186-of-01024.json.gz": {"num_bytes": 318374733, "checksum": "5005f1c42038769e225a626a88c10bd4f6af98dcc14deed475954b00c088bc53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00187-of-01024.json.gz": {"num_bytes": 319116182, "checksum": "cbd7e0f486c6dac13090cd344337da1c336973e7ec75e32b0bd5b18b98f24bf8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00188-of-01024.json.gz": {"num_bytes": 318981305, "checksum": "064ce8c30b7a960b20720c133c3dd3281d27752a66def44d5133ff8f1b8279e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00189-of-01024.json.gz": {"num_bytes": 317036462, "checksum": "acc052da4501691fdd28f269c633ed826840f2634be49b5e2c5e1273de0cb4a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00190-of-01024.json.gz": {"num_bytes": 318061662, "checksum": "5a436e97c59b8636ca5081b71ca6fe8f8a3a99dd3f426c79edb2bf53345ee810"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00191-of-01024.json.gz": {"num_bytes": 318556228, "checksum": "2eebc89381ff78ae63f311c98b07853cefcc42fbcc210995095d568a6ff70ead"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00192-of-01024.json.gz": {"num_bytes": 317987733, "checksum": "99de46c4702c06a2303262b185b92fad82e12e189c923d5b76d9d8f96faabfa5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00193-of-01024.json.gz": {"num_bytes": 320294532, "checksum": "bccb7d8fc34d6cd6eb41e2a1c6234596b00a5517fdca7c47562fdee0e675377c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00194-of-01024.json.gz": {"num_bytes": 320852679, "checksum": "bb1e7768a57145fdbca7957ed964648d1deab5edc5dfad4722a81ad411c5e0f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00195-of-01024.json.gz": {"num_bytes": 319016077, "checksum": "ac520468a5bd933dbac1aa5f7f21ba276bdce15abf99963ef9d73af294e81e70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00196-of-01024.json.gz": {"num_bytes": 319289881, "checksum": "9eec5740115ab52ce98ac9efbed4fa1c5c06787fe93b4b28f6a1e4df06272870"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00197-of-01024.json.gz": {"num_bytes": 320180232, "checksum": "07a03763b84b4a86b4f71d725927d62c40925823ee454122a00fdb625ddb3a22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00198-of-01024.json.gz": {"num_bytes": 320004709, "checksum": "a1b250b01289fdaf6dcd997ef31c59c580f81f961aa0fd88ae0d175bd07c02ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00199-of-01024.json.gz": {"num_bytes": 321006991, "checksum": "650e57c3dbbf4ed929da8c6c5d78f35fbac4644722a84d98f93342a8d33b2140"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00200-of-01024.json.gz": {"num_bytes": 317913111, "checksum": "42caf6dee42bd73d9e4bf0c7bb16383caa936b2e0a913489b9f0aef57b6004cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00201-of-01024.json.gz": {"num_bytes": 317897148, "checksum": "990974a82de2b1c27465f6d097d7a5718c5ff334271e722ab3736e7aa5b89d4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00202-of-01024.json.gz": {"num_bytes": 319510250, "checksum": "8467066f2417af774363d4984a37968a0189adfe3a581723eab15004930e621a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00203-of-01024.json.gz": {"num_bytes": 319762388, "checksum": "4e7e20980dea2d5e77f380b24580f0df9319a0d1d73ec319e17d8cbe044e53de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00204-of-01024.json.gz": {"num_bytes": 317418128, "checksum": "2c027c5225ea7ce3c31f5f32dda12b7c892c6fdc9c52da6d0af749171cdce738"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00205-of-01024.json.gz": {"num_bytes": 320157174, "checksum": "d953e79c60be0e2c3b072c2186a845a351392ef395fa95135f47e6b8491c6f88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00206-of-01024.json.gz": {"num_bytes": 320459080, "checksum": "bc70c34931942ca143f7eb555e86458afcc36110aa9559151f31d781969d4458"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00207-of-01024.json.gz": {"num_bytes": 317361718, "checksum": "fad5ebd7a81bb737e12e9d4c803aea1a9e905d43a3fa87cace32a64eef01e8e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00208-of-01024.json.gz": {"num_bytes": 319976693, "checksum": "21381c727d945d8d3b4a275e3622bce64b07ed87d7f2371ac28b5d2023359cae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00209-of-01024.json.gz": {"num_bytes": 319550585, "checksum": "8b74e5f1780c4bf12936ac3a86be7a3d11287866522da8275aa4232c1e3d8898"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00210-of-01024.json.gz": {"num_bytes": 319574289, "checksum": "1594bd49cde9641b49a1ad9373a53e10d65440000363f7532a7d326d17c44236"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00211-of-01024.json.gz": {"num_bytes": 320615302, "checksum": "5b6f7eddfa3a9ffb0d6668d10f398b1d86482b64daa9817ca0af549433071244"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00212-of-01024.json.gz": {"num_bytes": 319395225, "checksum": "db58fa453269c794fedb595c6193dea5a85c72ff8b2d43e77c9bb371b8c86b78"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00213-of-01024.json.gz": {"num_bytes": 320131797, "checksum": "1d21d19b5e36820559590b339c049be29f27505ab4e88572edbdb84b649e0b66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00214-of-01024.json.gz": {"num_bytes": 320153141, "checksum": "55c9b4ff1cd8cc88738196f867aba620dec3c8b27b9a485c7e75d3129d76e9c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00215-of-01024.json.gz": {"num_bytes": 320525443, "checksum": "dfe9f44676c1abf0e2875924c094c0d788f8a0172d641d5f810258e948e37feb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00216-of-01024.json.gz": {"num_bytes": 320100146, "checksum": "57f19f5437b0428d9f40799af14f8bfba8f6c82ebacaea8f6fc7531524a6d4af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00217-of-01024.json.gz": {"num_bytes": 320688377, "checksum": "fad4f3143aa303c9c35165a15c6d90087c204c586fe20b0c0f45cf4238311b70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00218-of-01024.json.gz": {"num_bytes": 318896471, "checksum": "aabd471960d6db1e93e1129410d9138d9d9efa3292af7491b3b6844c2bd3f543"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00219-of-01024.json.gz": {"num_bytes": 319298204, "checksum": "f676701589e39802779a0947585638347bb4fe55376a33c6d0afcdc40c5f8938"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00220-of-01024.json.gz": {"num_bytes": 317757045, "checksum": "f3d0994379d244054c5e2db366a081caee28d301aa6b0d9431e7d9eb1cb38c30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00221-of-01024.json.gz": {"num_bytes": 318568870, "checksum": "8026854c8a8cc1d16b52a898b9dd8a8df7901dd8cdf285f5d937c4d5d45919f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00222-of-01024.json.gz": {"num_bytes": 319096912, "checksum": "71f76f898864de3ae60f7c0cdbc68d53cbfa04b2f8493c40d55e1cb56727b275"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00223-of-01024.json.gz": {"num_bytes": 319350414, "checksum": "ba01faf3fe41a738c255b5da83daf53a5858144557af6c6f8d6208a049e4245f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00224-of-01024.json.gz": {"num_bytes": 319007151, "checksum": "94200d12c61f7c73a9e3a2bb089a05b017a215348d52018a34e3224578c0da06"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00225-of-01024.json.gz": {"num_bytes": 319502985, "checksum": "0b7ce650e555baa546bb329d7f0567a3dc0a7ec9d49149792032a86321a73d6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00226-of-01024.json.gz": {"num_bytes": 317983607, "checksum": "40cf6d4b3deb05cd97ebed01405d08ae67be6e896736e4f371d15e5404567599"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00227-of-01024.json.gz": {"num_bytes": 320199564, "checksum": "e65ee475e3b6682b57bfa3f7b9c1cdabf36a7282fc793865df63dbe6a6a3d1fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00228-of-01024.json.gz": {"num_bytes": 318852183, "checksum": "8b27f2fbb0233802229fc776cfcb0b6b43af3149d217d0ab00cca0f1286482e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00229-of-01024.json.gz": {"num_bytes": 319407418, "checksum": "f2d5199a0022134ae127c88f0ac20d1b2b8a88014a774b5432b41085c83ecb5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00230-of-01024.json.gz": {"num_bytes": 320787790, "checksum": "e1b040895ac6068dd1aa892ec93d733096afc4adda698379006ef89926491255"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00231-of-01024.json.gz": {"num_bytes": 318220053, "checksum": "648a6349206c50c17d4e3562fd6fcb0a723b4cb40005890173d5de0c7ecc2ade"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00232-of-01024.json.gz": {"num_bytes": 319702777, "checksum": "0a44b7cb4f354e1eede683a697aba4051c1542fd030dd59767065f5f0204554e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00233-of-01024.json.gz": {"num_bytes": 319154465, "checksum": "4070448b7844776db6754bd33791900bf9ac8dbd81e4cd774a3055ada67f6fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00234-of-01024.json.gz": {"num_bytes": 319846160, "checksum": "b1e8c73078c347fa062ed408e81bbdcb2f714675bab2c082016e822e91ef63a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00235-of-01024.json.gz": {"num_bytes": 317722912, "checksum": "d8aa694e870157b2b5411f496db46dc71dfeed01a42973a65499596921198abf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00236-of-01024.json.gz": {"num_bytes": 318593592, "checksum": "e0c4ff6c8a12128da88777074d0b097664cf2f2395913c4d82b0eecd501946f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00237-of-01024.json.gz": {"num_bytes": 318902831, "checksum": "adce772ed699d7e908ae1fe1ddf1d9875305c7875c93cedf1b3ea0bbc21ff922"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00238-of-01024.json.gz": {"num_bytes": 318696723, "checksum": "926f9fc42cd248077afec1f4b88603c646fc5ae47c4ee3e9b8a5f6b8b6ff7f46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00239-of-01024.json.gz": {"num_bytes": 318321822, "checksum": "439d756b0ffc97ebecc6c48a7dc90da77de7ada05a6eae929db98057ea15bef1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00240-of-01024.json.gz": {"num_bytes": 318992553, "checksum": "1f57af6ff9477263806c0827c0dd8e494e103b6f54eec2cd5f8f8327b01ee39b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00241-of-01024.json.gz": {"num_bytes": 319345185, "checksum": "493932a44e09f4b311ac5bdb519111fad0982708d4b467688f2b1105316544eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00242-of-01024.json.gz": {"num_bytes": 320108156, "checksum": "de5603f1b276f1373011c8884f06af017c71b03c5de3b3bb89cd6d550a0d5902"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00243-of-01024.json.gz": {"num_bytes": 319855563, "checksum": "7c1b74de8ae3699c567edaa6e2d1a1f1ae82f4810e769c710a23cd2dfc536c60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00244-of-01024.json.gz": {"num_bytes": 318966332, "checksum": "d3ada80bad9fa776374878bc7504138e14c161bc9798ea8114b0d187d4c815f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00245-of-01024.json.gz": {"num_bytes": 319541864, "checksum": "3fe5f26e32795c49743d1b2497c333be57248c9db2ce12fb93e103d1a9595347"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00246-of-01024.json.gz": {"num_bytes": 318530369, "checksum": "a0bdeb2dcb5dfb46f843c4086230ba918f2d3ec125654cb924ea11e7c75cafbd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00247-of-01024.json.gz": {"num_bytes": 319496627, "checksum": "0c4099f832ada6b24ef6c1d15267cd3c179f5b3d79e3d813d944e3ebea908c99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00248-of-01024.json.gz": {"num_bytes": 319132981, "checksum": "608b1cd27ad345f6511fb677c00d56b6e827f288877d68aea1bcad3b02dd040e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00249-of-01024.json.gz": {"num_bytes": 318529093, "checksum": "8fd580be09f913cc3809e3b0e467e2faf657a5db6f71b75aa931043267b9b0f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00250-of-01024.json.gz": {"num_bytes": 318248903, "checksum": "faeac675c3634b0834939046e60cdfad6a13558d7a6799c5bde25567898d86a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00251-of-01024.json.gz": {"num_bytes": 319184870, "checksum": "038972e03db75417fc4cb25e54c3aee01e4f022eb0fab202142f539e4d866e28"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00252-of-01024.json.gz": {"num_bytes": 319631399, "checksum": "2fda0c2cec4624c6068556e16630c3551ef3110759bed59628913a9debd547a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00253-of-01024.json.gz": {"num_bytes": 318275716, "checksum": "b5da4bfa564fcc6c49a573b90e679d60c4e222249858f4e58fdb3727a5f279ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00254-of-01024.json.gz": {"num_bytes": 318638865, "checksum": "279eb2978fe94e1570318a247b82487c04d7494ceed74dccb1d7a5734ea84e5c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00255-of-01024.json.gz": {"num_bytes": 319640339, "checksum": "aa0a1ef845d0df7d81d2588d53f29205a4e3858a0888c1b7d9c83eb2fe1d32a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00256-of-01024.json.gz": {"num_bytes": 320353593, "checksum": "407133ea3b32a9e004b992a1bccade0440a39d0bfbd12993ea78c6526c0864a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00257-of-01024.json.gz": {"num_bytes": 318165587, "checksum": "72b7a72b8402b22cb51db44c9e7859460366c7c9d33e16a4c038ad07f7ad8f3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00258-of-01024.json.gz": {"num_bytes": 318003534, "checksum": "e5f9f2f74b7f9958dc9535f04a8965749ca4bd68005a6efa36f480fb487ca930"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00259-of-01024.json.gz": {"num_bytes": 318990454, "checksum": "7cb3c284613537fc6b1a85d7187dfca30b37a7a1a5708094f17486e3184e2d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00260-of-01024.json.gz": {"num_bytes": 319514850, "checksum": "0067e36b7156196e2451cdf78dc8832352f2481a4740afbef9046104b6810bdc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00261-of-01024.json.gz": {"num_bytes": 318747661, "checksum": "b1e4597420035c355abe15efc576751169e2b5e4c38e073c178346a7202d5ab2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00262-of-01024.json.gz": {"num_bytes": 319868329, "checksum": "374f4b951e545968da45b5055af2aa0b128c1d65d6c854f5b8f7e02d22c352e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00263-of-01024.json.gz": {"num_bytes": 319268788, "checksum": "7168e635a32859a85a152b29bcd1f699257ee4e340517e218ea9b8dac3922210"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00264-of-01024.json.gz": {"num_bytes": 319270640, "checksum": "1da08b65c83e79a0f5b7215e5a4ee58f21383b69f09dd9a3ba95381ba3d56d25"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00265-of-01024.json.gz": {"num_bytes": 318744354, "checksum": "0c908e81d59b2099eda038731b387a0ad86fa3d168eb2955413dde9cf29d947b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00266-of-01024.json.gz": {"num_bytes": 318518406, "checksum": "115e375464931638de4af669b7301b6112d18b23835f2db2b092f47545b1a855"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00267-of-01024.json.gz": {"num_bytes": 318921711, "checksum": "6d66c715137885a46f2472489b21751284ec8ecfde6dca6be3ec1ee75f6cd5af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00268-of-01024.json.gz": {"num_bytes": 317786222, "checksum": "588865d8f9d3da5a70c958997060ce4792e175c8fc5323f1887787070c8c160f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00269-of-01024.json.gz": {"num_bytes": 319004956, "checksum": "163ec7497602931de2eaffad320704e508e491937a2965e39907a086f640d975"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00270-of-01024.json.gz": {"num_bytes": 319175186, "checksum": "794e0e7ceccf28457a8ed5b0724337545661da16feafd0a53e4823b2cb1c92ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00271-of-01024.json.gz": {"num_bytes": 319785821, "checksum": "9c9ec0348f7d4ffc61e5f19f1f60c8382b33ca2fe4b852567cbc3c16024a4627"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00272-of-01024.json.gz": {"num_bytes": 318933435, "checksum": "883d85985237948018b13c20f4d4ee567c6ee36a135b326e8117d73dad4fe37a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00273-of-01024.json.gz": {"num_bytes": 318456664, "checksum": "fdca13067e8e118e538b8de538e164fb5397724045a5b1b02764510c8de90969"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00274-of-01024.json.gz": {"num_bytes": 318418161, "checksum": "27556558fe8a91a4aea4800ba9b7e844336a7638c5b96e652fcdb359f631b04f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00275-of-01024.json.gz": {"num_bytes": 318437784, "checksum": "6ad4e6a3e1cee04aee3051a66531e3f4aa97f7bbb7602c6aa5f46a727b319f2b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00276-of-01024.json.gz": {"num_bytes": 318470946, "checksum": "145a4d85ddf1e72fcdb8477dcd2f70a5554d9cd9349e02e058d3e7837204b6ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00277-of-01024.json.gz": {"num_bytes": 319580624, "checksum": "7116de0dbc5c7f6621f7c107dded9d85788937a87f2d56efca32ae9f25fc6865"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00278-of-01024.json.gz": {"num_bytes": 319619699, "checksum": "8dabdf2d26035d30c22204e6f46f292c58f4a4c3b0b77a1826a43341d4282df9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00279-of-01024.json.gz": {"num_bytes": 319344020, "checksum": "c2b7d5bf62be1772c6bb80f597b28d948cf3cdefb10b6df6f777f0ab7d8fb015"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00280-of-01024.json.gz": {"num_bytes": 318997864, "checksum": "025457720b0045e7bf01f9b4b847f28ef94af9ca250675efeee73eeb340a3f36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00281-of-01024.json.gz": {"num_bytes": 318718146, "checksum": "2979c0ac06570a9ee437521778c514bd8755193b9f1ae6a5a671ef885243f019"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00282-of-01024.json.gz": {"num_bytes": 318434530, "checksum": "a17bca50ec20c364adb899a9073bbe3a1505f81803a58190efc5d4f3f78b58be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00283-of-01024.json.gz": {"num_bytes": 319317663, "checksum": "9034f524fc5c2e246b22e2dee00b47e0c4da0316bc60d0a11d966c28db917f9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00284-of-01024.json.gz": {"num_bytes": 318957832, "checksum": "f08b96047e711831dfb8a44d90cb712d3e78c98dd28ec6b937ee83949bbef5b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00285-of-01024.json.gz": {"num_bytes": 318643283, "checksum": "c5df1f2e2dad46d71f8aadf856a5139020da8afc2ee010d53c0372ea09b2362d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00286-of-01024.json.gz": {"num_bytes": 318064839, "checksum": "16f7fd6abcbc69750b8131bca3e38ddc40bd7c86c48122ad2a9a77cb9cfd552e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00287-of-01024.json.gz": {"num_bytes": 320328448, "checksum": "41e82bd357b47a28f28a4a203d5b54263aadb3c9a08899f78302c727c56d8b38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00288-of-01024.json.gz": {"num_bytes": 319559271, "checksum": "970b9df224b58ca50b3023d92f6be0c37dbda479155c29c535e457ef6f2bca0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00289-of-01024.json.gz": {"num_bytes": 318786822, "checksum": "36a6515e7f516335d3fe057bb6ed9890a2aea033e08edd8588b3168b3445b2f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00290-of-01024.json.gz": {"num_bytes": 320634782, "checksum": "7d19fc82b9a5aa0e0046cd17cd2c46f356f8a4a7d203d5e03e1f319156f05cb8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00291-of-01024.json.gz": {"num_bytes": 318746713, "checksum": "86d610d4590bca69281348dbfaaec9e704fd6194141c50c71e84aad51ce26b91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00292-of-01024.json.gz": {"num_bytes": 320049630, "checksum": "d045df646213e29d4e7de4ec8915eb3b65bb962f35b0d74abf00889bd5aae8ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00293-of-01024.json.gz": {"num_bytes": 319966146, "checksum": "c66fff1a64b495211bfdcea650ff76115f8c857b9154c1b869062e702714b9ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00294-of-01024.json.gz": {"num_bytes": 318805332, "checksum": "ef3d9204ec85a1e65ae48af7924f614403d297a15f232ba41eb0e4fe223e507f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00295-of-01024.json.gz": {"num_bytes": 318898465, "checksum": "2a071fc28b1216f2dc0579528d9b04e597b5cdac9fd14719e312092242da190a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00296-of-01024.json.gz": {"num_bytes": 319406630, "checksum": "ea71e9fd444860d70d3728f7e2213a4bccf3aa31a164c9acfa8df7a0b6619786"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00297-of-01024.json.gz": {"num_bytes": 320312971, "checksum": "ddaeba8aad38b7e9727c579cc44f15b3c82d292e2901b47b785e9c8d3d5cdb9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00298-of-01024.json.gz": {"num_bytes": 320660744, "checksum": "814460ccfda29b45edaee5f44e3c980889aee2ee52e4e5323931ea489fbe938e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00299-of-01024.json.gz": {"num_bytes": 319848186, "checksum": "3b91fe32d3a731a5be3bf778eedfe13e8a7e26ba9eda51c278c5212aa7925681"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00300-of-01024.json.gz": {"num_bytes": 319647278, "checksum": "1e0424631f7f354bc63b3e71c5c6516c85343dafd3896acb9560eaf93b672799"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00301-of-01024.json.gz": {"num_bytes": 319080252, "checksum": "46c21af013f611729cc06ec033dbae80151987f9098e57fb98e2631f6fe76c8f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00302-of-01024.json.gz": {"num_bytes": 320028246, "checksum": "d1ca8ad6e5bd6cb18db1f1be9154dbc8ba9df7ca02db4c1f8a7df9d40820d8ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00303-of-01024.json.gz": {"num_bytes": 319388787, "checksum": "bce87161f77464adfb1fc04fc2993211bcec502d7172b86f726daf7096b04f82"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00304-of-01024.json.gz": {"num_bytes": 318627831, "checksum": "235b8085cbeb7b13f8e1a5f6d2225a9461b7bcd76e21466a189c2411ff4c4107"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00305-of-01024.json.gz": {"num_bytes": 318148428, "checksum": "f13f124e0ea150da13ebeb3390c311b3db54018de0d640579307bbcf2c46068d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00306-of-01024.json.gz": {"num_bytes": 319451712, "checksum": "de5c3fa2cd6a47551ab43268484d017602e2c3e1f66f43f1a1d8f95bac52cad5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00307-of-01024.json.gz": {"num_bytes": 319026244, "checksum": "88769fbf393671db352227a64cb8ba6b4ba60c5bddb4a14294b1ad9a65a750cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00308-of-01024.json.gz": {"num_bytes": 318447454, "checksum": "555bcfc0ba4db0551ce5ffb18057027ee695af166856125aeb79f7ce013851cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00309-of-01024.json.gz": {"num_bytes": 318147676, "checksum": "bf28e60a7970c548190cf0f4fe56f27ea55a1ad8313fa353a8013f0a0e7919f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00310-of-01024.json.gz": {"num_bytes": 318930650, "checksum": "45a68c0ef70ecd10838d604d51fecd26e5199f5372022b9c2af461a71c24c6ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00311-of-01024.json.gz": {"num_bytes": 319955339, "checksum": "fb3c4e93166f1cb2ccc8a7b68da0246f0827d3a81bb5614c8c84f1c01c6d53c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00312-of-01024.json.gz": {"num_bytes": 318554567, "checksum": "0dce2ac88ba7ac5340d551add9fe7b1a30772a6cc082347c536427b48daca598"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00313-of-01024.json.gz": {"num_bytes": 318978931, "checksum": "c5f99dab085fb705769a514626c9af8a26cf846fdaee4b403a3d6f84c892cb66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00314-of-01024.json.gz": {"num_bytes": 318158197, "checksum": "79de4fa2aed5e3efa71e75d13f08d7c1869aa59f42a819f4429430b3db6c1b27"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00315-of-01024.json.gz": {"num_bytes": 319744521, "checksum": "5a47a89a1537662a91853bbe2a5b3e243f5de74489f820621192cacef192593f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00316-of-01024.json.gz": {"num_bytes": 319861527, "checksum": "1cd34f17f3ae3c8bf8e1636714a9ff600a26799d5ec02ba42abefa5db9d00e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00317-of-01024.json.gz": {"num_bytes": 319286030, "checksum": "a3e34af81264a72b523b63fdc0268f450675f7993fa0885eb2b4c747b0d6703c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00318-of-01024.json.gz": {"num_bytes": 319054871, "checksum": "02fa8cf278578108083bc9a3c5cf07b0a9d243f2162397091ede6c85a1df31e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00319-of-01024.json.gz": {"num_bytes": 319943810, "checksum": "93ef0d7f1610043a6f7634af73e89ee9f3d7e87828ad34558a4d688e6fa6b6dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00320-of-01024.json.gz": {"num_bytes": 320037211, "checksum": "06fbd99a3d64df293db2655f321117f1afcf1cda51e421edef9335a25cb1a902"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00321-of-01024.json.gz": {"num_bytes": 318584237, "checksum": "a224e4d902f7368f91d6a72fc9f5730996dc37de576bc2211eb632e3690f1b38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00322-of-01024.json.gz": {"num_bytes": 319686632, "checksum": "57fba28c7104ff659f8a0f330ae89c68d3a392dd14a78247fa357a3bcc8b94dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00323-of-01024.json.gz": {"num_bytes": 319834993, "checksum": "e61c760cd3c42f71a1a7bb6adc4e0bc970bbf864b69e2a4a5d56bf0a14d4e0be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00324-of-01024.json.gz": {"num_bytes": 319243057, "checksum": "61d21ab1e7729f172ade5ab6c0dcaf07eaeaee6e047ca1c24722c06ddd919678"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00325-of-01024.json.gz": {"num_bytes": 318569583, "checksum": "2192a891ecc2a6aa9f6ea64f1d76ce763e0a3963ae03c95275ccd626171835ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00326-of-01024.json.gz": {"num_bytes": 319175980, "checksum": "d35e4d5f8e924ad97520db51a2c361bbc02097721195932b6768e7460df092a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00327-of-01024.json.gz": {"num_bytes": 319892298, "checksum": "ce967065d3915d466982b5258e07ad2c46b02d7637057e0547586657ea0f53a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00328-of-01024.json.gz": {"num_bytes": 318004026, "checksum": "0676d556f46b1f057669d3378c6fc335db6e3ac67a02e11dce3823658730f4c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00329-of-01024.json.gz": {"num_bytes": 319066225, "checksum": "b00bb4bda957e1287b98c432165448b3899f9155363f7b61bfd0f0181181acfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00330-of-01024.json.gz": {"num_bytes": 319268288, "checksum": "d14d1883941966ef3b35203d06e6fa1bb485dd77118bd7b6c811b0d06fa72fae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00331-of-01024.json.gz": {"num_bytes": 319131311, "checksum": "4d5d41c2b2242b299fb67fa8c9327db8b4f612bdf4ee9af4d4e45aba8cd1e409"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00332-of-01024.json.gz": {"num_bytes": 318827508, "checksum": "68cea08d4805b392bf4c2894a4501ee3fbbe9aac4b1b6533e686ea749ced2dcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00333-of-01024.json.gz": {"num_bytes": 320572240, "checksum": "06f211ae2fe1c4eef5e41caceda8ebbc289261057911fcf2583a59c730b7951a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00334-of-01024.json.gz": {"num_bytes": 318121862, "checksum": "46c62769e04ce8acde4562ba24d72e245babacdfb50600da4e6217948ad71d24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00335-of-01024.json.gz": {"num_bytes": 318692168, "checksum": "dca69a6976e7387a12c8da16b696ed4f604254693a3280be0f90fa694700b595"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00336-of-01024.json.gz": {"num_bytes": 319479902, "checksum": "c52969fad97f1dc0e1e115428e7dad1ac6cb6d804db0cd34f0fc7846b1b50c7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00337-of-01024.json.gz": {"num_bytes": 319987407, "checksum": "2c570f02aa6a6bac96be1e02663996c87f9a94c160f22101ce8ae1d549ae1de2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00338-of-01024.json.gz": {"num_bytes": 319051086, "checksum": "77132df95b147c471ead74bef16ed4fa11e15209f518dd460110132358816834"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00339-of-01024.json.gz": {"num_bytes": 319473192, "checksum": "7f3ac20a72d395c02ed3cb50052821521dc2d8d97303d00e0d0982e2c29e7659"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00340-of-01024.json.gz": {"num_bytes": 318423485, "checksum": "d1127da89e960d939cfc06cf1985df415b60d4bf02b12b7fab02b796100feaee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00341-of-01024.json.gz": {"num_bytes": 320087690, "checksum": "f753423f82157e95506566d3653d32af6a181e69ea0e10b4d4eb24b626d3ca49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00342-of-01024.json.gz": {"num_bytes": 319767100, "checksum": "db7410e6a6ca74163098681038f497faa373e1d81434b45c1a2f273d467c0a2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00343-of-01024.json.gz": {"num_bytes": 318389429, "checksum": "7ea1e432a1ffbed8f4ad6cb985c5cf1b2584d8eb7d2fa091a2db3f104a3f7210"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00344-of-01024.json.gz": {"num_bytes": 319117212, "checksum": "c7317a81a6224dec9be07b41134ac7a7db4039b7c98b2061b20bb59b82ed0a1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00345-of-01024.json.gz": {"num_bytes": 318504232, "checksum": "1498efe8280609d9d66c324e332c9433c6351bb7b99c5891a8f27d6841410407"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00346-of-01024.json.gz": {"num_bytes": 316721169, "checksum": "0cbc6b494d653878c9d52a37572064b88356058ed291aa773e5f47259fbfc722"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00347-of-01024.json.gz": {"num_bytes": 319007736, "checksum": "6265505e19a42a01a159297d33b1a91cd0e042a31ba6a1a867404a143ae565a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00348-of-01024.json.gz": {"num_bytes": 320167918, "checksum": "cc8b29deb44c8348aa4d05836f89cbae995c946f38d9cb8e7fedbd4762168ba0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00349-of-01024.json.gz": {"num_bytes": 319901226, "checksum": "2a0f2188b43ffedc8b95a8276c7647147587c5e544c9e6475e790f4b5e362992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00350-of-01024.json.gz": {"num_bytes": 318999223, "checksum": "1fde48c503998872aa71fc524c7408dc84cbc1faa0d885895d5c57708a15fced"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00351-of-01024.json.gz": {"num_bytes": 318935410, "checksum": "72d577eabcd814a7ff61b894b3fe9089f483a793e692d3ab20ce4ee59921f975"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00352-of-01024.json.gz": {"num_bytes": 318655907, "checksum": "8686dc0e4ff7b35cbc4fa6f3abce50c06f8b95378031c132a117e1d458cb4616"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00353-of-01024.json.gz": {"num_bytes": 320619683, "checksum": "cd5816469ef54bfeb0db6b55a78e0d34eb2e1f82448a41f67dfb70061c3ea91e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00354-of-01024.json.gz": {"num_bytes": 319352400, "checksum": "bf082c093423d562da4984b1f0428225d853a05b5f8fb3696273f36ebb5a235d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00355-of-01024.json.gz": {"num_bytes": 318868462, "checksum": "3b8baeca48e55a2cd268d6aef75f7eed96ef10fceca593a5179d52a2b0121f8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00356-of-01024.json.gz": {"num_bytes": 318903295, "checksum": "4c9a9926a4bad6721807d99cc02a9b6bd28bb0a6254aa1c15527b745c56a06a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00357-of-01024.json.gz": {"num_bytes": 318881446, "checksum": "84b4c2e05bc162fef4824e97ba7a03b1cecb41eda08a3e0aedd264b66e859a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00358-of-01024.json.gz": {"num_bytes": 318521100, "checksum": "aee99528ffd0323fe81e4ed26ed1b9295baa2a3910771dd2a42f4f378fd82569"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00359-of-01024.json.gz": {"num_bytes": 317796778, "checksum": "7b01f2d5ae54f60c2aeb7b96bd366d21e558e2dac48c83a78df9850f37e02f1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00360-of-01024.json.gz": {"num_bytes": 319502919, "checksum": "5b54f9a050e6f9008a1806101ea553d90eead56c949a5f3f46c8ccb88812081b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00361-of-01024.json.gz": {"num_bytes": 318595505, "checksum": "49f4164d66187d46adff7f9bbac97b232ab7906d812e571c2e0bf028895e7f47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00362-of-01024.json.gz": {"num_bytes": 318851572, "checksum": "17accad3c0706c54530f128260cacbf986cbbb20427d4ba8d3444a3702a22c55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00363-of-01024.json.gz": {"num_bytes": 318555337, "checksum": "2327866e541aa6aa73f7289c3ad82a19ff154d39657d98cb78a2f481a8765920"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00364-of-01024.json.gz": {"num_bytes": 318641145, "checksum": "6f52354d804e8d4a1af1f6c2c6b759ae115c4f23a63f1206a73e7e25acfbdd02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00365-of-01024.json.gz": {"num_bytes": 319212614, "checksum": "8f1834eeacc9bbdee95b1f0a4078eb9488bd1a7c5693489bff7943869674cad3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00366-of-01024.json.gz": {"num_bytes": 319336585, "checksum": "a9cf01b76104eebb4ef8462a924f61c262fa197a7c68a50e48d925cb81586e3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00367-of-01024.json.gz": {"num_bytes": 319161263, "checksum": "5ac822027d50c3196026fbaffc7d968e1ca702b947688a6f4d268b942b5067b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00368-of-01024.json.gz": {"num_bytes": 317911640, "checksum": "f9acffbe3c6617e85911ff9dcecec2378b3469ab4546a6973cceb460f9003cea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00369-of-01024.json.gz": {"num_bytes": 319585031, "checksum": "9234553649cfa5265c5a9ccc88486402f88eb81275067c51d9deef16bbe7211f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00370-of-01024.json.gz": {"num_bytes": 318345879, "checksum": "2fbb410346d31a33e8532602f4e3340fcc75c96be803250e9f0f1a6894ca0052"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00371-of-01024.json.gz": {"num_bytes": 318996184, "checksum": "b069b0c8a830ea841e82077548706f286308ef0420e163ff6d8312c8853af172"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00372-of-01024.json.gz": {"num_bytes": 317989343, "checksum": "bfd62e448d4d9f89353abaa384007b0b72bd860402ade3a9d938051a6446530b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00373-of-01024.json.gz": {"num_bytes": 319770759, "checksum": "e4e176250aceb7362ce38d496556a46409e9872e69f45166afe71aa750de8fcb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00374-of-01024.json.gz": {"num_bytes": 319212902, "checksum": "28aa4510c3ddb9ee0ac56aab3792bfe5e899531919ccc0214a4b68bbf2ba18a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00375-of-01024.json.gz": {"num_bytes": 318968029, "checksum": "35326b1f2280e07dd754e89dfa29989d0dfa5c78995d393b36a752d8364bfcd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00376-of-01024.json.gz": {"num_bytes": 318685188, "checksum": "0060dbaccf7f2f956fb8b57891cb176914ddac1bc485dd86c2fd110c46d174b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00377-of-01024.json.gz": {"num_bytes": 319291982, "checksum": "99fc38654197e506868e099c15b2cb15b93238dafd33f81a7d069b3e01c3b085"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00378-of-01024.json.gz": {"num_bytes": 319259094, "checksum": "9b8d97f9d57dd97373c4f57eae2b9c01a58e49017ee41d3969e94fb4dbabc260"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00379-of-01024.json.gz": {"num_bytes": 320228224, "checksum": "82913f2d182d2a57f6c93e9b229862cb72feaa6331d04cd4419113e1eb9d52cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00380-of-01024.json.gz": {"num_bytes": 319738339, "checksum": "e0de43f754ab97d103a02c708d1cd7e771ba079bd9e1f7c532a80a30bd5182ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00381-of-01024.json.gz": {"num_bytes": 319210620, "checksum": "df74823f78564b544677410508e675e2811905c56afe2a60d19d3e049dd65394"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00382-of-01024.json.gz": {"num_bytes": 319810275, "checksum": "f5d5291a695fe2cd228213fa2bf090bf6513c49c6911826aa43ecaefec0622ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00383-of-01024.json.gz": {"num_bytes": 319190426, "checksum": "a861ae79a66b72d6cd5e0a030daae52cffb85ba1272c36ae2be04a9b7c0287c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00384-of-01024.json.gz": {"num_bytes": 318501845, "checksum": "b8d0f5078ae82980f0f64120530bbeb20f627be0a8629d68885acb867091417f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00385-of-01024.json.gz": {"num_bytes": 319530458, "checksum": "7da119f3f63e25ff63cacd8ba0d77987b2d576be1f4b86e7e45aa3f2d194624b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00386-of-01024.json.gz": {"num_bytes": 318938980, "checksum": "c21f3de56fab26d7fb60bdb47c216b22793f67b8fa6d382520c79b88d1896f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00387-of-01024.json.gz": {"num_bytes": 319207426, "checksum": "e28b0884092f75836eed4d73ed24b7403d7b0530fc389386a68887420b0c2603"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00388-of-01024.json.gz": {"num_bytes": 319835376, "checksum": "b4f0db632cc9af66e8aea109c80d73a6281207e29ece131d5bf8b57ff8f81262"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00389-of-01024.json.gz": {"num_bytes": 319346837, "checksum": "413a8d8df1f6cf3094839b57231da5323f33f7115768c65d83f0af1574f71b6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00390-of-01024.json.gz": {"num_bytes": 318632301, "checksum": "a3e8664fbb3ec2af5a217225dbb7fcf3e93b427e5da1a88e35c04c319d61e4c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00391-of-01024.json.gz": {"num_bytes": 319066082, "checksum": "e22eed3415c90510e97768be5a685e0a8035e2635ef773c56e9ce2718c278658"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00392-of-01024.json.gz": {"num_bytes": 318356286, "checksum": "ddbf325390648d9d86f1e7901b75c99fe8db538d203de8dfb4c304282f82cd74"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00393-of-01024.json.gz": {"num_bytes": 318048288, "checksum": "974fd05f356c86be2f9109b0272eee69c5b2eaf0b16104cc573846c925d13b4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00394-of-01024.json.gz": {"num_bytes": 319444683, "checksum": "0d27d6f8c3b935cef23ea60abfa82bd6a4f5e2e061080419dc9c6bc455b9f868"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00395-of-01024.json.gz": {"num_bytes": 318353166, "checksum": "24d9956bd857484ffbabb3ba6f6ac688f48a94b50228238c7c9153a5c6878a7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00396-of-01024.json.gz": {"num_bytes": 319960396, "checksum": "9425f4f18e1690ded866c4b5313cbac8a6210092dc42f720200b7143b69eabe5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00397-of-01024.json.gz": {"num_bytes": 319030577, "checksum": "dee166674b835b9849d281a87238aa136e14d26edaa72d0ecb6b7e82d556a72e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00398-of-01024.json.gz": {"num_bytes": 317664320, "checksum": "f85e08272f73ce4aa602719d59205db54d230a6b7247830d78f91eac63d753be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00399-of-01024.json.gz": {"num_bytes": 319623875, "checksum": "85dea0672a0362a08503b70623907c8c92bd105f788fbd7f3816212a9181e7c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00400-of-01024.json.gz": {"num_bytes": 318840274, "checksum": "a104345698500611cd1a71a6647555300d315490918740a8c6e3b8dcff315407"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00401-of-01024.json.gz": {"num_bytes": 318336377, "checksum": "808327d156e183e102fd75cfbdb7b5a1fbde3740168f59b767ea380608305b67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00402-of-01024.json.gz": {"num_bytes": 319270185, "checksum": "b6a5f7c1ade628091fe86744a6011147ec32795ad694ccbc82929791b93aa307"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00403-of-01024.json.gz": {"num_bytes": 318038520, "checksum": "108904ab05b3ad23318f8aa0f7ddd00d97aae1872fb157eea73273e011cbec04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00404-of-01024.json.gz": {"num_bytes": 320933185, "checksum": "cd0c068c0831218849149eaab8f8a98748823911c745ca0ea33ae839bd625e04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00405-of-01024.json.gz": {"num_bytes": 317694827, "checksum": "d99909ccd59e2ec183b41a7c6d1bd5677798bd7fd784ab681546a7bf8292f353"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00406-of-01024.json.gz": {"num_bytes": 317937468, "checksum": "c7f2bd7a366b8c389e41fdfad4891068c86039e1a5fc3b8a0b993253badf33d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00407-of-01024.json.gz": {"num_bytes": 320226074, "checksum": "765db6f9f0c8c3d9bbb0499f0010928fe4f90d5915dfdd3b6d09d3dc78ad07a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00408-of-01024.json.gz": {"num_bytes": 318613788, "checksum": "165e78c858dfaf010307392474d4917846c9d21658558912e5ffc915803bd2fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00409-of-01024.json.gz": {"num_bytes": 319212414, "checksum": "5f7d5952aad1ae31413962983971b2b422d77c262ededd2ce1c1e186aeb6d87d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00410-of-01024.json.gz": {"num_bytes": 319023647, "checksum": "24588d41f40e3fe389575b97d41ef761be46bc9a9b3965c5e3f994760f7a4070"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00411-of-01024.json.gz": {"num_bytes": 318408922, "checksum": "b35d4ada5a000f51169557b00e508706d51a7becd33370014ff07c8b8dac1af5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00412-of-01024.json.gz": {"num_bytes": 317166932, "checksum": "d3ed1cae269ebefe4716843bd7954bf7e44ee889f72066afbdcd95f4e1f06703"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00413-of-01024.json.gz": {"num_bytes": 318519121, "checksum": "07fc61a7e164301113201e78c99d40289d88e0b463048e14aa5fe69c7490ccac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00414-of-01024.json.gz": {"num_bytes": 317417235, "checksum": "c5a7222b2eb8e8fe690f29a0fff7e214ba94e4d9dae62f67281fe25dd385b721"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00415-of-01024.json.gz": {"num_bytes": 319690993, "checksum": "37052fff729bdff124577d5ba041906b2ea7420c5cb28195e6cfca0e41d560c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00416-of-01024.json.gz": {"num_bytes": 319466518, "checksum": "6e8ce2b9e6e8208ad7e43ce709454cb0b96572d793e0b11c15892f5df18f6137"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00417-of-01024.json.gz": {"num_bytes": 319694381, "checksum": "20892d7a33c31d7967ae0cf595a2108de96a61c0bbd773aebc5d3d083f6ed93b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00418-of-01024.json.gz": {"num_bytes": 319048918, "checksum": "fd795ae8d53e632bb3e89a2becc5b801e10db781b14f2c0ed50b12def5376c8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00419-of-01024.json.gz": {"num_bytes": 319791424, "checksum": "5a8e56faaa0892249e5694ae01e2e4dcd22d9750a9aeea5ca390117c77b8de2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00420-of-01024.json.gz": {"num_bytes": 318060925, "checksum": "795ee64f4c9e2e35d9dc0c91ea593c9e41a3924162901fbf782dc7112f8094a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00421-of-01024.json.gz": {"num_bytes": 319328927, "checksum": "2670b7b6b53e9082c90e4a4e915f72673831ff15e9f55918a1244e0c19c8f963"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00422-of-01024.json.gz": {"num_bytes": 320065363, "checksum": "34df2d1afac2ae4699524492d6b93e4a2a1e551cb4a4ae35fc19353930afab8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00423-of-01024.json.gz": {"num_bytes": 319349887, "checksum": "a2b19afafb45cf30493ac2a3eb013e136e7213f63bd633374ca0d9fe2780efe9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00424-of-01024.json.gz": {"num_bytes": 317515288, "checksum": "ec2a84fb16dd16f9547f0c3314a91968324f2c537118ca36e982b235e23527ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00425-of-01024.json.gz": {"num_bytes": 319092219, "checksum": "1ac0b93c0faae7d446add3af3173637a4b0d638dbd5285b0f4e1bf3abd0d1542"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00426-of-01024.json.gz": {"num_bytes": 318421245, "checksum": "bade501dc71c0b4968a9a7c833751cee5d8f7067a45dabd53aa03534df48886e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00427-of-01024.json.gz": {"num_bytes": 317847935, "checksum": "7aef554aa2b120c4d787395e28aceba743e309f2540fab283e077a1429a2f7ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00428-of-01024.json.gz": {"num_bytes": 318822008, "checksum": "cd94547fe1953a1cc074d97558a70d1e55834606379a8f5e6e60e1b15b56fd35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00429-of-01024.json.gz": {"num_bytes": 318507684, "checksum": "4d3c9245565a808058293558603c657d6e9a0c87b6d2d4b871b856cea2eb3a19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00430-of-01024.json.gz": {"num_bytes": 319042136, "checksum": "9c5a4fe50db5d0822923fe29a5aa8ca6cb09e3629472b1bf61f670388b6c2076"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00431-of-01024.json.gz": {"num_bytes": 318925124, "checksum": "8f18b35bb952da090ade742753e30861ba39c6c54c8ff2d76b358ca7be475ed6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00432-of-01024.json.gz": {"num_bytes": 318680251, "checksum": "7968c370d0efa4601ab8b5ee68e480b211fb969593608bf7e00a0153f00f99b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00433-of-01024.json.gz": {"num_bytes": 317822797, "checksum": "f62d7e74434d52c36b22f6a8cd56ed3937ed6aa03f140d0fbdf5e360632d51fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00434-of-01024.json.gz": {"num_bytes": 320094364, "checksum": "55d7678c7e197e165b4e09bf3f8ac159853120acbe5801ed6ab3ab0f801c11bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00435-of-01024.json.gz": {"num_bytes": 319008936, "checksum": "09b451c8ee06bc06507b3e75a60c544a6b70f27e3d07daa29c59803f785faaf5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00436-of-01024.json.gz": {"num_bytes": 319023456, "checksum": "6fbcb93f9dfe65e12b7efeecc8af7823471787438b1ce90e5f48b68b2dcb1d14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00437-of-01024.json.gz": {"num_bytes": 319484997, "checksum": "9e70c8c1ccbfe93ec9296811ae496a518dcafbf38c81b7972f885e297da9e726"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00438-of-01024.json.gz": {"num_bytes": 320319141, "checksum": "eaab759d8c603e8a2ad3ebacd99e30338fb904ba307aeaba0d2e0e63679cfadc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00439-of-01024.json.gz": {"num_bytes": 318410397, "checksum": "7a03a92bf97b6750941c1070f933c68f1b2a3e13fb68b3a21a4726676ea75d34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00440-of-01024.json.gz": {"num_bytes": 319447470, "checksum": "bc899e436da7b3bf13c1bfa2fd2bbf9d90b42a0c00f2971259a14d858ca3e5ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00441-of-01024.json.gz": {"num_bytes": 317582955, "checksum": "4d777860c2750e43038ef709d77bdc403b3b3bcf0f08e3c4562952c9ac70b113"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00442-of-01024.json.gz": {"num_bytes": 319592118, "checksum": "d9e5dc244bb6f0b629b2a929aedf506dadaf5eacc80f0997816b95279552fe8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00443-of-01024.json.gz": {"num_bytes": 318104403, "checksum": "56133bbd7cf96dbe87d48898b886a024af69ca405d7cea1799bbd30f185e9c1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00444-of-01024.json.gz": {"num_bytes": 318547808, "checksum": "8be0270c3cc96dd7f7b3aad08bde81ea245feff4a09923277fb0d38a7c095604"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00445-of-01024.json.gz": {"num_bytes": 320463920, "checksum": "e02316fcd355914e4d08ecf37036d4727ae9ebe45bdc5c98279aa3437c2c1eb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00446-of-01024.json.gz": {"num_bytes": 319583221, "checksum": "80c9b8c47665b2cef6c291b0eefdac5b14be1d7cd4a4c06c2e14cf48b42da92d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00447-of-01024.json.gz": {"num_bytes": 319546881, "checksum": "a18d5aaca1717ec33fb1822a633268003bf88093dd7b48db080503c3d01b6ffb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00448-of-01024.json.gz": {"num_bytes": 320234711, "checksum": "c41595d2b9cbf0e23fd65df1cb51499ee262d345d79d2625388cf149c3c39f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00449-of-01024.json.gz": {"num_bytes": 320043698, "checksum": "3bef99334be9d39f41296f8f134c88f04fe66502da2d2639f0d6d2485338e607"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00450-of-01024.json.gz": {"num_bytes": 318033740, "checksum": "9cd05b1b70ffc3c004b4b4a2f21f91abee1395f3a485efd1aafda550193df9fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00451-of-01024.json.gz": {"num_bytes": 318549622, "checksum": "b2ef6cc4ac7c4c69fb1661d7ed9b2ce4da261c72f9e49dc3c934180501ef3a24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00452-of-01024.json.gz": {"num_bytes": 319317230, "checksum": "89927f1fd79a5b1439988fd37e0377175176d9ed22d14611f67a81e185a336b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00453-of-01024.json.gz": {"num_bytes": 318952561, "checksum": "427f55bbcfb6c1a0ef12f96cb122f362b975169770ce1d392b763c4b4408cb34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00454-of-01024.json.gz": {"num_bytes": 317545286, "checksum": "2fc3b172ea721bc92b0f7614e8fea61b0781e6f4f3e6b7263cf0190beef3ec52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00455-of-01024.json.gz": {"num_bytes": 318975631, "checksum": "c96f688ecb19bdb1592b0124021fb80d48965303442de76751d82fa03ab8f6d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00456-of-01024.json.gz": {"num_bytes": 320016575, "checksum": "61d2be7a4b9e34cfb994ae2c120ed5a51a6669564046637445a46b9872812416"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00457-of-01024.json.gz": {"num_bytes": 318236935, "checksum": "a74dd51c3c490458ea0e61196d7e0085aff80d50cd149a673f54f661b364a671"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00458-of-01024.json.gz": {"num_bytes": 318495925, "checksum": "adf9cd717f2c79504dace22b5929d4c4064353e869457c20cc81a0b2db390c89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00459-of-01024.json.gz": {"num_bytes": 318956821, "checksum": "d7be5bcb738a75586125e56a25aa234618528accda620eaac421beab6288b992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00460-of-01024.json.gz": {"num_bytes": 318968681, "checksum": "6181280df5418fd9ebb52aa26a631100b6c3da0750dc5fbae152a6a44fccb942"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00461-of-01024.json.gz": {"num_bytes": 320810761, "checksum": "5e943c458674371dffb2466274b8f2a9df9902a370901ef97992bdf920cdae0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00462-of-01024.json.gz": {"num_bytes": 320154899, "checksum": "76b3d1b120cbb7cd71d004440e0c6bd9f9c4395424c568e8362973038017a90c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00463-of-01024.json.gz": {"num_bytes": 319247449, "checksum": "9de2c86d85289113b24c2f7eb4771ec1391511930f5f26a12133d41faf0ce908"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00464-of-01024.json.gz": {"num_bytes": 318150152, "checksum": "85fce3104ef0b247798c1de8d9d616d3de754841fb6c49a01cca5b9da5efa94e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00465-of-01024.json.gz": {"num_bytes": 320342803, "checksum": "ddf312f0b8de8f53ed556483fd998ae308d4829d18195a48869db6bf1866c332"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00466-of-01024.json.gz": {"num_bytes": 318619029, "checksum": "01239a1ff6ffe9032da320c5a7d1a93125d0724851e3e10746821c9452070887"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00467-of-01024.json.gz": {"num_bytes": 317677227, "checksum": "41783d20189a4bcfc33f543597a5473900e692ea13fa522f2724e27e810b4e9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00468-of-01024.json.gz": {"num_bytes": 320038217, "checksum": "7131b6f4dd423f2efe55c3f598893676300b31651cce7eed32ce633a015f8ca8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00469-of-01024.json.gz": {"num_bytes": 318359701, "checksum": "925bc76c045f25532414f29820adb0cf1a56c54b406333a6f348c29e5efda9fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00470-of-01024.json.gz": {"num_bytes": 319329235, "checksum": "9be740483aa7bbaf94dce550f2c20404c89326f6ec4ebe1b7070f85f93507038"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00471-of-01024.json.gz": {"num_bytes": 318792779, "checksum": "0e3d9492f15dc9867bb0dc803bdf45608fbe67255014b4488902d7bf2e2554cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00472-of-01024.json.gz": {"num_bytes": 319552622, "checksum": "00484bbc10bace3dfd93b57fc53d6f5fac26b7dd54fd5b5428d75eb9e6dbb0e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00473-of-01024.json.gz": {"num_bytes": 319466828, "checksum": "5db5d585798e8ed8e4a3bc540871f1185f67125f397a12942d21b24e6b374519"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00474-of-01024.json.gz": {"num_bytes": 320014669, "checksum": "db07fd0e972c1a474806c1b4464ad4cefdd2e8fc15806ba0d259d4f9e594c3f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00475-of-01024.json.gz": {"num_bytes": 320379280, "checksum": "e6e36a9eed8be84c928980fffd8177b177182726c9e13b41a47343d431f76a7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00476-of-01024.json.gz": {"num_bytes": 318820301, "checksum": "0543ed2d0b3aaba0b0fccbf0311836143bd19175c5eed9bf0f024ffb9ce3c50a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00477-of-01024.json.gz": {"num_bytes": 320577830, "checksum": "a62fd62ad771dbcfb7af73841e15a49e9d7239c53dbbbd84de2282131bca9c99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00478-of-01024.json.gz": {"num_bytes": 319593908, "checksum": "beae9334a8e93e4b036c4a9b3c5b3a75fff17264177184d243d9e6da286dbe2b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00479-of-01024.json.gz": {"num_bytes": 319728825, "checksum": "ae5b475c7be35d98b77d6c4aed5d61cbd1c98544c9a6e73a53ef2911757ab7f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00480-of-01024.json.gz": {"num_bytes": 319903674, "checksum": "51e0611378455d909e8b0f292eb62038848aa7afaa4f93c9c83061258b211a95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00481-of-01024.json.gz": {"num_bytes": 319998409, "checksum": "68c640304ac952f544ea88c88d7c994c8d2955b95036f8352a67b57a836fa1bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00482-of-01024.json.gz": {"num_bytes": 319047238, "checksum": "74cefa57158d0008a06ae85b2a7a1c04d57a79b7ae3f7b4b3426dbe9918b36ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00483-of-01024.json.gz": {"num_bytes": 318775875, "checksum": "e99faa71222017521f1fc9999bbb0832df5c91f8b9f6e2ef501d3f827d3a1e85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00484-of-01024.json.gz": {"num_bytes": 319190491, "checksum": "4518faae7c9d51a51f0b02cd895cf27e7c87a623b787346c844a8d9f0b52d6ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00485-of-01024.json.gz": {"num_bytes": 318974502, "checksum": "1bc8b207583b9f36169e0e9facd258de8eb73dee8bf831051dd1ab04b7726c6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00486-of-01024.json.gz": {"num_bytes": 318599424, "checksum": "0b1d9900e1921483b85305491f914b6b78fabcd0686a20695e61b89b7380a894"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00487-of-01024.json.gz": {"num_bytes": 318958015, "checksum": "c0c789c5f3b34d170d2aeb72642c70d2fa5eca567e7850d0c89b3d170f3bbf64"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00488-of-01024.json.gz": {"num_bytes": 320205671, "checksum": "6eef7a1ea80be43e84cb0c974215a477c909844899ac694afe1af2e8f4ac171c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00489-of-01024.json.gz": {"num_bytes": 319193967, "checksum": "eccf5d7f682a76e11332f07e7d54a080f76c0be58a98a853a9fe90c815a22087"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00490-of-01024.json.gz": {"num_bytes": 319833603, "checksum": "afe99e32ba36134f23b59a2ee43965bf185432de947740fc19e26eef41027aef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00491-of-01024.json.gz": {"num_bytes": 318912982, "checksum": "e981151b23b233bd3e5798f78658b5f52a73f69db39c30615f615069cf0c4984"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00492-of-01024.json.gz": {"num_bytes": 320057824, "checksum": "0cc5f7df318e0718fef93d24e7ff904b3e8e2728c4fc0b1d13893c81d8e6e2c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00493-of-01024.json.gz": {"num_bytes": 317967559, "checksum": "93749543b04a5a7093177d2a03acfc0bf6f26d5b53864ae35839a9421fb48169"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00494-of-01024.json.gz": {"num_bytes": 320426917, "checksum": "e461f56b461a4d5ce353c60889dcb99e10818985d3788440c6119bb145876277"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00495-of-01024.json.gz": {"num_bytes": 319528392, "checksum": "e530f3030ddbf7191bc4082e8209f63eb48733d7085d79a8469ce3611ccb79b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00496-of-01024.json.gz": {"num_bytes": 317570766, "checksum": "ddec34b528bd5314019d12089e600df27e781d78f43b6722b9c0202ccf385755"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00497-of-01024.json.gz": {"num_bytes": 319154838, "checksum": "e7438a08000fc7a158f887755cc496edcf51c8bdf2bc4a888ddd2c829bf8fa3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00498-of-01024.json.gz": {"num_bytes": 317955368, "checksum": "ad133d808ca5b6181bae1921ab1261d79630c09bf9d6c904db036f22e6f32e6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00499-of-01024.json.gz": {"num_bytes": 318286671, "checksum": "cb40879ea08db5a9eb6f2c23756574bda34deb9acf039b992f0ab90fdbb01594"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00500-of-01024.json.gz": {"num_bytes": 318510936, "checksum": "21e5f7468a907f38c3dc0a5c19f09921476f9186beff967e829329f191dad6b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00501-of-01024.json.gz": {"num_bytes": 319611074, "checksum": "38829434c8539bb9fa9ea32bfba3c6732c5021ffb60c16fc502fe61de83906ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00502-of-01024.json.gz": {"num_bytes": 318630954, "checksum": "22d1ca1edae179d2587495fcdf1d3e515c6f547cebafc54996c93a121731fd8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00503-of-01024.json.gz": {"num_bytes": 318253198, "checksum": "e95689993390086880e630ec4540e0629551076c0cad2c70f5aedd3aebfec181"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00504-of-01024.json.gz": {"num_bytes": 319497151, "checksum": "0cd7b986d247e010fd76fa2ab2b62d5f9eec292b28c1e7bd3e4c577042b598af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00505-of-01024.json.gz": {"num_bytes": 317498965, "checksum": "f1504912fc53cc3690e26ec3babf736ddbeb8f7d9196dac83f757699310b30ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00506-of-01024.json.gz": {"num_bytes": 319684193, "checksum": "9f6defbac132e097cbf7cb7d181cb154bace6af48964fe09d111bc610fdcd2bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00507-of-01024.json.gz": {"num_bytes": 318394726, "checksum": "a58f39d0bef19abefc089342d8bb6d75dbb2c663f67127673ec395404bcf15ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00508-of-01024.json.gz": {"num_bytes": 319013108, "checksum": "176443b39840826bfb1db2cef2541449a6fd0c465ff9bbf0cb2479f07fb8baa8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00509-of-01024.json.gz": {"num_bytes": 319832758, "checksum": "cce5a142cd7a121eba8c182d499442f4b0a397ea1484c33ccd79b1acbae832fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00510-of-01024.json.gz": {"num_bytes": 318762241, "checksum": "bfc910625f0fd6074955906bb86e789b0d0adcd1f8956cb8da276933dceac256"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00511-of-01024.json.gz": {"num_bytes": 319240643, "checksum": "ce53021b90d1c86e2d46293e7053aa174387d7408bf0cf907898be69b1a7befc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00512-of-01024.json.gz": {"num_bytes": 318353376, "checksum": "e9333c6f73c30c9cb7f31794025eb9129455fac2edd64f8b3f22f879124c6a85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00513-of-01024.json.gz": {"num_bytes": 317653011, "checksum": "d9450c6f541e82922b37d3b7cc25611707b44884f27825db4dbd65466b59e8b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00514-of-01024.json.gz": {"num_bytes": 319391160, "checksum": "20b77f5fc2a939fc291f901e8774acfbf04ffaacb08192b724673eadc9f83c12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00515-of-01024.json.gz": {"num_bytes": 317994258, "checksum": "32ca1f60d0deb395538a93ce5044a48fde05864f2c26af42dc53405b6dc05031"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00516-of-01024.json.gz": {"num_bytes": 318786801, "checksum": "eba4f34749eef4da2b0729abbdfa2ada77bd65383c01213d4f86625670430a65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00517-of-01024.json.gz": {"num_bytes": 320010732, "checksum": "617765f971b879182db7debf879025f8dad4fd8846b11728ee1230767c031c04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00518-of-01024.json.gz": {"num_bytes": 318681019, "checksum": "6987893764c56b84fca014532824a05d4187db5c313be4f7bdcb363b7e8cc8db"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00519-of-01024.json.gz": {"num_bytes": 319951543, "checksum": "ba151c4734db52e7c220dbefe380825ac6d66a9c6abb901b8096a87d97a2deb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00520-of-01024.json.gz": {"num_bytes": 317948056, "checksum": "7e53ed26c3c068b0dedd026219b7cdab79775545ebbf31b5dadadb45364c9985"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00521-of-01024.json.gz": {"num_bytes": 317993802, "checksum": "4d1d4a5583430e373bd2cfd191e59cd8911953fbd73fa924e0c15be76499b54b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00522-of-01024.json.gz": {"num_bytes": 320189449, "checksum": "71d851498785e312acf93861a43169794d4d576f5fe8b960303419316c8c898a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00523-of-01024.json.gz": {"num_bytes": 320443871, "checksum": "587867d619115c2accb69322b197239b79f12de41ae80427fd369813ad8d81af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00524-of-01024.json.gz": {"num_bytes": 318192840, "checksum": "7324c02db00b06d0f41d6e5ebfa4e4dd6554f5f4849d6de187ebb84162d0446d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00525-of-01024.json.gz": {"num_bytes": 319294602, "checksum": "24ae3495e5b59883967c62b8fb3a4fa7525d33c40957fd5fa3be413d66c24eb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00526-of-01024.json.gz": {"num_bytes": 319783465, "checksum": "27cd95e7bc6a3f156f1f8f26dc5e490818fc4810562e3964a19fad401cceacd2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00527-of-01024.json.gz": {"num_bytes": 317240081, "checksum": "6b84920fe7e28c01a03800512915c7a9e47816267ac652f9ee0314e3428bca72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00528-of-01024.json.gz": {"num_bytes": 318320694, "checksum": "fec06589f714ffe1343cb6781898e29e5d0cb789deba3aa4a4ccf86514d3f690"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00529-of-01024.json.gz": {"num_bytes": 318391515, "checksum": "a98c34c04c1b6f0ca3acc9e10fdf4bd0ead2ea7271832ce4972df8677590918b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00530-of-01024.json.gz": {"num_bytes": 318473966, "checksum": "1677d541c7bc10971c711f1eb030faa2e85e0967112ba57d7f04712908e4f040"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00531-of-01024.json.gz": {"num_bytes": 319463272, "checksum": "92b5d82a058554d3396a2b54504f45fa88581cb2951140c0f0bde67ed11bed0c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00532-of-01024.json.gz": {"num_bytes": 318228175, "checksum": "291bb3d7613f7f00b6910a0de78dbab0d87602243c9c83014de341c131200853"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00533-of-01024.json.gz": {"num_bytes": 318966937, "checksum": "a0ce39eac6d6ecad3478373c264e88b2ea20b77fb2049537c229ad3da2769c85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00534-of-01024.json.gz": {"num_bytes": 318968162, "checksum": "387db79d4aacf8fa4c512fb78023ff94a43d5d597d5a8c2ec6198e62e4b8c98b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00535-of-01024.json.gz": {"num_bytes": 319253588, "checksum": "3ff8f4a926fdfb6201a94d75c17ec5afe662a339a65019eb5e1193c1238bd388"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00536-of-01024.json.gz": {"num_bytes": 319662526, "checksum": "0c805e83d8cfd979701df5714713d062e14853d7e2b0f77c0b414a626686cd33"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00537-of-01024.json.gz": {"num_bytes": 319177095, "checksum": "f9a0ac216e316075e5c2219449a954f989eb160ead2ca07ac9f3813274e18f2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00538-of-01024.json.gz": {"num_bytes": 320109104, "checksum": "a425ef4dddefb40bac5a8cd3191161a41737aea5088a614410d10d83bbab5e37"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00539-of-01024.json.gz": {"num_bytes": 320600564, "checksum": "3580ea8da9c4aff1296e89136c5d7f1a37d021e0b10f3ebd1e05612c092faebb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00540-of-01024.json.gz": {"num_bytes": 319993281, "checksum": "ad8dc83bfbe7c8976f08708c5f0229cd4e1a2d80e272b225a8d208133b129dfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00541-of-01024.json.gz": {"num_bytes": 318256020, "checksum": "c7452669237323fdd09ce97624791a0261f3ec07d8a5f98e71a4b1252a2805e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00542-of-01024.json.gz": {"num_bytes": 318843744, "checksum": "1e5a11c25f82ce717302dbcd9acc1f8b916d83eca88d345d8434b1f88768137b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00543-of-01024.json.gz": {"num_bytes": 320482002, "checksum": "bbf96edf50c913d5162ee154423242e7c8faf490ba229f325bac98a5e3eb9477"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00544-of-01024.json.gz": {"num_bytes": 319059260, "checksum": "22c04506b5744df8c71727fc6527fa2bc495a10a237c71762c66d09625d34097"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00545-of-01024.json.gz": {"num_bytes": 317874034, "checksum": "84a78bb62eb6f72de7a75325870d9ecd419f77c4f6728d29609b2f7ab1b8bcf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00546-of-01024.json.gz": {"num_bytes": 319891407, "checksum": "28631c527dc398c9626fc60b39ad94ed880b41c71f55b9c7c670f6a1837f98d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00547-of-01024.json.gz": {"num_bytes": 319361268, "checksum": "273b8598405def0165ceaf9723d1425c9b74368fc22a414616c7ac9327930225"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00548-of-01024.json.gz": {"num_bytes": 318360761, "checksum": "59990568c0ea055fab27f2b9cd028e1c7177df0479712d1e2d8372e9b017ccad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00549-of-01024.json.gz": {"num_bytes": 317320452, "checksum": "fd1e361f28cf099df6088e26d06d79f7f62bd8bd89b4524b9baa80ea49a1a4a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00550-of-01024.json.gz": {"num_bytes": 319017444, "checksum": "4424833afcb143f6fdbfc2f5fa2508d6226a4a1df391969b2a751d2d0070158d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00551-of-01024.json.gz": {"num_bytes": 319118159, "checksum": "77b78f94a8bc8f905cf8b1997df1fc3b8c6d77ce65fc28bef68c6083275a832b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00552-of-01024.json.gz": {"num_bytes": 320058125, "checksum": "e7b71167c4ad947232b6acba26e4d3cc9214c25b50b853b5745333bba942f50f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00553-of-01024.json.gz": {"num_bytes": 319220671, "checksum": "ce7891f3820ce065e3bd7afa006e90889428c80bd8e771d66fbbf023bb2a9eba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00554-of-01024.json.gz": {"num_bytes": 318858928, "checksum": "015a707235f46f179a08d3f6674b6d368dc9612841e2bf39f700f11fef8e64c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00555-of-01024.json.gz": {"num_bytes": 320490725, "checksum": "041dd2e902ed04dfa143476da03d5fd00c30ce1259c0658150af5b77a5a092c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00556-of-01024.json.gz": {"num_bytes": 319863694, "checksum": "22e3d9e4dbdf2b1b822a7bc8c889f4747aa16c71f4c91436d028a228bffe4b87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00557-of-01024.json.gz": {"num_bytes": 318940362, "checksum": "4cb8b113ad9687b7dee590242c5f50fb3ea3a8775c67492a8ce0cb5c15fc26d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00558-of-01024.json.gz": {"num_bytes": 319797786, "checksum": "ad157a34c6a8d496859f55b00c79fcedf7305d8502ca86a511026f39cdcaca59"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00559-of-01024.json.gz": {"num_bytes": 320156705, "checksum": "816d84753b71fae446428587f41de5b3490e88321f1fa0cfa2ef1fd5eef851e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00560-of-01024.json.gz": {"num_bytes": 318346216, "checksum": "0b1b3d26316f2c0e973ff19820793bcfffa957c3869f74f62fb40cb6839227e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00561-of-01024.json.gz": {"num_bytes": 319571572, "checksum": "4f92594382c897bf94211f1446dbb38c2cc1fff3647acba731dfe0ad89ba4061"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00562-of-01024.json.gz": {"num_bytes": 319453711, "checksum": "2a6ba0c64806add776081f417c8d1afdb324dd8b9aebb603372afd7fc2c4cd6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00563-of-01024.json.gz": {"num_bytes": 318990092, "checksum": "e3032365b9b86883c24bfe387d810c2d9fd1d0a55ff88acd1f5b5357246b13ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00564-of-01024.json.gz": {"num_bytes": 319491917, "checksum": "da6196ab8650fc9f8fa391b821ff070070946412277bd423c40d9fa1de325f93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00565-of-01024.json.gz": {"num_bytes": 318756269, "checksum": "edeb5b13aa0d65354d78a5ca5d1698732e95f1fcba249c42825a0351d4a34f79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00566-of-01024.json.gz": {"num_bytes": 318461036, "checksum": "f179addbca50d8612612b0e09138d7ecc89ba7ef2d6e857d7ef0b10223dc71d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00567-of-01024.json.gz": {"num_bytes": 319625728, "checksum": "eaa1d0ee28eb17c6ebe3d85c8af8b7adac28a720b2975f86ac83f3f4d2bffbcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00568-of-01024.json.gz": {"num_bytes": 318428567, "checksum": "3677e88545f2d76b601995cc3e2b6b12fcf65e350ed7eb4137ab4beef3d475c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00569-of-01024.json.gz": {"num_bytes": 320114923, "checksum": "2d8810d8bcfc0fc19d82313be6516b2fef4cf68f56b0448af48b512c98e1ae8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00570-of-01024.json.gz": {"num_bytes": 319148416, "checksum": "8e5356dc0fa2b4e5fa16b36a1586f16920306af1227c765e5d2f0818e74d30d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00571-of-01024.json.gz": {"num_bytes": 318223973, "checksum": "c87cf8b88e8e4fc0a664f4b3a381b78b317680253a83a672cb86e02adb43f2aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00572-of-01024.json.gz": {"num_bytes": 318322508, "checksum": "2bdc857dfeab99c8f83f0267ed5ed7529bca8ee086fce268534bc0264ff738f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00573-of-01024.json.gz": {"num_bytes": 319203246, "checksum": "564fc77dec25ce0d47f4e3d8d04bf114dc06119b28b3ab00d6092a799d496e51"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00574-of-01024.json.gz": {"num_bytes": 318397937, "checksum": "dc3f206e1b5da963184da72e47959844bb164335c76e3261f3a189a4b7b022cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00575-of-01024.json.gz": {"num_bytes": 319183651, "checksum": "7f0c46955e37d5d52b305f71b4ce4fca5368d72e8698e8b832ac0177f868e145"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00576-of-01024.json.gz": {"num_bytes": 318690625, "checksum": "b37d0fbd439bdc05021a71c192ce5e61ebce27448a17819bb53156d9d5f27e17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00577-of-01024.json.gz": {"num_bytes": 317926085, "checksum": "3092d1ad70fb2d262ecb33f3fb6ea554af3ddd26498ba42b644c383f6d4bd1a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00578-of-01024.json.gz": {"num_bytes": 319190472, "checksum": "d9833fd591a618a167b31b7aaca420f3e719ded98987dbc0f46fd4bfd12564c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00579-of-01024.json.gz": {"num_bytes": 318958744, "checksum": "a11217af10c85ad828de38847eeddcde6af6899563585d581c20adaed3c9e7dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00580-of-01024.json.gz": {"num_bytes": 319893900, "checksum": "71e8be705bfa8563e33392d1c14decd84f52d6a0139b98344f1a0ed9bdc94198"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00581-of-01024.json.gz": {"num_bytes": 320109861, "checksum": "c5f13ba973803ef069762d22bc37ee02a4348af379c75848d93b2685fc4280cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00582-of-01024.json.gz": {"num_bytes": 319238177, "checksum": "da815527ca68b5c2ed604d00ccbcc7c631c60f33e3132f79212634a82c266844"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00583-of-01024.json.gz": {"num_bytes": 319375634, "checksum": "a332b791df0801f0b7227117f0ea3971563e8e420ae24dd94b38d532c1ab0573"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00584-of-01024.json.gz": {"num_bytes": 318596018, "checksum": "e6496d31f42921eaf9f85047e7c2eeb5fef46e01e99760fa676da96481d7d5bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00585-of-01024.json.gz": {"num_bytes": 320156294, "checksum": "08b978ec05d65edd22c301ddc6ab44174eeb7bef5c5997a84342b6faaa47a79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00586-of-01024.json.gz": {"num_bytes": 318716838, "checksum": "567ce600ad99e543507fdf27b9009fe1782bc867f44f3dabbeb93fab1208f337"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00587-of-01024.json.gz": {"num_bytes": 320247814, "checksum": "8f5c82f5eaac4a315d8615c9700cd81f3b9c2e1a17376d3b2482f8694dfe2492"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00588-of-01024.json.gz": {"num_bytes": 319546079, "checksum": "bae91422f87091b3974ca92781a14fae8f10c5c41de9c9132f745b3dcb8bc468"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00589-of-01024.json.gz": {"num_bytes": 319771959, "checksum": "babb615d77f80e5ef99aeed3889a26cef5c9918a7fe68b70a503815e69b0b189"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00590-of-01024.json.gz": {"num_bytes": 318926571, "checksum": "61f2ed732f3b2b5e24882f47b4eb84fea28bf89d112f6f173cbb50523a43c4b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00591-of-01024.json.gz": {"num_bytes": 319669791, "checksum": "3aa2e792ec775a52ee78447b81204867e58b0a46727bab4b7974977aaec2889d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00592-of-01024.json.gz": {"num_bytes": 320393142, "checksum": "1419c263fb74409cb0e39ebd87b1c020ee6863a3a6f2f427be27d3c76b84043a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00593-of-01024.json.gz": {"num_bytes": 320977171, "checksum": "4f16f33217c35a2b155d5b6fe8014c2e52014e63c419e7d3aaf71a35246c1323"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00594-of-01024.json.gz": {"num_bytes": 318211092, "checksum": "c9301ddcafea22d085ae48f551f486e73089a76c7990871f787064c61e4e60b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00595-of-01024.json.gz": {"num_bytes": 318978629, "checksum": "349e104763320eaae96ac3bc53c5fa7a73e7dec93b8cc3afaad108a97e7c170d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00596-of-01024.json.gz": {"num_bytes": 318573003, "checksum": "0eb6c25cf57764ec3aa7f74d6d967c52003f872f2f3b140fe6d5ac6360241a8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00597-of-01024.json.gz": {"num_bytes": 318931514, "checksum": "b42b7b984aad729185ca9b3a6ffa856b2a79165ce2feebe519b10f8ff42c4ab9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00598-of-01024.json.gz": {"num_bytes": 319002677, "checksum": "8306c5971408767b3735288fd0ee7ee7d01d9af4ef4cbec2e57c97b1f78e6d63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00599-of-01024.json.gz": {"num_bytes": 319637870, "checksum": "844df34f2a263011f9d1d85eaad5a1d95243769e9cec5a104807dd55e1fe431c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00600-of-01024.json.gz": {"num_bytes": 318099852, "checksum": "b05e66568a4472feee31f20918e9813aeae2d881f47b5281ff29fbcfedf4d5b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00601-of-01024.json.gz": {"num_bytes": 319136069, "checksum": "8dff2d56c9915d73e6154533e5de0ca9d867c5fdedcfeceb3e0ab22f3ba509cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00602-of-01024.json.gz": {"num_bytes": 319369121, "checksum": "45b2c1757260395afeb168b545892b315fa0bf14b3d144bfcab1fdaa6d79086f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00603-of-01024.json.gz": {"num_bytes": 319499076, "checksum": "46edc9f556ccae692900b222b8e4843360dd5dbe0798a8ad9cb51c07a451dbb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00604-of-01024.json.gz": {"num_bytes": 319132921, "checksum": "0cba8c8738ea7ff9a08bd1bab215010b03c6c83fe35206d83344d78005bdee6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00605-of-01024.json.gz": {"num_bytes": 319315562, "checksum": "0dc0d37658fd672c8d72775bd8855dce9037cf9715feda35a76afb1f0e87bebb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00606-of-01024.json.gz": {"num_bytes": 319223528, "checksum": "f679e437a3acda1a81013dc0f3fa93fde6c3309905e8142f8699a76bc04b7114"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00607-of-01024.json.gz": {"num_bytes": 319326218, "checksum": "7fe91f86f751b9aa3abf1c5ed0fdab89a76c7fa4eb7ab8b809ef29b0cf4a78d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00608-of-01024.json.gz": {"num_bytes": 319393715, "checksum": "a5daf706100eb797b5b0770fe0c790856637b22dc849aeda5b445ae5fa63cb3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00609-of-01024.json.gz": {"num_bytes": 319554192, "checksum": "4434338fe97d398d9565ae940c62539e868fa261be361ede1b5b0feb004160f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00610-of-01024.json.gz": {"num_bytes": 319786301, "checksum": "6b0d0e0457a721af6c67a31f5016432011e717302cfdc7ee39feb253fbae4754"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00611-of-01024.json.gz": {"num_bytes": 319356910, "checksum": "bfe201b1775270afef3a09fcfc074920cbb01093eef90d46f26b6b813d603994"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00612-of-01024.json.gz": {"num_bytes": 318780229, "checksum": "29248c4732fdfda2ba97ed38192ab391457e20fd70f713ef4a7cf084f9865846"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00613-of-01024.json.gz": {"num_bytes": 320190496, "checksum": "f5cb9be2442797d967b9041e48771196a6c0595933ef2102840b704e355f4d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00614-of-01024.json.gz": {"num_bytes": 320245862, "checksum": "89b74d0daea02fb69289ad259bbd0ddb1a64c5d6380848f7d51669be952f8a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00615-of-01024.json.gz": {"num_bytes": 316874605, "checksum": "78600c8703d5ebf80c99c089bb7a7c1cde843a66d706fd219eeac304f80e8525"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00616-of-01024.json.gz": {"num_bytes": 320237707, "checksum": "630ee29d4dc4cd5062eeca7877e5c1b204b36eb0b3aeacadf036cdb75c1ce840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00617-of-01024.json.gz": {"num_bytes": 319739365, "checksum": "d418fd284d06b1d2d9daebea3047ed06286640ac75d23893f1effc2ee9d7aa14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00618-of-01024.json.gz": {"num_bytes": 318634299, "checksum": "f5d75d129ab6c0f052028cf0139c3cf20eed3a9c5cdb151cd88ae42d5d1a32d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00619-of-01024.json.gz": {"num_bytes": 319086471, "checksum": "c558908f6e08b0d02f377c9aed1655d80106f4cfe26e955774bb420d19b2f74f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00620-of-01024.json.gz": {"num_bytes": 320665446, "checksum": "977f959e5b5eaa24081ce025d137647fffd65f1a54d2c45db9805a232e0c0364"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00621-of-01024.json.gz": {"num_bytes": 318576410, "checksum": "d07f3c31d7ec1c71b5ab9539a2ed49f6d5f46b48ee2e51800b9e28cee588a163"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00622-of-01024.json.gz": {"num_bytes": 320053075, "checksum": "58b897603eb83f789a1cfc6bf40a091093cbd8a0c20702018c411adc7b07a437"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00623-of-01024.json.gz": {"num_bytes": 320045187, "checksum": "3665d7579b3c57eb21ec9e55850e39307cc6f4ef8aa8b9937076ad6f142063a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00624-of-01024.json.gz": {"num_bytes": 320136842, "checksum": "35db069ae090e95c5a4d3db44eae73bcb29463c120584d7f6ccbe235983c5fef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00625-of-01024.json.gz": {"num_bytes": 317314201, "checksum": "7f6ddbbc8815e8bd10c99361fd8113cbbd84ebd92799eb6958cf98af825d2aa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00626-of-01024.json.gz": {"num_bytes": 320219970, "checksum": "4e2c46d1e3a94957717bbbf1e1e4300bd27ac17e588d426e0ba688983e83f4e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00627-of-01024.json.gz": {"num_bytes": 320083102, "checksum": "851ce6dfa6a4d1a4e3b8bf439e36db9ceb59eefc60558d429e2fec80655e1775"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00628-of-01024.json.gz": {"num_bytes": 320386844, "checksum": "86d8927f16d0790a07d6c68e745501188d13887df4a137e937ae00497d07c055"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00629-of-01024.json.gz": {"num_bytes": 319476643, "checksum": "c48cff721137b641fe9d5bcf30462c7e4e3a3ae631b7b4e39979c8c77f0890ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00630-of-01024.json.gz": {"num_bytes": 317961579, "checksum": "cde626b34c6c8455227fbb18a577877b518f529b6c8e16881cfdf334f2875cd9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00631-of-01024.json.gz": {"num_bytes": 318952266, "checksum": "0401582821f7b15f0b406f7ce00c56351b8e86a3c3282bdf4dd45b2f6146ea22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00632-of-01024.json.gz": {"num_bytes": 318261820, "checksum": "be48396ef18ce0f3650eca86eb36039f90b51737f9848086494f34fa28d60e70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00633-of-01024.json.gz": {"num_bytes": 319748854, "checksum": "9d5c342d82fcace21de2900202c3f2af47229aeae9d487a8b77b7f5b86c05f74"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00634-of-01024.json.gz": {"num_bytes": 317806530, "checksum": "00a70705afb91f6570d17257057c15b45386597b917061686f131bd41ddce421"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00635-of-01024.json.gz": {"num_bytes": 320313573, "checksum": "22a1286582d65975ed94f0ba25bf87e94d52a55214d0a51979a3e0fd9f95e3cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00636-of-01024.json.gz": {"num_bytes": 318151690, "checksum": "026c699ac6fa30f9e156a957026d8fa8df72daee3407c8fdc5e0bd7d6a3b50fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00637-of-01024.json.gz": {"num_bytes": 318665365, "checksum": "9bd931dfc074bc99df31d7fd31a5ac1dc8c8bc75f8e87b763545cd824edcdcbe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00638-of-01024.json.gz": {"num_bytes": 318521250, "checksum": "4b30ad531f7502ef7bc6398ab286e5c6c63d340c22792da9258ea95b496d1c0d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00639-of-01024.json.gz": {"num_bytes": 319997068, "checksum": "2bfdf36396e49ff625138d29925f54eb12b18d35f6d0bf5ca9e79194977cfb43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00640-of-01024.json.gz": {"num_bytes": 319355927, "checksum": "d0d0ed7304b5d79318b5230a1ab48d3ed03183f1eb11d96070604a7008cd7b30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00641-of-01024.json.gz": {"num_bytes": 319002081, "checksum": "1461ecb6b92819bfdc12808a5442d70f94538931f856c91dea602a23ba86ab98"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00642-of-01024.json.gz": {"num_bytes": 317689465, "checksum": "aa0af0169cf13db1f8133e8d76afeeae5f71d63d179794377a55b6c2eb938dc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00643-of-01024.json.gz": {"num_bytes": 317523344, "checksum": "5c060166e776f8efda48882c118dc0fd5e058d9ef40be578bad31e477114a16e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00644-of-01024.json.gz": {"num_bytes": 318876813, "checksum": "ad98ee119742cb8a6efa1be46e9670969397c7bde10049886d7d6fceb82387ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00645-of-01024.json.gz": {"num_bytes": 319981258, "checksum": "8930ae8e14c124218793d2fd1bbfb1b624e918cb092b21c6ca74347abd9dea4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00646-of-01024.json.gz": {"num_bytes": 319624889, "checksum": "a40705c4f9a4db4d2d698cf96e43b99fa0790b886506300eb4986a26de7063e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00647-of-01024.json.gz": {"num_bytes": 319240920, "checksum": "7129182faeac82b47127458e92903a209acf8272166024e8313c167d6f358456"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00648-of-01024.json.gz": {"num_bytes": 317305623, "checksum": "3124091a6c438fecbfc948b1a35ffb1462287ae06866b02a6dbb1a6651ccf1e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00649-of-01024.json.gz": {"num_bytes": 318998755, "checksum": "fdb286cfe9e9091a57b31be61a56a425fae07d6b44f0b45f8743d7aab0e980dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00650-of-01024.json.gz": {"num_bytes": 319612451, "checksum": "ff88c4310f049344b8a3f701bce12d08ef5f9b037e82fef7f1f670b3d51e59c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00651-of-01024.json.gz": {"num_bytes": 319098081, "checksum": "9c3b1843082aae39b057bbc7364e69cbc39bbdf91d5bff4f52b12cf1a264adf2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00652-of-01024.json.gz": {"num_bytes": 317107981, "checksum": "e6199d12a893ae5d05c5388ae7a679df419ef6a050c8e3ce3c15fe534943a774"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00653-of-01024.json.gz": {"num_bytes": 319623884, "checksum": "333ac93cf1f1f4da0f72c5e57b675052453b42dffe1e4d45ec680f4e3e075d97"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00654-of-01024.json.gz": {"num_bytes": 319055728, "checksum": "1efe352f2f2eba826231a5bff6c79390630b44039b226a5041a087e116b60f5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00655-of-01024.json.gz": {"num_bytes": 318539829, "checksum": "613c741cfb738017b3fa233512296d9127d661738721d3fccd806aad54d19d84"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00656-of-01024.json.gz": {"num_bytes": 319970377, "checksum": "51fa9b217b6bcf664c472cc2b258813e1f1d7a0f501c29b822221bccafa4e201"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00657-of-01024.json.gz": {"num_bytes": 318548629, "checksum": "c542c6fd2f3284d64f8d53b71ab8308bbba59f7f13e9d9eb20bbbaf13ad4782b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00658-of-01024.json.gz": {"num_bytes": 319845984, "checksum": "b3d8fb6ed2258c463367108e2942742e88eac657c859cc8d128035110fc87e7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00659-of-01024.json.gz": {"num_bytes": 318887872, "checksum": "02feb4e03020d767a4468251786d4857d5dc833969626bee616c7882bfda9ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00660-of-01024.json.gz": {"num_bytes": 319854892, "checksum": "a997d9187a185a29fb3bbeb1e696d32898efba8f5e9d6ed816493669f0c5ec02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00661-of-01024.json.gz": {"num_bytes": 317599289, "checksum": "86d9189ebc534c99da5a4407624a623561b159f758fb04373a270887d0b45709"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00662-of-01024.json.gz": {"num_bytes": 318138720, "checksum": "9c626f7aebcc4fc9afd533b6c8a372d884d01f508ce49c01ddd830e4e9e8b2d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00663-of-01024.json.gz": {"num_bytes": 318110835, "checksum": "441d4dd0d5d2ea7b6098a3fe006b9d7afd526188824a3325d44538fc5655942c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00664-of-01024.json.gz": {"num_bytes": 318996945, "checksum": "08ab0739c3565643b6a83d7091936f5d75a4d8418c956146114aa0315f205dd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00665-of-01024.json.gz": {"num_bytes": 320612903, "checksum": "1ab7bc2d0f7c6704c97848a9325015f06228339bc52cc1fb593d9c56145e7c48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00666-of-01024.json.gz": {"num_bytes": 319241006, "checksum": "8b1213325ceb2a2c89dffb891a31317e903d08fff911e4ba1ae66fc3bcce9973"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00667-of-01024.json.gz": {"num_bytes": 319650665, "checksum": "14676f97937eb3d0734e5f121c5f63002ba2d2c62b6c41b4b46d2fcab9ea9614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00668-of-01024.json.gz": {"num_bytes": 319198651, "checksum": "a406fceed5b7d17ff6d5773679c3df50e747215e39926228ddc9a60c6bf9d152"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00669-of-01024.json.gz": {"num_bytes": 319363200, "checksum": "1d3267d77f43d3d720dcd79c40bc3e8c0cd777d421b1b7d0e69e140199e34552"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00670-of-01024.json.gz": {"num_bytes": 320079826, "checksum": "85111c229b8fcc8428b3c13676bde8268f027fe06e1f576a3adcd82bce1603bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00671-of-01024.json.gz": {"num_bytes": 319494773, "checksum": "eeeed8d9f63a5c16ab9d62454fae5bef1896973cfa69cedfcfaac4565a793b27"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00672-of-01024.json.gz": {"num_bytes": 318304853, "checksum": "6793ec3ffbc147c36e471e1c06a664ac2143408c9ee46305694708eee0fb38cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00673-of-01024.json.gz": {"num_bytes": 319031236, "checksum": "3c886ff71973805a59312d8d43ee9e616bcfafd76c03a64d53ab548036b1fa90"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00674-of-01024.json.gz": {"num_bytes": 318647345, "checksum": "fd7f4efc0c8af611e7e137680342843d0471ca072421ab3c172a169ba2f5d217"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00675-of-01024.json.gz": {"num_bytes": 318313871, "checksum": "3b797b2ad717749a24866a97acb95aace0dd4e91ee7d51dcf1fdd46a9232b794"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00676-of-01024.json.gz": {"num_bytes": 318858652, "checksum": "2ccdf652fd413dc624643d35a76223e8a44e6241997841ec2d13ae11b56400fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00677-of-01024.json.gz": {"num_bytes": 319236091, "checksum": "bbf069c696f09e5467b17ba98479948a85101efa776094084e37581e72c01123"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00678-of-01024.json.gz": {"num_bytes": 318996096, "checksum": "3e3dd21861c713bd38d1803c32da1c0bc2496899648b4cffe1fa2e61b35ca056"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00679-of-01024.json.gz": {"num_bytes": 319915466, "checksum": "6ed56468a31564cb25668ceb5df325ff7138dd231afa85f676ac7af5e81e0642"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00680-of-01024.json.gz": {"num_bytes": 318537417, "checksum": "959ce407e7a892495c477b9e0071dff496fd20db9cfb04dd035ac59dd5b2f309"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00681-of-01024.json.gz": {"num_bytes": 320181225, "checksum": "0aa77d778f24bfdc8566b390a7a1ef1d7880a42b98b3e82e9b37ee3ed821a8e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00682-of-01024.json.gz": {"num_bytes": 319087756, "checksum": "a4da802570ee7bc27e752069612b633edf226078f48d5f55280f73a6dc934127"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00683-of-01024.json.gz": {"num_bytes": 320019766, "checksum": "587497efb7bcd4ca85ec0559e372ea285c1b95e3889d406f142cfe454d8e0e2f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00684-of-01024.json.gz": {"num_bytes": 318814245, "checksum": "6e904f73976ca18aed3375d1c1b308d749b9a4405a333dd0a2cf85360822e205"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00685-of-01024.json.gz": {"num_bytes": 318586686, "checksum": "c51012772c5bae73821b67f72c035f22a40725d42bcf51e439bbdfcd84393ef2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00686-of-01024.json.gz": {"num_bytes": 319648436, "checksum": "890b7408abd0cc04a84be3a3992d05714dbd30a9d33a8a9b05316a980fe51313"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00687-of-01024.json.gz": {"num_bytes": 318909835, "checksum": "b54b20c21ae9834b630a8aac057d47069cf137577d30b91fd1475f5824b61561"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00688-of-01024.json.gz": {"num_bytes": 319381735, "checksum": "422091d5ba0d44c64bb0c84ab4757318414bc01455a97f53190eddda89c2f3f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00689-of-01024.json.gz": {"num_bytes": 318995026, "checksum": "ad5080fbddc914c649027d5e2214f1d75e0cf0617eb3ca0b1fdb8ed9129f99cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00690-of-01024.json.gz": {"num_bytes": 320745318, "checksum": "d45492346bb4bf519e657356ecf1805b6b592683b98c20c93da2f07c50b06092"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00691-of-01024.json.gz": {"num_bytes": 318575084, "checksum": "43a07e8a98bc99f381558c938fc83acd4a37d565459c0f3f83aaadda816f66c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00692-of-01024.json.gz": {"num_bytes": 320651368, "checksum": "21a790ef1dcc9c6ffa071d1a2e21e330d6afcb45368dde9cfae8933c6d029742"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00693-of-01024.json.gz": {"num_bytes": 318429145, "checksum": "85558018ee61e33c4f3e05acc2029e69447a5717be880e9a0aa8fa715dbd0c05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00694-of-01024.json.gz": {"num_bytes": 319562061, "checksum": "894f4c906a33c644ea80c3a00155ced807a62e1bcd9f6e254cb6c88efeedd142"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00695-of-01024.json.gz": {"num_bytes": 318298964, "checksum": "06eb05f651f1d2fff495c48475894420334070df10c051c7253b7afb0bc38291"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00696-of-01024.json.gz": {"num_bytes": 317473664, "checksum": "59ea4f951335553945a644f7628403ba1a99a27e0d93fcfe5db18cbc3dd48ce9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00697-of-01024.json.gz": {"num_bytes": 318839008, "checksum": "f0203b0f2caa3287b8f7a64288af52bafbf033bcdf31dae54e501e4da47b9935"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00698-of-01024.json.gz": {"num_bytes": 318288032, "checksum": "fe2a581cd174429a81424e407aceb1d81b61d9796d74db4590327778fbd5016b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00699-of-01024.json.gz": {"num_bytes": 318696527, "checksum": "edf3aabcdb28fa2feb532b3bd55cd167c2200a6d8e19f05152be194e48acf87b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00700-of-01024.json.gz": {"num_bytes": 318900366, "checksum": "67d89417d1440afeeefd59a0993e4d12fb5731e917ec7f4e65d9319541b4b9e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00701-of-01024.json.gz": {"num_bytes": 318901212, "checksum": "64d302459e6871325282fd890d2922cb1fb25b47d677ce793bc065acc8d1bd07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00702-of-01024.json.gz": {"num_bytes": 318913325, "checksum": "f0bb360189166a0bd717bad85edf06943333b1854687839864aef3ee02814795"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00703-of-01024.json.gz": {"num_bytes": 318730274, "checksum": "c4e027079b9cf9b1adae3e285c5cc5dafeee5c74cf3621c424b6df9801d508f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00704-of-01024.json.gz": {"num_bytes": 320112232, "checksum": "37540f6a00523cbf429764893aa15aae6a57e53c89cf51d82a815feef02b1210"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00705-of-01024.json.gz": {"num_bytes": 319643559, "checksum": "9dae018569fa4bf33674f67ba03732a2f85cfceb53ec2cbb9457eaea607b8dfa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00706-of-01024.json.gz": {"num_bytes": 319941519, "checksum": "03926405dc629f0664a3d27c700a4fa2f606496f0b52a9bbf2fd2d75faae2f46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00707-of-01024.json.gz": {"num_bytes": 317628508, "checksum": "fac92295e4c85f087d27e0a6f231d782be7b2448e99cfc42c09c0e1e20964c3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00708-of-01024.json.gz": {"num_bytes": 318863059, "checksum": "39d4880d3e47e65ab6351e94b015810d66295a86a9f08534260ccbef41fdaf04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00709-of-01024.json.gz": {"num_bytes": 318412651, "checksum": "044fc99a1307737bc8d6d8a9b67997010309fc695eda6e8dd42e5b6bab2256d1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00710-of-01024.json.gz": {"num_bytes": 318631334, "checksum": "0b2c93cf298051864b8660e57182b38408ad738cf930afc09afdde26d952f819"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00711-of-01024.json.gz": {"num_bytes": 320587866, "checksum": "f1f6bb9770b76742d0131495879fa38ed8aebe8a0b38463e7834f0697f174ede"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00712-of-01024.json.gz": {"num_bytes": 318191204, "checksum": "b6873a7d375aa29ff39ca17c3bbc7e328292b1671b59a35e7b01c0e992da90f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00713-of-01024.json.gz": {"num_bytes": 319472539, "checksum": "3bb12a0a806ecb8a5eeaa00188c655f399460609b8a19005a7141bbcb3a7a694"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00714-of-01024.json.gz": {"num_bytes": 320196397, "checksum": "ca6e1fa6f27c9dbadbbaa767fd21dddee7c84ca96bbb6735640ba2631668ad0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00715-of-01024.json.gz": {"num_bytes": 320075706, "checksum": "1a773eec7d738c0e1e253bfd4533f0c43c0d133e564c3458159e0c47d767689c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00716-of-01024.json.gz": {"num_bytes": 318736413, "checksum": "c17a6b2115e56cc3d6bbbd94e8565fb14287057f80199528e6cba20adf557bf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00717-of-01024.json.gz": {"num_bytes": 317351537, "checksum": "cdba391e16c3bcb5569d978a8d11518103e7687714710ef4eba4f7c0821d67d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00718-of-01024.json.gz": {"num_bytes": 318017965, "checksum": "a25c494e4baead0af0afe6eabaa054bc15f80b6ca0ac8dadb1b354d72ffbe63b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00719-of-01024.json.gz": {"num_bytes": 318124432, "checksum": "94f5dfbec85a8c5b22ff1368a16ec2eb7fb4be25c0c8f004096156ae40bfa2bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00720-of-01024.json.gz": {"num_bytes": 318235852, "checksum": "c0248326e698599dcad01eca25d747c138881c61b5636ba765b21f9cd0df996a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00721-of-01024.json.gz": {"num_bytes": 318817834, "checksum": "c11df487a966e748cec522fae4ed76abf3e8cc9bcd28c301117fa52ddb83dc6d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00722-of-01024.json.gz": {"num_bytes": 318553851, "checksum": "63d3d0c3f5dcdff29a0a6ef41e3a9df3fb505c73c8554839e3032293a78bae2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00723-of-01024.json.gz": {"num_bytes": 320174720, "checksum": "29c97bb8ff301080547255af29bb5019a2c1fbc74f0a2711e626461d5a5f0b54"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00724-of-01024.json.gz": {"num_bytes": 317805413, "checksum": "65f8932f3c77b0fee5f2224643a71ff95246720368fe66d45c22df25ea4b9c2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00725-of-01024.json.gz": {"num_bytes": 319460597, "checksum": "dc785a8aa3a1f4ed77512d51a9139dfb24b356b5499ae67dd5b860101b1e0e4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00726-of-01024.json.gz": {"num_bytes": 320934004, "checksum": "45d857536d3535d08cddb6cf50d08d89cc28138a5be082465c3a8c27c02ae2bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00727-of-01024.json.gz": {"num_bytes": 318393879, "checksum": "e4a02e43eeabbecb81b971f4201212104b6214078cafd9500d5b5f323595f060"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00728-of-01024.json.gz": {"num_bytes": 318826577, "checksum": "cfaa0d0c8dfb333899c73e0c2aa00dfdadd00e5b4a3d477e7518c4141899c8a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00729-of-01024.json.gz": {"num_bytes": 320390067, "checksum": "528fe99b0c8dc917ac0f02a555603f9ae81e690b4ce1040f65ebbad3390c0426"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00730-of-01024.json.gz": {"num_bytes": 318156386, "checksum": "786e6913b4417a87cd4cb1882e181d8b2e1eb4b4db5b4b9ad2120b5efdf3e2ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00731-of-01024.json.gz": {"num_bytes": 320013543, "checksum": "f28fc2794c280fc1de263b9b2a81e42423f8dac3af7c4fbd3b3aff888821ca9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00732-of-01024.json.gz": {"num_bytes": 318753697, "checksum": "69491eb25dbaef78235f769422e773de7a2578e678ecde29dcaa663f4ebfa78d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00733-of-01024.json.gz": {"num_bytes": 318640706, "checksum": "dfde8960d738b873bcb75abe1661fcaa096d70c76aef21846b173b8adf049bbc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00734-of-01024.json.gz": {"num_bytes": 319447398, "checksum": "145add76dcd73916b548e7e3b161757c1bdc1f22a0f127019f24827afd6f85e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00735-of-01024.json.gz": {"num_bytes": 319868149, "checksum": "dcd4ba95672630f89e75b70dc08cb918bbe896f5d32ffeba7d3e4921b27c1f4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00736-of-01024.json.gz": {"num_bytes": 318404586, "checksum": "4710b1569342b7aa7ca610d8b8cbb2248a1c5fcd8c6ab3b7f875657dff4779cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00737-of-01024.json.gz": {"num_bytes": 319915151, "checksum": "7091dc758fd14c206514663eed0ae446178ff38e76c4cb7e711c63d419506e49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00738-of-01024.json.gz": {"num_bytes": 319709793, "checksum": "afe1a96ced49662b14bc60b4ff8fc1f610bbc6f3c515bb73f2fade7a0ba67678"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00739-of-01024.json.gz": {"num_bytes": 319789716, "checksum": "9e2332cfc994483d4b913c6556ca9c1698b95e81033b7bbc5a4f5271e5cce708"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00740-of-01024.json.gz": {"num_bytes": 319102226, "checksum": "61ddcc3af919b753638dd46f18f790d7783cdc3090dfddbbeb40faa93bed340e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00741-of-01024.json.gz": {"num_bytes": 318717589, "checksum": "aa3038c23a37561f2ba92e95ffeaa3e3641c1a69f8688b724116edd128e9ba52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00742-of-01024.json.gz": {"num_bytes": 319456536, "checksum": "ea9d23abfed6e3e8ab900291a3bc1faa27751ff94e35378f8c4eb07207036a9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00743-of-01024.json.gz": {"num_bytes": 318641730, "checksum": "6efcec6cd087be4eaa98491e463d0fb9c1253aca275971de08c56a20be9aa579"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00744-of-01024.json.gz": {"num_bytes": 320264992, "checksum": "71653351253c8f7fa18673a3f956bddebd158978708c5a4c9e9b5318f598e1f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00745-of-01024.json.gz": {"num_bytes": 318665967, "checksum": "347dfd824d6f4afe58c6f418ab5d332909038c880f4dcda7f774d3d7a588c3f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00746-of-01024.json.gz": {"num_bytes": 320005833, "checksum": "812bc3c082e3a65c8c77fc7767bb435f9be9a999961d84eadc9e0c602e5ce168"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00747-of-01024.json.gz": {"num_bytes": 318575441, "checksum": "a4414d376c69ae8dd5e60b206315cf920d5a797c6ef7c08fe0c4b4e28b4eb4ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00748-of-01024.json.gz": {"num_bytes": 319266882, "checksum": "f08aee694b85d5e7120652350bfafaa05495e609aa6d2fb0b913ed8a718d7dcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00749-of-01024.json.gz": {"num_bytes": 320205042, "checksum": "b3402b16a5cc817d89a19fd3456a50b5b6d5f3f555eea725167558cc85366d12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00750-of-01024.json.gz": {"num_bytes": 319198252, "checksum": "6b95232f6d53cff8045bd5ebaa87d6e6c511a74dc646d2a960eb87e801ff4f2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00751-of-01024.json.gz": {"num_bytes": 317855407, "checksum": "badc9d82efdbc8db5dc328e8aa5e80155c52f00b105b136d8c5c948fe237d61d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00752-of-01024.json.gz": {"num_bytes": 320283992, "checksum": "67c32eb497533d6fd20b206c38483d171275029ff525bba3da13b0c62e1ef073"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00753-of-01024.json.gz": {"num_bytes": 321030653, "checksum": "5e95b1cb54d7d7f12bec1559ababcab0c364a0af99e10a42a08357647ef5d3cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00754-of-01024.json.gz": {"num_bytes": 319059779, "checksum": "32cb59ad16dfda8a5b52615498fe2e6d85753fa44ab667af2f525a2467508da5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00755-of-01024.json.gz": {"num_bytes": 317737268, "checksum": "0ad2fef2fe37d59b163e29c2287938a768ee87acc34752394809295d0710c602"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00756-of-01024.json.gz": {"num_bytes": 317293218, "checksum": "db737ceace329fb1f8fe1aca38db048a1dedcb5226a4132485f26afecdc6c3c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00757-of-01024.json.gz": {"num_bytes": 319529375, "checksum": "8b823e97964894189a13df393e1b3978342fb24bd81f07af6e54b7bfa2992796"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00758-of-01024.json.gz": {"num_bytes": 319297548, "checksum": "3f31d7ad99d88dde757a651b12db909a30cfcae5796fe3f85722598d92344ba5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00759-of-01024.json.gz": {"num_bytes": 318154496, "checksum": "a4b780127d6f22aed49d155e234e21a847a60626143a8e7dc6e31a5f204e79f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00760-of-01024.json.gz": {"num_bytes": 319386997, "checksum": "020e68dc60004d0661de8a22fe2b9fa7f481fcecaef8fb06efa43093a2a9cc52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00761-of-01024.json.gz": {"num_bytes": 320035555, "checksum": "8d7b5a97770a062276ca909a3bd20365cbaf3931fcbeb8b7e479f5ee03b47053"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00762-of-01024.json.gz": {"num_bytes": 318099583, "checksum": "b8fcbbf9b55cde2ff66ca046884870e1e5f2d2a729a8eedb253c16fe0d7658e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00763-of-01024.json.gz": {"num_bytes": 318354409, "checksum": "ce2d9e44161b13f6226cfb9f93ad42fa0edd18eeaee923c8ab31c25aec1fc976"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00764-of-01024.json.gz": {"num_bytes": 319181291, "checksum": "53ed1ef77f24bdd7c189aae0905d63be97f48aa3233fda139e59af53baab242a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00765-of-01024.json.gz": {"num_bytes": 318147738, "checksum": "26b9b9ea2f94b322c03d1b83b25ab4e9a1a203fe9923728c5dd91f22d5f8fef5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00766-of-01024.json.gz": {"num_bytes": 317964368, "checksum": "e59fec52abde3fb4cea58a5a4e511f4cc61e21062bfdd1e3ffd60131a847e0ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00767-of-01024.json.gz": {"num_bytes": 318750919, "checksum": "0e5eff983e793a3d7cdd1ec85a45d58e5e6ecf7a12cf83a01888e148ab08acf9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00768-of-01024.json.gz": {"num_bytes": 318978892, "checksum": "171509b0bed8854b6de92fe146993be80ab31e0aa56953c7b0a66eeb738ff70a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00769-of-01024.json.gz": {"num_bytes": 319386097, "checksum": "704e7daa85c0e3ac974d51a6e2cf6df2ee053613fd2b77b5fe16d10b29a50a4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00770-of-01024.json.gz": {"num_bytes": 319623528, "checksum": "e787064473427fe17ba95d9326d009e9723148fb314a7a9605dcb6698854dad5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00771-of-01024.json.gz": {"num_bytes": 318911381, "checksum": "c54aaffd8162b30280e974e81e9d0669357b74394e0da2d1ca2ce613f5715e4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00772-of-01024.json.gz": {"num_bytes": 319386949, "checksum": "2f9c83681632482df6c65e4c70718c83f500305ee1d061626cdef35bd794a412"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00773-of-01024.json.gz": {"num_bytes": 319962599, "checksum": "f47c487ba09051c9a4bf320d69db9546e98948e3de68050ae2ba025c71e09146"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00774-of-01024.json.gz": {"num_bytes": 320370991, "checksum": "69a1eacfdb6f6fd49ea2b729a7ab291b96fd5bd42f993e2306d044871b069aa7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00775-of-01024.json.gz": {"num_bytes": 320433220, "checksum": "d35934fb537d1283d40897d05c1486f629776fe9e4ef127694ecfd0221f860c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00776-of-01024.json.gz": {"num_bytes": 318809986, "checksum": "9079970aa1618b6be51caeab7a2cab26e61c30aa53af361a6184ef6249bf65a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00777-of-01024.json.gz": {"num_bytes": 319617796, "checksum": "5e200e354ece1713a32a3e1ebcea33412de814dd5843df3523afa1ec9a4d5275"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00778-of-01024.json.gz": {"num_bytes": 318039278, "checksum": "b79309eb335c0c860c85d2b724df52c3613f61b92ab6cd6276c2be8c25a7b01e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00779-of-01024.json.gz": {"num_bytes": 319078058, "checksum": "fc6053d53255e4d4a4c22c42049ce3eabc224320a51c94c1116f3201f87b377b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00780-of-01024.json.gz": {"num_bytes": 317637428, "checksum": "e38c933003910b02beef64af2d330f32af6e6f3b7346fa121e89045c136c13af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00781-of-01024.json.gz": {"num_bytes": 318792407, "checksum": "b6795b4db199f7a7a92ef195aee3753e5e00df05fad2d8401b2b9feb56d71a76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00782-of-01024.json.gz": {"num_bytes": 319081289, "checksum": "dc20640bded03596eeec689f1293be55e72d138cf0c576df9768c7631931ceb9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00783-of-01024.json.gz": {"num_bytes": 318663257, "checksum": "ac2b4ee9ab8f25ec010a17358d2f3f1fb9d8d50c9f4b73357429277710e6564f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00784-of-01024.json.gz": {"num_bytes": 319687102, "checksum": "fb93dee8a974f2ea204c240ed4c24e1b64f91ccb421070be305487e4e53ca083"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00785-of-01024.json.gz": {"num_bytes": 318909034, "checksum": "2f298b358cc619fa72097e3dbd9ac91e7dc3f7c5f9c4f2ff6881c988921d2a6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00786-of-01024.json.gz": {"num_bytes": 319213094, "checksum": "60ebe35e0f23ccc61fc0eedc891ea9deb43001beb8205d31360a05b5d58e31f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00787-of-01024.json.gz": {"num_bytes": 318335621, "checksum": "a7b0aa4dafdda2f3dc3c1832b71d4a92af08f99a70a315b4cf9f60c1768bf2c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00788-of-01024.json.gz": {"num_bytes": 319444037, "checksum": "874dda510a01a2f78e51d917d309bcf1a0f21e7e1ca46661f93931a6200b3d01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00789-of-01024.json.gz": {"num_bytes": 317955670, "checksum": "ec949a05ec7750dacfdf692c1ba118a33454097fdcaa56626fb042eb93933811"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00790-of-01024.json.gz": {"num_bytes": 319033823, "checksum": "0939164a602d7c7140c619130977b6814639122d0038aff7bb840093def5172d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00791-of-01024.json.gz": {"num_bytes": 319366402, "checksum": "fd6ea942b3402b5da4acb1a03bf59b17df402e90c47dbb66fb198ca2f4b5e1cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00792-of-01024.json.gz": {"num_bytes": 319218667, "checksum": "9e8af5aaa6d5ed915eae334c6101948fbcc7bcf6c8c6beaf80fd1adecd67b078"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00793-of-01024.json.gz": {"num_bytes": 318865241, "checksum": "675330d6736a677760d854dcdd9a174eb7c1d426f94e34836a048c2139befac0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00794-of-01024.json.gz": {"num_bytes": 319384084, "checksum": "fd4c2623d9cbaed3fefd6bb88c2d88b58fe8f08e9e8ef0cea6bb22cac68dabd2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00795-of-01024.json.gz": {"num_bytes": 317654308, "checksum": "157533ddb56290662e25cb60842327daec23e377e116496338c9313cbf6991b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00796-of-01024.json.gz": {"num_bytes": 319298258, "checksum": "fd90f055499095efa9cb848dee62406d25820f929554b0e07674d4c95db574b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00797-of-01024.json.gz": {"num_bytes": 320048871, "checksum": "e089a95e96a081dd76e38acf9506bfc7b86c682892d3a8774e9784019db39306"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00798-of-01024.json.gz": {"num_bytes": 319291246, "checksum": "e29133ab6f83c84a69752a451053dfe20887ea884e09cc373afd89bba7458664"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00799-of-01024.json.gz": {"num_bytes": 319175282, "checksum": "8f3f3a67946615bdf499d64341d200477280947e5be8538748e28db768115947"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00800-of-01024.json.gz": {"num_bytes": 316687275, "checksum": "c9a17dc92658ce5d062af25e5c8610a7fbae501627cfc7324ace7ca6a8d75d8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00801-of-01024.json.gz": {"num_bytes": 318710698, "checksum": "4b7d1e130fd8ba536da073069221f68d567492b2bff27d8769fb4ef124cec3a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00802-of-01024.json.gz": {"num_bytes": 318914381, "checksum": "9f186b8d08f5d3090b7c9eb8a6954cf3202caec7cbf5c308221333cd115af561"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00803-of-01024.json.gz": {"num_bytes": 319111424, "checksum": "117b0590a976805001a879c49c42db55579e5bb9a5d4db9ce20e42746f59d574"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00804-of-01024.json.gz": {"num_bytes": 318186018, "checksum": "ea376d6cc1043dee9a00e1eca1c431aa59755d8966162701817f9cf274a758c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00805-of-01024.json.gz": {"num_bytes": 320382848, "checksum": "1e69e7896202206f9f804b2497c4d99cca5c1d139efc782b8ede2cb88f68b48b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00806-of-01024.json.gz": {"num_bytes": 319508172, "checksum": "9da7e230c7abed9beaed9d6090efa8ae1029a418dbbf6d04bb4386aafde3dbce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00807-of-01024.json.gz": {"num_bytes": 319995091, "checksum": "2e3ba0dbe85c004c6a23b4caf340282e0d0004ab574a14bedc9c83c67cc2c0c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00808-of-01024.json.gz": {"num_bytes": 319880961, "checksum": "f53fd08fea0f874d727422357521176c6810a54abf4fcc7019357b50f1928daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00809-of-01024.json.gz": {"num_bytes": 317100774, "checksum": "dbeed220f330b489cc262fbd7cbe84f04ba8a5118ebbd8f48bc7a4f5f63ae7b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00810-of-01024.json.gz": {"num_bytes": 319625750, "checksum": "fe5dced88ccd54b258c6740d8988e10b128a869ecf28e7096e689c59fa147d4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00811-of-01024.json.gz": {"num_bytes": 318375975, "checksum": "e4bcc5571fdc4f51b733d975e78ff02939d3463264a02d7e651271ab91c81df8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00812-of-01024.json.gz": {"num_bytes": 319663092, "checksum": "b1e41c198bc69d026ab997fdeaa4e687f7a8ddfca751add9bc85f00481708a63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00813-of-01024.json.gz": {"num_bytes": 319094357, "checksum": "c07287aedf6854f581aaf83b75c4939aa4b10181977d4c4be97c20989ab8f992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00814-of-01024.json.gz": {"num_bytes": 319521327, "checksum": "c96203ba5461ef92a7a2b0d4e598efda943b5b3adf42a7268c26f1c224410c01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00815-of-01024.json.gz": {"num_bytes": 319098749, "checksum": "72f2e65c5b482be0d9e3a3d8f5cdb703cec7a515e927bc4411e2f6ff5085ed5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00816-of-01024.json.gz": {"num_bytes": 320377295, "checksum": "df95ac17a25cebb854088cca345f60c2634d07f088e45e251d7f9afdb334c0c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00817-of-01024.json.gz": {"num_bytes": 319007451, "checksum": "bad1cc25de4f66ff36c69284e6b615f68bdc25e45f08e04e33ee463a0c6ef0b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00818-of-01024.json.gz": {"num_bytes": 319609737, "checksum": "acf1b390f1c492d97bf027f06898f1dd5cf8cc6def41f4d43b38a0c99f4a85e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00819-of-01024.json.gz": {"num_bytes": 319164157, "checksum": "3d973eb401876c57e9cd1420fc938da9dd7b08f97d4596c66a8c159e2b56b1b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00820-of-01024.json.gz": {"num_bytes": 320181073, "checksum": "101d5f0079caa840b934c14800ba5cbb7fca22e9e6915b98b4dc5f37c57f5b4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00821-of-01024.json.gz": {"num_bytes": 320949305, "checksum": "34ba423c93c4262234e6e2005aba0436daa99b05570cff0a58e9d27b65d76896"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00822-of-01024.json.gz": {"num_bytes": 318392521, "checksum": "4a586e220fe34f544dd068f4e1c310459cabd5dbea9a991c21c09f70079eb4c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00823-of-01024.json.gz": {"num_bytes": 318526893, "checksum": "3b10a8e32a3a8f6541400d697516fcd3fffba3554e8d8a96451f01fc6b729d8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00824-of-01024.json.gz": {"num_bytes": 318640792, "checksum": "c921270db8004d309f91e3209340c476191793d47b3cfa9d19fdc602d43dfe65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00825-of-01024.json.gz": {"num_bytes": 319524026, "checksum": "a6eb347db464976ba5d1aaa4fa64e103ba36520dd1e9c103644caf187be471a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00826-of-01024.json.gz": {"num_bytes": 318469810, "checksum": "dc5f88e6161ac06165f3cd4cb91a00cdff75d2f900e8f53d62bacfd833e352b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00827-of-01024.json.gz": {"num_bytes": 319391185, "checksum": "66a240be851d6622adf7801d9634a456e83e9edfd135601c0dc1aab48902d7cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00828-of-01024.json.gz": {"num_bytes": 319625277, "checksum": "2e989beeeb2a63bfb87a5a401619a8e4155a961b44441cb5f627c29f25962dd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00829-of-01024.json.gz": {"num_bytes": 320001237, "checksum": "0653e4052fb7a4ef503bdfbbee332d650492e99c130a85c04250e18d91cfd30c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00830-of-01024.json.gz": {"num_bytes": 319240468, "checksum": "bd56e55e75a8237b5292fa65e5ecb0dfbabef6ef0dec6695b13522803210f40c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00831-of-01024.json.gz": {"num_bytes": 319174603, "checksum": "ca9d6c643127a390823655256a45462ee6e75aa2485141f6530a3bdf6ce4f572"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00832-of-01024.json.gz": {"num_bytes": 318909883, "checksum": "e91c35d94e183515e660cd8c874c12bbf22e1fd683312446f02287b0d032fb68"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00833-of-01024.json.gz": {"num_bytes": 319095835, "checksum": "971d9a4f8bfce564d42dc0a80009acfa7d2f47557ac19836ab426defe1877714"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00834-of-01024.json.gz": {"num_bytes": 318319786, "checksum": "159412a58fb8deb59e039fa0102bdb746065cbc6b4d1d3da892930fbf8b0f178"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00835-of-01024.json.gz": {"num_bytes": 319959334, "checksum": "814518d53b3023e3b8ac22dad9d65dd50d455a4c7db1490022f447f793f4d24f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00836-of-01024.json.gz": {"num_bytes": 317642779, "checksum": "19ad4fbaa3ff5c638b77980300b8c162c21a8237b87d054a30c46aee67d0ad94"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00837-of-01024.json.gz": {"num_bytes": 320687986, "checksum": "190de7948a4b163047ecdfc856e5f78bbff52ca883edfad26b32fbc0b57ffe36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00838-of-01024.json.gz": {"num_bytes": 319802866, "checksum": "ccb4d342791a187f3bde225e008ff8cf70465f7fd3eacaa8bbce1ec4e52c2622"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00839-of-01024.json.gz": {"num_bytes": 318621894, "checksum": "3ff5cf5b33996a663df5783f3f41a5b5b2f6e08a2cf91e74cad3bf82291192fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00840-of-01024.json.gz": {"num_bytes": 319757379, "checksum": "8292e0854c01ca79ef03dcc1752ddc1f0df747ad67551b7c0fa5208b6aa3f822"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00841-of-01024.json.gz": {"num_bytes": 318779722, "checksum": "9eee9e089bd396adf5a276eddca9f6352e07f8c33877f85c1f65968aa0c06128"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00842-of-01024.json.gz": {"num_bytes": 318692591, "checksum": "caf3f40a144b43af08687e41a1eb7d08da1b78cd1600574566e11f29fde9cd34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00843-of-01024.json.gz": {"num_bytes": 318944616, "checksum": "e74d624534091173546755ca236e5912cc8acf8cfef5f9c197b541ebe76f0818"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00844-of-01024.json.gz": {"num_bytes": 319392887, "checksum": "e47d3f44f996398b54f18729f4e81d88d04b19bc529847e86277a6a91ae74e6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00845-of-01024.json.gz": {"num_bytes": 319215311, "checksum": "de7cffe64f422b02668137272943537946c15539954b564345d6722c4eb06345"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00846-of-01024.json.gz": {"num_bytes": 318129297, "checksum": "1d5ea0ab8fcb3975735aa421d646cea4544087f60a79ec209b63c93b6318523f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00847-of-01024.json.gz": {"num_bytes": 318134095, "checksum": "6fa4c50808df2aa8efebae3bbf832ba2b0be2f7113633fef720cffb3c50143a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00848-of-01024.json.gz": {"num_bytes": 318521356, "checksum": "3aeb657aa448af82551c653802c669c985c00b7daa593de07f80733ae5dee84d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00849-of-01024.json.gz": {"num_bytes": 319541694, "checksum": "1cc016f58a4a2c54625214f028df05247ed319b8c1868c96c2efe8147a73d08a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00850-of-01024.json.gz": {"num_bytes": 318861613, "checksum": "eb5fbe6eeb4b0281604df264a5b04a3a0db96ff0d04f252375a788a0d3345c67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00851-of-01024.json.gz": {"num_bytes": 319356648, "checksum": "ffe1397f1d412979cc66820555ef27345f3a2a48b8bcfe682d48301135e8c12a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00852-of-01024.json.gz": {"num_bytes": 319662372, "checksum": "fa78ed98d602276520e823e17adc7f796320d95e27e08d84d06e66e415b79161"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00853-of-01024.json.gz": {"num_bytes": 317625507, "checksum": "b10cff62fac5191b9cb5e2025227adb838088773e79bfec0937a34bb857e1b1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00854-of-01024.json.gz": {"num_bytes": 319665550, "checksum": "15441b2a7c09a477389a8fbd7401c549dc8281f2bd44251b1546077301e24624"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00855-of-01024.json.gz": {"num_bytes": 319059897, "checksum": "f6127845b162181dd7157dd316021a4e6b5d41393c66d3e577491cdb74657f2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00856-of-01024.json.gz": {"num_bytes": 319243991, "checksum": "ec9f0884c5ddf82550105f969222d3ee8b0d4907a0a2540ea6c8c67c2d2e9179"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00857-of-01024.json.gz": {"num_bytes": 318546680, "checksum": "840205fa73336ff51d75008ce8c530164ebcef3b50f1ad8deab879a67acf8d5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00858-of-01024.json.gz": {"num_bytes": 318306547, "checksum": "e9b3819e9dc98d66a61f8f4e8f6ecb03099c79ae87a175fe1ae484174b173b44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00859-of-01024.json.gz": {"num_bytes": 319088302, "checksum": "eced8de72f8755fa0dfb690c626cefcacf5fbbce97029d4589058913c31b9339"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00860-of-01024.json.gz": {"num_bytes": 319704792, "checksum": "90a169718609f16abe120c4b63a20adc0bbedba51de14b004d34dabe530339f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00861-of-01024.json.gz": {"num_bytes": 318444445, "checksum": "d020840f09fa426ee15d19f05e5afd9cf674048e0dc4438dae0b6f02c7227d9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00862-of-01024.json.gz": {"num_bytes": 318606300, "checksum": "e02bf9d3f1a398972f7d78b9b1aaff9a92146554a1358ea1b16ce7873a9f8fd8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00863-of-01024.json.gz": {"num_bytes": 319273730, "checksum": "c977f143cbb5e61160ce76f1cabf7bea6c158abb7e159ec3362aad1cc7af0ade"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00864-of-01024.json.gz": {"num_bytes": 318143165, "checksum": "bdf20dbde61f0663feb70be419c39c60acdc7ecbbe1430d47bf79ae2e114f168"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00865-of-01024.json.gz": {"num_bytes": 319041356, "checksum": "11c9c068ec5c1b612494c1473b7cace67a55ee66155559b19035df180ee260a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00866-of-01024.json.gz": {"num_bytes": 319758401, "checksum": "ab4436f283af0ef2d33b93cf026907cf68255beee9d9dc1d6c542dee9c3f48a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00867-of-01024.json.gz": {"num_bytes": 318991336, "checksum": "56beb5edbca3b66981f5f8e65f2a13a0f6e99e68ff50cc263cc529a4d8ebf371"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00868-of-01024.json.gz": {"num_bytes": 319984390, "checksum": "b9368d2ae0eff869c70c1a1214126c1d084f56887102d3d46e450b2c934102be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00869-of-01024.json.gz": {"num_bytes": 319462888, "checksum": "68ab404e0ca2247686eb264a0d7feeb9d2460162434f5babb2b1da82d865343e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00870-of-01024.json.gz": {"num_bytes": 318426018, "checksum": "2d60208a558f6ba92d6c6307e1ab626acd7ff3b7bc25963b09e87e464751c42b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00871-of-01024.json.gz": {"num_bytes": 320233396, "checksum": "ee2517922079c713605dafffe6bc0db0a947abf64ff92c409aa1015b92cdb099"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00872-of-01024.json.gz": {"num_bytes": 319570251, "checksum": "83ca4f125bd628cb28210fb874db717635009e36c60b42237bda48fcb611a53f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00873-of-01024.json.gz": {"num_bytes": 318755978, "checksum": "d94ce49fd17da5f70d1a89bc9e5323daa54f0b8417e1ee5d991467c80c068ec7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00874-of-01024.json.gz": {"num_bytes": 318986904, "checksum": "f634915d1b529d9d728fd96993bb151dc07016767cd44ceeedddec73eaf37074"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00875-of-01024.json.gz": {"num_bytes": 319116193, "checksum": "6367b1216e1c6ab18af66471d866f39caeb9a538209134a9e6bbbcb81bc51db7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00876-of-01024.json.gz": {"num_bytes": 320829257, "checksum": "c9ad4ab8c6e5995aaacd72ebc6654b43b4756804bf3cea808610f9b618f98fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00877-of-01024.json.gz": {"num_bytes": 320082625, "checksum": "835ae7d54732c309bc9aff231268474af66653b06ad6ca17b54dab6f4a7d30c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00878-of-01024.json.gz": {"num_bytes": 318964554, "checksum": "49c761449d5052dd6c408268c77196bffc5125eb5189390f73ba0ce8550f0175"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00879-of-01024.json.gz": {"num_bytes": 318699617, "checksum": "521e1c5fa967a6f29641e7c4c2b210acda0736b32f318e24aef0e587895ed492"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00880-of-01024.json.gz": {"num_bytes": 318723630, "checksum": "dee1814b24f9bbc3aa3430cd80302b08b863eb1b92698158960b6be216845843"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00881-of-01024.json.gz": {"num_bytes": 319839271, "checksum": "9e57ea6a0e3d8a7798a0cb3e6344e1711e8fd879e2e396294718ff360fc7c4df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00882-of-01024.json.gz": {"num_bytes": 317773196, "checksum": "2e5e5749618e53668222c7d310929e2177772dd7c14592e61dc86f163e353c8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00883-of-01024.json.gz": {"num_bytes": 320262049, "checksum": "f80afaa4495a2d41ad4d7380b79040569179b24ef5c2df17f75ce8e135d786b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00884-of-01024.json.gz": {"num_bytes": 319146213, "checksum": "77338479b420dab9316a4737fc243de84b5e88392cbbb46fa0619045a42432cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00885-of-01024.json.gz": {"num_bytes": 319022605, "checksum": "3a67fee2fb77e64aa13fd595d7786b432203f36712ff723ec5999a341834b38c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00886-of-01024.json.gz": {"num_bytes": 318624429, "checksum": "2afe387f2500c57294acf1403a8c27f27f6c7c2d228dee0f1ed70a02c438f838"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00887-of-01024.json.gz": {"num_bytes": 318733911, "checksum": "3fe087b3441f74730ab137ba9486650cfedfe2d724573c3d166565d7d1e40938"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00888-of-01024.json.gz": {"num_bytes": 319926754, "checksum": "dd2df1977458cac34ef1e52059bbc28738e541761d7ad11c0ffc8ef3ca061190"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00889-of-01024.json.gz": {"num_bytes": 319085344, "checksum": "4172244cc3fc4a4e9e09f04f8097cbc678aebaedb9d1fb97b1daae16b0b8ef45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00890-of-01024.json.gz": {"num_bytes": 319838671, "checksum": "8ffaf34eb8209e7ec250303298f9eebd2833fedcf80414c20331e8dbed42251c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00891-of-01024.json.gz": {"num_bytes": 318169092, "checksum": "daaf74ba5d12a7415da94be0f4454336aa3d86ad5cd300dbe30cef596835ac8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00892-of-01024.json.gz": {"num_bytes": 319662776, "checksum": "6d99c0419a6c9633620fb0aa7b7610cc5d06696e839a1a52953fd7db7a18e053"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00893-of-01024.json.gz": {"num_bytes": 319541919, "checksum": "5f246aeacef0dc8d40a036bb1eeecf278f66d7215a134fb746d30f3420d18c18"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00894-of-01024.json.gz": {"num_bytes": 319528897, "checksum": "9975fd5d23d25938f00de3fc9240d77c27b4784c2f443b1914652a06d3b59fcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00895-of-01024.json.gz": {"num_bytes": 317548307, "checksum": "7af9e2abfaebd4afe05a0e28d3e6e3126800a8b9b7ad49de360e42f2eb2c8506"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00896-of-01024.json.gz": {"num_bytes": 320278601, "checksum": "1941689d6a0e449423faad6e41714f33d5b23cdb1bb73961a888a87678fc74b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00897-of-01024.json.gz": {"num_bytes": 320161831, "checksum": "3d951cb1ae4a9b3c6ff70555139435febda83d24bb04ea27b229a05424b470c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00898-of-01024.json.gz": {"num_bytes": 319341305, "checksum": "3227b97aa9ff57b62be2a26fd8131e9ea45f7731673acb43432e529ea4978a25"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00899-of-01024.json.gz": {"num_bytes": 319658969, "checksum": "c746f8bd5fffac933640ff39db0b9d7b022edb28d7a4b3237d8c69fd919b7b48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00900-of-01024.json.gz": {"num_bytes": 317494627, "checksum": "0327f0c57a668b2b34e72f4c53d4cfaeed787d879843d0bba27b5be58d1ee5fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00901-of-01024.json.gz": {"num_bytes": 319683481, "checksum": "886449092779ee26fccd11e0c89c36e449346dc6b1f0a7cb15b6b53c897790a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00902-of-01024.json.gz": {"num_bytes": 320228529, "checksum": "6960d8539df78e98858ba8cebb2e637b6c2ef20890b5f2af1cbf4621b52c364e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00903-of-01024.json.gz": {"num_bytes": 318961279, "checksum": "4ddb3c9e9276d220f1d4dfc32bb61a090e895e9e3c9f53c169db99a024e7cd95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00904-of-01024.json.gz": {"num_bytes": 319926290, "checksum": "69a941cbbcb673efdb254c162854fcfff6fe1132182210235b91d1d21ed4d2ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00905-of-01024.json.gz": {"num_bytes": 317982280, "checksum": "1d9613f366b91102d018e57894df520aaf1910aa98e06cf369d9676e498610c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00906-of-01024.json.gz": {"num_bytes": 319012210, "checksum": "4855989c814582f5cc0a5e9b8f9d1f642ae33de81625d4bbafaafb709c1cd260"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00907-of-01024.json.gz": {"num_bytes": 318515420, "checksum": "8f34dbaa454215922a29fea975357e4e705381a65e4dcaf8b0d8c200f9a277bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00908-of-01024.json.gz": {"num_bytes": 319286320, "checksum": "536bf0610a2c14d1d59aea0b52fdc29cec19cd7eaa4c3a5e5fec04dee103b29e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00909-of-01024.json.gz": {"num_bytes": 319938295, "checksum": "3bb3943183f579c15d0d30440f6c82d0c9c64d6ded398dfc7c67502d73868781"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00910-of-01024.json.gz": {"num_bytes": 318423425, "checksum": "adbdcf170531c725b54c1e5713676b789589b2fb77310f3e64a0cc30b83602ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00911-of-01024.json.gz": {"num_bytes": 319578185, "checksum": "a1342a95ce77013820c36e7d038ed47ca4d40cdf3584a66abc310132435b25fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00912-of-01024.json.gz": {"num_bytes": 319154715, "checksum": "4973afcb1d7b4816e3a3df1b9ce1e48a0eea4fe8ead5f83ea753e46a934e5ddc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00913-of-01024.json.gz": {"num_bytes": 319011218, "checksum": "c9a158f69a123859569e1cdd475355afda32d7e5c48001591f0b6c20dc17d572"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00914-of-01024.json.gz": {"num_bytes": 320027387, "checksum": "61f6c0f839908e7d3105a6926c501bcacd293d1ba50c3b8639ee227c9a8270b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00915-of-01024.json.gz": {"num_bytes": 320280632, "checksum": "a74fb91d8f7d79b09017a7f996b6ca5d59e4ecad9fec354ac977c0076d53fc66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00916-of-01024.json.gz": {"num_bytes": 319278877, "checksum": "cbbb8dc274fabb4435db5fef5da1d91671e1a4c7f3f652742324f9632b01c5dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00917-of-01024.json.gz": {"num_bytes": 319616831, "checksum": "31e62cbd6209fb7831078e4a262d1b25c0590f9425c62b2b208d4030ed5722d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00918-of-01024.json.gz": {"num_bytes": 318635363, "checksum": "95e5c2f51abc9ef4c0422e91b77f79ff83c8cc38e585df621fbc0dfef48a84c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00919-of-01024.json.gz": {"num_bytes": 318885096, "checksum": "ea5960d4fbc7d5e7097edbf2c9c706e6b7c7e9d3e36633be9bd68c4038955f10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00920-of-01024.json.gz": {"num_bytes": 319228627, "checksum": "73b721ae576dcfa83bd963e49530f73d76b788a669e3abc1c02189900c80cf02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00921-of-01024.json.gz": {"num_bytes": 319557114, "checksum": "710c65cd504e87b5019c01f658e669d1e023473d879913a9522760d33546cf24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00922-of-01024.json.gz": {"num_bytes": 319356053, "checksum": "f0b54b3c6b51a356debc9414df0438ee525ae5114cbb7c8176634b7493095022"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00923-of-01024.json.gz": {"num_bytes": 319766600, "checksum": "d5b80091c8113c283d91ff5826b46068b96c423c0dc74a646e2c8d1c5d815cea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00924-of-01024.json.gz": {"num_bytes": 319733540, "checksum": "56a54c7d4114c21c1657df0d295839c2bd4904cd1b651104e2a155c2bf1b5aca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00925-of-01024.json.gz": {"num_bytes": 318944357, "checksum": "4d396c29cd1d9ba16016fac37c333c0a872f6cb0e9faae7966e53f6e5c879d67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00926-of-01024.json.gz": {"num_bytes": 320276135, "checksum": "39a64c261a76d5e13f187f12c886b22e2db08fba968bc9d0c1cb0d3c241abda7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00927-of-01024.json.gz": {"num_bytes": 319181837, "checksum": "86db529dd52fb67173588fcbc9f0e52c99ad6dd34e44865150bc6c962de5b3c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00928-of-01024.json.gz": {"num_bytes": 318966114, "checksum": "d232df8033ddaa7397dbcfa8ba4ded9421ee9bfc091c725b311fd963b29f13eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00929-of-01024.json.gz": {"num_bytes": 320087917, "checksum": "fca6bfe8fe17c867681c58df081f2186dcc6bf22e46ce3783f85b918644c0b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00930-of-01024.json.gz": {"num_bytes": 318921677, "checksum": "b8031359e758cd835c44e81303e04ef7b2137d2e1a9472d7e04552c353d883c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00931-of-01024.json.gz": {"num_bytes": 318978028, "checksum": "bb5f2ea8a2e56c69813bdc08cb243c0763126e7b5f6c5cb57e7f4767d2126f89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00932-of-01024.json.gz": {"num_bytes": 318627424, "checksum": "f6fd2065ce202d5347243a2b396707bb606be20c1829989bd7dff6d9fb7adec9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00933-of-01024.json.gz": {"num_bytes": 320226802, "checksum": "b303d2ece81c1f7b882703b915765212796518010aea6a108a441dd0a84a6128"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00934-of-01024.json.gz": {"num_bytes": 319908526, "checksum": "e5b05714922d132073122e83933853f52f0046c9f51f985cfbdbd310e8d677de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00935-of-01024.json.gz": {"num_bytes": 318941663, "checksum": "4296055a31409a778c516afe25a8108f23dfffaf13cac33e5ed834a37c46b37c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00936-of-01024.json.gz": {"num_bytes": 318430860, "checksum": "4634630c012ed184b264ea01c97f7bb3f1af030f2466f1d99d20bb0472f74511"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00937-of-01024.json.gz": {"num_bytes": 318008229, "checksum": "131cc9a2fef4ebe81749f1844b7c4b194b97de7db4f5253ce59207e68d8b4df8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00938-of-01024.json.gz": {"num_bytes": 319099506, "checksum": "fff55e3b2ff8b53e56ab99def626a7334ce67d2414351b2e83d84298052dd9b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00939-of-01024.json.gz": {"num_bytes": 320457851, "checksum": "8431e38c86516ed88d5c028f4a1dad32b02bcccdc03f9687d18f8312e493bcb7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00940-of-01024.json.gz": {"num_bytes": 320607829, "checksum": "a68c577555781adc777c09c68f623431469d67e9b66af7b0813f09a512b7d777"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00941-of-01024.json.gz": {"num_bytes": 318923471, "checksum": "807ffde4034b6b95a5eacb71f093686586ca11e417517894cca99dfe7b12563d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00942-of-01024.json.gz": {"num_bytes": 319880902, "checksum": "d03d04f619a8f3afbefa6d67986f50d5ee264c45de36c0ba67b069e343e002ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00943-of-01024.json.gz": {"num_bytes": 319079341, "checksum": "e482c4dee03a34a1a5756e6def26134c9a3f18ee386f5569d6cbf16d3875a429"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00944-of-01024.json.gz": {"num_bytes": 319436318, "checksum": "6241f9f35640598c05bc5cd00d8cc024dde59c0065c8935da229a8a583de32fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00945-of-01024.json.gz": {"num_bytes": 318998098, "checksum": "85f192c1ee9734da0f1dcad31c2b8111076977582e139ecc1ba959bf2df6b262"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00946-of-01024.json.gz": {"num_bytes": 321951470, "checksum": "44bccedf6a8db115bb6563d6775ff03c67511ce4e23a2de77e79edcb568c9fa1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00947-of-01024.json.gz": {"num_bytes": 318689631, "checksum": "36f0bfa191ad7d51452d51249c724150f8c3774142df3720f176f2772f42f3fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00948-of-01024.json.gz": {"num_bytes": 320347661, "checksum": "f4a7afa90b6d81a4cdc99100b75b4d3174c4d5d670042766c3e0418b7a97ef80"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00949-of-01024.json.gz": {"num_bytes": 318054841, "checksum": "f39d0c9bfc0a562ede67b8cfc57e6974a8a999e2bbc1b6940f107169b4f06e4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00950-of-01024.json.gz": {"num_bytes": 319722042, "checksum": "bf376260e5a838b3b901ceb22f922829619be710718446ee95c24400cbc73495"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00951-of-01024.json.gz": {"num_bytes": 318315382, "checksum": "987cd895f63bb74c9d4ce229ee853c7bce53c75c324366a0d06377c36030e39f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00952-of-01024.json.gz": {"num_bytes": 319247792, "checksum": "d218dda02748a22821c2ecccf1cbb136dc8772a25ddfacc7ab354fc089470e87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00953-of-01024.json.gz": {"num_bytes": 318411551, "checksum": "698768f3d7959b33fa74a3827e995b0c184bb3b4c46eba667d7dc3365fdd07f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00954-of-01024.json.gz": {"num_bytes": 318809810, "checksum": "651d9ff43d5a3f7f5945ccf26b9410018248bf64956f3485c50b0df9034fb2ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00955-of-01024.json.gz": {"num_bytes": 319761211, "checksum": "29fa5c68fb8d3719e5f5f17568ce888522de64499554b5f0f4dafafb4ee5b40b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00956-of-01024.json.gz": {"num_bytes": 319255736, "checksum": "333a90a9c13f71e41a7cdd4784684bc142c79ef99155b9d62d062db318798b93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00957-of-01024.json.gz": {"num_bytes": 319504417, "checksum": "730c90615fca09c81d9644cfae40d325851bb9bbc1af696caaadd67d8282ab5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00958-of-01024.json.gz": {"num_bytes": 319066016, "checksum": "bb565af6529720ba2a3e989769b33d978ef49cb2aae49c60f2ff98a981414280"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00959-of-01024.json.gz": {"num_bytes": 319887940, "checksum": "8992783693dd0ad5ce07427f6b5739c818f13952d90bb61312ec98f9c813f313"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00960-of-01024.json.gz": {"num_bytes": 318051437, "checksum": "4773edbc822ff8d51ec13af6c371214aea7545047d9babeeac0b29180d52fa0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00961-of-01024.json.gz": {"num_bytes": 318373291, "checksum": "ff33854746566f7d3b4ba9eadd1329ece48c034345fda000d9af73cb26d197af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00962-of-01024.json.gz": {"num_bytes": 318572513, "checksum": "a6d07f7caf55fda0df74a22b454d196fb2e29312d433bc5506b00448c22b579c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00963-of-01024.json.gz": {"num_bytes": 319488084, "checksum": "453f666c6578376508b1fe8bd3fb8ea5bf030aca5cfedf383cd23b27de15228f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00964-of-01024.json.gz": {"num_bytes": 318905670, "checksum": "74f64ed6583e6a4df4b3c3f8a76263a2d63905d51d5680d9683d86f5039d5b56"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00965-of-01024.json.gz": {"num_bytes": 319452844, "checksum": "88016c1a0663b89dc3d76689c827c82a6d128401ae05f7b70c8727d75302cd47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00966-of-01024.json.gz": {"num_bytes": 319334588, "checksum": "dd9300bdc27513dd62578e1cf3c8302647b49c61185c282a684011d788c43d17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00967-of-01024.json.gz": {"num_bytes": 317872396, "checksum": "90747ee63ac7d8176fde1f2afce8deb7e39bf19e682e17d0fcc1711d09d5f1d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00968-of-01024.json.gz": {"num_bytes": 318988069, "checksum": "2cc785d650013d35d5d31b1e85c5530b197687c69117881362bf6b98f47c22fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00969-of-01024.json.gz": {"num_bytes": 318324244, "checksum": "83750d93c788ad32a256862b8173db3549eedf52ac131f09f662f1fe0f46bd13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00970-of-01024.json.gz": {"num_bytes": 319494164, "checksum": "e0e46e185851ec569dc13a18519988ad926bdcd9bf448eff00aebf6df141f5cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00971-of-01024.json.gz": {"num_bytes": 318714665, "checksum": "941c9bf116353230417950d292c38b12b00935184162227eaec01870ab7f4510"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00972-of-01024.json.gz": {"num_bytes": 319518275, "checksum": "de30e19a155a6f4303afb0311416aa84cc3baf5a09cef55b8e2adc2a4f478f6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00973-of-01024.json.gz": {"num_bytes": 318092574, "checksum": "f70bf6727f1f308d93684ca41e9c2c68dfbd737a90da6375b58f162e8470fdea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00974-of-01024.json.gz": {"num_bytes": 318555677, "checksum": "109fe184ac9498ac571cd9c6cb38ae5ed566b0e98e8b7718984656a70cc6b224"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00975-of-01024.json.gz": {"num_bytes": 319045215, "checksum": "03c4257851857450f7397ac3d627a60ffc98708ad5aac6e1f73e6ce818fe7be8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00976-of-01024.json.gz": {"num_bytes": 319172031, "checksum": "7d98fa662aa9d0ff7ed50cc72195bdda2147212b34a3d22f0f757a4eb158d5b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00977-of-01024.json.gz": {"num_bytes": 318650530, "checksum": "bb8ccc07ecc6fd39ae97136418efc543efe5541e85910a7f333ee5cebaa3b595"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00978-of-01024.json.gz": {"num_bytes": 318609909, "checksum": "40b49f3fbb2fce73bb1851304b290fc7fb400d13c2448ac7e5e559dccfda7ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00979-of-01024.json.gz": {"num_bytes": 318881197, "checksum": "b29f96cfba574428cb66f54b20c4a848bc83438256167afdaed576a3931117a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00980-of-01024.json.gz": {"num_bytes": 318506081, "checksum": "a15996adaaf41e5615cb5c7fa2ef1b4e3003836542d0851d1c6907522f534fee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00981-of-01024.json.gz": {"num_bytes": 320000305, "checksum": "38e282b433c4e3dcc9fc2b056f6ddbe4eb857c5137f7c51301d53ca259d6bdc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00982-of-01024.json.gz": {"num_bytes": 319959158, "checksum": "97d5e58088a87a15b71db975d5e09b69daf497b7dff3ef809e1b8292caa27905"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00983-of-01024.json.gz": {"num_bytes": 318921242, "checksum": "f062e04f89132576ac1969fdaa43db761a0ff7e4269a6f173d87fa011a4c289b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00984-of-01024.json.gz": {"num_bytes": 319577980, "checksum": "e52a6c08d5243717f21120b4c3ebc8fcf77168928945adf68bc665392a6e8d11"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00985-of-01024.json.gz": {"num_bytes": 319812101, "checksum": "8b4f5645ae0e0b190af4ca5335c57735ae919d3c6402438af506c7907f1d1494"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00986-of-01024.json.gz": {"num_bytes": 319582409, "checksum": "3654109968d918aa4d8db17cb7057111c42894cfc7eee093df13036cfb3ac6fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00987-of-01024.json.gz": {"num_bytes": 319957581, "checksum": "4b9e6febb461940b993c50945a2ed06736c6786aa8f758565ff545814ebfddcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00988-of-01024.json.gz": {"num_bytes": 320346479, "checksum": "2891565dd75fd4354777b4f4f393983180584ee9c64b5d9b4557dbf26a3c4cfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00989-of-01024.json.gz": {"num_bytes": 318546717, "checksum": "929d0236c9fb77d638e0a18aa97b00004316bbb0ef3c4323e39f61aaf7c0af53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00990-of-01024.json.gz": {"num_bytes": 319606761, "checksum": "6ebd2552ecdcce7b194d4f6d5b5e66ede9d65da4e4999ee8ec4705d847e473ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00991-of-01024.json.gz": {"num_bytes": 319117521, "checksum": "1b3496964d0a895b347529ddb7b712d211c9419317fb41cdd6e20bba43f39f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00992-of-01024.json.gz": {"num_bytes": 317781551, "checksum": "9f9cfb5f9152b9a60121b03c24d944129c1ee43e862112fe3896e2772fef99a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00993-of-01024.json.gz": {"num_bytes": 319341839, "checksum": "fb329b7470ae127efe1be4adc960b06eec4f55bbcbe1f3f0f0b794d70a8aca14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00994-of-01024.json.gz": {"num_bytes": 320357337, "checksum": "bbe9a60c3c2b3b5b11a5d531d1d85f0a90ebe3dbc79189b3825e169ae302932f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00995-of-01024.json.gz": {"num_bytes": 317824612, "checksum": "26643091ae3425b63036453ffca7ed82c85c24b6a24264197e6516b68a39a4c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00996-of-01024.json.gz": {"num_bytes": 320453890, "checksum": "db33809437e62bf1f086f40e4d66ad0133db7c7d406b2ce52ce5d9c9b0809961"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00997-of-01024.json.gz": {"num_bytes": 319469732, "checksum": "3447b74f09dc4d63dd04d6bbd4382147071504338e6ea428b37c3a5174877537"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00998-of-01024.json.gz": {"num_bytes": 319562604, "checksum": "270a1c19e6321541398836d3d982c2e396db99abf94317912714251d1f68e8ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00999-of-01024.json.gz": {"num_bytes": 318895764, "checksum": "d68f8f4d85d91679c20e972b2b1955d41a8f6601873bb311a2621f4b3f3152a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01000-of-01024.json.gz": {"num_bytes": 317697031, "checksum": "68b47464ca3e97e9d3f4075b656f804c1bab667f231701db9cce1f0b0a921088"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01001-of-01024.json.gz": {"num_bytes": 318915840, "checksum": "582216879b058ccd4d0ca2edccaa2db49b64459371f8798a1d9c66c06a0cf908"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01002-of-01024.json.gz": {"num_bytes": 317811256, "checksum": "6864299a7d0174f92abc696dc293524291623891b86cd69132348fdf78760a4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01003-of-01024.json.gz": {"num_bytes": 318605529, "checksum": "4ef35b7546266f99eae5f332cbe3e284801c5d7b39f840297d67e71c036edf62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01004-of-01024.json.gz": {"num_bytes": 319379897, "checksum": "040dfa80eaf8355370d8a50692bc3ad03a1d57272af340d70031a4398f37b9ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01005-of-01024.json.gz": {"num_bytes": 319515177, "checksum": "012ac70ef2715181ec1fb578a2366d68e786d3a9ea41c59c08d7c494b89b429c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01006-of-01024.json.gz": {"num_bytes": 320078217, "checksum": "46030d85d8333ae224320fa54e487f3770de7de280cd0001344136b0bd87c431"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01007-of-01024.json.gz": {"num_bytes": 318526753, "checksum": "dd432d865ef3dba4b5af30e42b11ace96900bd7b97af053ea892292e75bd142c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01008-of-01024.json.gz": {"num_bytes": 319407137, "checksum": "165cd3a688be6f9f5a4cedde198a9dda4f9d3dbc1d275d1e99411f3ee96a0d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01009-of-01024.json.gz": {"num_bytes": 319763066, "checksum": "e44e86d497f8471e53531374b0e6ee61aac54996b6af64a4af0f5620673f9f7d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01010-of-01024.json.gz": {"num_bytes": 318653930, "checksum": "61115f16e718d3a2b66574cc17841aa5d02739762138abe3c9a7f325cf9f2e31"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01011-of-01024.json.gz": {"num_bytes": 320037079, "checksum": "65e18df845f1e6cce1bb92a45f71274dca94d3f0ece1d556116085b5c0e6338f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01012-of-01024.json.gz": {"num_bytes": 319753418, "checksum": "cd5a8ee1bc7d9ad58e98aa6fe56d60501115592519a19efcf9fa370668c6327b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01013-of-01024.json.gz": {"num_bytes": 318657671, "checksum": "986ead2c1b37f4094aa6f7a7882824ff013e6393323d5290d7f3e9215589d07b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01014-of-01024.json.gz": {"num_bytes": 318028602, "checksum": "3c82c0611fb1fb0f635eaedd2bbe7cfc9d53d1ae967a9cbd0416def046e4b104"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01015-of-01024.json.gz": {"num_bytes": 319164504, "checksum": "5eb5cf76022b12d8751a2fce5c4d4831066785a68edd7b3cd3dfc10017f91621"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01016-of-01024.json.gz": {"num_bytes": 318474894, "checksum": "a99d827be814e27d948264d6ae55c6a032a664f3ff0ef6ae94bda90f7faf29bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01017-of-01024.json.gz": {"num_bytes": 319516762, "checksum": "7eac25ebb9383a4592023634b852d88a128604c494972a8fd9e2b183fbb303a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01018-of-01024.json.gz": {"num_bytes": 319433935, "checksum": "35adb751748043a36f22b412d3ea0e01166037cd96216f516abc547e9d2609ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01019-of-01024.json.gz": {"num_bytes": 320305440, "checksum": "54c4d52564221e48dc5354cb51d447658707ab8edaa3d6d8fec5ec379a29d462"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01020-of-01024.json.gz": {"num_bytes": 317445661, "checksum": "edf1c6ab9900d75b91738fc7e9e3db8cdde3f9ef2234ff249833b5cdb04c65a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01021-of-01024.json.gz": {"num_bytes": 318134525, "checksum": "1c5e670ec9d815637e9bdbd75289c7ef7f3ecf384e32f403ae8a9fe2595cc983"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01022-of-01024.json.gz": {"num_bytes": 319809162, "checksum": "9def881764ca614c88ceabb41032d3e145f06c843a7ceebd87dba6b93c974a6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01023-of-01024.json.gz": {"num_bytes": 318155801, "checksum": "552a6a2be423c0ecbb767611074200c5b85c1cf76c8640c79e3be5e967b293b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00000-of-00008.json.gz": {"num_bytes": 40471190, "checksum": "1f25b6af12da84115301d4ee93ea5246c8fea5bb4a2008472794d95b917cc97f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00001-of-00008.json.gz": {"num_bytes": 40675053, "checksum": "db4c23d7a336032de37dfe2f3ed39653c8afd94004d4e8d9c73c03222299292c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00002-of-00008.json.gz": {"num_bytes": 41175078, "checksum": "4bf6b248b0f910dcde2cdf2118d6369d8208c8f9515ec29ab73e531f380b18e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00003-of-00008.json.gz": {"num_bytes": 40728516, "checksum": "082b72c1ec600502df2e4403df6884390c85627ffdf37a5b700397c9a1ac6b8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00004-of-00008.json.gz": {"num_bytes": 40920200, "checksum": "37c2ce46864db0b6f1fe89220ebf4ef811ea10485c8336f1712227bbbdb530e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00005-of-00008.json.gz": {"num_bytes": 40921460, "checksum": "00b164e59df49df5dc1df170db99bb0d9207a6329cb9272ed8b6ef7a55058359"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00006-of-00008.json.gz": {"num_bytes": 40549809, "checksum": "86896a9baffe0ab9df39a2901f0e515009989ca1fec9a42583d718ce16166b5a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00007-of-00008.json.gz": {"num_bytes": 40446172, "checksum": "0bf87534c7050091c60466df50f174c3147d052ec7dc645da9574c902445beaf"}}, "download_size": 327104523018, "post_processing_size": null, "dataset_size": 1658004128680, "size_in_bytes": 1985108651698}, "en.noblocklist": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "en.noblocklist", "version": {"version_str": "0.0.0", "description": null, "major": 0, "minor": 0, "patch": 0}, "splits": {"train": {"name": "train", "num_bytes": 1029628201361, "num_examples": 393391519, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 1025606012, "num_examples": 393226, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00000-of-01024.json.gz": {"num_bytes": 396728190, "checksum": "06fcf4d9bf6ae45fac94245952f000c924d2a0b5cc8841c916b3ee949333410d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00001-of-01024.json.gz": {"num_bytes": 395686133, "checksum": "8a0b64c5efb1db1ebcc0a664c801221049f5812652dc1a727a0e9f8d0df0cd0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00002-of-01024.json.gz": {"num_bytes": 397762165, "checksum": "087fabf9563297a6eab8bc39b68c0c6d15169032001d3a17c9bd964080759f2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00003-of-01024.json.gz": {"num_bytes": 395307518, "checksum": "1e5b89200528320e354f60be0868a3ab6dbbe667a6b16b48e4739b988a6360e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00004-of-01024.json.gz": {"num_bytes": 396280504, "checksum": "8291badbe84854960c0ddac3d6c226cb519268d1b3fd267bd72cfb4f10800de1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00005-of-01024.json.gz": {"num_bytes": 396636600, "checksum": "c74226ceada7d78e3e7a2ad931d0a99df93f4cc4377ec69d4f1fab4164c3d845"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00006-of-01024.json.gz": {"num_bytes": 395364336, "checksum": "4e52e99dfc4e55c41226978b4dbf48fac2f886b9b0446bc3bd576f32bdd7cfea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00007-of-01024.json.gz": {"num_bytes": 396428805, "checksum": "283ae93ecc3f8daefa9c47651ded763dc5f339ddc619c8cb5e32dce9cb9cfe4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00008-of-01024.json.gz": {"num_bytes": 395030041, "checksum": "d3fc7fffdf9c2172d233bea3bb7dc485d753319e6196672d0186b8ba04a1d903"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00009-of-01024.json.gz": {"num_bytes": 398255693, "checksum": "61e10cef5c2cab162fb1d26f97fd9d76b30c9ee989c01ef8597d2a4e35b303da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00010-of-01024.json.gz": {"num_bytes": 397825333, "checksum": "f72040887c2a2c17564c2c6a9a4b5ff95fce6a0eed4f0800cdeff8277af651ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00011-of-01024.json.gz": {"num_bytes": 397877458, "checksum": "ee34ff11164e10a86f76593205cb13986c70ea3d3a8849174a6dfb5b4ec91262"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00012-of-01024.json.gz": {"num_bytes": 398317059, "checksum": "7a3ef558efaca3e5d19e9ad02b47dd61f9639dd806130b62d66e9c3341c0edce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00013-of-01024.json.gz": {"num_bytes": 398518794, "checksum": "f5a6c18992ab2b59a9c02469d20768bf5757624e03bcaf92957ce736a3a9edb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00014-of-01024.json.gz": {"num_bytes": 397026214, "checksum": "c174b625c1534c69814f8e4879169b58af96f801dbb433113740af0d78535abd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00015-of-01024.json.gz": {"num_bytes": 395621683, "checksum": "4e8e52a602d4eb4b27104780f4a36617505505fb66a82f36e90631a4e668f5b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00016-of-01024.json.gz": {"num_bytes": 398138551, "checksum": "a3e7a95b16f09e09e45f1c3bed3524415581e21b065d8efcc66cece705dee4d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00017-of-01024.json.gz": {"num_bytes": 398720813, "checksum": "79cdb89052e8dcecd1f1319e47f4c4ae1d350ab81777a9ba8077cebdb558e795"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00018-of-01024.json.gz": {"num_bytes": 398538940, "checksum": "8da6aac3a794ce326b5a3971fb75a2ee848f008940d4f1bedd724ce7c5874278"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00019-of-01024.json.gz": {"num_bytes": 396834319, "checksum": "b57c93502949dad9001e89847947f6c65943927eb519e16de4eaf5590b235faa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00020-of-01024.json.gz": {"num_bytes": 396402861, "checksum": "05e14c7e21df3d4af7be7a597fa22463868464d6475282376536e12e82367401"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00021-of-01024.json.gz": {"num_bytes": 397560852, "checksum": "756d15d8b07414dffd7cff3efde606aa62cf8f73b85d8e1cd17408d6a339414b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00022-of-01024.json.gz": {"num_bytes": 397210987, "checksum": "60aa08d9c5d813d5f2448d910bc23a705cdd0828a9403c18ec223e53623889cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00023-of-01024.json.gz": {"num_bytes": 397563062, "checksum": "bd865213ffb2b40c2cd3eb16724b68c0f37e29f68215990dc84d91852c7c0d72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00024-of-01024.json.gz": {"num_bytes": 395799120, "checksum": "08ff3615ecea3eb5b55703e123475c95afbecfe7107eedf05750147c9ffd12ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00025-of-01024.json.gz": {"num_bytes": 398336372, "checksum": "e3e30b97e585fd881b3a1b006775854a11a2b967d992e7eea886338d8beefb13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00026-of-01024.json.gz": {"num_bytes": 396819084, "checksum": "fddc9e1a8405c5e05e63ce98b19c7833c0fd46392b4b55532b317e7f81426590"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00027-of-01024.json.gz": {"num_bytes": 397912380, "checksum": "d3e597b3a96b993840e47adb761cce2f2ae1c96aefcbd6c250198dedaecde15a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00028-of-01024.json.gz": {"num_bytes": 399078461, "checksum": "abd6d2341b6c61cdb89b80a8b9bfd938bb6d8a423a89e6a9f997c22c6479d537"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00029-of-01024.json.gz": {"num_bytes": 397303107, "checksum": "ee35a3af1056cdab79b644f6352150aeb6fb19a630cd6bc893a072e35fbfbad2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00030-of-01024.json.gz": {"num_bytes": 396602401, "checksum": "1d04d4bc295aee2ab80b24f587f8c483599db7d5a8157acc99a1d8b001f8353e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00031-of-01024.json.gz": {"num_bytes": 395941329, "checksum": "cf1dd244555511245c0e6a5b1dc9c24f747b8377674aa3690677ce08ebb8c26f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00032-of-01024.json.gz": {"num_bytes": 398049663, "checksum": "c83e5572647eba5ab14fdc4dcba8efb6981740b99b8f634e2c6b1942a051c249"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00033-of-01024.json.gz": {"num_bytes": 398044404, "checksum": "b76815aadcf4ad802071428864ce0b406cabd73dfc2be5e20b44885ec6a85419"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00034-of-01024.json.gz": {"num_bytes": 396885224, "checksum": "da00d92418fbdb9799d8f16977b3a33f67cb98a31808544cb68cf3b42ea9adf1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00035-of-01024.json.gz": {"num_bytes": 396185021, "checksum": "265ad43ce00666c83fd441d35ff29ba1ebf7d62442cc3e3c176091b4c725ea9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00036-of-01024.json.gz": {"num_bytes": 396702503, "checksum": "4733156df48f2dd0f2e859fef28f56d12a84e8012085ca9318073ae647b0fcdc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00037-of-01024.json.gz": {"num_bytes": 397582277, "checksum": "7d62d03c3496ee2e17ab6b9635710efef9e4cefb88ddccdc16ed720a414c38c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00038-of-01024.json.gz": {"num_bytes": 396186761, "checksum": "670affddf8fcca6933af3f5b30efd1bf490c3e38c3e90f2e8e9a464994d613f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00039-of-01024.json.gz": {"num_bytes": 397056953, "checksum": "4acbd97f9c8fd9a930a6f4284a11cfe37f6cca3b5858ae3c2cde747dae35e0d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00040-of-01024.json.gz": {"num_bytes": 397809786, "checksum": "d350e48a36bb1ba3125f72a07ed8024d26eae6d89ecac686ac0bdf3d5d89e1a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00041-of-01024.json.gz": {"num_bytes": 396944358, "checksum": "817a58dc40440b8b1f54d129db08ae9124e0293e5a0e45f034fbffb2140d90c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00042-of-01024.json.gz": {"num_bytes": 394327995, "checksum": "6bd6bc1269c2dd81db466ae9c41f76b8b8cf71cc7bd6e131452fa1a1318ff459"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00043-of-01024.json.gz": {"num_bytes": 396476043, "checksum": "f3525d9c861d984ea0cdacba7fddffaef058d8f95aa99ef1f09f9f0792fde5e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00044-of-01024.json.gz": {"num_bytes": 396893614, "checksum": "292ca2b6b9ba41567fe7cc60e5424aa1f3e431ac874d06ae8eb98794563a7d35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00045-of-01024.json.gz": {"num_bytes": 395885483, "checksum": "ea2c8fac41ededba7da8bf2bb48463d83f148e5c0970a689876d4932ab18a3c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00046-of-01024.json.gz": {"num_bytes": 396963386, "checksum": "97672d9bca357cd2721f51301aa37d37a271dd3ca7487244c057570b995da66d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00047-of-01024.json.gz": {"num_bytes": 395856712, "checksum": "52c517670ba4eefb262cb71373d6370f86ddeb0aea7391a47a22d52a55bff7a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00048-of-01024.json.gz": {"num_bytes": 396091027, "checksum": "49f5b68e29c55eb50da941eab1cf446c7d8c9d0b30290318977edb39ef0b887f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00049-of-01024.json.gz": {"num_bytes": 396892998, "checksum": "82a51eb6f301c00d927ca7920338247038cf4e9e0072d74c02bac897701f5859"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00050-of-01024.json.gz": {"num_bytes": 396308050, "checksum": "d72f92ecd27b716cd90cc4abe562d25fe6d49740b4a3d1fb9beac2526a61988e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00051-of-01024.json.gz": {"num_bytes": 396137777, "checksum": "a956e4d086077f7ab309ff10b0eaf4833e4d3ed74435293e96588f4361e1536d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00052-of-01024.json.gz": {"num_bytes": 398302544, "checksum": "5a54f7faa07661ea6a5f0585ca49ad66c8f7025fd9627b3af832dc886d50f78e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00053-of-01024.json.gz": {"num_bytes": 399616791, "checksum": "7f8fa496d50a0b7c399faff4c1864e24717b3f9c86b2552536c8f91e3e0cf9d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00054-of-01024.json.gz": {"num_bytes": 397332881, "checksum": "ab862f26b4fa38b6c16d8cfd0d63a9f0973827e45915e85aefb95d4e182b7b9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00055-of-01024.json.gz": {"num_bytes": 397075146, "checksum": "cb67aa9229bec8b88e496829aa0a60ca1c3ff4a2293632cf7782b69aa71aebfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00056-of-01024.json.gz": {"num_bytes": 397827600, "checksum": "2f63e3ec40d32237d4a50c873b966d7fc2c16ef5c04a2bcfc33328b128654e7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00057-of-01024.json.gz": {"num_bytes": 397533583, "checksum": "7c90bf39bddf8ad0c6a8bb3dff02caea8bbc2abbd76047c5d523930d2a00dbc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00058-of-01024.json.gz": {"num_bytes": 396411363, "checksum": "ee6059f3c8a2df34858a0110a06ec4e9673555fa56c1a2b40930337ba5b1b39c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00059-of-01024.json.gz": {"num_bytes": 396735510, "checksum": "d9dbe2421edba1820294e757d88aa25455db42ce8992f8933b51cd84cfc35a36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00060-of-01024.json.gz": {"num_bytes": 395694553, "checksum": "b05d6502fc95587fa7047fac64978d6be13761dcc6954629332812e5937c2731"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00061-of-01024.json.gz": {"num_bytes": 397740757, "checksum": "39303faa5dc33995dfec683b44fc24066ecccdf6b5001b9c0644d8e9899d45f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00062-of-01024.json.gz": {"num_bytes": 397358263, "checksum": "fe27dd467cc2c34abe5b0bb34473ee68859f2198eeb78304e1d2e54460a67383"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00063-of-01024.json.gz": {"num_bytes": 396826654, "checksum": "1da2c414bd03e5547d8c9c7447e42b8dcff5f6ca8ba35c53076f2895e8ea63f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00064-of-01024.json.gz": {"num_bytes": 395781869, "checksum": "af96de4d6b5bc1ab0527efa33a73d7eb788dca15829acbb7291ce72ad05e6c66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00065-of-01024.json.gz": {"num_bytes": 398192274, "checksum": "7f46ccfc1703fee106e932bc9a1bc5dedf7de944172cfa34ec9b31413bf0bbda"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00066-of-01024.json.gz": {"num_bytes": 397133438, "checksum": "dd3b67d8578927d7474dae76bdca35f35a2aa125fc50873e4a9f6e73d7a81831"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00067-of-01024.json.gz": {"num_bytes": 397204214, "checksum": "4cdc87a7c9fea33e15d638e5c921f45149212769bfba5f59f0a5943398ca0d55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00068-of-01024.json.gz": {"num_bytes": 396489592, "checksum": "64d175c23574998f8c5d28ce3d3f3934144b1fd4f6527ede1aa3420c28bb90d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00069-of-01024.json.gz": {"num_bytes": 397697351, "checksum": "3329857f531c9fa22d98bd567638f0564f73062da1478ca84385246f71baabff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00070-of-01024.json.gz": {"num_bytes": 398449973, "checksum": "bd13494aa03a95d943a01f3436f62c46ee3390b30f6ff0fec0636f3c0b09fa1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00071-of-01024.json.gz": {"num_bytes": 395498960, "checksum": "5e69529ae82c305acbf1f58a7021b4e3fc67285a871dcbcaaff0781d0e721070"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00072-of-01024.json.gz": {"num_bytes": 396170387, "checksum": "9b9c7e11b9bb2cf6ea0fcdfd58754f522a95070feae74c29559522e12e1b41f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00073-of-01024.json.gz": {"num_bytes": 395915819, "checksum": "87a2069589fee8de23730b8b994ba59d63d5128175b5326ba0a8c8ac9e01a3dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00074-of-01024.json.gz": {"num_bytes": 396986018, "checksum": "e073efb3f00db65c1ee14e8bfa6e8c807f7827d0f3dd4d4026f823bc6f61b1cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00075-of-01024.json.gz": {"num_bytes": 398555103, "checksum": "a1793748c7979e241ca34291c843ca3cc90dd7643f04810b6cd324220efbd6e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00076-of-01024.json.gz": {"num_bytes": 396357420, "checksum": "7b1cd69788ca9a7e614de70a8b908183f41f316eaadf3b0236a7c4e126db9844"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00077-of-01024.json.gz": {"num_bytes": 396666167, "checksum": "aec828d3c2a1f7fa970de328a8fd1a85a90493dbcbec4f50816ccbc2275a1fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00078-of-01024.json.gz": {"num_bytes": 398167446, "checksum": "e14bdf5af810574aca7c6f3daa67e503f24ab1705435a62129c66c248667ee97"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00079-of-01024.json.gz": {"num_bytes": 399696096, "checksum": "b63756f81b8b19ecdc9bf227045df10840cbf973b60bd8ffdf28f58a53cdb028"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00080-of-01024.json.gz": {"num_bytes": 398755610, "checksum": "dfc118f680b79260e7ece75f27c0459484eb8458f2422df9f1918f726b54ccb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00081-of-01024.json.gz": {"num_bytes": 396606787, "checksum": "17d6a503947f5132728f53ea62fd093f55bf2dc6a32316a5c0413353cf13eff3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00082-of-01024.json.gz": {"num_bytes": 395714484, "checksum": "8ca41818ee6a0ffd5b00714779289c18cd97d620258c5d3d741c482b72344300"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00083-of-01024.json.gz": {"num_bytes": 396807173, "checksum": "12d87c0a948f32f788497858751c3ef22f289136e6ae58518a97a2e976f5cdc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00084-of-01024.json.gz": {"num_bytes": 397241529, "checksum": "7c3da4ca4d2b2077f0ab7be511038255732fc88d954f2f17cb0f3ab144216206"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00085-of-01024.json.gz": {"num_bytes": 398357369, "checksum": "26df55183e78f8d69fb16e21d07edf98659b69bcb3c48f340da6a5bc44007f4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00086-of-01024.json.gz": {"num_bytes": 396997317, "checksum": "09f0641e9075cb88800d0eaae3f7b99b047552edbc71d1fd2d8594f645d22c2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00087-of-01024.json.gz": {"num_bytes": 397978000, "checksum": "c9437ef5f58a46b8a6d8efcae37fa658da3f2c4f1cad0f9cf47fbcd09bb82f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00088-of-01024.json.gz": {"num_bytes": 398468913, "checksum": "be187fc14017f666b84ed7049c169c1a28654441c2f523eee8b655b3b9d9ba8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00089-of-01024.json.gz": {"num_bytes": 397071121, "checksum": "637c3f964ee2c750a0a175f2e5d24b786a37d37701f10616b448804d68b72f4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00090-of-01024.json.gz": {"num_bytes": 395753807, "checksum": "8eef7ff1a8080aebe5226cc3539baac46ab64d93f8e3ffb6e8b7ab3346e151dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00091-of-01024.json.gz": {"num_bytes": 397039764, "checksum": "a2904ae5bf69b393a697afd62ae9b8a560c1f076e8a141e6f3feef29cb5d1352"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00092-of-01024.json.gz": {"num_bytes": 397058578, "checksum": "eb4d7e2712a9983bc1581133fa8eaa2e1d28b314861833bd8d810d615ec1ed81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00093-of-01024.json.gz": {"num_bytes": 395855981, "checksum": "5c9a7573a5644d89d46666306d333ff1e4af3213f287cb9adb48ef87a023d479"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00094-of-01024.json.gz": {"num_bytes": 399516118, "checksum": "de7ae1508815e48ba031762c084cf6946b084871463821407090d23c197c6474"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00095-of-01024.json.gz": {"num_bytes": 398236235, "checksum": "616cef1f21ef078ffb9fc2b4148735668debdd15a8bc1be281183ba3659e9fcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00096-of-01024.json.gz": {"num_bytes": 399526010, "checksum": "eb754381b8a6f3c74dda5ee5852958f7b69c707a3908cbaa9410c972e002a0cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00097-of-01024.json.gz": {"num_bytes": 397935028, "checksum": "6d6d2ca80708b7c6ad4240a042dddc2170060e8976c2e7b4ace446d2f2395076"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00098-of-01024.json.gz": {"num_bytes": 398645934, "checksum": "568db6971230fb42df8973ecb5a2a6d77204aa8cf0bdf47b386c04370da8dfd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00099-of-01024.json.gz": {"num_bytes": 398110916, "checksum": "9bacb381e3b06976619e816e40ac2ccd3bcf3cb9ecd30c294b388cfb75c8bf77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00100-of-01024.json.gz": {"num_bytes": 397631228, "checksum": "7d515ac0f767736600a216ebe7280b9751f16e70df969ba601d1aaae15f201e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00101-of-01024.json.gz": {"num_bytes": 395102356, "checksum": "87c5c81e154e136f3e090ba91682ad54fe678653f86f6f32002ae5ec3c9aa743"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00102-of-01024.json.gz": {"num_bytes": 398926159, "checksum": "2df85a9ac13812c3870180901dbba99b52e53fc045da019160a3f06d0dfa5e95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00103-of-01024.json.gz": {"num_bytes": 398383820, "checksum": "8134d12e84ed4a58a5f8f6eff8a4349f7d6ded6a1d7539b5c23193571569d6c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00104-of-01024.json.gz": {"num_bytes": 396628542, "checksum": "208f0cb3365b0243d70e7b4e52ff977e9b11d8e451adea521a5bf6e10cd40ee0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00105-of-01024.json.gz": {"num_bytes": 398737797, "checksum": "855ac7b8cb621a240319ef00197d2f20338d17db71a1aec68fb66930bc17c59c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00106-of-01024.json.gz": {"num_bytes": 397281064, "checksum": "544d5d91d066f2450bfe622ce55bdfe16a300aee9c05aaffae8a645966bc695e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00107-of-01024.json.gz": {"num_bytes": 397919761, "checksum": "f4af405c0f19c9139d93b3073f3fe328be998c9dc6f74afc7e21ad068964b92c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00108-of-01024.json.gz": {"num_bytes": 398810219, "checksum": "bdfce29353c6caa33b178bdebbf7e48526c391bc6c71180e3fa378b723879563"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00109-of-01024.json.gz": {"num_bytes": 396605124, "checksum": "ed6acc172bc9af0e31170f5533001a8fcd344e6732a4b3a714b7ad43740f25f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00110-of-01024.json.gz": {"num_bytes": 397491755, "checksum": "428b6c91f12c4f7032fa692bbe887f1a4c02635eb88b91d876da4c71f3da5e4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00111-of-01024.json.gz": {"num_bytes": 395754897, "checksum": "a723863559edf291fd8a6c2736cc1cefed70dd3c8625b967df049ce0d373f68a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00112-of-01024.json.gz": {"num_bytes": 398567649, "checksum": "a90ddc9ccfbca20b9c75bd2b7d63ee6abd03236a0f0dd2827eb9f7350d9c3931"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00113-of-01024.json.gz": {"num_bytes": 396706569, "checksum": "479052b6b9edcc2bbda40b982976e7e28d84fad7b2dce46b017f4e3d1f61e0d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00114-of-01024.json.gz": {"num_bytes": 397384355, "checksum": "a95984e4c261a3057d1bc51939aefd9413853111e19030b19c5d26f778be00ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00115-of-01024.json.gz": {"num_bytes": 397702826, "checksum": "5eaf7fc2c9d4b2ee3e216c215da7f4fc7558e89d6993033b95a940a78061ab05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00116-of-01024.json.gz": {"num_bytes": 397252590, "checksum": "268033cbbdf3be9790cb6010791693f1b490af06f9fef91b0b307420a4e30a08"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00117-of-01024.json.gz": {"num_bytes": 395506730, "checksum": "cb80908eee1054ddaf7e2e5d66c9a41505025c2b6dc7fe6aa287db0a9f3829ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00118-of-01024.json.gz": {"num_bytes": 396452136, "checksum": "d75bf895c88ff2e9c4031c1f65b067222cfbb1a937d685ab4dd33369f5f5ff7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00119-of-01024.json.gz": {"num_bytes": 396777389, "checksum": "2c00362f4d99cef2bae2f13f17b79ec56a5ef8aca18ffd56a12fea2308e5017b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00120-of-01024.json.gz": {"num_bytes": 397730478, "checksum": "e31296949f7ce2e2a74fd2443552cb64b9f3cddcca691097a56992f51033fd11"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00121-of-01024.json.gz": {"num_bytes": 396593647, "checksum": "c2f0f81e3c835848a47532d8fd1c215a624f47740196a7bb45b5099916853014"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00122-of-01024.json.gz": {"num_bytes": 396576172, "checksum": "72edb7581a623e20f26cae4885f3b9d7f329581921253ca4d7ceedfbca17b7b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00123-of-01024.json.gz": {"num_bytes": 397378329, "checksum": "4f045ce7bd077b7f878012aead8c51073022448de66d2e35a755d4c8c4a6f59d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00124-of-01024.json.gz": {"num_bytes": 396545003, "checksum": "dc7949657328520d31a27d8e267c2ab07cd4e8639036d4b1bb59454c309f862d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00125-of-01024.json.gz": {"num_bytes": 397630505, "checksum": "530bd95e5ef9a1d5989c595e60e0ab11583e0f42d16b2bd37c49ed09a67af207"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00126-of-01024.json.gz": {"num_bytes": 395483747, "checksum": "d9df071edec6959ba842509f72ad43be3ea3f529b60d48f3dfbf390908887a5f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00127-of-01024.json.gz": {"num_bytes": 397295159, "checksum": "02b61f5bc7d1d241484c4f04fd517960ae755a69f35192bdd5bb471baeba5614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00128-of-01024.json.gz": {"num_bytes": 396276865, "checksum": "0c7d618df232c36ba018269ddf3b2863cd6d63bb7fabeaae33fd508715bd8ce2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00129-of-01024.json.gz": {"num_bytes": 395314703, "checksum": "03443afda032187d2dc2e696ce6eaecbf2219e6dabbdd593379e97c0e00e3112"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00130-of-01024.json.gz": {"num_bytes": 397411481, "checksum": "8969873d5efd3df0cef1742e4bc67f2df7a5b5d9e641f7a12e77c7e8e96a1bf1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00131-of-01024.json.gz": {"num_bytes": 396925311, "checksum": "31adc39ea4eda8667662608bdad6bb32bbc82b1ee1ad53ceb4df50924a933bdf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00132-of-01024.json.gz": {"num_bytes": 395826124, "checksum": "d2f035ba2c388fec2d847bd43449c885eadd0bcab5fb8afdf031a53e72c4ec32"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00133-of-01024.json.gz": {"num_bytes": 398892794, "checksum": "b7ed60983058a5f9f0ef72602789f50359f415ecbe60dc967e7a869866d833b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00134-of-01024.json.gz": {"num_bytes": 398206890, "checksum": "9ba78624879aabb72bae0b4119fa2625793915382031ed897a0b4c3f2863b8aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00135-of-01024.json.gz": {"num_bytes": 397161888, "checksum": "9fa6fee55f5e8f887dcc64d94cc65ada6f283a580edc7926cb159b80d0084ea8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00136-of-01024.json.gz": {"num_bytes": 396185585, "checksum": "81a1fcafcedfdd9bcb32d2467d9c963cc7d8b2f32e13e52ee04db41b0d3f5483"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00137-of-01024.json.gz": {"num_bytes": 396933735, "checksum": "c7558304b614e1cff13b0f6e967fc5ef77e4953a1eea1f39ed925c33076d7723"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00138-of-01024.json.gz": {"num_bytes": 396371698, "checksum": "3e896da8bf296403f7b4061ba0b24d3c3978993de4854fabd688cfce9fbf7bba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00139-of-01024.json.gz": {"num_bytes": 397289537, "checksum": "1a5ffa3aaf565ccf4db7444983643ad06e386938a0a2d313aecdb972c36111e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00140-of-01024.json.gz": {"num_bytes": 396983259, "checksum": "4047916916fd9dd7b76a8cbc595d52803344467135f744b23bd10296004a47d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00141-of-01024.json.gz": {"num_bytes": 394947050, "checksum": "7edfc9e5870d80d470e3797e8bef5183e9d170eab410ab50957e946dde2e8199"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00142-of-01024.json.gz": {"num_bytes": 396852755, "checksum": "4affc3a24616858fab84211e3825e90a1ea7d9c8f2cfabbe9a5c9b24c21a116b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00143-of-01024.json.gz": {"num_bytes": 397579248, "checksum": "d5aa9ba68e9b30576bd640f647d4069b6c56db276cc5229573440e4a38a7f1e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00144-of-01024.json.gz": {"num_bytes": 398800367, "checksum": "fa104e63eb7a8a6b066a5f00bf05b3ea095bad35a902bc728251f096173f1417"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00145-of-01024.json.gz": {"num_bytes": 396709510, "checksum": "b615ecd58821b1697c82094cb3435375924263827c342ab1b87e53907d4aa63b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00146-of-01024.json.gz": {"num_bytes": 396042389, "checksum": "6004c782f3235490865b6634b2c4840a989745b70ef2da674e75c62aeedf8a6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00147-of-01024.json.gz": {"num_bytes": 399840661, "checksum": "5e8b46726f7ff2c3dfd381fb252f1b4bddf9436fd9ffd10fa300cb0fbe76998c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00148-of-01024.json.gz": {"num_bytes": 397098215, "checksum": "0851cb274aff2ec4f781c82af11c94f8938a797aca5097fb0089299cb4c75aff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00149-of-01024.json.gz": {"num_bytes": 397540697, "checksum": "7cadf4ef9b0e29d9e8f68474464dc072b78e909a0f03c74e61b67912ff9b551d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00150-of-01024.json.gz": {"num_bytes": 396347701, "checksum": "521e4f67d12ae47b8f2a02b6f77e0c85cdf9a0efbcb45602d09ae116110ebe66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00151-of-01024.json.gz": {"num_bytes": 394890490, "checksum": "2255bf3e1940ea28da9656028dee26865a9ee682cbaab4d5aeb34c081062f8fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00152-of-01024.json.gz": {"num_bytes": 399584675, "checksum": "f8ca4aaf5706ffb0f5518c7461d9045d18c645df068aa436137299e5ca77df82"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00153-of-01024.json.gz": {"num_bytes": 395606567, "checksum": "24f0e81dc3140f063ac89173fc262b01f2420133025b114f29632262cdd2e7fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00154-of-01024.json.gz": {"num_bytes": 397925578, "checksum": "5f40a87b15b0acebbd324e7c5cd2c0f31f911558d57f774f278634db94f2d5f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00155-of-01024.json.gz": {"num_bytes": 395428741, "checksum": "36281c154f187a09a83822878da815cd9b7f659a41cd90ac64653b437e798c72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00156-of-01024.json.gz": {"num_bytes": 396799274, "checksum": "0fb66965107e54c9fed0013962763e874b940b0e174d775b21fa5e688fa53b33"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00157-of-01024.json.gz": {"num_bytes": 397321211, "checksum": "014d1443a4940fe95089bf87e245817d3a90c50e3e371a703098f5b9c3f6c759"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00158-of-01024.json.gz": {"num_bytes": 398736992, "checksum": "f912d27d68318fc0089fbaf8e0481ebe8dc5d2963cb89ed315f3bec637460bfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00159-of-01024.json.gz": {"num_bytes": 397250687, "checksum": "1bfd02a301b09bfd53058522d0613e1fbecb788d3173eb30b58115cd1cbdb477"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00160-of-01024.json.gz": {"num_bytes": 397492158, "checksum": "149a7bd76e9ea41185d99d21df870ddd4f32857fdd628cee927d6bee7d6a527d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00161-of-01024.json.gz": {"num_bytes": 398383574, "checksum": "0c385b4c9b33574cdc75070309a0aed46aa7b2e3b8754a7692035a3c5a04f916"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00162-of-01024.json.gz": {"num_bytes": 397126197, "checksum": "5c012b2a6bbc9413914ed1420b6150a5549cd74185bf2788d8809005034d433f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00163-of-01024.json.gz": {"num_bytes": 398201223, "checksum": "79448c338e86cea2609399705268fc6011cb21c4f0aff82e3fb7660391ce85c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00164-of-01024.json.gz": {"num_bytes": 397914908, "checksum": "dfb89631dce146ab4713a03f184e864472eb133b2cd04db8b4bccab688e9e287"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00165-of-01024.json.gz": {"num_bytes": 398142696, "checksum": "74acc88d6612aae7bdf5187d3b9eddcdb04cf60f1cc350661ffa50219a747f9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00166-of-01024.json.gz": {"num_bytes": 397533050, "checksum": "757d23402b3a155cfcb6b30bdc305c8014c9b64ba4e067753664670c2c5e9534"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00167-of-01024.json.gz": {"num_bytes": 396241119, "checksum": "521bd7a9dcfa0390c35e50a3d0cde3ea627ca538dfc419a97ed83b251d8a3005"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00168-of-01024.json.gz": {"num_bytes": 396041761, "checksum": "dc540ec27d5999f6a4c71f075ae1ec64ea84415c720cd2b6ef3fdac925e576da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00169-of-01024.json.gz": {"num_bytes": 396350882, "checksum": "36d5d35075a82038dfdd5abd29a839f4e9ab79d51f0bbc635d3dcf3f5f1e2732"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00170-of-01024.json.gz": {"num_bytes": 396885157, "checksum": "db9a3f6a7e085007eee381357ea9e4d5d6f702580d38220860967ec441ba3525"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00171-of-01024.json.gz": {"num_bytes": 397266368, "checksum": "7f8098cb6532bc888d3c1f0ea5072cf8419ce1689b9ffe1c370ca20071e7e1c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00172-of-01024.json.gz": {"num_bytes": 397140430, "checksum": "90ae7e2551b1f3bf2e5ccf4fb3fac8fa3512add5e299ba7c90319611baf8c840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00173-of-01024.json.gz": {"num_bytes": 397069631, "checksum": "a86f5ab72e1a9b1d491988154fd6400e6ee8c74378a9e64276df438a3c4edf9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00174-of-01024.json.gz": {"num_bytes": 396743897, "checksum": "451cfe8e14c17113a2f6673ece27e01f8d54bed1b57d1b20cb84f125879939ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00175-of-01024.json.gz": {"num_bytes": 395780705, "checksum": "3252e9781545bc3f9f19ac6e8fdb87d81cdc5a94838798daf6037c9f4f473db4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00176-of-01024.json.gz": {"num_bytes": 396205053, "checksum": "49d1648d37150b90632a6459828eedd82deb2fce7f108bf4e1b050f2f9ad1668"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00177-of-01024.json.gz": {"num_bytes": 396248718, "checksum": "99346ccda762ae85038a10baba937ef8ef668a0beab483c4005dce77e331768b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00178-of-01024.json.gz": {"num_bytes": 396634813, "checksum": "8d3bb1610ce79cf359d75f32e7624b6203140ed3eb276362b040615e9ffd4b54"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00179-of-01024.json.gz": {"num_bytes": 396524113, "checksum": "971e5c9499425294cf5945436b2ee419379a75bdd72d4cd6a33b1d17c17de298"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00180-of-01024.json.gz": {"num_bytes": 397938782, "checksum": "dd6b3e60219788b82ab3fc63a9e65f38f64aa2f7b294135ec2d16b36350f1f40"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00181-of-01024.json.gz": {"num_bytes": 399155769, "checksum": "c6a806d627a9d197789bfc6257a92b0223ca51e724c3c2ad10fe2397dbe30848"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00182-of-01024.json.gz": {"num_bytes": 396136228, "checksum": "2c48e3237253eaad9afc121e6946a9e1856bbe82c5a7cb287b05cff3e6ea8e8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00183-of-01024.json.gz": {"num_bytes": 397083292, "checksum": "52645e03ab47da01bb40226eb90042be914f1170688ae940314871e16cbb1037"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00184-of-01024.json.gz": {"num_bytes": 397402964, "checksum": "1edbdb41edeabc108f0147e18b439a75e390e0a843ed915f1cbf73a7c7f7867d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00185-of-01024.json.gz": {"num_bytes": 398411052, "checksum": "ef071e52174a19597e567696262470906275c2cd1cbbb0b1e98864999ea2d463"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00186-of-01024.json.gz": {"num_bytes": 397122443, "checksum": "0d87080bc08f7f8a1952a7df57ce2bdbf61e40c05b61937c8c19ae0ecd952b1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00187-of-01024.json.gz": {"num_bytes": 397244868, "checksum": "4aed75ea9f885fc3dab599c19c7bb98f7d57ce2b2ec11ac8ab3258fa479fc0db"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00188-of-01024.json.gz": {"num_bytes": 395677432, "checksum": "342882e436ea826cda9fd38c0caca68bb35444a2a07596f8de0e53a3e2169f59"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00189-of-01024.json.gz": {"num_bytes": 393653750, "checksum": "22ed9e389f6c8410c9bde898d97ad798c236c2da4d0b2c76b86d013f8686da03"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00190-of-01024.json.gz": {"num_bytes": 395437920, "checksum": "b3f9ba5834d4f0280d6defd3bd50fdf961bee6be4c71ed47046cf4e115acab01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00191-of-01024.json.gz": {"num_bytes": 396944861, "checksum": "4e7ed636a60edc44b5ba709dcd83bf4263ad8d5a06a02827d3d27191bf3731a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00192-of-01024.json.gz": {"num_bytes": 396611165, "checksum": "4fea34466d9b470bf0bc44455183b2c61994c4e71e4bfb684dff3b5e3870d1e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00193-of-01024.json.gz": {"num_bytes": 398283211, "checksum": "4c4e6d31f455831330971ed1e0c33221203401b817adbda5b53de16f8299a9ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00194-of-01024.json.gz": {"num_bytes": 398915952, "checksum": "dfd0b1ceb2a437da8cd38c9c791af809e94f2e36ab4399b2a45a5b916f4ccaa9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00195-of-01024.json.gz": {"num_bytes": 396352694, "checksum": "0ccd90ced34b3ff28c21d015a87eca3f31eae2bf31f11f25ac073139f9d50c22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00196-of-01024.json.gz": {"num_bytes": 398582922, "checksum": "f22e59765cec074a0c687c500f4e6348250d0e418d12dcba211e39c133aaf290"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00197-of-01024.json.gz": {"num_bytes": 398839554, "checksum": "95fa68cd75d77a1b5bb526dd5ef16a2f04a3520604f734baeb6e2d95608b5973"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00198-of-01024.json.gz": {"num_bytes": 396202192, "checksum": "f0e6343e8105178b38f75eade6774aa6e85b62a271622fcfcbe2745f1cae11ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00199-of-01024.json.gz": {"num_bytes": 398029364, "checksum": "4c58736410c8d3c7174ce011e2f281cb16e4949d756ff4ace86b4a9d4795c04e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00200-of-01024.json.gz": {"num_bytes": 395867629, "checksum": "1cb798ee6609e670053987d881d130d5b73db19d9f37fecff7a6da41152aba05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00201-of-01024.json.gz": {"num_bytes": 396858169, "checksum": "7357eb22b2aa75c55885252c62d12e08cf8f7ef285c0052cf1d706c3f0f74fef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00202-of-01024.json.gz": {"num_bytes": 397955766, "checksum": "8901d0f27c4c11916cda7cf806cd00000771b6351954c8503bc312cca5ad3a10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00203-of-01024.json.gz": {"num_bytes": 397737882, "checksum": "ed51917fc8936701b681cfc49ef95b2dab451ca597e76b34ba90be9405a1a0b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00204-of-01024.json.gz": {"num_bytes": 396094006, "checksum": "88692bb8da78347cb97c0e0849d1a10a97b1686cde1f75626236b89bd507e2b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00205-of-01024.json.gz": {"num_bytes": 399027636, "checksum": "fb17fe19d1f0fcaa43fb31a3ad9b105b3d93fa287351c7f93fb599edb7f40bc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00206-of-01024.json.gz": {"num_bytes": 399406254, "checksum": "668d2a9927080b686a4d728236e4cfc780b262f9045dfe9575cfc48cb69d6adb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00207-of-01024.json.gz": {"num_bytes": 396291803, "checksum": "928f451dddfe42bb2ca791dbc61c36ddc618006ef709eaccbc2beb665c8427e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00208-of-01024.json.gz": {"num_bytes": 397807368, "checksum": "11e8627b758588056b61d31de07c50092222013a38ba802b7a9ae34b6b8b84a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00209-of-01024.json.gz": {"num_bytes": 398085408, "checksum": "d49d31d1719698ab7a2b9ee91d887f3192c8fc1b6108152a75b39de2a0ad25a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00210-of-01024.json.gz": {"num_bytes": 397670254, "checksum": "049b3294c3e22e6db6c115979a4a55f0650966c600ca17250e91b241cc97bbd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00211-of-01024.json.gz": {"num_bytes": 399643598, "checksum": "7772f26fd90f47033670e7f1d3f6fe092116486bb9a991577f9560b54ed3832c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00212-of-01024.json.gz": {"num_bytes": 397390768, "checksum": "7a24e4a70f43f6227fe6491fcc7bb6b2a19cae203521c803bedf8882c995d7e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00213-of-01024.json.gz": {"num_bytes": 398657925, "checksum": "21d0ee8d1a01957b56ac503aa88c6f3269b4e4692762a3f929fe0e7069be8c0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00214-of-01024.json.gz": {"num_bytes": 398282324, "checksum": "ede2d9824d8f99dd578a36ea82caae942ebcafd99f308cf5d0ff8aa4a56f0a05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00215-of-01024.json.gz": {"num_bytes": 399178235, "checksum": "82516fa361dec02c7ed59ea2d0510d9ee4187609b449dca649a04141b12bc037"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00216-of-01024.json.gz": {"num_bytes": 397630870, "checksum": "4a6d5e60354b7b93f005010c6fc55c0a81596e98a116cdeec99e1ab4e58fd03e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00217-of-01024.json.gz": {"num_bytes": 398628848, "checksum": "02dffb623b628a3a3ea38084fe6bb840aafab8419feed3d1f2bd3598cfa80aab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00218-of-01024.json.gz": {"num_bytes": 395087998, "checksum": "e1e9a7ac7a922d6a9bb90f82cb48dff11ab7208dac08511e9613cd2726ca67ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00219-of-01024.json.gz": {"num_bytes": 397622792, "checksum": "955afc7d45a080ae137e9dc25ba3d85629a6a14c3d9bbe4065aa37d710345b7a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00220-of-01024.json.gz": {"num_bytes": 395112655, "checksum": "a3560918bec20087e9908009a362957ecb06401924789e20b36c26e363db5ae7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00221-of-01024.json.gz": {"num_bytes": 397132000, "checksum": "d8459bb5b6fb6b341b24fe517cfc5dc099765ad70c3383bae913229e06cf99e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00222-of-01024.json.gz": {"num_bytes": 397138513, "checksum": "20d3c6219921dc9c2928d637000e488635fd9a12b5636de5a6a7e52c1b67d781"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00223-of-01024.json.gz": {"num_bytes": 397167661, "checksum": "43a18accd194646893324537991e0162f6f98a9cec5ff59fe8fb510d81d707bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00224-of-01024.json.gz": {"num_bytes": 397905941, "checksum": "a516485cbefdef2e31a493cd8827a5f936f10674ff3525b71d414e17f48241c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00225-of-01024.json.gz": {"num_bytes": 397218123, "checksum": "791c85c78c5e7f3557855a1fc71acd860521710515b89f92e54e02960549f46e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00226-of-01024.json.gz": {"num_bytes": 396619135, "checksum": "52a36037696e6245efad80e00d1f123c36dbd79e7ff52b1fb99f579e712d2b30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00227-of-01024.json.gz": {"num_bytes": 396654998, "checksum": "e31123ab579fe95bd50afa10d52a51e9c15a4af28c06583fb5aeac4e3418f129"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00228-of-01024.json.gz": {"num_bytes": 396899165, "checksum": "86481361fff334dee3183fac8ab3f346e44ab3e6e7b35bbd7e6e062b2d2fa0d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00229-of-01024.json.gz": {"num_bytes": 397489378, "checksum": "bbb717711fb4c78ebe8a0476296a21a50285ec41d9fb9f08d5d66d899577e04a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00230-of-01024.json.gz": {"num_bytes": 397462301, "checksum": "054414aac29b5c8faee71a918f2586ad3fce8ee44c71e7a2e2af4b91e0169523"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00231-of-01024.json.gz": {"num_bytes": 396097584, "checksum": "8136e320fccba75a493954fefbb560f92532be44a6e0990404edae659d48ce1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00232-of-01024.json.gz": {"num_bytes": 398984795, "checksum": "3d9362aab157beef3b5fcd4a0a0236d59de635a565b1c86423f45b26e8b437b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00233-of-01024.json.gz": {"num_bytes": 397258012, "checksum": "e1a532922477d17f7cbea7db72c2391d26b4db580e526ebd5a90be23607a8d31"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00234-of-01024.json.gz": {"num_bytes": 398350453, "checksum": "c464829565bcaafdba165b2d886be4580f3c0a516b5417853ffc4fe30049cffe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00235-of-01024.json.gz": {"num_bytes": 397147353, "checksum": "573a6a1d33ccc6c5b605d381f04d73989504bb6d24514b938e92c3d4f61501e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00236-of-01024.json.gz": {"num_bytes": 396963006, "checksum": "21318462014bc185d0da7cbd342fddd07521401ca2b73e47eb5cb4bd42a82bbe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00237-of-01024.json.gz": {"num_bytes": 397087111, "checksum": "49459c97b078726bf8377748d4bb2066bdfa47e2717315a9b3c8075cfc4b9b10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00238-of-01024.json.gz": {"num_bytes": 396984031, "checksum": "befb46e9f928876edc580c60ea4242f63cf6df77c6c107fec6e4280d279e348d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00239-of-01024.json.gz": {"num_bytes": 395915197, "checksum": "dc5ab17e04e4f2678771094af67909dcaa8be36a6cb047cfa66e75f986c91312"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00240-of-01024.json.gz": {"num_bytes": 398321096, "checksum": "25b92f7a499e9aaf0496a57f6292a7f65941b34dd6c78f14b08358d180070029"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00241-of-01024.json.gz": {"num_bytes": 396626980, "checksum": "1ae21ee5585ec718763a3c7bd70d9338aaf77d0e02f92a41f6ed213d1eefa5b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00242-of-01024.json.gz": {"num_bytes": 398220596, "checksum": "c29f98174a0c02a817d5cfa3ebb2a92d5f49df8a34fa40abd360f1b39b4bde05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00243-of-01024.json.gz": {"num_bytes": 398250083, "checksum": "819387c95ea7183b1f9e1e78d077de65023c4809198ef3a0c946f46f8b6c19b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00244-of-01024.json.gz": {"num_bytes": 396943969, "checksum": "7a0b0b984d7afc4181827705212f917cf4ac12412f640a2c8120513763cdb390"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00245-of-01024.json.gz": {"num_bytes": 398365865, "checksum": "a424157137a5eeca89819d600deea2a1619ea8f5ae1ed395c88ac600a85e3afa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00246-of-01024.json.gz": {"num_bytes": 397285385, "checksum": "73029f721bdaccd9d126e871973e70a551f48f077f5903656b305ea9885c4798"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00247-of-01024.json.gz": {"num_bytes": 397132841, "checksum": "b223cf1270d2c728592ec65b09599bbdef8d64f7df2eb525e114f86268500daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00248-of-01024.json.gz": {"num_bytes": 396316645, "checksum": "94102d9bcc086ed5b203bc0c6b830dd245c9bf6c695b23b19922b2a98eeb6a52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00249-of-01024.json.gz": {"num_bytes": 396644237, "checksum": "36be793f4d76070ba1c696b3274e6dbab43f415c8fbaf752145cc99af6558680"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00250-of-01024.json.gz": {"num_bytes": 395860541, "checksum": "313febcf026d2cd1495fdd3d5ba3b492ce5d5749153e189672b6d9dff3e26a61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00251-of-01024.json.gz": {"num_bytes": 396709140, "checksum": "7e2480b3d5869ba35007c40e18585f3fa208cdf8e004078cc8de4fac36773507"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00252-of-01024.json.gz": {"num_bytes": 396508847, "checksum": "25df46ae56c0d4a6f945922e31fc697d12e0b7c525be9bc2b8eced802641488d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00253-of-01024.json.gz": {"num_bytes": 396364816, "checksum": "6b2125b9eab9bf893e7f8913a6beedbeeef5de53893fbd6172f706e33bab5177"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00254-of-01024.json.gz": {"num_bytes": 396122930, "checksum": "7947e5152c5305863e2d664622e3de49f9386b4384eb09630c5bfcad21fb458e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00255-of-01024.json.gz": {"num_bytes": 396929803, "checksum": "a1ec8c609ac969c24e2524f0f3dc31ef43ca0147ffe66569d3135e4f28394325"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00256-of-01024.json.gz": {"num_bytes": 398432943, "checksum": "3fd0373f5a8974a3499c436d96ea73be95f5619b8388dc316f51aff01e9ecad7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00257-of-01024.json.gz": {"num_bytes": 396003748, "checksum": "516cf3626076f083962983b2d6c596ef355609492f2e81c6c3cdec01acf8c5d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00258-of-01024.json.gz": {"num_bytes": 393890690, "checksum": "700760a7764f890c8aae337e7ee458c8467eb9048347edd237e341dd2bd5d236"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00259-of-01024.json.gz": {"num_bytes": 398130606, "checksum": "d868f8ef5e1cc971ffd00908bdc7eace32ec151d7405d7cac5fac22df9ea10c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00260-of-01024.json.gz": {"num_bytes": 399765969, "checksum": "7d5eb3b88eb8a0291ae70c1997458cf5aecac645397e50a67fab3d1193064353"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00261-of-01024.json.gz": {"num_bytes": 397418895, "checksum": "ca607c9e13d7cfb73a29ee3131f77e6bef3130d8627037cef9f57ed459185f0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00262-of-01024.json.gz": {"num_bytes": 397925991, "checksum": "ca789394ab4398c41490ec6147a41ffc8847155ea9ff74d7ff8b3402ed0634e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00263-of-01024.json.gz": {"num_bytes": 397082336, "checksum": "aac81d1bf0ade80758c14d01842b9b06c89ebf2fcdb9a06b1472bf2f70bbc348"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00264-of-01024.json.gz": {"num_bytes": 398101079, "checksum": "3cf56a2989b5c3f26ba94124cc534f5c9ae9770bdc6a3431dd745603b480ab19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00265-of-01024.json.gz": {"num_bytes": 396949669, "checksum": "d4f252a6c2f43833d6d89bf69337449b4cae5dc88fd08fb20b35fe7194a50ddb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00266-of-01024.json.gz": {"num_bytes": 396242007, "checksum": "71c745968d8ee4a0d64f38930a76e65d68ea094ba3e0b963d5d6878f65f51b34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00267-of-01024.json.gz": {"num_bytes": 398342031, "checksum": "706a560c862979594265925c3200d4bd0981a9eaa279841f2cba673634f7074b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00268-of-01024.json.gz": {"num_bytes": 396399468, "checksum": "eb3dea553c37f220b3b9b5f377d5a4ef94243b3c0b6b46981e3e5b7ba5b4a935"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00269-of-01024.json.gz": {"num_bytes": 397181296, "checksum": "4f0feae035dacaeb720ca3b6ea17685144895a0d78cfa358e30983f8d6c4ec76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00270-of-01024.json.gz": {"num_bytes": 395712883, "checksum": "6e0f6de1e5a5c6d4bf23d0539ee72ecc2b4285da2b0f1ec2cdcc443d2e22aa88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00271-of-01024.json.gz": {"num_bytes": 398066980, "checksum": "4c5cd1ef1917ed762d7d8c5c54e1da05db74e45721697df8b0626e0aeac96966"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00272-of-01024.json.gz": {"num_bytes": 396667308, "checksum": "77a33c37a5d88e419e2b31cf560d53f129a38e5bc2306b5baccc187b7e94e589"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00273-of-01024.json.gz": {"num_bytes": 396020214, "checksum": "b18e40c00b8e0e02dfac40ea0519964e231c8a2f28bc1294b044fb090f41a9fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00274-of-01024.json.gz": {"num_bytes": 396300833, "checksum": "34c8945a6ebac564fe87881d6968d05363a89985f297692a3df7104128b9c26c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00275-of-01024.json.gz": {"num_bytes": 395206463, "checksum": "1e41d7e2a6117224dc23fbaae8e9d20df9d7744adb4687d2b0e570bf8d9e47f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00276-of-01024.json.gz": {"num_bytes": 396667995, "checksum": "45973b91c2f1140f79265a24f484fc6d6653f43f83d5bd2d18954892dfa4dfae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00277-of-01024.json.gz": {"num_bytes": 398134029, "checksum": "b7da91889b6695cf01bceddfc139b23f9465bda5cad54088b84a1f5a4d7a4f9a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00278-of-01024.json.gz": {"num_bytes": 397422615, "checksum": "e794a2903bda1f3c082e8f590383c714a518c202ecb99eda5513d6b320f70e86"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00279-of-01024.json.gz": {"num_bytes": 398776175, "checksum": "a5528d3e33151138ef9bdc2433744f1797de2b20673a570de5bd4d81b306354a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00280-of-01024.json.gz": {"num_bytes": 396208086, "checksum": "1be2d8c3d0eca510fac7b06a5401b2b8873bc6dfbf85a3c736301756f9681309"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00281-of-01024.json.gz": {"num_bytes": 396893734, "checksum": "1db3e9017561d38a91c417ffef875b7a948c4f64c51b90b0983c71bc9d950903"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00282-of-01024.json.gz": {"num_bytes": 397411883, "checksum": "4e23d39fcec2c310cbde3fdc5d9c185046086877ac03bbf9d772b092614f93da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00283-of-01024.json.gz": {"num_bytes": 397906911, "checksum": "850eb5e60b84bca4d2f10b2e511fdb2661e3d08444a07db1782ad85c754fe808"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00284-of-01024.json.gz": {"num_bytes": 396043261, "checksum": "fea24050c6aec13eb706a6f3854b4debde62b1b842f2992fc027820c66218b0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00285-of-01024.json.gz": {"num_bytes": 396961329, "checksum": "6052f82887cd2362320f72f6545d2e5b5a775e9bef95783c9b9995ecb7a5ecc4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00286-of-01024.json.gz": {"num_bytes": 395697481, "checksum": "f4361838b5b679c8306447364166c1c3083af392b4c8793399c122af09c7312a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00287-of-01024.json.gz": {"num_bytes": 398773520, "checksum": "9add91f23f31ff8c5d8d84e6a0af75fc6fa08ceef8ccd9b633d8c49aa1d0104d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00288-of-01024.json.gz": {"num_bytes": 397684645, "checksum": "64dc94555a122353c3a3c9999e67d17b0e4b682096ba80be2258c791ce1c2b9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00289-of-01024.json.gz": {"num_bytes": 396655864, "checksum": "2472c76b1cbcfc3cb82126795673126e8f532119a03722a304396ceee9b7db3a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00290-of-01024.json.gz": {"num_bytes": 397415313, "checksum": "960b71edbdc6a6a62a0d3cc1069bbbfb11893cc017aba543e10c9a23cb759d1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00291-of-01024.json.gz": {"num_bytes": 395617977, "checksum": "96e582d7a750bee597331f373ec2e16d3a9686f48a49d39765d39550c8cbbad8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00292-of-01024.json.gz": {"num_bytes": 399332500, "checksum": "cd6ec4941aa5babbe274684945bf899447ec2459b8f7076ec8c74d2b3fe794c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00293-of-01024.json.gz": {"num_bytes": 397021546, "checksum": "d0d0c4d80e75c5d02103b49027d9e2e6f7db74c12f8b53f600d7fe420b2d0a7a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00294-of-01024.json.gz": {"num_bytes": 396272726, "checksum": "caf5708a6989f867ec6c4c56f338aca9f3a43a1806a27ef473d9b0f219001cb4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00295-of-01024.json.gz": {"num_bytes": 395233811, "checksum": "a7b5f904e34c0b370238e6beb19149d4bb96d0cce43a1eca3bfaf181952ede53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00296-of-01024.json.gz": {"num_bytes": 396480926, "checksum": "4fcf284d98c2f7b63e47573e9d084eeec2516fbfa62be42c3ff94e1cf518e313"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00297-of-01024.json.gz": {"num_bytes": 398883718, "checksum": "c1cb458076497e7dee645f50281d1af2fe5dad556d28a2cbbd73abe6537c8a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00298-of-01024.json.gz": {"num_bytes": 398733629, "checksum": "4a612c715025292e62860fb0018e9fa2d3fade692342746d044be6297e25a034"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00299-of-01024.json.gz": {"num_bytes": 398155026, "checksum": "d33f4043fad9551f92084a45b7f54d920ded9d6fec271cbbf85f71b021f9ee4f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00300-of-01024.json.gz": {"num_bytes": 398612975, "checksum": "61b1181b796a2f40db3cb6954f2890397c3722c486dccd4075d74679cf61a70c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00301-of-01024.json.gz": {"num_bytes": 395385748, "checksum": "95a78e9d3cece0620430c85822fedf4021ebd88ece57d6714933c268d3b6af6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00302-of-01024.json.gz": {"num_bytes": 397620059, "checksum": "321aed402a5e779febe9766294ad040a3f8dcf57bae68648c03d3c59023aafa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00303-of-01024.json.gz": {"num_bytes": 396549027, "checksum": "4198f6a2b5bdaf90ac4251f013908123a5964429870ccd6b245a9069278c4e17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00304-of-01024.json.gz": {"num_bytes": 396596460, "checksum": "74a6440e93d18d0d6d0622ab7d8832d7ccc91c03297faf20c8090d16f7c042d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00305-of-01024.json.gz": {"num_bytes": 394881271, "checksum": "654deec494bba4eece19c27140426049574cf529c93ccb422fcc09fe4496af15"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00306-of-01024.json.gz": {"num_bytes": 397760377, "checksum": "e0840cbc94db6cfc35df66d413a11261756392dd59b0fdf89d9ff166ec76f3e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00307-of-01024.json.gz": {"num_bytes": 396671816, "checksum": "31ceb8cfcd09fda621a9a483b09dfb43f5436e867363f6736ea3f710a6af10fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00308-of-01024.json.gz": {"num_bytes": 395961013, "checksum": "8c1e5acc3f964eaa5aff300731a74dde84ed0671cd764b121ea638fb08c3dd0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00309-of-01024.json.gz": {"num_bytes": 396035179, "checksum": "7d555942b1bcb2518aa5ff9c0549d98fabe7bb563cdc6c73d3f11e6a0bc502b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00310-of-01024.json.gz": {"num_bytes": 397140669, "checksum": "859eeb7a9d2ed03d5299bbf7f1c3e719236477950d7601112a458ea5a2adf7c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00311-of-01024.json.gz": {"num_bytes": 398170419, "checksum": "1e7661637b0a4445119ba403e4f8ede129c829fb7d1907ca7660870b536b8b29"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00312-of-01024.json.gz": {"num_bytes": 395605627, "checksum": "87a3ccd2ac9deff1ac4a5dd02bba269a48692d4598c5899630e8d2e4136dbb99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00313-of-01024.json.gz": {"num_bytes": 397081206, "checksum": "c6952116cf573a6e20c849cf1b7d8d0edf3b9d00fc7e717e7bacde915c4c52a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00314-of-01024.json.gz": {"num_bytes": 395555727, "checksum": "762066fd85c596ee01b3b8070708517cc5759bb1e3c4bb65f4645fd62b550d13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00315-of-01024.json.gz": {"num_bytes": 397871218, "checksum": "814f19cc5e81144f5bfd7037f5f522dd5c44faf150c10337c675174a5965a5b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00316-of-01024.json.gz": {"num_bytes": 398577523, "checksum": "27643c7c3c0a1a78c9003b936ea27785709a2df80d09817278a179eecaedc352"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00317-of-01024.json.gz": {"num_bytes": 396388623, "checksum": "5f840180e2017c41c6b1c865784788dc3b002478a9ecb43c3859174af788ba5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00318-of-01024.json.gz": {"num_bytes": 396173471, "checksum": "2aeab99fbc84a2640a05081e2c7438451e75f76cbece3cbe5d82e85463a61966"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00319-of-01024.json.gz": {"num_bytes": 397912127, "checksum": "fda805ed19f4b996b048386f4bd73924dc965a069e85b8b4452a54a1372375fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00320-of-01024.json.gz": {"num_bytes": 398765416, "checksum": "bce244d024c076911c1c6dbd35609be5442c8b0440690e2cbb342ac64bdc494b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00321-of-01024.json.gz": {"num_bytes": 396005962, "checksum": "763584ee096223b8aeffb1576ec6e4f3bea674ec4de40fa163c2f2221b3701d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00322-of-01024.json.gz": {"num_bytes": 398615672, "checksum": "5c12ec1d0c450fb7515c586f24311bad145050dfc64180d65bacbd346c2ce9c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00323-of-01024.json.gz": {"num_bytes": 397861187, "checksum": "93326f43273fb963593e0b1caab1e9588387291c23d5c14b5ae40b46b199998c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00324-of-01024.json.gz": {"num_bytes": 396679008, "checksum": "6ebfe6e28851e6d79cfdbf370602373fc2136e88936eece302ecaa8ef8251827"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00325-of-01024.json.gz": {"num_bytes": 396358086, "checksum": "51190fbfd48479842ec3c7d910b5519e01ff797ca0143c39be142c1650c5e893"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00326-of-01024.json.gz": {"num_bytes": 396490692, "checksum": "f4d9bbfd1bbc6e939fce9a2df26e45c79be73dbe2650fe79af395bdaa39cd121"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00327-of-01024.json.gz": {"num_bytes": 398354656, "checksum": "c70c824b6c16e5fad922ec9b8d363d97bed90501522b641b0eb0f66b8c086325"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00328-of-01024.json.gz": {"num_bytes": 397326336, "checksum": "7e6008433a0e5bc6eed28a13b9dba17246e7d65ca96c31092086c3546a3a397b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00329-of-01024.json.gz": {"num_bytes": 396390524, "checksum": "f379d844a35172424554bb82a65c790c354b76c0e7abfd868225d1968017d1a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00330-of-01024.json.gz": {"num_bytes": 398259199, "checksum": "ea15be4a83c3de66c42410e13e5ef9c93baf86099a8eded1c1d10b0cd5ad0f29"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00331-of-01024.json.gz": {"num_bytes": 397618860, "checksum": "7b6aad6224ead9ee3a0c860cfd991301ef5e97093b23c76d713e73f4911d0e44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00332-of-01024.json.gz": {"num_bytes": 396743573, "checksum": "bc5333d383020d2296aa0f6ec940ab586a367efe50d1c597f9db55ca72fa66e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00333-of-01024.json.gz": {"num_bytes": 397460128, "checksum": "095b3a85a9598009638622ca21cb00142efa0d68196c8c3a8bb922cccb465e8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00334-of-01024.json.gz": {"num_bytes": 396900262, "checksum": "6f005575f4843b84f4512e1b7c1b748edf497e4e9f55eaae47f9b4637161ccab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00335-of-01024.json.gz": {"num_bytes": 396106895, "checksum": "66bfe399d0859f71c20db01de53ca7bf997b33afcd3d181f181d9f265a2c2fa2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00336-of-01024.json.gz": {"num_bytes": 397732616, "checksum": "1f1e0435de870b98b119e91edd4a0d32d078dbb810f919a70b85360cd860f0cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00337-of-01024.json.gz": {"num_bytes": 397834763, "checksum": "1db4bcdaa6fca612c3f1b38dad6d5402679ca21aa6a545850d61bcda10103697"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00338-of-01024.json.gz": {"num_bytes": 396712179, "checksum": "810c104a8862699c490fc8625a7be4115872fe2de4d8c061e095dc5a81eb4d19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00339-of-01024.json.gz": {"num_bytes": 396838831, "checksum": "9bbc616d5c4aba46475957a22544dbdb0557f8de31cdf919718fbfe55bc70ac8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00340-of-01024.json.gz": {"num_bytes": 395587861, "checksum": "48c8411ee2b5fc8cffe1589ed204d0ac8a12b5b3bb1857373f84bae984d49e8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00341-of-01024.json.gz": {"num_bytes": 398093153, "checksum": "4ff8ba83e489580da2401aaa23ca3329befe8fc08b6f299b612950c358688604"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00342-of-01024.json.gz": {"num_bytes": 397248009, "checksum": "c72e063f95d10ce661b4bc97538eccf6da6ad493b7e54da555a46e4a47aabbed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00343-of-01024.json.gz": {"num_bytes": 395939409, "checksum": "249eb2080c55402aab34a31a442b06bcaa25d2df3f4319ea1a5f50dc6bb709b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00344-of-01024.json.gz": {"num_bytes": 397608807, "checksum": "8cc57604fcc5fa920b0d16df6e8d8b7f4ca88c0c76c86f9ac81f42a615b330e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00345-of-01024.json.gz": {"num_bytes": 395751274, "checksum": "13fbc76e49a8b856f7563b945bef10d786a86caff63b4cebea50416ca34932ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00346-of-01024.json.gz": {"num_bytes": 395516794, "checksum": "61d43da2e3e7770016ba7235eaa74a1e6a180e64cd2cfacefed5c34e8b72eca7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00347-of-01024.json.gz": {"num_bytes": 396180000, "checksum": "4a0ca2103de168d05d0090c8800d47f216cc167a9cfe9e736403aedf040c5e46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00348-of-01024.json.gz": {"num_bytes": 398461180, "checksum": "a56396961496499ac289a85d126b916132e787d0dc4fbd9961aca7dbbc7cfcff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00349-of-01024.json.gz": {"num_bytes": 398049366, "checksum": "ca012572c575f6a8e6ad6453296ff93f22118995c17928e76b655da44ce5810b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00350-of-01024.json.gz": {"num_bytes": 396532962, "checksum": "bb35d17862201063b46d8745dc182756d1bb09e809c4c355452ab1967e655491"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00351-of-01024.json.gz": {"num_bytes": 396576223, "checksum": "19ea45ab2fe5487d2a69cca7c9a1db7a09c8d5dfdf130412bbcd241cc60a61c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00352-of-01024.json.gz": {"num_bytes": 395956381, "checksum": "bb5869b8649fffadd5f1945ca9a79588e84081a8fc45b7e4cb5507149b5be2d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00353-of-01024.json.gz": {"num_bytes": 398903623, "checksum": "cb16a7ecadd28a8b5622c4e581f463f0ae2fe20a3e6582fa6885d76e7523715a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00354-of-01024.json.gz": {"num_bytes": 397316693, "checksum": "42aea18548695c458ddc229d8c837356845609aca3bb64ce6e07b185443b9468"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00355-of-01024.json.gz": {"num_bytes": 396240550, "checksum": "1577d76807548d83427293b9f534a3261fb72a345569f0491a1fd2691047bd92"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00356-of-01024.json.gz": {"num_bytes": 396132315, "checksum": "b6e17a39292e082e517082b23b381305ebe889c2530fb5eb74a2683d36d07a86"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00357-of-01024.json.gz": {"num_bytes": 395948117, "checksum": "524ebed10c881f52f155db5d6690806f5a97aa8f811deadae916323b50427ed5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00358-of-01024.json.gz": {"num_bytes": 397397242, "checksum": "8e23d852bc3a0dda4684d5fd511003ad6f18232e5f54e32638c8db62e9d18c6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00359-of-01024.json.gz": {"num_bytes": 396141321, "checksum": "345c34dafbc59f5e93355c8b2e6fcde6bf59bc9e1ebbf5cb962d54228e6d3204"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00360-of-01024.json.gz": {"num_bytes": 397258644, "checksum": "51db06055d95e2b43fddebf8c2b7d76b7572745f129d89fe005f8e5d3f12b758"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00361-of-01024.json.gz": {"num_bytes": 397913411, "checksum": "2c0f6054fef084d3e7cd10e2de0b1d3a48dc716af1e9146548195df128bdaba9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00362-of-01024.json.gz": {"num_bytes": 397722576, "checksum": "664b390b20498eb6e78fc09604b3a947fc1847a01e3eaae4c7861d1dde3b90fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00363-of-01024.json.gz": {"num_bytes": 395416894, "checksum": "c57529884c6d4977a279a097c0dfbcc31d52048cdcf64950182c743583d7989a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00364-of-01024.json.gz": {"num_bytes": 397028679, "checksum": "ed4f252d63c679f6e3f35847e0871c3360e072b0d6963f662d7e808b6615457f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00365-of-01024.json.gz": {"num_bytes": 397574891, "checksum": "68e8e44a531d98897245fee90ad349f4fdee891b2f68dfda78a1dedcc9474326"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00366-of-01024.json.gz": {"num_bytes": 396905692, "checksum": "9e88b888d85633671e009ed7093763b934a42054ed6a1252222dc64781a20e22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00367-of-01024.json.gz": {"num_bytes": 396802011, "checksum": "2abaf3f3946788258b8543fa2ccccc0c20e6980b9d26a38decd356e67f575fa1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00368-of-01024.json.gz": {"num_bytes": 395630737, "checksum": "b4960e3395d8a1bf8350f57e5f6280b00443a4c6b85e6fd47478fbbfc1733caf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00369-of-01024.json.gz": {"num_bytes": 396228047, "checksum": "08e8210426e6c6ef9746675592a3eea4a92eff9aa4bb7ffc6bf6ba54bc411f72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00370-of-01024.json.gz": {"num_bytes": 396548482, "checksum": "10e0305ac4d1e410d749637e0c03386d969563f8eb73bbbc376fc1d21025e4ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00371-of-01024.json.gz": {"num_bytes": 397344482, "checksum": "03df0f4aa5c377f6b45db3c3b863240bfb1211ddb226bc055433fbcd9ee8e873"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00372-of-01024.json.gz": {"num_bytes": 395872223, "checksum": "9b70549213cb01595179928cdb020daaf7bcd2085c5e947d111f3cc66e406d2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00373-of-01024.json.gz": {"num_bytes": 397399096, "checksum": "945c204cdb107669a8d1252a91323eb300c902bdd6c6a8167a90805ec02cba9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00374-of-01024.json.gz": {"num_bytes": 397755002, "checksum": "8353d4383f73caceb5d112f260b37d1349dc7898af2d05b98ffe17d22aea97ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00375-of-01024.json.gz": {"num_bytes": 396534763, "checksum": "a3de41388a6d8ce3b605c6586e47b74a565dd2f54175551987bda0a0ff95036f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00376-of-01024.json.gz": {"num_bytes": 395594630, "checksum": "7cadf813f2b31a1bfe44fdfc84aef4eb65e889c2616c56b189890734c22b731f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00377-of-01024.json.gz": {"num_bytes": 398241040, "checksum": "15df154b52cb4d9314dbc4ac26ca4b4df7125b12131d538fd480f8a6b3fbdfc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00378-of-01024.json.gz": {"num_bytes": 397217224, "checksum": "208ce680427f62d78dad857bee91122a79f968589b4e44f2f89919e91f4dea30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00379-of-01024.json.gz": {"num_bytes": 398504097, "checksum": "0052fe7f27e720423b6143f401b8618428d913b22fc2af2950874785e2ef7528"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00380-of-01024.json.gz": {"num_bytes": 397494149, "checksum": "15c4f07a2629c7bd79b243c97367e3e18de02b5ab09eccc0f85b1eba0e0b071a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00381-of-01024.json.gz": {"num_bytes": 397190859, "checksum": "77c71b4a79ac2f462040ea0e8408fdb8f719fac0f09fadb760ed00b709e9dea5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00382-of-01024.json.gz": {"num_bytes": 398126420, "checksum": "aa44d029398c33f733065c489ab3ded9395f6e53263407173b6e9c27b6fb9c45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00383-of-01024.json.gz": {"num_bytes": 399108296, "checksum": "f507161fbe96f8abe9dedccba2458448719e6b153bcc1256ecee6b4b9c82256e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00384-of-01024.json.gz": {"num_bytes": 396156787, "checksum": "83c236bbc8508fb81992c837751a4d8ad4b9bc138dd1f4bb5c1fcc68203e12da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00385-of-01024.json.gz": {"num_bytes": 396878483, "checksum": "df45b4749951a46695f88789fc536617ee3470083e55562292f606e09185e4a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00386-of-01024.json.gz": {"num_bytes": 397495799, "checksum": "a8240c9e7266e47bda8880e38ac8a5afa8541aed4b989d6642b31497716a51ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00387-of-01024.json.gz": {"num_bytes": 397062301, "checksum": "e6fd54ea6f17d5570fa4cc97554813a7a33bd4e44cbc456b27b0c87c1af22c60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00388-of-01024.json.gz": {"num_bytes": 397074091, "checksum": "fdc2a134df4a669deb839f26947c86b7e7a4bc7596a6a1c25562cb97fbb6b089"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00389-of-01024.json.gz": {"num_bytes": 397056868, "checksum": "e7390f0007582a3460fa67375b2628c85a1aa85954796d8e6584fadcb35761cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00390-of-01024.json.gz": {"num_bytes": 396404332, "checksum": "820a97060abd3172852f38e1636706c8389adad8495de56f4c3a2c3ba6008235"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00391-of-01024.json.gz": {"num_bytes": 397125489, "checksum": "68732c5ab9f4b6945e79ce2a1b45b97a97822d6a107aa79aa9135f29d91173ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00392-of-01024.json.gz": {"num_bytes": 394992472, "checksum": "c9d1e8cfd481631a76544e5880ceee9990e7553c88c5978a91b48ec8aa47717d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00393-of-01024.json.gz": {"num_bytes": 394778146, "checksum": "7a5ec4f0878f676a3ac2c417f512186066d793f28d611f97135c3626b3b60fdd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00394-of-01024.json.gz": {"num_bytes": 397024190, "checksum": "44e32db5a39684ab1789cfe97b6e9cbd3c539390e7a4c8ec9298e7177945452b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00395-of-01024.json.gz": {"num_bytes": 396537190, "checksum": "601ec281240753ac5793ec7cb83802a788c4d88e56dfd83e6c875cf2ef9bd8f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00396-of-01024.json.gz": {"num_bytes": 398049705, "checksum": "b1024b69e191b2c7073f5f4f3ea51e8710be54db8603ce8aaabbfb919ea6694d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00397-of-01024.json.gz": {"num_bytes": 396670567, "checksum": "11357bc600f9b0c443f124c7fa4046d10cf03e19016e5ba8cdde884d2ff76c9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00398-of-01024.json.gz": {"num_bytes": 394706629, "checksum": "778eca6d845b9a7d49e22941b959a95e5e4d2d9714720f27b810230d136acfde"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00399-of-01024.json.gz": {"num_bytes": 398257272, "checksum": "27c2a30af83975d32469e85fb2e27953a3aa9f97514f621063325cb9af1829fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00400-of-01024.json.gz": {"num_bytes": 398732278, "checksum": "aff9a39748526a03d3476288cdbce122c3683baf113362e9085895609d03c3c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00401-of-01024.json.gz": {"num_bytes": 396372632, "checksum": "a6af262bb962eb1c45d2003ee1bb2be1a3a12cb3e53d4ffe58b4b68dd852957f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00402-of-01024.json.gz": {"num_bytes": 396783625, "checksum": "db9aca12012da21fc5a0619a47e9c3075959786d6d6d74f6a244af1cb33c402d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00403-of-01024.json.gz": {"num_bytes": 396950960, "checksum": "b3566f7b9251f6aea9343d1344151f10fc104464f92e8f10a97742defffc2244"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00404-of-01024.json.gz": {"num_bytes": 398481154, "checksum": "897904040b5887620b9996cf89656f5bff329a430a8c3dfd6802d0c879675376"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00405-of-01024.json.gz": {"num_bytes": 396065216, "checksum": "45e0108549ab06d9a8ad5c45dc53250798d0e58f7e940080a754106801250009"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00406-of-01024.json.gz": {"num_bytes": 395637879, "checksum": "bda70f3a19b19e2ffdd1c3a26b959945b447acd450cab49e72ce727d2218af5f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00407-of-01024.json.gz": {"num_bytes": 398356109, "checksum": "1df9e8b4715d9a3f02a0b06aef6095f81d38acd1be0b4fa402acaac0258c3116"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00408-of-01024.json.gz": {"num_bytes": 396041456, "checksum": "e89ebf354280543204e78f4308a8f8751cc26094524628cd8e9cb691d9911b82"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00409-of-01024.json.gz": {"num_bytes": 396254329, "checksum": "15729474174d6a5adb5935f25afa6de2f03a8dd2f73b780e23795ede92f5762d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00410-of-01024.json.gz": {"num_bytes": 397850848, "checksum": "98f1b8fc845e0005b76d7eac70a430ce98e6989569344ea92266f8391b1396fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00411-of-01024.json.gz": {"num_bytes": 395527322, "checksum": "52b2e31f2adb61c8e703c6758016cbfc650f8104dcd5f78867c81434be155ea6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00412-of-01024.json.gz": {"num_bytes": 396155992, "checksum": "7b6b4192f9bec4fdeaf9d6dcabd9cbba6b4c8ebb42d26730fea21bad139823c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00413-of-01024.json.gz": {"num_bytes": 395766377, "checksum": "775d1fac6b1708ba0384d922640b2f372b3ee146fc79fbe692ff69a7c6c699b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00414-of-01024.json.gz": {"num_bytes": 394860848, "checksum": "0386d8a8e0cc9d5d613b1f84085791de57ad05751d94d25681d86dff5cec1afb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00415-of-01024.json.gz": {"num_bytes": 397566065, "checksum": "1957b0d185943b1952dc66e78f0a7d449f49f8f55fc0978bf77e8dde10f4714d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00416-of-01024.json.gz": {"num_bytes": 396297306, "checksum": "3f8796934edb79d172e682511a5ed7666aa09ff541ce55e2c66406bdb6eeda9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00417-of-01024.json.gz": {"num_bytes": 398314475, "checksum": "8da08075b966c04aa7859275eefd34c78cd2b9edc366684733d027ad6d619ba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00418-of-01024.json.gz": {"num_bytes": 396296110, "checksum": "efe43733ebfc7b65c646aee68b883cf40124c1446a28e70ff2bfa9e1bb1377cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00419-of-01024.json.gz": {"num_bytes": 397614415, "checksum": "c0f02d78715de9c3ea0c684dad36a506386081fed2011ec298ca0ee623c7792e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00420-of-01024.json.gz": {"num_bytes": 395133656, "checksum": "6237f5797a35dcdd89a0b70cac4dedcfb3fe418560f8dbbf6cad685f11c870b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00421-of-01024.json.gz": {"num_bytes": 397061849, "checksum": "ee37899a6a49269026633ec79577491ff4b11e219e0236dcba68eb168279067b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00422-of-01024.json.gz": {"num_bytes": 396539584, "checksum": "e5914a4b97c27da82eaee2f4f67a165de946bb38a00d6126b1527f5eb1200417"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00423-of-01024.json.gz": {"num_bytes": 397715346, "checksum": "b99e628f8790a7baa8ee7828e31f2ec72374f9a8390c1d64c9b8092b10d9c7fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00424-of-01024.json.gz": {"num_bytes": 396335469, "checksum": "9cb3b9eb00760bb68f3df4b66b96f1e5798c338231500472fd64c49cd87c6599"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00425-of-01024.json.gz": {"num_bytes": 396714466, "checksum": "f28d4901ccde8eb7afcede9732ab94fd18c49e0e3731659ef587058d6ea2ab28"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00426-of-01024.json.gz": {"num_bytes": 395566563, "checksum": "9ab75a89a425ce974fd36e936476a30db913c2d7c9ca6e5522b91ffbcbbe30cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00427-of-01024.json.gz": {"num_bytes": 395379035, "checksum": "5e1ca658bea5ba5506afbb9ae5a5da4d35cdc3a215478c68e11652a7d5d918f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00428-of-01024.json.gz": {"num_bytes": 396419259, "checksum": "d740b37b576bcde0e1c8eee27c3bfb3b58c1a0d3c5b471001804b2a37f277ac9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00429-of-01024.json.gz": {"num_bytes": 397116774, "checksum": "d1c10b0ba72aa2d4cb4640d1263c32868190942b1e93b4bb4e9798e25f10ba67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00430-of-01024.json.gz": {"num_bytes": 396634586, "checksum": "11dec038b4c1c35d32d000915812b6ec8da9abbbec2e15f7493551198b6a1ef3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00431-of-01024.json.gz": {"num_bytes": 396704705, "checksum": "efdfdef444cf68fc05090107033ffe2ac906b6efe2fc138e90f47cd4bd0b6204"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00432-of-01024.json.gz": {"num_bytes": 396264701, "checksum": "fa649c2e2dbc992408c3a60327e5d5ace4697c84010446bb286e544eb6c604be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00433-of-01024.json.gz": {"num_bytes": 396887722, "checksum": "3d5fd3fbf209dfff2057143a3dcf7eceeccb1e85967a9a85a992f465e3522335"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00434-of-01024.json.gz": {"num_bytes": 398856291, "checksum": "ab6dc5343b052da901f4671c1cb3173850fbc6bbfac2623ca14936b2b83d9667"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00435-of-01024.json.gz": {"num_bytes": 395888569, "checksum": "26abd1e2263af02f998705501bd02ead2edc3d7f68fadc7b198e7fcf4dffc454"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00436-of-01024.json.gz": {"num_bytes": 396976077, "checksum": "a5dadf6ec93e8dcd62b0e1de3cb03c866147bafe0da8e631341663ccc03bb801"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00437-of-01024.json.gz": {"num_bytes": 395809168, "checksum": "7f98e98270f9b88570b5e498511ee65d07428db604af349ef9107dbcf65ac4e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00438-of-01024.json.gz": {"num_bytes": 399136723, "checksum": "0e03ec507b90b38d5b6d7dfe27d40e127efdc9a0bae349bea2e743375ea29b9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00439-of-01024.json.gz": {"num_bytes": 396435416, "checksum": "5f868ba66ea32a23be4a926fda0a86d0d2ab4948326e1ebac615fa16a2a6864d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00440-of-01024.json.gz": {"num_bytes": 397487165, "checksum": "d30005787e7472313982cf2860e0a0764900b82a7bf616da27e6c1c3298eb215"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00441-of-01024.json.gz": {"num_bytes": 395968030, "checksum": "181461b447d88040130c3348ae7d22f220e0f97ace030d6f54301a9a3d483fc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00442-of-01024.json.gz": {"num_bytes": 396909150, "checksum": "0854cd3454047e0c6a0746ef21e0cbbb22fbdf4349c2e668f4fa1e49add183c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00443-of-01024.json.gz": {"num_bytes": 396271897, "checksum": "2493db29dd3cadef3719576c34213496eff807df5ae8cf538f13e84d403fec77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00444-of-01024.json.gz": {"num_bytes": 395540084, "checksum": "5e717d9e0c1b6f728df0f206e422a0958a537dddf31fffa4d699e5bf4b3c2b16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00445-of-01024.json.gz": {"num_bytes": 398750991, "checksum": "b8af9d413da48fb5f9a9174b12ad253b2eb2c1ed7709cab710d66710841568e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00446-of-01024.json.gz": {"num_bytes": 397575547, "checksum": "2bad5a914cb9f2e5e99d76afbf85eef66c18e7c1cf2e11c5d455792ae86ab441"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00447-of-01024.json.gz": {"num_bytes": 398035036, "checksum": "d834925674a33ed5eb8fcb335fd81b95e4ab882010e434e3fb9323e0f23be2bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00448-of-01024.json.gz": {"num_bytes": 398658613, "checksum": "16f3ac40180e47b9b97998f5d1d7c0e9336e2fee5612a3397fd161937f7a2b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00449-of-01024.json.gz": {"num_bytes": 397934476, "checksum": "09dd3d5a529f62b10d1ec97f37ed142315190fb437be3f50987ee955b11f7672"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00450-of-01024.json.gz": {"num_bytes": 396444119, "checksum": "8a25c11e0adc5fdf50944767fbfbf01a9c35b3c0e07205c7c06288d1f68b4c10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00451-of-01024.json.gz": {"num_bytes": 395963541, "checksum": "f3ac2e295ca4b3ca1f55c8b500ea2588f1519163cec381297ad4bef390fbbe1c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00452-of-01024.json.gz": {"num_bytes": 396594911, "checksum": "25a57709e934077c2972f0f8a1a9db7afe9b7558ab023bd6ee5224b2f8cd770a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00453-of-01024.json.gz": {"num_bytes": 396745507, "checksum": "75c1a4803bb58efe5df885bccd13596d46dd1f3ea30899a7e83812167b990bde"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00454-of-01024.json.gz": {"num_bytes": 396193342, "checksum": "c151679573ea5f5b52e26e8b50da7e14760d1ec15c63a5b864b648190efd48f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00455-of-01024.json.gz": {"num_bytes": 398096160, "checksum": "7f86270b13ee4133adaa06de809f26ef581229407813fca05db521d9d36880dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00456-of-01024.json.gz": {"num_bytes": 398965570, "checksum": "d5b292189c5d318e0ad622eec1e764993084d0477147f51f29acd637935fec5c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00457-of-01024.json.gz": {"num_bytes": 396672892, "checksum": "8b490f615b3ed701390ed671d5645dec4aa3fc576a032da8f9d434087c1eb8c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00458-of-01024.json.gz": {"num_bytes": 396911580, "checksum": "8bcadc16baaa4e36fe17ffc0862c264230385e18bbd861671ad5fd8cbb86404d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00459-of-01024.json.gz": {"num_bytes": 395969213, "checksum": "b8ff8371a01d7bd1782044058ee0f53d4d1275ebca0870ba16104c1c4b12f07c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00460-of-01024.json.gz": {"num_bytes": 396928338, "checksum": "23dde1fe55277467d6d2385684b71e90e9066e6a3c349a1da30a1487e87c8539"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00461-of-01024.json.gz": {"num_bytes": 400009637, "checksum": "34b98d46d207c5b6ea7416fab6f3cfcb1444cdc19376464ae9abb9296fd14c3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00462-of-01024.json.gz": {"num_bytes": 398107677, "checksum": "2031735c0f38ce43e37a5bb1b9728fc37c758fc4af71758c3d3b9535716a3253"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00463-of-01024.json.gz": {"num_bytes": 395503017, "checksum": "7820184904183fad9a61b6c638df9de11d4624bb3aca08885b842255172cecee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00464-of-01024.json.gz": {"num_bytes": 397493281, "checksum": "b39b1b1e6686014a3c62e74912ec3b915dfc161b62e2d1108410354e6dec760a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00465-of-01024.json.gz": {"num_bytes": 397080149, "checksum": "a65cc7f590cc498da334d5a8653e818421e09e5e6ce2e8bc2a29ac67a02c3d43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00466-of-01024.json.gz": {"num_bytes": 396633690, "checksum": "15d891873ba02923893cbc8c42adc0468bb39161f898a810037cc2e9f82e0796"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00467-of-01024.json.gz": {"num_bytes": 395045117, "checksum": "711686ff5478ec35ccaaf1549b7a33b941e322585f702257dfe2d31630245ba9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00468-of-01024.json.gz": {"num_bytes": 399486439, "checksum": "59c4599c8610f4c54778daedbb358f5e26fa527f8f94c3364b70565ebc90571e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00469-of-01024.json.gz": {"num_bytes": 396170105, "checksum": "4263dbb03135c2d8b16fb323208f98fe1a1ff1223e76a7ba085f881411a0ab95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00470-of-01024.json.gz": {"num_bytes": 397479432, "checksum": "2db90de8f4d2bde9af453478ed4667166f636af701bb487095311f99b28e59bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00471-of-01024.json.gz": {"num_bytes": 396679096, "checksum": "caea3c4744adb89f006d9b0d9ef93241a55c1fc165cb0cd62b6d07fa3a40cdc0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00472-of-01024.json.gz": {"num_bytes": 397080237, "checksum": "34995676d953f4c95f8bd4f54fba8f92b86189cd73298ab77ee2702611b86e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00473-of-01024.json.gz": {"num_bytes": 397881706, "checksum": "c0fc6c68ae509d8273e7ca0efbe24f1452a57dcb000f44f550fe9600fd305e62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00474-of-01024.json.gz": {"num_bytes": 397705270, "checksum": "50aeb620f8c03a2e4f2346a0c79a4509adfae084ffbeff0b86d8892b858a821d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00475-of-01024.json.gz": {"num_bytes": 397201717, "checksum": "4fa508d23abd417bdb0b0e7a61f9aedfb770609214cd85b10b4bde7ced7f12b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00476-of-01024.json.gz": {"num_bytes": 397522775, "checksum": "27da6164865687041e4f53d9ecec2edc877b147da5b424acbac2c69480132a08"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00477-of-01024.json.gz": {"num_bytes": 397323156, "checksum": "e40115fc4901a3930494652ce9ee7abb0c3f41abc6d6c58c81fa75a0ee752db8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00478-of-01024.json.gz": {"num_bytes": 397380721, "checksum": "79a16b7016aed0eec375ca383eb316765687f12421f786b2e133faa5690ef197"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00479-of-01024.json.gz": {"num_bytes": 396828680, "checksum": "08185ce3c3e5b01552be7d8f08ed5b27a6b1b121bb2d7d70a78b7074fee02fa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00480-of-01024.json.gz": {"num_bytes": 398678311, "checksum": "37a5804dafb2f4aff9e393af5b127c3577ab8a5dd23f1e41f2304b25a4c428a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00481-of-01024.json.gz": {"num_bytes": 397654112, "checksum": "47ce12535b753d8936ce3b569675e76cb6f638bfb74a93caf201f3ffc409d71a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00482-of-01024.json.gz": {"num_bytes": 396387301, "checksum": "1d07828a199bb1e1c0c8342ba99e484093557188370d1ced90803c2615d24b7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00483-of-01024.json.gz": {"num_bytes": 397178863, "checksum": "b6499612fac654798010e11c27ee8a25fc05d1dbed8aaf2338fd0ea377dc4732"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00484-of-01024.json.gz": {"num_bytes": 395826769, "checksum": "ce197ad5a226249bbba53c34b9f3c83508b542853748c3094a5b98befb537f2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00485-of-01024.json.gz": {"num_bytes": 397100006, "checksum": "f483044a4a0418b695e0b989f0fd03bfa79df01b649991f2356443bcb29d0820"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00486-of-01024.json.gz": {"num_bytes": 397658615, "checksum": "297beef7b85dc128a6a58d834c5fd1b24bd7fe84c7a317500461720c742235f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00487-of-01024.json.gz": {"num_bytes": 396904673, "checksum": "06751938694fad1645ed575208e8e2c1efebb7165b4feb2d0ea871dc348741f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00488-of-01024.json.gz": {"num_bytes": 398019631, "checksum": "eb58bf8b011fedf15835841317e445e9e757c9939b4453a013233f020f98a697"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00489-of-01024.json.gz": {"num_bytes": 395822836, "checksum": "b339e33e7affbdaf691852d3668ff79adf8476a3c33eb86ad9f4ad4a6ebbf3dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00490-of-01024.json.gz": {"num_bytes": 398410737, "checksum": "4d8356cf804474538772c5520e77e75ac750dce3e6b103c9feab49ccd46a58ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00491-of-01024.json.gz": {"num_bytes": 396607853, "checksum": "1757097fb884d03aa288a05870016b1c2b9f1700ac5913d85c9821cf2e367702"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00492-of-01024.json.gz": {"num_bytes": 397612443, "checksum": "92e98e431a378e0402d81299c49209c66d39b0ba7ae63711f8d6ecf542f5fdf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00493-of-01024.json.gz": {"num_bytes": 395595466, "checksum": "d839e1763aa6ebc7cbcf1b870d947ba45b0b4ac95b0adbe4941a0b121690a311"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00494-of-01024.json.gz": {"num_bytes": 400397068, "checksum": "31caeb5f0ef694c06ce434df44c01f4a91fcd48e4acb4f1bf167eae6e59a02de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00495-of-01024.json.gz": {"num_bytes": 396458630, "checksum": "26291dfcae5145cdc306317ecf95851a3f693b4a7c6e132e55384ec69d85ef3c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00496-of-01024.json.gz": {"num_bytes": 395037560, "checksum": "b32344b92f81006ad9e2e471f5ef8133e87924c5150145b13d51c3d7a0f68c46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00497-of-01024.json.gz": {"num_bytes": 396247929, "checksum": "0396f0bb16b06ff130e955f260233ec868ada1daef6e8cbd480ce388628d49b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00498-of-01024.json.gz": {"num_bytes": 394798084, "checksum": "28d43d4e7bbce4e20167741ea2bbc3f17981aa51f9c040cfc41c522e732c6d32"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00499-of-01024.json.gz": {"num_bytes": 396699883, "checksum": "c6f6deff919b375fb08c74e159c25aa66362e4cddb0700f9b1e0e2701293ae70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00500-of-01024.json.gz": {"num_bytes": 397014521, "checksum": "7ee22957fdfad0880f132f47860612331afce7a48975b9312233ba8ddf537bed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00501-of-01024.json.gz": {"num_bytes": 399063718, "checksum": "ec94186b620037002819cd40347e6aaf67cb847848483790cd687222c9addbbf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00502-of-01024.json.gz": {"num_bytes": 396938850, "checksum": "a218de10cee75c4bb5a7102fbe208e6e65142ba5f960ecdc2b56b6f85fa30840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00503-of-01024.json.gz": {"num_bytes": 394631309, "checksum": "8189de9454986f63253fa1ad44c63d5c2f692ff4bc3a848c7c2fd02e08f4e1b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00504-of-01024.json.gz": {"num_bytes": 397884411, "checksum": "b7b268545c27573840bf8a6abb7361c209f92f9b5f0f8028fffd49b0c773854b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00505-of-01024.json.gz": {"num_bytes": 395784113, "checksum": "b9f1610be9f045c15e43a7343bd2918743a71585a7122a4e781533dd39a73132"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00506-of-01024.json.gz": {"num_bytes": 397939195, "checksum": "f07b77d1be71c5922321e8683140f9a63a90903f1fbd1515d908807e12fc4597"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00507-of-01024.json.gz": {"num_bytes": 395925741, "checksum": "23e9927e9e83fd03e9d99c3fac05f1bf63d6c296a2b02d1aa208798d27d8dc1c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00508-of-01024.json.gz": {"num_bytes": 397426015, "checksum": "f4b8a74c610cea50a6b144337f65fcfed11fff21df6683503f25d4b82e29a4e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00509-of-01024.json.gz": {"num_bytes": 399072341, "checksum": "c3069ae9658273cbaeaed1730f171837c8d3042e31d1093cf0f519f601309a41"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00510-of-01024.json.gz": {"num_bytes": 395859781, "checksum": "e5863648f64423397ca1a7838df18aeddbb3d5d3a2551321fd99a480508fa86f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00511-of-01024.json.gz": {"num_bytes": 396948832, "checksum": "a2209ec05a794f083cf163c102c6ddd8d5e5627674686950e17e586128a81e60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00512-of-01024.json.gz": {"num_bytes": 396585426, "checksum": "1c6fdb002dab490e6ddd7fe6023b2124bb944b7ebe95ee3b7faca9a92f4b5de3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00513-of-01024.json.gz": {"num_bytes": 396789970, "checksum": "83b02c0cf9ffea9d021adc102269c30a33ab3a803d331ba8d39aaa9b3b7acb43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00514-of-01024.json.gz": {"num_bytes": 397131474, "checksum": "783f25460641cd3532c3bb3920c7d3f0c68b5e674d44cba33b1ed755608cf8ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00515-of-01024.json.gz": {"num_bytes": 396127068, "checksum": "61e5b9947f77d929442f23fe84465d88044631aa1eb6438a0b86372cba7286fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00516-of-01024.json.gz": {"num_bytes": 397526020, "checksum": "539b032f528d1ec3a8e8420514ef2118f05482297b052f6d28876a8bf776a080"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00517-of-01024.json.gz": {"num_bytes": 397748661, "checksum": "03b85a51aa7bcde672cc017fcbb0f11976cbd1447fc0ccb4f4bc822b2b04b27b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00518-of-01024.json.gz": {"num_bytes": 397915751, "checksum": "80dec6dc7d15459c113c16f23978c38cdc1157ca18468d8a00e0d2192bb2ffd9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00519-of-01024.json.gz": {"num_bytes": 397847480, "checksum": "7125e7915fd03c6312cfe448e4e7a8629249765c13d8558b17c240c2aef713b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00520-of-01024.json.gz": {"num_bytes": 396232144, "checksum": "27974f9766c18fd0b652c94eafa3493243c8e1b25b6e850e857ab6246b193b48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00521-of-01024.json.gz": {"num_bytes": 395111538, "checksum": "61406e92a8f9a6ab800b3dd25cbac842e3487a4c7db7b1bb2070a41d627367a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00522-of-01024.json.gz": {"num_bytes": 397690206, "checksum": "b2e29801d120132a5fbbd3662a54290e46ff5e178b3146ebfc2169facf72e7e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00523-of-01024.json.gz": {"num_bytes": 398274007, "checksum": "79905dbc45756c9f1c225120709d39cbf3caf435e322a531a4add690a1d0440c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00524-of-01024.json.gz": {"num_bytes": 395689218, "checksum": "1dc3086cb869abb13862970186f6a77cb29b687cd49518173f639c148d937f6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00525-of-01024.json.gz": {"num_bytes": 397979085, "checksum": "6958bbc6029c00229fb0059d016a6b7a2bd21cfdc69392893423d2657c35c7c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00526-of-01024.json.gz": {"num_bytes": 398473877, "checksum": "895f42c4e7569f0db3832af13e56499f65fff74e93fc0cdf60c1c4b4b08881c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00527-of-01024.json.gz": {"num_bytes": 395879939, "checksum": "e84e72048b56878b1ff904ee83d92c208e15b16663b99a9d763edc23c2e0e55f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00528-of-01024.json.gz": {"num_bytes": 396472889, "checksum": "badcc3cda339c61936591e9333787ea032c42d7ff2288fdaff791bdc8504ce96"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00529-of-01024.json.gz": {"num_bytes": 396983038, "checksum": "ad20643f9d50c7c508fa136ceed0039ce39708e0e7a5e743c1981f1000bc3c4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00530-of-01024.json.gz": {"num_bytes": 395774249, "checksum": "9453fa3fd296150b436f0146171ea8317512c6735ee9434622a83765a5d9e310"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00531-of-01024.json.gz": {"num_bytes": 396171120, "checksum": "3e3c230ab6beda13e4dd4747c7c6291e57b1ccb4a96ac2edb46ffdb4c3cb05b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00532-of-01024.json.gz": {"num_bytes": 396200411, "checksum": "e9b52c3dad233fd1c4310cf5f76c2e6d0788ed084abcf931f99ab7002976d75b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00533-of-01024.json.gz": {"num_bytes": 395580851, "checksum": "e135cc4420d9f4d17ab523f7db8c559021a46a9a6bcdd21a6c4075047465906e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00534-of-01024.json.gz": {"num_bytes": 397459281, "checksum": "bb4f32ee1c1bedf4582b0f4f9ec7644be73fa25bf18cca7506e3c26e98818bad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00535-of-01024.json.gz": {"num_bytes": 397344480, "checksum": "3766ddf8313c5cee08a575fa96bdde06a5b293f1964e58293ea583d72bd18e20"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00536-of-01024.json.gz": {"num_bytes": 396588089, "checksum": "56d236a4250f9488d80b93c0c005962d018da256ea5632c7e16ae26c54188749"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00537-of-01024.json.gz": {"num_bytes": 397606873, "checksum": "d7ec24ef99de2769937b89e0ca7e291eca2bd0438d501d9228d5ab035f49d83e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00538-of-01024.json.gz": {"num_bytes": 397608864, "checksum": "1a60378a0f1a200b11f85577bbd0f373ae47022eab16fad53da492ca1ed35bfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00539-of-01024.json.gz": {"num_bytes": 398377669, "checksum": "787d263107eb09e852b015c17d1d0f54d8b93e78292c0c1e60cf99f27535c608"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00540-of-01024.json.gz": {"num_bytes": 398516980, "checksum": "dce03ef0813ef66e27df8730da7e341b49bf7e684bffd3a9cf700905501d1d72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00541-of-01024.json.gz": {"num_bytes": 395557685, "checksum": "e4035222d65124bd3e33372b76b65c2dad9e696701607ceeb5968d483595645c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00542-of-01024.json.gz": {"num_bytes": 395725875, "checksum": "4e7ae0b1c0c4d514e0208e21336d095fea5970475077d6690a917faadb2b72b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00543-of-01024.json.gz": {"num_bytes": 397625187, "checksum": "a96ac467b6ace74a08f7dbc4bb8e3fc57fae36abc8975d6b60a7b7353ca9ca88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00544-of-01024.json.gz": {"num_bytes": 397078230, "checksum": "337470c84cde5d02bc6a89003a6796de9e63db269e7800637ef2d220d75bd3ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00545-of-01024.json.gz": {"num_bytes": 396145060, "checksum": "da65d66aa4cfff77c754f8017eedd92cb82494b9425c2d5c5491d64603b2231e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00546-of-01024.json.gz": {"num_bytes": 396093007, "checksum": "399f7b70d1c1b45ce315f396d5fa0db2c69e41c522b0514e19bcc6802b953b1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00547-of-01024.json.gz": {"num_bytes": 397457696, "checksum": "47fc8fd82271e6b1fb074512da45dc005e22cb7f0aca3b7b621ea87613aeff9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00548-of-01024.json.gz": {"num_bytes": 396246097, "checksum": "3108770b39746852d7c048d9a8777722480505bbf4592732c7d1f231e2505c55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00549-of-01024.json.gz": {"num_bytes": 393096516, "checksum": "9bb2b88775593afe4060349985ff4417a37f1ba9b4ef33399c58644c01a92b89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00550-of-01024.json.gz": {"num_bytes": 396631619, "checksum": "cbb55d645d145ecc2ff9b96524463f82d5548c0bdf42381fc6faaad256e7ead7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00551-of-01024.json.gz": {"num_bytes": 396806780, "checksum": "ece03d7f12daa39473b6b8d5faed08a3f751efb9b1ee99f69c5188633d4a0f43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00552-of-01024.json.gz": {"num_bytes": 398608968, "checksum": "7fbbde9c39d67d8d7f9f16c0848188b743c6ff5bc44e6339d5fd88c32e1aafef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00553-of-01024.json.gz": {"num_bytes": 397696672, "checksum": "85f9c5c5fbcfd06f715b520a1a3a63a014b1831d2f65de5f02cfea49a18ddf63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00554-of-01024.json.gz": {"num_bytes": 397122204, "checksum": "78e3d43c3d2b71d8483788a085cd5706648767de7a2fc4aab707d6a05257ff00"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00555-of-01024.json.gz": {"num_bytes": 398704893, "checksum": "113e5fd99ada6ca96c086487b6e4012bad711d1d482d580e22d3af5b9d118572"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00556-of-01024.json.gz": {"num_bytes": 398099675, "checksum": "c7a816f8f2f74b4554ac17ffc41e67ebbcabb7c8b0c94292b4569bea372bea3d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00557-of-01024.json.gz": {"num_bytes": 396538561, "checksum": "7af6d2c9886481a0d393e026739b5ad7d0fc358ecc216d2fc124160402d4b50a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00558-of-01024.json.gz": {"num_bytes": 397660839, "checksum": "c1033428189671d4e1ba55c822040f307748c6ec31b80be3e4ed8e7a4325066b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00559-of-01024.json.gz": {"num_bytes": 398754128, "checksum": "69c9f88840166363f2b7ddaef05ac9d10441fd184d8451abfde76eb105572342"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00560-of-01024.json.gz": {"num_bytes": 394988981, "checksum": "a2dc4fc315a0db8f1a868d631d2941ab2806f44c2ae698e94bb7e8308bd67c70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00561-of-01024.json.gz": {"num_bytes": 395801300, "checksum": "dc1b2b4594e3fc7f8795f7649d1c524405edce56d617f1e214692565de8c8937"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00562-of-01024.json.gz": {"num_bytes": 398322250, "checksum": "c23404fef6a6b5b887cc2dddfe341e983939ae36078d62842919a3739c96b43a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00563-of-01024.json.gz": {"num_bytes": 397584845, "checksum": "c909fe429772c8198f904496ea6cf239d669c6c787889cefcb7623e08a988db0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00564-of-01024.json.gz": {"num_bytes": 396436964, "checksum": "8e7cb1863057a3b9929af4da29b4e1cca1f71c254f5eba91a657d9e8c1fd6dea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00565-of-01024.json.gz": {"num_bytes": 396486039, "checksum": "23ba56e78c4edc4d58fd7fbfcf784b29037204a641e43a9894c95c68bdb982fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00566-of-01024.json.gz": {"num_bytes": 395358745, "checksum": "71259a300ff096b49e3461c91824a8185037ca85ef2018dff2617f335ab304b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00567-of-01024.json.gz": {"num_bytes": 396405726, "checksum": "d9b56ed523376681dd81cb9831727467461bdfb87c80d3932937338370093033"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00568-of-01024.json.gz": {"num_bytes": 397509797, "checksum": "c650aad13a48d5b0c51162ad19c9eb3135559d0a3318dba701a90e8138a8cd24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00569-of-01024.json.gz": {"num_bytes": 396514261, "checksum": "d71e4126c2deffae8ee55077cee9dd2b70ce27adec767bce06e02afb23b42416"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00570-of-01024.json.gz": {"num_bytes": 397072833, "checksum": "519a32e1bdf7f5b97e1a438242a79218317e04e44021dc61aa65c526d35ce8ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00571-of-01024.json.gz": {"num_bytes": 397170114, "checksum": "919a9659156cafb26b87190fc00b9d33c4fd536dd35544cbef8e5ddc018ae365"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00572-of-01024.json.gz": {"num_bytes": 396475017, "checksum": "3d7e4e548f01c9ad5fc99b4342cbf9a9004737058dd93aae8b7d95b2c00856bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00573-of-01024.json.gz": {"num_bytes": 396749955, "checksum": "032f8e37328c9f0fc046e5a6ff5a79cbb744f3100c4cbea78e397c449471bb10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00574-of-01024.json.gz": {"num_bytes": 396036505, "checksum": "8e795341527712be32a69307ce8cbd2d6195c6b2fea596d326a279734505198e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00575-of-01024.json.gz": {"num_bytes": 396722381, "checksum": "45a43576cfc61842bde146eaa566b4f22a128c3c2eb8f30c59a6b6cae4bcd4e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00576-of-01024.json.gz": {"num_bytes": 396163377, "checksum": "38429d2d6176ee42ddd495e052c01735a9a7f0076cde107d24a0a9c7a26bf2a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00577-of-01024.json.gz": {"num_bytes": 396813305, "checksum": "eae77c319bba236feaffc9f74eaa38e911fa48eb06f4794c9b1a6d17edab91a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00578-of-01024.json.gz": {"num_bytes": 397797226, "checksum": "1dd2b3d7e99fde8903bc12625568ec4fc6fe653737b3af5e9c71432e311cf5f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00579-of-01024.json.gz": {"num_bytes": 396012631, "checksum": "d9322e66701b4ada3788b91a07e87b03af6c91eb4cfaaefee23c0330987a1840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00580-of-01024.json.gz": {"num_bytes": 397943129, "checksum": "23deb32e1b0f07a55a5cf1572cb8e313ce716c748a07f58bd90cbae97290d0a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00581-of-01024.json.gz": {"num_bytes": 397614648, "checksum": "6193f8b848c7930fc04b9f2429dbccf36f1b291271b3eaf646c655433bf3ff9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00582-of-01024.json.gz": {"num_bytes": 396659280, "checksum": "40997ef02c7040356cd1c5acd8e6a5121e00b31253713cad4f529ab2922affc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00583-of-01024.json.gz": {"num_bytes": 397686445, "checksum": "5cd21271e4ae036f8d1e0c320330a6c93a8b1ffbb9293a80c56c2d7f123f9ee7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00584-of-01024.json.gz": {"num_bytes": 395500815, "checksum": "c25befb7c735b2340b092a04375d2109c1b876d2b0057dd8d4ed4beac87118ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00585-of-01024.json.gz": {"num_bytes": 398413461, "checksum": "073f632e95c218fdf17274fc21915c94f56bdfbb58a6b1a0550de249ce4d2129"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00586-of-01024.json.gz": {"num_bytes": 396849745, "checksum": "647cbe9bd7709c0d8a01485096fd88ad0fc09b27de324eae141a8d841536b71b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00587-of-01024.json.gz": {"num_bytes": 398567154, "checksum": "557af97a8d2b2656149bc25ee5b362116d173e6a48911b860ec10d512b4b763d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00588-of-01024.json.gz": {"num_bytes": 398086388, "checksum": "9e9afa15ee3534e497c9fc7c8cd967388183193dade3d1ec82a8e2b0e82c5118"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00589-of-01024.json.gz": {"num_bytes": 397335823, "checksum": "ed8a1d0b9c55f465b5d4a4e5ea022f6d17aaa8b82569be7cfec55629c1bf26c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00590-of-01024.json.gz": {"num_bytes": 394931693, "checksum": "3fbe539fcf64f0d914c19b383de9953b0605d4a69f48801145f0db1972f9c6b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00591-of-01024.json.gz": {"num_bytes": 397828770, "checksum": "9165de8866384d3d03c3876c39c96706e33a24b9f95acc09999c2dbfb85cd9cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00592-of-01024.json.gz": {"num_bytes": 398782493, "checksum": "433a9cb730d7ab024b56ad662a3ea53633f7ff26c625051c4c02f252beeb87a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00593-of-01024.json.gz": {"num_bytes": 399264489, "checksum": "4a7e5f40aa8b692cfa0519d33a868e9a05e579ad430204bc13c48b533eadc5ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00594-of-01024.json.gz": {"num_bytes": 396629833, "checksum": "521d5e90550dbc97ab26a18a0b75da81e38ce2083ff5fd93340fded2e54e1ca1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00595-of-01024.json.gz": {"num_bytes": 396916313, "checksum": "30c9be1d99ce0a41b214fdbd5115988c82ca317d4aceb30c19fbca05e0a409e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00596-of-01024.json.gz": {"num_bytes": 397013253, "checksum": "b16bd9d7d893b4a71056575fa0799bef96120c03cfc6e2a88c292469a67f2614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00597-of-01024.json.gz": {"num_bytes": 395980036, "checksum": "3bd15089b6fff342df2b3109d7ebadca35cead4f44ca5b1b55e55d8892aab82f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00598-of-01024.json.gz": {"num_bytes": 396295935, "checksum": "6252d951a9570baea9767cf3350a6d09ac5a5fc34ba80eae3b5c40adb8361ab9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00599-of-01024.json.gz": {"num_bytes": 398608239, "checksum": "b265a385cdd5e64d1fb2ffce739e72f2fe2cc8944621f20e2084dc52b91cdd9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00600-of-01024.json.gz": {"num_bytes": 396563743, "checksum": "43d12028cbe738e8f450911f6a55dcb00f8742cefc2a2c4da5f9e9220b0572c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00601-of-01024.json.gz": {"num_bytes": 398256993, "checksum": "9368dcfc581e6d572d899ef25b129bc0268901a2fa009500174a0985bcf330df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00602-of-01024.json.gz": {"num_bytes": 396202546, "checksum": "3cc57d7afd161fcd411f73da8369d98db4c6d8e30643ee01450adef21e8ea3ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00603-of-01024.json.gz": {"num_bytes": 396338425, "checksum": "cc21fc5b8ed6e5115bd8924954d685ed52cd5b773ab63d37188343443c95851a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00604-of-01024.json.gz": {"num_bytes": 397597307, "checksum": "d24f6d807ae35037e695e19917ed446f74448166fa464c862e31fe7ba2bea196"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00605-of-01024.json.gz": {"num_bytes": 398278313, "checksum": "99166183c752aed8d0f2cc9c010f1ebdd4fb93d40e936fd6c082eb3542baa956"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00606-of-01024.json.gz": {"num_bytes": 396590468, "checksum": "657ce79340c15524a5897459a6cf712fa4127def2445f7eb3de21c9b46db3794"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00607-of-01024.json.gz": {"num_bytes": 396603228, "checksum": "3705441435f18d1e4aeea9e794e1216fcd29b48213763a554808e3d3697951a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00608-of-01024.json.gz": {"num_bytes": 397280580, "checksum": "be0bef2c16e9bdd0387276402dc99fe5a9a0a7a105a44e88bdb783139f2de474"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00609-of-01024.json.gz": {"num_bytes": 398284528, "checksum": "3a7c7a8cb01f6d7589152a1483682a5fa99e119490f3e70d8a02f582f2e2b19c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00610-of-01024.json.gz": {"num_bytes": 398872039, "checksum": "c349aac5b64227397ec2870992ac9e4fac9fe39f1fd4e0a7b8c727e171655e14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00611-of-01024.json.gz": {"num_bytes": 398736440, "checksum": "63ca5eb2d27632b3b4dde8e40f9925e71e21ef737262bcda7a99324a67e0fab5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00612-of-01024.json.gz": {"num_bytes": 395170895, "checksum": "3b4bb3e14ee981a9edb9828ce40b86b5d83dfafcc1a5e0e02642cb40924bd6ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00613-of-01024.json.gz": {"num_bytes": 398443337, "checksum": "e95adbd7d55024b7e62145860f217a6f04f5fcef79ac23e92dd9e14f9a0b2a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00614-of-01024.json.gz": {"num_bytes": 398854661, "checksum": "def8cb789f8f79fa169e855816c5e4bc7d5c253e565502691a9abb826d7436d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00615-of-01024.json.gz": {"num_bytes": 395505189, "checksum": "6775ca6aa4f834289396a438906b90936ed0ff6390213dac2b0861f40d7761e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00616-of-01024.json.gz": {"num_bytes": 398999454, "checksum": "6cd5efddacb09cc80ec1eb79f93b562044787903b3cb1c879be2acec64a9dbdb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00617-of-01024.json.gz": {"num_bytes": 398570431, "checksum": "26d1f587377446e8b1499be7a3b6776d437baa40353fb04c591203a420eb0cc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00618-of-01024.json.gz": {"num_bytes": 397064982, "checksum": "e59a87fd1cd3d87fff4b15c3a9331521d7587ac7f4a7fd51ec3906b484ef9ad0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00619-of-01024.json.gz": {"num_bytes": 396676338, "checksum": "8077c3a15d93579d0fbf00bd9d117bf4f50092c5be3acf46c7d4433ef7be9dfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00620-of-01024.json.gz": {"num_bytes": 398186471, "checksum": "ee3fb91d7797ebf1daf8dcb81563b7dae7b161d97732efd35e3eb6ebea732ee2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00621-of-01024.json.gz": {"num_bytes": 396467968, "checksum": "386adb83129a7306ef4da37c1cbedc39b3971e7633d516d406a982f307577e67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00622-of-01024.json.gz": {"num_bytes": 398293882, "checksum": "b708cad0e04c56174d0feec84d7224a4490cb8db023d38e57398cad89b78568f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00623-of-01024.json.gz": {"num_bytes": 397396780, "checksum": "c50c4568c6f103b3e6a3702cbd915ecb530df954df808156bc38a98f36a0b944"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00624-of-01024.json.gz": {"num_bytes": 396971282, "checksum": "11351ef83c9fb883d6c0f484af5c10f0d686b7ac4a2f08fae9ac3d9837df0a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00625-of-01024.json.gz": {"num_bytes": 395882440, "checksum": "dfa97ea7949c9bbf7af43d43ac5c8d0034bdbd1ad572895159b7c7846ab89676"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00626-of-01024.json.gz": {"num_bytes": 398292846, "checksum": "fbc9c23dc286ad6fd7f01f344de97ef5789733af581de278488869bd36f3b246"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00627-of-01024.json.gz": {"num_bytes": 399890427, "checksum": "f43bbde36b8bd34ed9998b99b42c85434b8bbc8bbaa1cf5b38cec6393099c23f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00628-of-01024.json.gz": {"num_bytes": 399589466, "checksum": "c50058a4937912b678d33d34ff91e2287e8701365f4f71fce61f9002652556cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00629-of-01024.json.gz": {"num_bytes": 397355095, "checksum": "051c4631d0587b6f65827410ad2f2121c05c849a009274415bc5e7f72db42d44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00630-of-01024.json.gz": {"num_bytes": 397860559, "checksum": "07b48a86a8a3245fe5b78f6943c8970c839942b8d86abf173507225b0d1520d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00631-of-01024.json.gz": {"num_bytes": 396161304, "checksum": "70a03f0308105de5266c4a40803b51f99888b362b71409719b7f71f73761b590"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00632-of-01024.json.gz": {"num_bytes": 395620184, "checksum": "c6923984c419f08bb4e6effc27dd25dd986513034338debc9b238592dad9f607"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00633-of-01024.json.gz": {"num_bytes": 397572527, "checksum": "900fc701703234031e825a1eb2d11b364f1dda97eb0c7943e17ef278695f7bea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00634-of-01024.json.gz": {"num_bytes": 396215174, "checksum": "0cc838e395581933123fc57c6690afbdd2be1b67d213336d9b8c08b3876f8458"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00635-of-01024.json.gz": {"num_bytes": 399176005, "checksum": "5a3daa1bd0be8c997da56257f063a7d1c7b2b271648a46615b26ca4beeb42863"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00636-of-01024.json.gz": {"num_bytes": 396035356, "checksum": "9d21ce1c8b5a7c1330cc95b1f45286fb8578d5dcec0686724ff6e25a97f38a7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00637-of-01024.json.gz": {"num_bytes": 397214839, "checksum": "83cd34e1ba09c268b515fda7699e12bfa2531fb7e60e2f861946ffdc01e54a04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00638-of-01024.json.gz": {"num_bytes": 396292535, "checksum": "82a7bae9a7d35fa707bcb6d90f7b244f1509e112dfdbd604c9be1f8b8ce7150b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00639-of-01024.json.gz": {"num_bytes": 398009954, "checksum": "b6d7ebd102c67960413caf5fcdc5b4aea728b6d3d6369ab8dd3cd6bee6c769de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00640-of-01024.json.gz": {"num_bytes": 397558496, "checksum": "151c55d019fd84fdc0eab73d24984e5d88ac964c86f89a361a03dc776a22b5b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00641-of-01024.json.gz": {"num_bytes": 398031508, "checksum": "e0e87304a8ac408adca2badf2564ec52caf155295ea303a121c30f3b1ce797b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00642-of-01024.json.gz": {"num_bytes": 396594124, "checksum": "73d08c99b6b96d96b82d88267b2a392a7dda2084ba5142b8eefd0d23212702d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00643-of-01024.json.gz": {"num_bytes": 394552252, "checksum": "ebccf3b935d63c30f626d317af250b6bd0f04ef5e1cced829287ba64fbb0d25f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00644-of-01024.json.gz": {"num_bytes": 397586341, "checksum": "674c0965a9a880c057b6f2dbb785a4a6ae048954d44ba4f5266dd5e65095d06e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00645-of-01024.json.gz": {"num_bytes": 397950976, "checksum": "7ac8d4dacd682a2977818f01d860c3dfa5a5e5a78f7d2d95be0353a675452e93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00646-of-01024.json.gz": {"num_bytes": 397511840, "checksum": "452a9cc03facf9151552f914f9a8a3507a96fd8ea40f7d04951a29ecbf6aa1e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00647-of-01024.json.gz": {"num_bytes": 396692070, "checksum": "5a795a238203444596c711bcedc634e653e5240c9a800a9884c51f878340b494"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00648-of-01024.json.gz": {"num_bytes": 392707626, "checksum": "9cc366c37950624df6af318ee52a97d32a40e278fcb519cbe8545b04bee3204e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00649-of-01024.json.gz": {"num_bytes": 396283284, "checksum": "4ddeec31a30b5c563838b17e1115ad30041e08c70a94f299ea324ee4b71fd82b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00650-of-01024.json.gz": {"num_bytes": 396349662, "checksum": "f5bc63114ec9d73d6cea7f8e38a95031ae2bcde849b27440afd840a3e72aac13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00651-of-01024.json.gz": {"num_bytes": 397187042, "checksum": "7199c0242b2654509af187c9c8bbfc22cc5067aafa1ff69949b1f0e5b718425b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00652-of-01024.json.gz": {"num_bytes": 396263026, "checksum": "c9e62b6df7213ea5b71913fbf736403f33c51e5a868bf1035cebcc39d80635bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00653-of-01024.json.gz": {"num_bytes": 398689010, "checksum": "f3bcc9eca4d71043e920db6399a032f916c23b1da329d2ef86434a74f8e7b318"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00654-of-01024.json.gz": {"num_bytes": 396938678, "checksum": "fb41df26e1f68e1e9d12ae8740535ca66e80910320be2270d680fec40d6fe9a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00655-of-01024.json.gz": {"num_bytes": 395995226, "checksum": "018b40ddf6d88c4c346c8018439d16f6ca66ee0720970e84ddc34b1010ae35d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00656-of-01024.json.gz": {"num_bytes": 397860049, "checksum": "8f3847e9bb5a8145e2959b340f86cc06f85e6646f32d5d785c5c90ec11a9f404"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00657-of-01024.json.gz": {"num_bytes": 397142407, "checksum": "a1ae8735a39bd099dac2e50c22e312f1a010f2644774ef53c995f3437c0a5524"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00658-of-01024.json.gz": {"num_bytes": 397827609, "checksum": "f6154377cfff2453392fb899f81514a7c0ffd40dbc35d8842d61a115d0aeef35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00659-of-01024.json.gz": {"num_bytes": 396861858, "checksum": "4299633524667921549573c469a73e33abae89d107375d5ccc6a6d987c2a2a26"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00660-of-01024.json.gz": {"num_bytes": 397773823, "checksum": "44eaf6c1739d8a9c13c54750c473ac04aaf9d2223d8893cd8094f1769b1f6f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00661-of-01024.json.gz": {"num_bytes": 396311257, "checksum": "18edb60444b660c7cc68dbe59ac71989be0e20ff13639725a5f05e4d4d512514"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00662-of-01024.json.gz": {"num_bytes": 396176936, "checksum": "7b60541181fbb92f361fbdf0bee80d086c75279610aab792a7b3877d49a3e1bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00663-of-01024.json.gz": {"num_bytes": 396274985, "checksum": "59e057ee5f5e8c7267138c18c5c88f3ca24d30f86c484e4bb0c0a4eb5169c4a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00664-of-01024.json.gz": {"num_bytes": 397483935, "checksum": "585f45d3ac3f88c3bf1c86e01daa46537f8f5c5165521412de0e67393cb6da33"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00665-of-01024.json.gz": {"num_bytes": 398831104, "checksum": "e403d2f4ff6e74abc9639749f93f77cc868453908c10821fea7fafdbcc981a06"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00666-of-01024.json.gz": {"num_bytes": 397668116, "checksum": "f9bbafa396a466b24630a259a01804b2857c1dde2fa3cec60b2967a88ad9f528"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00667-of-01024.json.gz": {"num_bytes": 398123165, "checksum": "ed693d5ecb9dfcaf545e831b5769b877e927125794cae61a0ec7821c3c85dfe6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00668-of-01024.json.gz": {"num_bytes": 398152096, "checksum": "51c33c07d503743704f564bc6a372c2f6f8f13a1ddd00b0b9a2c44c94cc57444"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00669-of-01024.json.gz": {"num_bytes": 397927981, "checksum": "d356b5268ba39e38ffccd20e95803f3218407e0a1ca3b4d1165ff82796ec1bae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00670-of-01024.json.gz": {"num_bytes": 399074605, "checksum": "bb96ea8154ae01275a9197709820e670c4e6212c740e92a7f1cfb7c618a49bea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00671-of-01024.json.gz": {"num_bytes": 397864381, "checksum": "afca3dbcaefdc368e996259fd595b77fd98a885ec005a93069a01b83227c827b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00672-of-01024.json.gz": {"num_bytes": 396077133, "checksum": "3da96ebd1b28b55b03bbab8e85f78295cffdad9020f869cb456da27058ffa090"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00673-of-01024.json.gz": {"num_bytes": 396943842, "checksum": "6a4c344a8af68a95e20d58b64fff8fe616c2a406cf26f642cdfea65fce5883d1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00674-of-01024.json.gz": {"num_bytes": 396975969, "checksum": "e6b0f7727d78143fa180abb76e617b37660b35f6323f19bf1dcbc78fb9374508"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00675-of-01024.json.gz": {"num_bytes": 396692800, "checksum": "e4ed97b19c6d83e618a3fcaff75460d828ca419b1e62842a1493b0ec4c9703e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00676-of-01024.json.gz": {"num_bytes": 396514400, "checksum": "a5672f1561ab85f071395de43e702791aaacff77a9f67f6ec9e14b12aba675b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00677-of-01024.json.gz": {"num_bytes": 395939125, "checksum": "3dacd3bb90b5e645d1b9a962d8df87f571b0fcf227996068535bb98a68f9191d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00678-of-01024.json.gz": {"num_bytes": 397022852, "checksum": "c1a0ef31342161369b7fb709be17e3c86191c1a52cb04b704fc58190818302c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00679-of-01024.json.gz": {"num_bytes": 398325372, "checksum": "47ddd1056ad977407f61b2eac3ff803d17b1aa8fa0719279bf911caf49bbb7c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00680-of-01024.json.gz": {"num_bytes": 395502228, "checksum": "cbb93f322d684ed558cbf8d92b9f83958ba772fe4177093a334b4596343f3cd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00681-of-01024.json.gz": {"num_bytes": 397981781, "checksum": "9ec2dec493733846a1ec9f68ff5130cd461d7ab9c07b22d4aae94463bcf03146"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00682-of-01024.json.gz": {"num_bytes": 395265758, "checksum": "7731cb9a2898c730a650e5d1b358886ed562228928aefe55d991cfaaa61a9a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00683-of-01024.json.gz": {"num_bytes": 398783283, "checksum": "6f2bb48070e809ac17fc90e1117d63bd8c7cd0079d9e44c9f262c4ce60f5d373"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00684-of-01024.json.gz": {"num_bytes": 396160769, "checksum": "fd07413637b97b68cb3a7a6cb86c4656017b7841728e806485ae196294e79f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00685-of-01024.json.gz": {"num_bytes": 395594461, "checksum": "939925a9169da729891fbeef926f420b80bcc60e0f170bcf9a2095449a22d424"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00686-of-01024.json.gz": {"num_bytes": 398275260, "checksum": "13836c45719ba10f2d581cf17cdab1daa4cc207a49db2b4786b451605842ac4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00687-of-01024.json.gz": {"num_bytes": 395256765, "checksum": "0c0d0e6c1e3cb9a024c184a8510066a005c031a15af74d117d0e736a358a91d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00688-of-01024.json.gz": {"num_bytes": 396635904, "checksum": "2462e084563f8b8de68c6e826289949ff8ebf8cfaf323344c07ab93e56373539"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00689-of-01024.json.gz": {"num_bytes": 397749444, "checksum": "d03746220f3374c80102ed39d8f6ae0daec40fc1b23312c08ecdee82a65ac6df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00690-of-01024.json.gz": {"num_bytes": 399380060, "checksum": "217d032ecce8d0b7e448befe83aa051a3bfab8cb0e167d043b6abc833f5e9b4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00691-of-01024.json.gz": {"num_bytes": 396975651, "checksum": "354fe9bc07aefc55cbbf8752f53ad69d45761da928bc8deb6fee1de9e244e93e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00692-of-01024.json.gz": {"num_bytes": 399720848, "checksum": "21f88940b6cbceefd66ea5e8d466467806370ae24a5833ca308cd840daf5ff8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00693-of-01024.json.gz": {"num_bytes": 396787846, "checksum": "c8d28980ffa1eff4459d2fbf0043a1f8eeaf840a3b1d1ea4989b2192c7a82041"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00694-of-01024.json.gz": {"num_bytes": 397945967, "checksum": "1936570da24c4bab9fe0559826f1cc509c4ab6eb3679e26d697efa6e7e5c8a81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00695-of-01024.json.gz": {"num_bytes": 396349049, "checksum": "8e497506f84513272a8a0694e7d4efb004b1e3b515887e3b5762f59b6c659dc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00696-of-01024.json.gz": {"num_bytes": 394901418, "checksum": "9e1d6cc187ff67ee734bbadc6cbd57eae05634a448edfde184fa8d6fc3259836"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00697-of-01024.json.gz": {"num_bytes": 399142528, "checksum": "9584496113a8612620748aaba35e185b8f47b7c96b4ff0dc7bfdd6024a3faa14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00698-of-01024.json.gz": {"num_bytes": 395923784, "checksum": "83a3c57b3870ed9beeaf3ec8ab694e0be458106f3128b14b2a44a036e89d32b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00699-of-01024.json.gz": {"num_bytes": 397137494, "checksum": "0befea64fe749d79592e337bc359bcef70ca8816d0126ebf89d4b8fbfbdcbec6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00700-of-01024.json.gz": {"num_bytes": 396554785, "checksum": "34739b543636aeadb6dcce3e7c97ca49026cc9897c13add6b592fe60e5c40338"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00701-of-01024.json.gz": {"num_bytes": 398091188, "checksum": "c9bcc7c9e91de707ee548e67452d6970af2e19bef91f966b19fa71504e5305fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00702-of-01024.json.gz": {"num_bytes": 396039798, "checksum": "fcda5f8ddc5ed163db84aa70c565f8181731af9a29918a2ece0436d3146d7125"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00703-of-01024.json.gz": {"num_bytes": 396889704, "checksum": "c80445d442a766d2e87ecf5804e87bf7f8b23c2238476fc2b51f657400739306"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00704-of-01024.json.gz": {"num_bytes": 399465260, "checksum": "0bb73674d579523fcbe079fbea7190138911711f023404ae46ea7b685fc09c73"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00705-of-01024.json.gz": {"num_bytes": 398579507, "checksum": "97d6fd9cea2a47913c6ee9d1e34c3440858f25f3d670cc81c8f83f2346fce6e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00706-of-01024.json.gz": {"num_bytes": 398761590, "checksum": "2f4836001b8b80066ae09b6e385ed0048770c13ba2410e0f0309ab4b9200e37d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00707-of-01024.json.gz": {"num_bytes": 395576626, "checksum": "8e0c0c635a7a7c32d4fdb1a7906ee95a9f334a55b2ff3881cdc7d5e816a9c817"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00708-of-01024.json.gz": {"num_bytes": 395930921, "checksum": "e6978b92f333230972e2b4c31cb86b5286fb899948c7680c7a9cbe75a9d60296"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00709-of-01024.json.gz": {"num_bytes": 395734676, "checksum": "13071a3527071f06570c6cfa485073f2f3980c83cac782db6bf66a75dd865df3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00710-of-01024.json.gz": {"num_bytes": 396501107, "checksum": "6562cb3675a42a58b8c8b2a232043adf532fe49420e30c3c237a6d8889a8de30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00711-of-01024.json.gz": {"num_bytes": 398422179, "checksum": "f38b59c4739d3c15e5bf5dbc0965d1a5dcc0f49a3c89eb7a6822003aaa1ae7c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00712-of-01024.json.gz": {"num_bytes": 395905103, "checksum": "500b4914f3c42d5e24ced7d36dbd3143c49e4fd5dfc3d53a172d1a55ae738889"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00713-of-01024.json.gz": {"num_bytes": 396009909, "checksum": "4f50bfa762db1435a89195fd180615e9f569c1668e128d343c87c40ac5cf60ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00714-of-01024.json.gz": {"num_bytes": 396963447, "checksum": "fd9eea7dfb93916a3798a8b69d29fb5d4bf0fec448b8a24427f729e7a41205e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00715-of-01024.json.gz": {"num_bytes": 397474378, "checksum": "3c61bcf6f24e21d2584bb4ae008230540d9a375e35f3c4ba1668621b80d85c5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00716-of-01024.json.gz": {"num_bytes": 396285471, "checksum": "c554e562a369d9696219ea8b0e363907c50f626d7c410a26515e07de801da74a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00717-of-01024.json.gz": {"num_bytes": 394827995, "checksum": "f8b4678c21d93c19d50cb576f0910050d24dfd606238bbf8013c45f98defda12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00718-of-01024.json.gz": {"num_bytes": 395517823, "checksum": "1bf63affd6914d98e197b6e1ce526cae7754ecdc750184154d3cb8e3bdd21a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00719-of-01024.json.gz": {"num_bytes": 395561934, "checksum": "c04b162d984ff2ada9f39aa6c0fac04a1531fbde05175f856d2e3ca2797a448a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00720-of-01024.json.gz": {"num_bytes": 396227762, "checksum": "25da2ac7c1f3cbc361807f67e8826ffa95f4caa25f81f66832cbd0a08f1a51f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00721-of-01024.json.gz": {"num_bytes": 397716450, "checksum": "28180c6396deaf34e2a197f5cad1b53ba1c9532db8b5c21dd7d81332b2793181"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00722-of-01024.json.gz": {"num_bytes": 398022279, "checksum": "9c3a8038a7f9431b90f67ea0d3b77353d0508b09865f49af575b6aaf5e32d6b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00723-of-01024.json.gz": {"num_bytes": 398064523, "checksum": "4b18959f604bd5f379a73b52947261cb8d63f2243f5afeb5807a13669ef4a800"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00724-of-01024.json.gz": {"num_bytes": 394747045, "checksum": "615f13a1b2a6942931519b7a7f6aba286f6045aad65b041c2c6643ce906de1a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00725-of-01024.json.gz": {"num_bytes": 396726374, "checksum": "4099a416eccbb56818efda68bd027c993c1a5fa1a8e722bc268041fd3f804cfb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00726-of-01024.json.gz": {"num_bytes": 397361407, "checksum": "152d5e2bad0de3b6b48fb26066891b160ea79c4c382ce6aec6047196e3b08ef6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00727-of-01024.json.gz": {"num_bytes": 395542925, "checksum": "ce1d46b0cd7d9e4075db3feab71d2f72939817ebf45819e73ec277c9cc07307b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00728-of-01024.json.gz": {"num_bytes": 396647931, "checksum": "c859626b14584c1bab396c867ad5eb11ff3af39628206b03612ee2d2b3058497"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00729-of-01024.json.gz": {"num_bytes": 398272080, "checksum": "758fbdc5bf6d66a36d69d31141742b2a917bf0341494b844f22ab82cd54e7ead"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00730-of-01024.json.gz": {"num_bytes": 395977662, "checksum": "56a7fcb59ece26d4b19be0bd5e6c2d0f05e4b1b23e8ce7b4fab064a29b229c02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00731-of-01024.json.gz": {"num_bytes": 397530948, "checksum": "bf0f4dc8796a737daf80b977a6e3656cb1e244fc40d6df92852da45e53e6cfdd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00732-of-01024.json.gz": {"num_bytes": 398314575, "checksum": "1862bcc85d48f59283eae56836e5598f20287ce36a185252abb24bcfbd1377cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00733-of-01024.json.gz": {"num_bytes": 398547748, "checksum": "476389cb582df3c214f3f5a45268bdb47b581a432c08723bd811daa5f5990083"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00734-of-01024.json.gz": {"num_bytes": 397380175, "checksum": "2b6fd36a8f8bc3edfcd8a486de44d2f3132f7b8f4bb2d4c93453dbf1a1b6667a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00735-of-01024.json.gz": {"num_bytes": 399584382, "checksum": "3e0a067fef0b40edcd23ce6680efc07253660b8c00699630bb7629b9d803a198"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00736-of-01024.json.gz": {"num_bytes": 395312038, "checksum": "e4f92413c837d269481ecc0b5d0fc87548bd2ae718ef7f9bff18674ece289bc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00737-of-01024.json.gz": {"num_bytes": 396820243, "checksum": "e61680c57505f027ef8cbd28a45e706936befa2ab40a24a63e638019a1717b63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00738-of-01024.json.gz": {"num_bytes": 397691872, "checksum": "d3acc0c9c76ef2df89f49896744dac53f488f830d3d42f0c481f2321ed60fa67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00739-of-01024.json.gz": {"num_bytes": 397912166, "checksum": "18d281ed9831f28c4c54256a844ab2cff7a5b681da1b7c8eab2565b106381aa9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00740-of-01024.json.gz": {"num_bytes": 397093867, "checksum": "6a65230910384587f5e7f34b52c2a6d9a86a8b1f7a23d26f890b6e810c051815"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00741-of-01024.json.gz": {"num_bytes": 396371058, "checksum": "26eb40e98075ab716b4edec76d1723a679e648258d6812119b46f7522dfa9b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00742-of-01024.json.gz": {"num_bytes": 398346941, "checksum": "466043ec98eb806916806cff7495f0bae89cfeb2835204ea34328030b92a27f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00743-of-01024.json.gz": {"num_bytes": 397366055, "checksum": "d98d31aaadf95dd0d1cf0548db515c8e77c95bbc4b611ae9ab5650429c171889"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00744-of-01024.json.gz": {"num_bytes": 398722902, "checksum": "a43c80ab3bd8d12d12b4ea41d9054b90214fd3ea2ef957f317d6ed6fa7b60e34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00745-of-01024.json.gz": {"num_bytes": 397562514, "checksum": "1e6dad94e0f90bfa0fdc5557c58873aaa95fa9ce1c7b70a1fe76817289cff78b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00746-of-01024.json.gz": {"num_bytes": 397731351, "checksum": "21fefd6cffa9032c9ca7cec91cd775c83bbd37419ae236eeec9589f8bc4be0dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00747-of-01024.json.gz": {"num_bytes": 397781450, "checksum": "b84c74bf1caecf92777fb85129bb009eb3a27fbab1b97af567f36a8bf100e704"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00748-of-01024.json.gz": {"num_bytes": 397425031, "checksum": "fe9bb225f6d03b44e552ec985c844e5012e90c4ad99f699ec4ed4297db91349d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00749-of-01024.json.gz": {"num_bytes": 397925850, "checksum": "3913b2955fee02e2ba716d843559bc4bf4e85a2884ae4495446a379f857a30e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00750-of-01024.json.gz": {"num_bytes": 397089489, "checksum": "773486144d3008cb3207c3c8b65fe6081c9e64dda09728d3586bc82e6bb73fca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00751-of-01024.json.gz": {"num_bytes": 394819424, "checksum": "d728b117a7b74150b03ed7d562514c2e45ccc03b0bceb120eddfa8333166a923"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00752-of-01024.json.gz": {"num_bytes": 397199683, "checksum": "6c10c3f4e3737db6a70375bd605139de61ae8b09a1aa91dd1cfdb82c183f0cb3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00753-of-01024.json.gz": {"num_bytes": 399197199, "checksum": "101c4ed5426b586a4aeeb7dbd377306eae9eec2eaf934e79d25583abff70b15b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00754-of-01024.json.gz": {"num_bytes": 396415619, "checksum": "732f4dedcf1266bcabf15a6a1cdead617ea37d428d8cfbccb5a9dd7521133075"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00755-of-01024.json.gz": {"num_bytes": 394564662, "checksum": "a23f1bb1de23554efff68e730d85802a6491936fb54e256744af641f97ec155b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00756-of-01024.json.gz": {"num_bytes": 395577258, "checksum": "2f4275994a103dca517d4eb3656009c8138930079e00303c7b8746ab6094fd19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00757-of-01024.json.gz": {"num_bytes": 397161772, "checksum": "ab16360173283b22a7e19d181fbf55a6a8d07f0d9007b51aa159c1e81661f5e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00758-of-01024.json.gz": {"num_bytes": 397545456, "checksum": "ff5a6292bc557aa9895de39697e8aea5843fa5a00c83c7983eaa36640d446ecf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00759-of-01024.json.gz": {"num_bytes": 395470957, "checksum": "66a64accfa6c281d2bdfa7b6846397f56c2d4f8a22ae8925a07af853e42f5521"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00760-of-01024.json.gz": {"num_bytes": 397328304, "checksum": "46778c90bcc6da96cf02e66956a1bcabcb9a95bad538cfc0d5190db473a278a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00761-of-01024.json.gz": {"num_bytes": 397706141, "checksum": "4825f25d6e1d13c70e6e65ce13ccd7b1922344c48ee2806952f3ba1b6e26d3ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00762-of-01024.json.gz": {"num_bytes": 396983663, "checksum": "25e1645f05d342b5f872ca809b36d516c7336c22035bfa86cf295d0865e08789"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00763-of-01024.json.gz": {"num_bytes": 396355038, "checksum": "d4c3a92808f0bfb042423cd4166abc57d20603ef07a0f0912058a718a38f26d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00764-of-01024.json.gz": {"num_bytes": 395434042, "checksum": "aa4384f587fd64c24fad9a27defb0345eb44cc536b3d45c710017d225c191ded"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00765-of-01024.json.gz": {"num_bytes": 397204482, "checksum": "cf419554f6c4f6201ebe92e7a232013e5949910f3d54f5cf3d1d65845685c7ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00766-of-01024.json.gz": {"num_bytes": 396420917, "checksum": "32076dd8004ebe35f46d6e790fd6330ad1d7df2b7ae3c4ede325b0da73a673ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00767-of-01024.json.gz": {"num_bytes": 396840905, "checksum": "08e5fd0fc1578a337f3dafdb3c718ade437256119e1968e9f958a8ea9d052c81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00768-of-01024.json.gz": {"num_bytes": 398085225, "checksum": "3579e0756bb6cbf1eddfca27de5cf067a212d683134bc6f8c26a79b7d802bfce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00769-of-01024.json.gz": {"num_bytes": 396879117, "checksum": "0913c93203a084521212e473d08c1d11e8136a8e37f1891330fbce0397bd431b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00770-of-01024.json.gz": {"num_bytes": 396386647, "checksum": "6c12ab51c92b9c92336a6142a1a4e2f7c3725beb7e61dcb004551d13e8d5488e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00771-of-01024.json.gz": {"num_bytes": 396279989, "checksum": "752deaefbf22dd1b1adb36561e8524c1dc555fd105bf3acb78611be9bce72318"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00772-of-01024.json.gz": {"num_bytes": 397850815, "checksum": "4f1969284d1f448caf0bff5d05eeb995cf2339801f6a71e01286f4f7f387c564"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00773-of-01024.json.gz": {"num_bytes": 399466666, "checksum": "20ba552cd30349bc8a2c0b6a8701d4587a005e7ebdf6e3f2a3bf95462c304447"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00774-of-01024.json.gz": {"num_bytes": 398051538, "checksum": "1f66196e8fbf0ebef977f235d2aacb7245f4033b53ecf75ada2f8007465a629d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00775-of-01024.json.gz": {"num_bytes": 399284061, "checksum": "97df92baa605c34ce857d380f1ca42f9e2a0de499ccaa9bab26a5c449451d1ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00776-of-01024.json.gz": {"num_bytes": 396710162, "checksum": "4b1ec54b82c8e5d969d3000ce547f4c20df16d9cc0b889b2b58c8839e9d8e27f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00777-of-01024.json.gz": {"num_bytes": 397265441, "checksum": "03827ccc3c5bebbd12a04019e9797945c55becabf7f9c1f3fe5353513f5c5a38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00778-of-01024.json.gz": {"num_bytes": 396050013, "checksum": "54aeadf4fe16949b2ee9438feabe979570e7587bb07b3c57e47422f662191936"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00779-of-01024.json.gz": {"num_bytes": 397124991, "checksum": "913e268b5474a8b4cf1426f5a0a06c7f437eeabbc35f0126481328b419f85bf6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00780-of-01024.json.gz": {"num_bytes": 395196367, "checksum": "4c1a4f296916c30103a5dacacf8a167e43bb424d085ed3491b19f0ec1985d9f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00781-of-01024.json.gz": {"num_bytes": 396578403, "checksum": "a54f26c233662299ec8f0ae1bd266879e93cf4676707b0955114a1a80e2fcf61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00782-of-01024.json.gz": {"num_bytes": 396142106, "checksum": "3713c6b725afd833063402e6577bc0ed003a87720f700f9272864c2360bfd260"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00783-of-01024.json.gz": {"num_bytes": 396470511, "checksum": "fe9d904a07ffb2581b6734c8dd847435b867d3043ce4b4840b1c54374919d757"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00784-of-01024.json.gz": {"num_bytes": 398156228, "checksum": "af762a9ff3eeb7ed4a56f54702911f0c190b97f8efaa02cb89b1626a1c44c9f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00785-of-01024.json.gz": {"num_bytes": 397185035, "checksum": "6629e1827aab88f55d53de24625f8362daccf910663db8584d959aa44f8043a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00786-of-01024.json.gz": {"num_bytes": 396556703, "checksum": "ce51603900ea0aad8981fbfa8d05d684bfef5360413dadc6933246c2dc81c413"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00787-of-01024.json.gz": {"num_bytes": 396214799, "checksum": "6eed5802b89d63eea115cbfd9e00f6d1b4970bb3600a887b904b548181a4acef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00788-of-01024.json.gz": {"num_bytes": 397965162, "checksum": "eaa948fdaa744576f006bd70d54f129968772a479fb0bd8e946d7605857545d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00789-of-01024.json.gz": {"num_bytes": 396280999, "checksum": "e0b80ec73507f96310abf070e5cd17d5a67ffb4a337820a8b79a02afe81a0b99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00790-of-01024.json.gz": {"num_bytes": 396224660, "checksum": "2b4a06fb6f68c773da34f8d4c33d7746b6a3206bb242042841e5e007fe3cb6ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00791-of-01024.json.gz": {"num_bytes": 397681975, "checksum": "1b167c20d0414d970cda74cd357cf07d69abd1d3fb0f57222028b369551d513b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00792-of-01024.json.gz": {"num_bytes": 396210611, "checksum": "ab55128753a1e58d1032b8fd747c48158a721b12e85990627478f22b78e156ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00793-of-01024.json.gz": {"num_bytes": 397534599, "checksum": "e7476bde08e0065c523d09932cf2cf6ffe8ba023ae0ee435238efb5dd6f93d7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00794-of-01024.json.gz": {"num_bytes": 396536137, "checksum": "6228922504b2d3ebeef4735abdff06cc786d6533a6c150d50f34042aeeae1544"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00795-of-01024.json.gz": {"num_bytes": 395235406, "checksum": "9dae151c15898d7991417596a364e30f00e0ff6280f1505953e6de40c2e228e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00796-of-01024.json.gz": {"num_bytes": 396226178, "checksum": "1dc8decde490324087fcd06e4b1e17117606f2d61a80d506d89a12cce11ba291"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00797-of-01024.json.gz": {"num_bytes": 398556774, "checksum": "a454758e8cffccc88f83517a241f2457e683647949cde6aaf1e217de42f6a52b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00798-of-01024.json.gz": {"num_bytes": 396109677, "checksum": "3daa6b8602517b9873db96522a2852d940d52cdf0fa86f259ac41a9cd688751f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00799-of-01024.json.gz": {"num_bytes": 397930210, "checksum": "09dec669699a437d6fb78b3f2705028fb380b2eaa20ee73b77270216a48b8a95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00800-of-01024.json.gz": {"num_bytes": 394545441, "checksum": "726f99301047519de253e3edbaef5f4a4f95e3850b1b98e01c7864499dad7833"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00801-of-01024.json.gz": {"num_bytes": 395867151, "checksum": "a97ef657bd8ea718427ffc686f55fc1786f0834755fce3ea3ae8402d9f75c11b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00802-of-01024.json.gz": {"num_bytes": 398573429, "checksum": "20ee1f30272a0d5db74e8589be12c17173580cc9f14b039b3d33f3197816ef95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00803-of-01024.json.gz": {"num_bytes": 398084513, "checksum": "31d1a8f6965d3a8cb7e28fa8bf2cb9a5609d4a129dbc630a8e2a939f475b2003"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00804-of-01024.json.gz": {"num_bytes": 397815811, "checksum": "edb758146d462848bdb113df90fa4b9f451eca6658cbd2cab147c8b0eaf88a70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00805-of-01024.json.gz": {"num_bytes": 398641802, "checksum": "b916bafa7269ad4ed09c58c74dc3f098b529444609dafc57e6e4056aa6496ee9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00806-of-01024.json.gz": {"num_bytes": 397993720, "checksum": "92fcc5881ca81b808c14f8c9960d873be70f857f95fd1e777b1ae1d4c62bbbaa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00807-of-01024.json.gz": {"num_bytes": 397743279, "checksum": "79aca62194176964b66a90dda7631d01acc2a6abea1ba19a90076139e390170a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00808-of-01024.json.gz": {"num_bytes": 397076817, "checksum": "a469391e432dac6967e841d46eaeabe9429849492a3df5e91431777fe9b9f164"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00809-of-01024.json.gz": {"num_bytes": 395533122, "checksum": "1278d928e105ea7d9c397ef1da79dcc8791dfad9177727aba098bd451734ce45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00810-of-01024.json.gz": {"num_bytes": 397468683, "checksum": "5c6f3e7550827de9d7028decd82320a55722785394ea4951ee78f3ffadb2d4e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00811-of-01024.json.gz": {"num_bytes": 397348260, "checksum": "8c1ece72814dd82bf1bb663b76a40c58129c08540195f9b2134eff5837faa366"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00812-of-01024.json.gz": {"num_bytes": 396753479, "checksum": "b3770924d0576f7cd1706771c411f0f288277c6c6c922dc7af4017b665109a88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00813-of-01024.json.gz": {"num_bytes": 397977743, "checksum": "864040da6f03f4d2ed2a9eae4daedf304e0d27196f0b522cee4e8fee55f9ea71"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00814-of-01024.json.gz": {"num_bytes": 396168620, "checksum": "542986bb3b75ffcfc853af11a80edb6a31e12527d2588f1c5b2119fe35d3f150"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00815-of-01024.json.gz": {"num_bytes": 397639162, "checksum": "a617c2f27306ce5de74ab756cbf74707fddeb0aa92277b66d0cd65be230f386a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00816-of-01024.json.gz": {"num_bytes": 398296204, "checksum": "174a2e77e6562384cc4e7459ebf536db5cf4b530e4f1d7714e60d082ac7a19c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00817-of-01024.json.gz": {"num_bytes": 396112543, "checksum": "95af2c4f32efb4ed2a41cfa38dd2be09d51d4b0dc53ca8763309503f0276d56b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00818-of-01024.json.gz": {"num_bytes": 398371592, "checksum": "67789e3525f2daf6af2551df12a50341c3ef51c89a9c714a8def76209b5b7460"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00819-of-01024.json.gz": {"num_bytes": 396751420, "checksum": "07431a263e2bb92c048fadbab74ce1399f76fc57a04d7f9e90cb33aa60a4c5e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00820-of-01024.json.gz": {"num_bytes": 399213859, "checksum": "83c03df95869973c2ed46c909c0e92e7ecd75317c06b09e447a62b592421d1c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00821-of-01024.json.gz": {"num_bytes": 398408628, "checksum": "b5cb8c52a8713c5291ccf29c171e9bd9b57a54211392a19e8f31182d1053a032"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00822-of-01024.json.gz": {"num_bytes": 395429180, "checksum": "8c47bf7a0d2b9c84d255df0e7da058fba2b4ca6da3c20cbdfe5a686e01cf5c45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00823-of-01024.json.gz": {"num_bytes": 395437149, "checksum": "62818e45f34e70728494c74daa583e30c70aebf91c2f057470039f6d35059691"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00824-of-01024.json.gz": {"num_bytes": 394503147, "checksum": "e9fd88994b23531ba26e6859ec1985798a2ab9b300c2fdb1e202ac553ab305b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00825-of-01024.json.gz": {"num_bytes": 398841091, "checksum": "77ad5a9ac5e3c1d1180981bffbbdbf8a429854001d990258c615e0e16c8a9f6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00826-of-01024.json.gz": {"num_bytes": 397404278, "checksum": "06a39374c1cda19cc4b034c4877e1fd3bdc84290fdb621fdcdc77f3c5eea9a47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00827-of-01024.json.gz": {"num_bytes": 399316947, "checksum": "fd27a73b130c1cf8256f22212e23799d0dd31281cd29bcf9bb658bcda457b66e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00828-of-01024.json.gz": {"num_bytes": 397514415, "checksum": "3e7d199d05f885e8bba769d21a55a3f2ef2114b66ed738428ceb506fdf272ff2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00829-of-01024.json.gz": {"num_bytes": 397251538, "checksum": "91650563e9520b2d1ec2cd726304b781b4156ffb68bc172635a53f425fa6bb0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00830-of-01024.json.gz": {"num_bytes": 397653118, "checksum": "893ef017cbf7d46c99d9c69ba74344cfc2800bb23faf93e7400c0c282422945f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00831-of-01024.json.gz": {"num_bytes": 397299276, "checksum": "4eb3c91e52547f3b4af586f5bbdb0cdaf6a345b202a09c6aabff5c5f628b2948"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00832-of-01024.json.gz": {"num_bytes": 396915924, "checksum": "9fffd46fc1f1bce010484f2850102e2e153c5695c277efb67f65811630c2493d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00833-of-01024.json.gz": {"num_bytes": 397652261, "checksum": "3b89df9375a906c96eb1e21a6572a07de2f5d875996c01c744933984edb1af1a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00834-of-01024.json.gz": {"num_bytes": 396070735, "checksum": "b758b4cbfdfb799a8615ec9c3678b27dcd9b1d63af4f272879e0dae84cac9d63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00835-of-01024.json.gz": {"num_bytes": 398028152, "checksum": "6e07f1e6a099aa496fef3015514fe5f3cc665c742f8a783389c7da4ce0e0e72d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00836-of-01024.json.gz": {"num_bytes": 395941604, "checksum": "6bef1291a741ea5976749456185a3e3a03c3fcc9ac00370f28672ab39c552db8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00837-of-01024.json.gz": {"num_bytes": 398655070, "checksum": "b0b7e1c826302417630c3e1b1877bf106beefb5a7a11feb9bbf1ac3712714fed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00838-of-01024.json.gz": {"num_bytes": 396374435, "checksum": "3e9bdde8b73397a5fce143e91c92f9e66f46b45edfb30da1cac400b9aa7b2ecc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00839-of-01024.json.gz": {"num_bytes": 396388725, "checksum": "4154322b97c600742660125e6458787e603cf1a44b49267f4d1c569387fd132e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00840-of-01024.json.gz": {"num_bytes": 397564603, "checksum": "f9560028196fc934378389e355101e5e7f8fde9e5c921722704a18b24ebc5804"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00841-of-01024.json.gz": {"num_bytes": 397001678, "checksum": "0dad99ac959765280e6bf6d9d1a1468ef9dc9cc781e8f5bb832f7295e4e79f69"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00842-of-01024.json.gz": {"num_bytes": 397139167, "checksum": "e81fd683da081349629a0a7ae8ff7813351ed23caf4ef87041b64524034abc83"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00843-of-01024.json.gz": {"num_bytes": 396044889, "checksum": "d8e3a5b4148c7e86dea50ee5ba89ef55629d3550fd926c41754e5a26e7e52c36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00844-of-01024.json.gz": {"num_bytes": 397365441, "checksum": "c4d2ffe853b55464961b707b6d0264d6852817077204a0380c906184c077012c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00845-of-01024.json.gz": {"num_bytes": 396477802, "checksum": "7b3c4d435eca57a0fad05c106ec5928750aa01d95047618a3bc84e5342e912c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00846-of-01024.json.gz": {"num_bytes": 395983616, "checksum": "bdad2ba411291435ac0cdd083e46aa8369499f014a788fa85ed8c419fe9cb2de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00847-of-01024.json.gz": {"num_bytes": 397646062, "checksum": "3f6bddcefcceaa4184161432e4f0b9292ae4fe7dac3079d4191a31a38f48c7bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00848-of-01024.json.gz": {"num_bytes": 395958111, "checksum": "5ed10d926e5fd1dcbc777df82391eb3ba57276c7303d488d6f3591022d20cc4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00849-of-01024.json.gz": {"num_bytes": 396960036, "checksum": "ab82adc6f66ab0403cbbb38859009a460e6c8c38c789bc2b2420da8b87096a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00850-of-01024.json.gz": {"num_bytes": 396603592, "checksum": "5a6aa59a01504f5655d429dd5cb3ebc39e3994b22cbaeb5b09ceb29a26b94031"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00851-of-01024.json.gz": {"num_bytes": 396511886, "checksum": "f1954da7e217d893a0237a0f431dd2a9071723e543bf0f4943ce38fab048a44e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00852-of-01024.json.gz": {"num_bytes": 397626831, "checksum": "f5cdcd7ec4f3c855a1006f9278ed4df50574a3fa7aa1c5a2e255ea5fa1a770cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00853-of-01024.json.gz": {"num_bytes": 395811873, "checksum": "24b1033da877ebddc09cfe2d3325868448dab9083b5147d6cfc4fa63ab402a94"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00854-of-01024.json.gz": {"num_bytes": 396513614, "checksum": "419952e0bc38cce474190c0b9ea581ccbce77da5e045dd60f5ff1fa1d2833d19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00855-of-01024.json.gz": {"num_bytes": 396493352, "checksum": "3d2b529871c625fc9c1c59b9d5cede2a77e609041f1ea044d68ac16e9fa6a30c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00856-of-01024.json.gz": {"num_bytes": 396852729, "checksum": "a3b56e6171fc2b14ebe67f6a71af688ea6135597bb8f8cf83e2fb460727aa5eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00857-of-01024.json.gz": {"num_bytes": 396428653, "checksum": "de550a5d608bffde45c149bc0d4c1165cbd3b5baab3d3529f006a02aba6d53e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00858-of-01024.json.gz": {"num_bytes": 397039613, "checksum": "11374c2685676ac2eb3dd0d281b44b512ff1d2968ab320d9c857b44304eb8ab8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00859-of-01024.json.gz": {"num_bytes": 396515194, "checksum": "64879e565e5c467e630566ab75524bb300d58798c814637ffebd15646544cd5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00860-of-01024.json.gz": {"num_bytes": 397764125, "checksum": "7e22be61b3413c8fca2414087655b7ef7bef2ab5ee373fee74d13c8fb991675b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00861-of-01024.json.gz": {"num_bytes": 395314420, "checksum": "29c451c69c8c05f6eee2741b9ef6c241f551257a45da8342a1d6bb341f80314a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00862-of-01024.json.gz": {"num_bytes": 397763845, "checksum": "679668616899f548fb35da32c3e5f121002670cc3296c0c90f5bf45eb3ea1d79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00863-of-01024.json.gz": {"num_bytes": 397356206, "checksum": "43c5b3af2173d4293396f336ec363aa2f31580b65128f44ca8bb891f2022859c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00864-of-01024.json.gz": {"num_bytes": 395463092, "checksum": "77b7b6299955f4869e5db994fa6b20fe3007cf8cf2b6609442fb1ed49284cee6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00865-of-01024.json.gz": {"num_bytes": 396909291, "checksum": "7eca0e82842b52f99640ab574e4b2446309aba6ac262f980fc6d249a337d06a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00866-of-01024.json.gz": {"num_bytes": 397587651, "checksum": "931014d99ab2a765ebf90e876694647c265ca5e6bf2b459eb027d6b06643a8ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00867-of-01024.json.gz": {"num_bytes": 395992645, "checksum": "0976a5389aed40e4bca89cf22382cf121390c75bd755437be474c097c8fee0ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00868-of-01024.json.gz": {"num_bytes": 397789857, "checksum": "6ffd848d165290a746a21767e79a9f046b70534aaf7b14fc01f9365e4e3f7d93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00869-of-01024.json.gz": {"num_bytes": 398124116, "checksum": "5fb85058bdf40c0ee6cf748cda7483b1b3cfad18c26a90c2150c2a3f30ceeeca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00870-of-01024.json.gz": {"num_bytes": 396432487, "checksum": "89d50aaa3620eac4ad593a403ea637b2ff090361ead05c3aa8c7a3351c66ad65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00871-of-01024.json.gz": {"num_bytes": 397484772, "checksum": "490f4104981a9ab3ef04600a4865b9a2a18239e335d7fb7fff79ec1b7a225318"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00872-of-01024.json.gz": {"num_bytes": 397240896, "checksum": "d344994866bc49475f66e9937636afa787e1ff560e3f62dc1a0e4d0220d6ed39"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00873-of-01024.json.gz": {"num_bytes": 395450398, "checksum": "5d3b320aab1f7f09450531649666ded1aba8a9bbcf0f47992c43cb40a6d7a929"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00874-of-01024.json.gz": {"num_bytes": 396365056, "checksum": "346aae20204537ba2f4a865ca80b5d1c6da1e3a3b78d306d7570a69f185cc4fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00875-of-01024.json.gz": {"num_bytes": 396679348, "checksum": "ba81f9c1650d30853edbb9886dde84658c254dee5a3ac1062484f7194cd413f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00876-of-01024.json.gz": {"num_bytes": 398278881, "checksum": "88fb38aad7cadd76c818dbe7a372144dfe17d110f7d2123a80d14686fb43a6dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00877-of-01024.json.gz": {"num_bytes": 397051868, "checksum": "049e4a62056c98284b35d10a74ad5ef7014265a6dccb99a71f93a409933a685f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00878-of-01024.json.gz": {"num_bytes": 396132123, "checksum": "bb7b97a82bd6d31612de66a03af35d404b15808b925e7fd94bd0a8e9e928b927"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00879-of-01024.json.gz": {"num_bytes": 396520374, "checksum": "2a56fed53aa022e6a7956f604d54d99af89a15b6c7fc6b037f94d347f1d15f51"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00880-of-01024.json.gz": {"num_bytes": 397004524, "checksum": "1cadef434909d4508a9a6bf40d6a9323256f3089615a5d2963c83040d5f549f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00881-of-01024.json.gz": {"num_bytes": 397336334, "checksum": "0e36dcd0eb1773eec15ffd0fbbe8951343bb6961dd1838b51e74da2e055db176"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00882-of-01024.json.gz": {"num_bytes": 394949798, "checksum": "78c99406cb921c2b8f5b86e4e7eeed24c799678732e5a5450db6b12b7ceeef61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00883-of-01024.json.gz": {"num_bytes": 398647721, "checksum": "f0e7a0a9970c7fdb5f629771e76bb06bf62b79e9cbf5008e866f954dd436401b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00884-of-01024.json.gz": {"num_bytes": 396040500, "checksum": "05272a55eb2840f94a7dcc30a8d09b957511b983b0fc3fa618a8995bc594d055"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00885-of-01024.json.gz": {"num_bytes": 396460591, "checksum": "27511aa50410260d261866dc970b897b10a95dd4dfd92b0bc3a5fc41e6c75335"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00886-of-01024.json.gz": {"num_bytes": 396149133, "checksum": "e66ba9c7ceca631a4b43ecff1e151524a209368f298ca83624476ee9144cc3cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00887-of-01024.json.gz": {"num_bytes": 397164216, "checksum": "95e341054bd8a21e7f49e4a5aaa5fbe51517ff631e66e67ff1cdaea6e3178002"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00888-of-01024.json.gz": {"num_bytes": 398216402, "checksum": "6fef57de31fa1692d8a4021b317554688657fad3f55dc144e2971d63083e7879"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00889-of-01024.json.gz": {"num_bytes": 396976936, "checksum": "36da1bd0eaa27ca6e8510a3c005695fbbd7b0fedf63f077e3787590d4b1af625"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00890-of-01024.json.gz": {"num_bytes": 396903125, "checksum": "6bbbe5db2c0938efe5f8afe7b30765f45cedc9fd4209bb7826c489381175bc5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00891-of-01024.json.gz": {"num_bytes": 396404354, "checksum": "47601b1b1a0a725c32ae0c32364f7ac188b7e8c68d29a2dffbe1a4dbe39393f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00892-of-01024.json.gz": {"num_bytes": 398144052, "checksum": "a7b6bdafa5a226c22ccdf97c873e4915ed8dd8b59e2820a4dc62f600b4710175"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00893-of-01024.json.gz": {"num_bytes": 397990484, "checksum": "12f08cfa1fb4f94a3d7d9584cc3f5ae9fa518cc095e4cb07939d02ecfb7ffd9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00894-of-01024.json.gz": {"num_bytes": 398271782, "checksum": "004bf46ac7c8d7770b458ec341322f5cef643926aff9255954f08faa1dd43d53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00895-of-01024.json.gz": {"num_bytes": 395489909, "checksum": "3ea14b3dbd7a4c9cb7aad83d1311d335714aaea5b2dd0374debd63c56d02dcbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00896-of-01024.json.gz": {"num_bytes": 397589097, "checksum": "c0f1c7e54bf7a808f66d2acc9aec79f1ce936ba480f5d1e379c6853714413175"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00897-of-01024.json.gz": {"num_bytes": 399215096, "checksum": "20958123acf2d578448a5166f1209b0452db33ed395cfe512015106bf99ad31d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00898-of-01024.json.gz": {"num_bytes": 397044516, "checksum": "46c5145069d861c04b2ac1afe80c4c4453f91869f6cb6a1d9f7b648f1b08942e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00899-of-01024.json.gz": {"num_bytes": 397687759, "checksum": "2a3923d8ff2ce0eab5978a8e0198bc2d1512cfa19c69e673e048b8eaa72f82b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00900-of-01024.json.gz": {"num_bytes": 395192267, "checksum": "9cc72deeea7fbc0fa3782c41938d66315923dd9f53d89f47c00f85f93e454ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00901-of-01024.json.gz": {"num_bytes": 397806320, "checksum": "8cfff74f280636416f523c271f75e5704a570db4cddb8a70d033158868c21347"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00902-of-01024.json.gz": {"num_bytes": 398450537, "checksum": "7df8804eb5ecb79177001f9ce3c66f0ad20cccd8151e817816e9342d07c392be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00903-of-01024.json.gz": {"num_bytes": 396733151, "checksum": "89551a52d1e97b4ec3007f8c43191c1ae1475d0ba5b48d20818a12c85b0add74"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00904-of-01024.json.gz": {"num_bytes": 397497719, "checksum": "2bcde59dfaa642722969d1401a4ce43a35c57930bb1d664371efece1e2e91c32"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00905-of-01024.json.gz": {"num_bytes": 395760696, "checksum": "ec844272b0666a455dfe0cab065e00df44e8da2156a03797100418307c96830c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00906-of-01024.json.gz": {"num_bytes": 398496346, "checksum": "ff68909d470edef08929a91068e1de02841c16a000fbbd17ef042cb76f1fff37"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00907-of-01024.json.gz": {"num_bytes": 397085405, "checksum": "a9b26676af61a6a1355225bce5bbcd67aeaf0fb7dc2209f30235b275536baa85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00908-of-01024.json.gz": {"num_bytes": 397037103, "checksum": "e86688677a46103b0b224333faf1b4f89da062e4ec0ee35752c91ff9772697c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00909-of-01024.json.gz": {"num_bytes": 397394775, "checksum": "93082177607900bfce7fc53f1665a831093bb50caea33e014f327181579c0012"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00910-of-01024.json.gz": {"num_bytes": 396668466, "checksum": "dcfe639607c18a309e2c91864a6912dce3851abd62bbed3ba16390899e637327"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00911-of-01024.json.gz": {"num_bytes": 397926997, "checksum": "aa995c38d953237b1d6d53be7237958a00ca2dbab4a753c7c4404849fb416d5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00912-of-01024.json.gz": {"num_bytes": 397810240, "checksum": "e3f17ac285e8c9b04713713a957602a63e176f476d4a67018012e9cf2a3e5a84"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00913-of-01024.json.gz": {"num_bytes": 397143597, "checksum": "4082ab833be47cf881693ea4442e3940625e0d2c1117e15234886fdfa779bce3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00914-of-01024.json.gz": {"num_bytes": 396398347, "checksum": "7c62dfd17b21ff64af640e4aca8fea0240998596d11ca551a3ab045d5041fcac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00915-of-01024.json.gz": {"num_bytes": 398622100, "checksum": "69abe67cda4b1613d5f741804ccdb294cd5f457027818d9366db8cf2f5f40871"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00916-of-01024.json.gz": {"num_bytes": 397387266, "checksum": "6effa83cbf3345fd7e41e432ef82156bb1334f2cf17589bce313aebee9727131"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00917-of-01024.json.gz": {"num_bytes": 399730979, "checksum": "f0d0ff1ae76a84c07647fa1517410533862f1927fa85dbf38017dabf4607bc1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00918-of-01024.json.gz": {"num_bytes": 396895902, "checksum": "84cc56e725be31047d0b6a025cfacefc462f4a1a546feaa34af95a6f25a4e1a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00919-of-01024.json.gz": {"num_bytes": 395247578, "checksum": "daa3156989ddaa9a7eba228848697ccf6a385679359ab765881d2293bef107aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00920-of-01024.json.gz": {"num_bytes": 398305242, "checksum": "2a9e02ef643962f6009e42304b983c87bae7b74c1edcbf8e6808b320ea7ea776"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00921-of-01024.json.gz": {"num_bytes": 396446011, "checksum": "f83526ad11d81820fce4231e3303d613dbbe56a8fae878d9442c8d7e98023437"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00922-of-01024.json.gz": {"num_bytes": 398010331, "checksum": "e47cb9d7550644ef807c3ea9e19ca4aa1df54eb908b54651bf0e17f0ded9157d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00923-of-01024.json.gz": {"num_bytes": 399160018, "checksum": "470401e5b0777096806113a36dcb92b8d453d6e8f5f4f0b15df2788e382ca03f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00924-of-01024.json.gz": {"num_bytes": 396880756, "checksum": "c86e546c68bf8458951fa723c086d6efa5b210f53cd4fcb2de4b9efc7a71a275"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00925-of-01024.json.gz": {"num_bytes": 396806561, "checksum": "5d9b1105c0053dc9530c911046f4da458f41d92c771282d0df8a3a22838feaec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00926-of-01024.json.gz": {"num_bytes": 397479994, "checksum": "c3253305ac4ef226501e4fd4a6acfc6067a76c084ad852eb2a9f5916aa3d51a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00927-of-01024.json.gz": {"num_bytes": 397083225, "checksum": "8931df0ee597f72ea3592d0a4d236ce655a92cf4e7eb9298145f496246c18c21"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00928-of-01024.json.gz": {"num_bytes": 398000839, "checksum": "5e29e75231bdb413dedd1211bd87e9fc3f4ab8bba41999afc1ddcddc16f4599a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00929-of-01024.json.gz": {"num_bytes": 397731309, "checksum": "03f7a9199b7927a6d78a8aa4eed32c250d32dc409e3bb2847d7db948ee63d46c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00930-of-01024.json.gz": {"num_bytes": 398133003, "checksum": "b22a79dc228697394d0ce25b7d31112f9e1a6508cdc4b57af35e84e65167bfeb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00931-of-01024.json.gz": {"num_bytes": 396694508, "checksum": "dbbc65db3d442f9ace85498a3b27bb598c20cea171b3de17d409f9b989c262d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00932-of-01024.json.gz": {"num_bytes": 396255463, "checksum": "02af4162b084004e99dc6862c88749545593e342a83523597cada140e57a0ab7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00933-of-01024.json.gz": {"num_bytes": 399013035, "checksum": "dc4d3b4f03c36a8f1393ba15195c3f64b128862b812839689fa387e708ffabaa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00934-of-01024.json.gz": {"num_bytes": 396593138, "checksum": "02a5a8e02b2636c9e912a9ef8a79ececde4f4fc92bea74e59791d181bec104cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00935-of-01024.json.gz": {"num_bytes": 396748502, "checksum": "05d1d6290580d5c74b906ab03fe6773ecaaa1ff3be84dfdef48d1a2e7f5e1120"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00936-of-01024.json.gz": {"num_bytes": 397737673, "checksum": "351d3543b1457da9719061948a1b4bdd79be8a0b786ecd6a9a8cc0db49cd2181"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00937-of-01024.json.gz": {"num_bytes": 395377872, "checksum": "d431b01bddcf911d7da5bad74a78d0d1527d60d9720f77868ef08e1a65850986"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00938-of-01024.json.gz": {"num_bytes": 397193715, "checksum": "bff5e755b174e3608ba72b39898a2bb5e9ca6d3362b70bd66143566aeff52690"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00939-of-01024.json.gz": {"num_bytes": 398044482, "checksum": "03facf22c376f03a8078e99d1dcc1c22ed5d7e179de472019cae894f40c7a4ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00940-of-01024.json.gz": {"num_bytes": 398894204, "checksum": "3d3a2125262ee8ca498cd54db52fe626d010a2a93c000ea2b45f931e491ea9e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00941-of-01024.json.gz": {"num_bytes": 396758197, "checksum": "b3957de08e7779d8ec23af02a6d709189796314c70a99f46c90d0bfbd14ad561"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00942-of-01024.json.gz": {"num_bytes": 398181993, "checksum": "74aec8dec794c79683dfe43d8aece4c1c47c5389aa6d4bea847ac461cb5ba21f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00943-of-01024.json.gz": {"num_bytes": 396271547, "checksum": "231f63d05f81d249f618768c9f712cc31314dacf55a6004902a0e7d0bfb13724"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00944-of-01024.json.gz": {"num_bytes": 396603419, "checksum": "d5661730f3ed6cc5bbc5d935a6f1ac7d241b40c52dc83775a421e7a1a672f518"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00945-of-01024.json.gz": {"num_bytes": 396596660, "checksum": "3b5aeb0786dddf0b9cabe2ca071283b276822e2861d8688e38f927595c159b02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00946-of-01024.json.gz": {"num_bytes": 399900563, "checksum": "6d5549970af2c6987583477991552e1944b411642782c07d17eb52f91e714a1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00947-of-01024.json.gz": {"num_bytes": 395391489, "checksum": "f5544ecb42c385cd5d5120c82140e4a36051f6a401d89ce30c8f2fc08cd69804"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00948-of-01024.json.gz": {"num_bytes": 399257562, "checksum": "1448cca7f1b9824adcf8437a33d14a7e95b705396611f82e7aba9a69e0a25118"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00949-of-01024.json.gz": {"num_bytes": 396371965, "checksum": "a7eb228f1d1ff2744af3d1a1358a94611cd92c25d81edac0e209b9f81c8a0a60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00950-of-01024.json.gz": {"num_bytes": 398022110, "checksum": "8651693d2180e518039da487f638c532c53f6d79a33356922b2d8706aa6a83cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00951-of-01024.json.gz": {"num_bytes": 396224338, "checksum": "c46bc8aa1621153fbd913b5d0b23a82352a28b36ec997c4df4b92dcc6ef26895"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00952-of-01024.json.gz": {"num_bytes": 397581207, "checksum": "02775930e3c420978a9d2785ee0137c3963dba7bc34538b2155eb38dd6ee89a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00953-of-01024.json.gz": {"num_bytes": 397045599, "checksum": "9d54940cb594de6e0f8593f64293e96375f0a5c56f3569c72720476bcef1f1a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00954-of-01024.json.gz": {"num_bytes": 395457873, "checksum": "3c12a1c3061164f345d9e402bed28be9af84ef56d5df1b22a3cf9f818ed47ae8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00955-of-01024.json.gz": {"num_bytes": 396450938, "checksum": "45db78bea4fae6cd69d900c581fccda873d2aa9f24ac5e9dfc18b486c15c3788"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00956-of-01024.json.gz": {"num_bytes": 397120474, "checksum": "7db7ea23446bd8a66737546c5daa0c2dec7bd5c4743f52eb53685ccbf54d9b17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00957-of-01024.json.gz": {"num_bytes": 397403279, "checksum": "89de2950bc3f7dd4f95d8a0b7cba19e9678bfbc23175bc22d9f9599ec1ad9cd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00958-of-01024.json.gz": {"num_bytes": 396861933, "checksum": "f325478647cbec9d79bff2266672144147276a82f665d3014c5d2fa9c112c387"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00959-of-01024.json.gz": {"num_bytes": 398439950, "checksum": "70d786bb337c012269caf6aeea3bf9604d279d3e4335294c72ca6cb5a9fbd951"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00960-of-01024.json.gz": {"num_bytes": 395684257, "checksum": "e1d170b0a4d6954a920ef3923688a7dbf40398609ed2ae04b2635df9ceb07821"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00961-of-01024.json.gz": {"num_bytes": 397526287, "checksum": "47b90e3747f35bf67c872d65d843f6dd9bfca15dcb769b31bf3586c6645858bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00962-of-01024.json.gz": {"num_bytes": 397473683, "checksum": "d0ddb2c104f515144265bd3eed526a65ada46f848183688b420694751b113272"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00963-of-01024.json.gz": {"num_bytes": 397964876, "checksum": "74725b631c1699b1166589eaebb66374c031b170eab3ab359230cd4a23a8ae79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00964-of-01024.json.gz": {"num_bytes": 396523661, "checksum": "fa0d49a2cc726628d9a1b5ae2ace52ee90401af8ae15add27c3f4566dd99a79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00965-of-01024.json.gz": {"num_bytes": 399289514, "checksum": "11fb1878a8b204181f7f776a764f5e9e577d0fe62d4b2e4ce2164ce9fcc30b8f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00966-of-01024.json.gz": {"num_bytes": 397411408, "checksum": "5646014ca3c99f53bd13183187b1e6e8f84cb6c846d6f1f3a3c82edb4accc47e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00967-of-01024.json.gz": {"num_bytes": 395095282, "checksum": "b799b17f36d85235eaf1bed9f4f760a22b75fca736744218e44fae5917a2286c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00968-of-01024.json.gz": {"num_bytes": 397189410, "checksum": "8d9748f5a92a9e0b836fe74b962bd2da04b62a0a2943ea5e440cef19166a5479"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00969-of-01024.json.gz": {"num_bytes": 395651742, "checksum": "f42c71219641fa302692698b4944864f27b7f87d4477a86babe23745dad72715"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00970-of-01024.json.gz": {"num_bytes": 396180197, "checksum": "383d9586f27579b4a97c5901013b3e025f10dc813047d65158d6621430803aec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00971-of-01024.json.gz": {"num_bytes": 396574555, "checksum": "d2c9700fbac454d3b3a42b2a3c4eb0111eb7cca7cab3d545b0912aba60415c91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00972-of-01024.json.gz": {"num_bytes": 399639122, "checksum": "5d59e643bf20156a28e5e9dfcd811c5a6c3779e1875f375db09a0fa1871dcc90"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00973-of-01024.json.gz": {"num_bytes": 395456709, "checksum": "8b22e82588e30f30f664895b9716cbb0cf38d5ff4331d3be31ab25663c634a00"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00974-of-01024.json.gz": {"num_bytes": 396693438, "checksum": "5fba4f9d634d968f15d5d4fb29d253646494e3e125aaf1c2f8fab38a7e60180b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00975-of-01024.json.gz": {"num_bytes": 395697641, "checksum": "b4c5fceb9fa2397a9b7c75249bd3386b8dbf999d5b52521051a86e067d698448"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00976-of-01024.json.gz": {"num_bytes": 397172005, "checksum": "093aa01a944a222828656d31dacd8ecd57a24a51d361a8742514bb6af009dce9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00977-of-01024.json.gz": {"num_bytes": 396182407, "checksum": "1beef6e248c00abee5f8952641b12d3f5b12d58adc05c8d461c0a073a6ca9b39"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00978-of-01024.json.gz": {"num_bytes": 396180428, "checksum": "0f2bb125af300de2c9fe347899673a4bd2842ba8298146bfe94c9eddc41893cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00979-of-01024.json.gz": {"num_bytes": 396479117, "checksum": "1fe9d0e54b9be79722e6483e386801263ca51d6e9ad925dabbb58a38c4df877e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00980-of-01024.json.gz": {"num_bytes": 395119279, "checksum": "0f262ff2d4701497f6fd6d4f9d3cb1aa3a730ad6bef1961d890a3b0cb4747ee8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00981-of-01024.json.gz": {"num_bytes": 398285798, "checksum": "a295b85e63c176cecd9f5222ba417eeda307e41847eb38c61dec9b83101a8256"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00982-of-01024.json.gz": {"num_bytes": 397811687, "checksum": "2a3a0e0f454dd72a68ed1dd71c508a9b24fb2349ffdfc588cbfcef728cbaff05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00983-of-01024.json.gz": {"num_bytes": 397069906, "checksum": "5b4256392755c4dd79cd37cd6ede645a9a549c4436acd27495e974ebe1d80bc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00984-of-01024.json.gz": {"num_bytes": 397670152, "checksum": "68d4f5dbb3fa349a6811edce8056eb297e771cb9c9939c3a84d30c6ba3ad9dc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00985-of-01024.json.gz": {"num_bytes": 397949975, "checksum": "6ba478b8a1ebf3b1dd67ed7b4a055cc9cc3c01bc90c1852aea8f5a99f6c07e69"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00986-of-01024.json.gz": {"num_bytes": 397730984, "checksum": "a39a23589cc434e573613e3ead44f33adb005c2c13cea8b33601647c97300fce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00987-of-01024.json.gz": {"num_bytes": 399173506, "checksum": "eab46d9d0a0cf05dc5ba475017d98f02f1cfd756c8e707d9823a0463713ebf23"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00988-of-01024.json.gz": {"num_bytes": 398674037, "checksum": "88749d380aac85314df66448542b696e9ae6f61f1b27dc395556737f59ad9024"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00989-of-01024.json.gz": {"num_bytes": 395313344, "checksum": "bc565b662396e3ab4e108635e01873014515663bd5216926a59ae80f6cd4273b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00990-of-01024.json.gz": {"num_bytes": 398567254, "checksum": "e9b9bd97a30ccac353a2386babbd01c3a3bbede8c07bc28d17aecc7ef5af6330"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00991-of-01024.json.gz": {"num_bytes": 396958611, "checksum": "505ab5458d5e52d656048284fd22cc0fcd16e49ba19331669239be37645cb04e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00992-of-01024.json.gz": {"num_bytes": 396102263, "checksum": "59ac5b2b04f224be04a4ceac6a16e29a33681f19cd40cbce3d3e8eb961b9f33f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00993-of-01024.json.gz": {"num_bytes": 396935362, "checksum": "c804f2311de9f7ae5691280e16261b9f8385ef9a71929b2111dfade532b6bdd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00994-of-01024.json.gz": {"num_bytes": 398832432, "checksum": "594727bdc3756e678bd4d156216712ed6c8fc98d3f8e9594cfbed10b2e414554"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00995-of-01024.json.gz": {"num_bytes": 396699737, "checksum": "bb3c73c6d48aebf9c60cde56944faa5bb6727db4cc48ae23d67650742462c42d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00996-of-01024.json.gz": {"num_bytes": 398059244, "checksum": "ac1a7e6e2c2a5468c704f5a2318b5617dd4ce140b98271e2034e00015db6cd76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00997-of-01024.json.gz": {"num_bytes": 397439167, "checksum": "ce9664b29c86c05d3541aee377acdca7a32ef8f0220e0b4b6bf18276b692529f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00998-of-01024.json.gz": {"num_bytes": 397383159, "checksum": "1b4db1b59255f106dd2af7510112eef6d6b611d9f9e000a0e585b623fdb8ae98"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00999-of-01024.json.gz": {"num_bytes": 396339114, "checksum": "ee5e1508704b03f0a9cb3c4bfb578c08fb83a4d20760e3b40f101c58cbbb3ec7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01000-of-01024.json.gz": {"num_bytes": 395172166, "checksum": "f8cbf0bd9c2b90e588942048848fbfa1a20cf775364cb9c84b4d5dd7cf19e603"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01001-of-01024.json.gz": {"num_bytes": 396629363, "checksum": "7cad3f9a28e5988ef91073c48e9d85ea7030289690f817545cfa9f1165dd33d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01002-of-01024.json.gz": {"num_bytes": 396507390, "checksum": "b4ae1017913509855d6d8d4413ff3de4a8d519d91f354b6e5b5267219d20658b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01003-of-01024.json.gz": {"num_bytes": 397652598, "checksum": "0c115446c159d27e6e1354173ebec29e6dff5f38c4d2ddb46c07c450523309c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01004-of-01024.json.gz": {"num_bytes": 397408971, "checksum": "f0b559a832a9ee50225fe1417d936d6b898026d80a105b976deaeae75f9e30a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01005-of-01024.json.gz": {"num_bytes": 397753911, "checksum": "e001c9285ade7de6ac23716b596ddcc733f05bd6abd7e1a67874894c93fbd43a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01006-of-01024.json.gz": {"num_bytes": 397962701, "checksum": "acf13433824104e4bfc3a8aaf8805eb16712cd97b2dc1d48e7d771bee4bd41c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01007-of-01024.json.gz": {"num_bytes": 395966285, "checksum": "4c6069f6a95d036fd3e05a4246db932ad5ab89b9470274f23a17df0b77b9b717"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01008-of-01024.json.gz": {"num_bytes": 397075505, "checksum": "9b3b9c0cd4ee02e18a5d22142183874586da8fd23b4f97033e354f9681d150a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01009-of-01024.json.gz": {"num_bytes": 396881470, "checksum": "14d2d7cf2ebf3b2c73bad4a6099fa1d2b1cb341b100976b03232fb664a7d020e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01010-of-01024.json.gz": {"num_bytes": 397471393, "checksum": "01e6f56bebe0c874d82135f551a6b917759c41af48d127df181267dc9b8f6486"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01011-of-01024.json.gz": {"num_bytes": 398092801, "checksum": "ead5b6b13bd09136fccd9548c224398401bda0ca7ff62ca4db852760760f13d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01012-of-01024.json.gz": {"num_bytes": 397831436, "checksum": "daa2d1507f9b56de0c4aa9d86d93259c1e6f73f0cdfd553ce075a16807dbcb56"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01013-of-01024.json.gz": {"num_bytes": 395098326, "checksum": "c2b21a1a56e9879335c72008919e8f7998dcc1e8df2258fdf2196ea86194e3cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01014-of-01024.json.gz": {"num_bytes": 396164077, "checksum": "0df125946c83c66c6961eae2aa45ad7eea7038d808281d633ce30686a8245e01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01015-of-01024.json.gz": {"num_bytes": 397895284, "checksum": "f6f6eee8fc113b7e717654b9305cc5129c3ee1ce9f263b91f0202762f078a526"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01016-of-01024.json.gz": {"num_bytes": 397723033, "checksum": "48426df1f4665d3179251904c96a0e73c041ed5b57885b4dd852809e632685b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01017-of-01024.json.gz": {"num_bytes": 396761053, "checksum": "f33cf2d744585e0338b29a5a5638752123b7b59f9ae3b723cf7e7b536f9f80ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01018-of-01024.json.gz": {"num_bytes": 396562520, "checksum": "72adb0869cac573282c4bd938cdff556f659540dd4a0a6663711974cb2dc147a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01019-of-01024.json.gz": {"num_bytes": 397564701, "checksum": "3b64235effaf41ad61698b2c28f4d73ced1b6ec6b6d79e0f52314176fa0feb12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01020-of-01024.json.gz": {"num_bytes": 396053080, "checksum": "b16b9f815823d176f94388d4c482652ac656aa763ec738ccd8c8a2a3bdefc1e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01021-of-01024.json.gz": {"num_bytes": 394731398, "checksum": "f4c0044abadd339055bf13843938eef4c066856757250fc15f77060fc0881ba6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01022-of-01024.json.gz": {"num_bytes": 396548645, "checksum": "5ecd8432526eda57065e6161f0618a19cd5993c7dfe86575775f1bf01836f750"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01023-of-01024.json.gz": {"num_bytes": 396863581, "checksum": "c6cd29b8f6067152ccd584ded81df1f9cb905515d48815b8a546d104ec7a3565"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00000-of-00008.json.gz": {"num_bytes": 50774357, "checksum": "7cd6c8b1072af3f3ca3fa160d9411960908142743b101f7229223e6658acb42c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00001-of-00008.json.gz": {"num_bytes": 51252663, "checksum": "d36ef5fc04b24117a19d992de06400e5f290f11786be99be9de68818f7495694"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00002-of-00008.json.gz": {"num_bytes": 50860289, "checksum": "ab8b3dee7c0698c3cc3a74f159d85495b6bb9529600ef9246bec218ae6775e28"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00003-of-00008.json.gz": {"num_bytes": 50141661, "checksum": "54d62c9359000b99713a8a0a0fdfa415f1c09824555526f01dc7217b068542ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00004-of-00008.json.gz": {"num_bytes": 51141505, "checksum": "c11e31de558613237533b41354ca29f0635b599a1c9232517dbf4c2cb1197319"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00005-of-00008.json.gz": {"num_bytes": 50797157, "checksum": "20d39c0f52c34a3148c0a235238ed3849576ed895c3a43cb47b0159bf233c7d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00006-of-00008.json.gz": {"num_bytes": 50158887, "checksum": "754a2b7f134bf45f17db7450d5c0eaf2b8824e4a6072be7b20db434f9cb7968f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00007-of-00008.json.gz": {"num_bytes": 50232244, "checksum": "f90c1d79c51ee1a009dc05930fc40e9ee4c3840ca2412cc129855156aaddc279"}}, "download_size": 407016751197, "post_processing_size": null, "dataset_size": 2060282008734, "size_in_bytes": 2467298759931}, "realnewslike": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "realnewslike", "version": "0.0.0", "splits": {"train": {"name": "train", "num_bytes": 38165657946, "num_examples": 13799838, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 37875873, "num_examples": 13863, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00000-of-00512.json.gz": {"num_bytes": 30085821, "checksum": "6666a680b0a34eb8756dcb5fd2b12f0078237f3502e8a513bd3e5b71bb92be00"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00001-of-00512.json.gz": {"num_bytes": 30065900, "checksum": "61c3f9ab763067f76d9bea349d86efb97af7539d481b5d2807f362204971c327"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00002-of-00512.json.gz": {"num_bytes": 30028880, "checksum": "3aa4405d957ed42d10d643efe7c0f51b05e8f29cf4ad8783448083c1cd3f2a24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00003-of-00512.json.gz": {"num_bytes": 30136880, "checksum": "f6eb49e4c0d691e67fe96ddeb3f8370c5e63a7297a31a8da0c58f5cb3a9f6061"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00004-of-00512.json.gz": {"num_bytes": 30110499, "checksum": "6e0908780f555f4b74c6a5055e2c9708333a8466f0b8723a8ea38cc04828ce44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00005-of-00512.json.gz": {"num_bytes": 30097927, "checksum": "a333562df3fcd4c5ccf51b4c00e11f6619ac4a28a878383aefad277bd30131a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00006-of-00512.json.gz": {"num_bytes": 30013820, "checksum": "7c436cd0993077187988239cf74c3e64de440dacad62ba4b02bd4ac0a8d219b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00007-of-00512.json.gz": {"num_bytes": 30557005, "checksum": "dc9e43681c404fef1741e9608295b8dfae0953473993f3fc44fb83af07a6b82b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00008-of-00512.json.gz": {"num_bytes": 30369535, "checksum": "8de7a4005acdb60436b4e5d7274084e28df3aee31a5457c6837452094544c541"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00009-of-00512.json.gz": {"num_bytes": 30033048, "checksum": "32310a6c74cbee1dbb8b196e0cfad41f79e88e48d8f04c88692d42506113b903"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00010-of-00512.json.gz": {"num_bytes": 29948345, "checksum": "b7df217de849e26ecce5ed7a35b6e6238fcc1c08e969023f209307842dd496c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00011-of-00512.json.gz": {"num_bytes": 30558885, "checksum": "82e5428aaeecf27141a7105e48b78dc02516ae6ebc3d6cd4ef13963316279e1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00012-of-00512.json.gz": {"num_bytes": 29888513, "checksum": "f3d7e496b7c85ed7d020c8f8a24a0b27f9b2535abdb22b45c08441a29398c44c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00013-of-00512.json.gz": {"num_bytes": 29936292, "checksum": "bf04d82f0cdddc09ce4aecd9f71910b9858badaf6456253d43d89e6a8c56cba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00014-of-00512.json.gz": {"num_bytes": 30169338, "checksum": "15b4611513154de0dfc1c9d470326fd053adf70de814ecfe8ba7ccee66de947e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00015-of-00512.json.gz": {"num_bytes": 30071363, "checksum": "887bdea83bdefc50786c93e8014d1d49999f8090ff15168598c884cd0724fec2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00016-of-00512.json.gz": {"num_bytes": 30451660, "checksum": "288ad0d553d54052354be506f87878fa7c54b0fa65811c6e456b3262e1d117e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00017-of-00512.json.gz": {"num_bytes": 29940254, "checksum": "b13ad58ae9f38598cb9d560e3ab34c1d0200db73fe86da12230e50086b532463"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00018-of-00512.json.gz": {"num_bytes": 30282186, "checksum": "5a67e71955ab2d8f6531bd3949cd8ab71f4ff91863ea5a6ec3e7b33c31a05dd6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00019-of-00512.json.gz": {"num_bytes": 30373907, "checksum": "a70682315a0cfe0af815c7b2abbcd63310fabbc33ad6e19daad19f1f51506955"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00020-of-00512.json.gz": {"num_bytes": 30104199, "checksum": "980e544ce130a06e9e99ec906342eb0ab8aeaa96ac26eca01c56ebb463f5d688"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00021-of-00512.json.gz": {"num_bytes": 29733696, "checksum": "a69729b8f3ccb9db12476a31917783c1c6e036e7bbbb4089f430362aef71f467"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00022-of-00512.json.gz": {"num_bytes": 30012894, "checksum": "589e698fe450e22cba47813a5a28da5393e79702a528f6a8469f72f6d630caad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00023-of-00512.json.gz": {"num_bytes": 30024851, "checksum": "2a7b036c38fb4d2df6535631018c23d001931e5bf8d8a815fd5b2f9343ec4529"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00024-of-00512.json.gz": {"num_bytes": 29906809, "checksum": "7e512306cb6ebb0b0c3e96ceb16dade9e1e1f484e754bebd0078e7f545fc5b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00025-of-00512.json.gz": {"num_bytes": 30332268, "checksum": "b636b91fcd9a91ce05b8cbeea6f591a0e916175ab23b0cfaf688171c8a98ae8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00026-of-00512.json.gz": {"num_bytes": 30288490, "checksum": "9e2f8e2a37dcfe66873cc5355740448ef75a1de2deeb2d8c047c3c3a7ee485c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00027-of-00512.json.gz": {"num_bytes": 29897688, "checksum": "882616d1e8ca66c0b6e7aa2ccb18d9239021603ab1b9486638a9a3447ddebe0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00028-of-00512.json.gz": {"num_bytes": 30201690, "checksum": "0312b12f50c64fbe7b894a28e0940089ad57af95df8116cd7d43c0435ec2e79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00029-of-00512.json.gz": {"num_bytes": 30237920, "checksum": "1e8677140186b219d32e764889dcc344ccac9db51685363324d1bc13ddef2bb7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00030-of-00512.json.gz": {"num_bytes": 30048903, "checksum": "43558e81c291cbf53a5b6a016aecb0e07e26a98b8fb32f4a000037b281afa363"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00031-of-00512.json.gz": {"num_bytes": 30294528, "checksum": "c33ae8a2fad7e5264d093fbe89ed1611357110a4f0f26dd5a93a4dc15560f205"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00032-of-00512.json.gz": {"num_bytes": 29868168, "checksum": "5dc2a8f96db8da87607efc0b708e6a2172530f0c9b43665dc01286109b5c55bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00033-of-00512.json.gz": {"num_bytes": 30105916, "checksum": "c4cdc2b39a86eff251f903d7f3d39605b721615aeffa6a2753f3588b7dbef6c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00034-of-00512.json.gz": {"num_bytes": 30126174, "checksum": "6d874182112b0881dc929c0182a30ec4f9f1633372a2b822200a7b1faaf4f1bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00035-of-00512.json.gz": {"num_bytes": 30084101, "checksum": "5bea17f0cd4dd888f5d8a2d4092138e4777d80493a1f410d618d4cedf353b914"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00036-of-00512.json.gz": {"num_bytes": 30095974, "checksum": "6e7f42f3012d8ca7500c7e2ec82d27c26b3cd8bb5b8b66a7fc8355d77284f433"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00037-of-00512.json.gz": {"num_bytes": 30239345, "checksum": "54ee45bf25152060679bab3e5fc6f5cb5a3add6acd2664cb152f88c223f83239"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00038-of-00512.json.gz": {"num_bytes": 30247683, "checksum": "f738a2f0f156f7bd897d9d822748d4192a5fe46b566c7288ed5b840c4ffeda64"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00039-of-00512.json.gz": {"num_bytes": 30057005, "checksum": "60235900d69579334660c153c4fe384c08f14f4e729a06a1e8247e8b4ab8a213"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00040-of-00512.json.gz": {"num_bytes": 30185136, "checksum": "5a059d64fd6a1b42a2faeb4088db327c47f9e8328737ab74a0e0457f84433374"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00041-of-00512.json.gz": {"num_bytes": 30314653, "checksum": "2cfdc460c8dd0fb4766191ef2aec0af856af7c95d11eb3f1d731f63b71db4daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00042-of-00512.json.gz": {"num_bytes": 30123256, "checksum": "64e59b8ebde3c12b0a1d218a302252b96aeb5bb4976927463101a9509579ec22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00043-of-00512.json.gz": {"num_bytes": 30057043, "checksum": "edd200b97394f15f9cf0a6289406a83b42c3d6f961456f031f5814db4f6d482a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00044-of-00512.json.gz": {"num_bytes": 30029900, "checksum": "1b2980f21ee5cffb271591adc8eaa414438841426442f194b5f4b703356f4e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00045-of-00512.json.gz": {"num_bytes": 30367170, "checksum": "83967210891345b831956722e8dcd29cf55fb17b786c85c2dd2778528ab4d1c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00046-of-00512.json.gz": {"num_bytes": 30105866, "checksum": "6921ac4854e2eacaeb4be07669faab85f2bab33f744c7efae1ce17be25176bb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00047-of-00512.json.gz": {"num_bytes": 29957618, "checksum": "e8eba2ba9f51e76a06a2df43b6b120c47b6e41f61e46a2e3331518ebb2d0c84b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00048-of-00512.json.gz": {"num_bytes": 30329887, "checksum": "6af9c44a53d7eb9df9d86ee4d895fb9f7f2b9b3863fd30aae325e79fb792a10c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00049-of-00512.json.gz": {"num_bytes": 30116207, "checksum": "57dc1e94f73b55e0be5690b01d61188a62186ea9f5f85b556ecef3bcaa36fb92"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00050-of-00512.json.gz": {"num_bytes": 30236341, "checksum": "eb75bdf0e63e798838b3d7abfc6a3bfab5de2ba39af833c38048dfe39c1175b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00051-of-00512.json.gz": {"num_bytes": 30357091, "checksum": "f48b1f5e07311ca9d69787019a56ad849932e6868d1f7778681cf7e4cc9fc562"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00052-of-00512.json.gz": {"num_bytes": 29944959, "checksum": "debf9490c057f11e404898b4a57cb424c1eb523fa90bb7899b1317f970481638"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00053-of-00512.json.gz": {"num_bytes": 30240416, "checksum": "9e847a5c6eb80e5c045fbb405729c695911674bd8d29b1d0be0791303d02f41d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00054-of-00512.json.gz": {"num_bytes": 30174556, "checksum": "65a80db1cdde9153e08277ad2d9074dfba1682c0f771fbb9f4aa8f88ca557f43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00055-of-00512.json.gz": {"num_bytes": 30134394, "checksum": "beb8d280d322520ded21aec92ae087867d0bce64aac4e243a127a88f143ff578"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00056-of-00512.json.gz": {"num_bytes": 29891026, "checksum": "82fceaec35a2456487a59ae652d72f41a940d2d6bafdc4f05a6e02bcd7ed4dc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00057-of-00512.json.gz": {"num_bytes": 29920525, "checksum": "e4fd55ba5fb2825ef4209aec87706ecdd3db040242c6aacfc82f350765fbeff8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00058-of-00512.json.gz": {"num_bytes": 30060421, "checksum": "3cfc894a1853e3d1f2daa314873b7919fa52b7208b590637f8face6536305770"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00059-of-00512.json.gz": {"num_bytes": 30038488, "checksum": "4f06ab7b5ce8e8c696445db4a3e32896b6396e3f67d7414a593e7398d752e564"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00060-of-00512.json.gz": {"num_bytes": 30129718, "checksum": "7923385ee0c6801073feb10437ee3c59e5f5dfe82c2311ad8c4ec670dcc0ec87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00061-of-00512.json.gz": {"num_bytes": 30130505, "checksum": "5cd682e148b8488775622098214fc2009ef9c95355f46341bd78434f1b560fa2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00062-of-00512.json.gz": {"num_bytes": 29968130, "checksum": "53562fc23501f3a1d11c8ae6a59e719d6f4e67db8b8ea1d55e2b1b80849afd08"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00063-of-00512.json.gz": {"num_bytes": 30116532, "checksum": "008cc5c0cb7d60e84ffdfe2132f6bb49aafbb31083fd026067b3859326ca64fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00064-of-00512.json.gz": {"num_bytes": 30236194, "checksum": "8f9eee169071e80c94c248f1c37b7fa631bd75a7f6e401f6a963aecd8815910b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00065-of-00512.json.gz": {"num_bytes": 30077312, "checksum": "8c5e18ea3575cd350e98d062ef88d3fd1df068e4bd410be8732723bda03656c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00066-of-00512.json.gz": {"num_bytes": 29920862, "checksum": "e377b8112dc6ff6834607c27b927636429e887f4ab8edc0824363941b7bb311d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00067-of-00512.json.gz": {"num_bytes": 30278223, "checksum": "ec2c2ac74cc3f4f814d645410cccda266151949dd36aae518b8082b948b47edb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00068-of-00512.json.gz": {"num_bytes": 29940464, "checksum": "ddfc16a17cabf48a2c59fa8ef25ccd12d899d3462d08b45f2a301567ccc105c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00069-of-00512.json.gz": {"num_bytes": 29903118, "checksum": "66d9d1791cda56607b2561199503cef216df86b28d4519d5862905671a4ec4c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00070-of-00512.json.gz": {"num_bytes": 30082323, "checksum": "8072d3bd5e19c005493c0332b73ca5be253397f54be90be1bb7b2ef8df7ad117"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00071-of-00512.json.gz": {"num_bytes": 30128276, "checksum": "b7c68af5a6dcac3fbb3dcbe12123d1045a79baf657a8b3bdada60c1a97404c48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00072-of-00512.json.gz": {"num_bytes": 30458419, "checksum": "cfe5c6ae2ad1531271b0039042e033bdd7caf9604bfa219980ca27513cea755f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00073-of-00512.json.gz": {"num_bytes": 30366974, "checksum": "a132f5e85376b0d0a06c6ae6af9c226dcbc98394461578c4fbc6cd439ba6e721"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00074-of-00512.json.gz": {"num_bytes": 29987779, "checksum": "f905e808b50908a7d2a7f0944e7e6c01ffd97ec16e5f0b6ed7169a60d66b0100"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00075-of-00512.json.gz": {"num_bytes": 30070204, "checksum": "b57458683803936f6bc03b06fc26be9d1a09ba09517b5c1518676f468e404595"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00076-of-00512.json.gz": {"num_bytes": 30129238, "checksum": "81e88ec53e39d6191e40e5852564f592b745abf99c71ff78302292632f636792"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00077-of-00512.json.gz": {"num_bytes": 30051399, "checksum": "218b0f6e219e42113e35d99458861f8511266dee6c17d9e2780a17af8877f822"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00078-of-00512.json.gz": {"num_bytes": 30144230, "checksum": "c0a337619559362e0e1cd0fe87c9ced5c987313a7f3cb65eb44f8b861c41c616"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00079-of-00512.json.gz": {"num_bytes": 30544297, "checksum": "27e257efda6adbce01585b3b6cdeefa95d31f607012fed5dd4310bfb5a790ba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00080-of-00512.json.gz": {"num_bytes": 30188866, "checksum": "26411f1a0a7b299d0bf6cf78db04b0bcc617894cd87d59e54614f3258dd393ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00081-of-00512.json.gz": {"num_bytes": 30418881, "checksum": "87a659f6b24560a754ccbfb6aee019484e48e3ddc7955a6c7a18aa9098952cfe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00082-of-00512.json.gz": {"num_bytes": 30086460, "checksum": "708fe5108042b957688817625c84059c11700b18ddcea3814b86b6c8c66af8a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00083-of-00512.json.gz": {"num_bytes": 30138639, "checksum": "8d8681519538afdb7622b677ca5d3ae2a643382bae9639e3ad90c82d36477653"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00084-of-00512.json.gz": {"num_bytes": 30228150, "checksum": "db708760b9d45e0b20c8dde9b0008f01761d9bb0f37a194845b4d097a60e477c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00085-of-00512.json.gz": {"num_bytes": 30004564, "checksum": "19ba55c7cbc44ae30a6497373fc15b548e5c45667f790c392857f6fdaa7e2bf6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00086-of-00512.json.gz": {"num_bytes": 29696360, "checksum": "4cb07dd259a084818f9a79a4fe4fb7b24ea1adda0cd4fd405ba003e7bd481f12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00087-of-00512.json.gz": {"num_bytes": 29927300, "checksum": "7c3c07dbc9c57881a3c1abab85a927f1ba609c58da9dcec22d7415079cd336b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00088-of-00512.json.gz": {"num_bytes": 30038333, "checksum": "59158c87d7e9e5011516f98dec1313758072ca6685c7ad9df5ee4a075d9ff8a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00089-of-00512.json.gz": {"num_bytes": 30223506, "checksum": "d3f39f7e90b4a82257779290a3f2de5619049d69b2169577f1e3c81791d85419"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00090-of-00512.json.gz": {"num_bytes": 30266969, "checksum": "88ed3237aadff809cec186fa378e176774d3f32aef1a6d8bfdbc530f64e8aed4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00091-of-00512.json.gz": {"num_bytes": 29885840, "checksum": "b9a247993a8eec31b3f853d1329ae79da29397dd27eb4acdc196b71c091335e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00092-of-00512.json.gz": {"num_bytes": 29942337, "checksum": "3d83cc54c06cad8effdb7a38ed6666b5d912e6fffcf4c82471af064b0aabe05e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00093-of-00512.json.gz": {"num_bytes": 30129376, "checksum": "d72ed9855fa86ceb4089435da3d78e8d4151b92185f828329b534d1adf3821db"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00094-of-00512.json.gz": {"num_bytes": 29613450, "checksum": "f61f74aa65a81616b97cbc34a8be1b563f83f69709642b8156eb76cdda02103f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00095-of-00512.json.gz": {"num_bytes": 30469526, "checksum": "926d1ba2e4b191e75b0bce0cbe4c15f95f244445ec03a6095c009c34e36f897e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00096-of-00512.json.gz": {"num_bytes": 30126036, "checksum": "e74818ad94e408498644dc71f1ed967f356f539418222f1dfea467a21c99badc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00097-of-00512.json.gz": {"num_bytes": 30374980, "checksum": "d9cc8827ee38bddd1a31e48b2b0064a567520e3c0f2e1be745acef57d267e4d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00098-of-00512.json.gz": {"num_bytes": 29928579, "checksum": "090ad37fd9eaeb53308599f2da1053b19b1c6478adaea5a8a1c35d6c35340111"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00099-of-00512.json.gz": {"num_bytes": 29901456, "checksum": "c0e7d9a7cbc3b9b940077508441e471a1eb70e822479fcad726b900e6c196382"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00100-of-00512.json.gz": {"num_bytes": 30033459, "checksum": "b62033de618191de3200205e6e40725baf045e403060d10417211d47854d6bb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00101-of-00512.json.gz": {"num_bytes": 30280468, "checksum": "8726d092785856ec690dcd8a9edcd968cd04af1cfafe8a83192e3c0782f02b4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00102-of-00512.json.gz": {"num_bytes": 29805195, "checksum": "248edf4dd6c9a1137c7b45ab0b5a05a5fc93fd14cec17a5da4d758b9f7b359df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00103-of-00512.json.gz": {"num_bytes": 29995494, "checksum": "d66b75c3f08a0db141d2c0162eb3dbc351e656ba1ba480e77eda051435d1390f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00104-of-00512.json.gz": {"num_bytes": 30318447, "checksum": "09bd2068c20d33783f39322c95756fd3dbd0da91f4380fae3822cb33b7d06779"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00105-of-00512.json.gz": {"num_bytes": 30209523, "checksum": "0a399ecb1116890e1a0189cd2842d64d8ed53213b1623ae38229a6ac4f5c1c76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00106-of-00512.json.gz": {"num_bytes": 30476739, "checksum": "540f682a7c977d20f920b5af1ec7e40c14a0d54f1718b43271e22dece9cdce16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00107-of-00512.json.gz": {"num_bytes": 30203291, "checksum": "0dd51deb74ab391c54b20862f7df561f74d00be2ee4fc13987f91771870c099b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00108-of-00512.json.gz": {"num_bytes": 30265100, "checksum": "172b09a108b154014077a415f644cd16db6a66f178bf780c120a6c4fecc3c0a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00109-of-00512.json.gz": {"num_bytes": 30342649, "checksum": "214a8f147f2d77ec0f3889b0a2d782e5d44230878359e695e9523561e6723a1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00110-of-00512.json.gz": {"num_bytes": 30152418, "checksum": "dc0d34ce7918b80ecef3528ec2b063edf7b12223c453ac7fb9d39232fecd81d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00111-of-00512.json.gz": {"num_bytes": 30160329, "checksum": "d0594cb69d26f0e853575d86f92b1aa233b5bb236804a2f496a792fa031014ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00112-of-00512.json.gz": {"num_bytes": 30428351, "checksum": "2b0542d973bab88e696fb9efbe042167600da397d776ef65344dce868bbcb0b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00113-of-00512.json.gz": {"num_bytes": 30200133, "checksum": "10dcb929692795fefcf4623040191d9cb6199fbb3b164648b62b9867e8392379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00114-of-00512.json.gz": {"num_bytes": 30205273, "checksum": "f16631d5bcbbe133a01675286ca7667400ecc7e6df13d728015381d21ec71cfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00115-of-00512.json.gz": {"num_bytes": 30164849, "checksum": "bed27819db4bb7e02cb42cdda18acd232659a2eaa43eed910ba26d686cb3f837"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00116-of-00512.json.gz": {"num_bytes": 30117752, "checksum": "4eb4bec7adac3c2f431d356212f8a9d47136f0011f5f9e71dd29d82b1b823e2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00117-of-00512.json.gz": {"num_bytes": 30062588, "checksum": "79639624734885b3051b10f052f5486d7124bbc4bcd18d99348f3683ee2fc54f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00118-of-00512.json.gz": {"num_bytes": 30125828, "checksum": "e922a4a5332a4182ddcf6ac8ba910024fe4fa878b524f7368b27373f75bbfe44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00119-of-00512.json.gz": {"num_bytes": 30156741, "checksum": "a44aba8779b99ace2f212789389af058d12dfb0706221b296676d5e10528dd78"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00120-of-00512.json.gz": {"num_bytes": 30489925, "checksum": "82bec41bbea7bc5ddb67b3bccea51122da7d0922768f8bda7a0c9d489bd20cdb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00121-of-00512.json.gz": {"num_bytes": 29606989, "checksum": "b49238f5b75aaf876657826cfbd4346d250f564a86bdb010aa1e85b44a969229"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00122-of-00512.json.gz": {"num_bytes": 29770557, "checksum": "0803ccbd505db47cd09b20d86cc6ad459c7a8d1c583a5ee756b0397369d8b6fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00123-of-00512.json.gz": {"num_bytes": 30248121, "checksum": "d73a1bf285a0355bd61a25891cd8c5fd9da66535ec515dc7e1602a769b994727"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00124-of-00512.json.gz": {"num_bytes": 30131013, "checksum": "65d2dcc7e63a28e1911717d149b907d0c74fda6e36db2840353a0290f7880324"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00125-of-00512.json.gz": {"num_bytes": 30348971, "checksum": "5dee3c7afe0364ccb8e36647d01e78ffe61690f29f29aa033efac9a0413c2a47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00126-of-00512.json.gz": {"num_bytes": 30370074, "checksum": "1dc04b3755291842711623d1d6cf042e2d66987103a0c708f01c9136a8c42db6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00127-of-00512.json.gz": {"num_bytes": 30320846, "checksum": "e31a27ba25bdf13e6f929fd38d53409dd3f50be78ad955b69b1956709de5aedb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00128-of-00512.json.gz": {"num_bytes": 30076235, "checksum": "122ee9d293428a7a823c17b3a432b5b2198fa2a68bbb246b97e981bd09f78f0c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00129-of-00512.json.gz": {"num_bytes": 30569486, "checksum": "918bf43ce3ab54d535dd02cbcd09f1081890be3287e23fd81bfa032beec61ebc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00130-of-00512.json.gz": {"num_bytes": 30280169, "checksum": "ab0a53e8c10dfdd139281175b5fcfe3090fa238fcb383e27b1dcdfdbbe8a879c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00131-of-00512.json.gz": {"num_bytes": 30338899, "checksum": "e54771e12a6f3583c3accf9bcc01b598819231f367e7f80cbd44cf6683c5c852"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00132-of-00512.json.gz": {"num_bytes": 29969011, "checksum": "f69d7052ca7657fdebe547a6e196b109285d5d4e4f1a68f3900a37ba6fecc22f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00133-of-00512.json.gz": {"num_bytes": 30179558, "checksum": "cf2130dedafd8f47e97661a5b1555813433e3f7293b5c5cb222cf551d90a0604"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00134-of-00512.json.gz": {"num_bytes": 30080257, "checksum": "1a32902fc21633ae8d41e4e5518804f4c719dc8729b866ebc32d3c36fdadbc10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00135-of-00512.json.gz": {"num_bytes": 30284972, "checksum": "6e3a78e7a530d91ee4578caf462a4c685a5f221f0cd8eb9639c9067e2b655a7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00136-of-00512.json.gz": {"num_bytes": 30130265, "checksum": "defc57340cbaa5f325994a91b5134789c84a76a4ca7b9fdbf993b0e634735f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00137-of-00512.json.gz": {"num_bytes": 30146793, "checksum": "7ce5035f452eb2e1adeff36d0c6d6d65c245d139a86ef48bbe10c5275975183b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00138-of-00512.json.gz": {"num_bytes": 30180265, "checksum": "298849a53a8ea0e68d01cc137195bc36d686077bed722e1198337a1dee3c51cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00139-of-00512.json.gz": {"num_bytes": 30398387, "checksum": "ef2ac4b8f195141a79a357d934d5d97bd4d2c64027ec7509b5873a4ae32fcb9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00140-of-00512.json.gz": {"num_bytes": 29652990, "checksum": "290f1c99b696e345aaa6ac6d5a882a87dcf5d3939b08ba859a359d2459498785"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00141-of-00512.json.gz": {"num_bytes": 30083642, "checksum": "fb6a38388a25261d86fbd8ffea63e06bcbcbd6846a4eb6f13fd09d7fe5a1fbc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00142-of-00512.json.gz": {"num_bytes": 30131064, "checksum": "b61ccf6166ea4b777629bdc07d543f299bf7569deab18228ec5bb9edc8cd3eb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00143-of-00512.json.gz": {"num_bytes": 30244435, "checksum": "22812c50efdfcf2c0fdcf593639dfea09ffee8068321c30effc669c8234d4f3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00144-of-00512.json.gz": {"num_bytes": 29725094, "checksum": "79cfa65a3115193629d16606643d90dcf27d3108c320cc9e364ba19fdb9fb1d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00145-of-00512.json.gz": {"num_bytes": 30335033, "checksum": "e836f0bc9acba85fd1721d19cc24054e97defb0d12678bdc0d086f40deb9b1a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00146-of-00512.json.gz": {"num_bytes": 29905680, "checksum": "bf684871a235078390d6c6bb03fc2d5bbffec2b095806df652a19baf5e67135d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00147-of-00512.json.gz": {"num_bytes": 29852459, "checksum": "0e716de5b3b09ec287b039be0f0dd6edd7d541aa6d3f9d2be18768e1cd5f4cd8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00148-of-00512.json.gz": {"num_bytes": 30364788, "checksum": "4cef624e6b7c2b73dbfb47227e31681223a5a9369c4b7daef8606b796f010dd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00149-of-00512.json.gz": {"num_bytes": 30096278, "checksum": "fb448ccc7412f5ca8667004a70f3dd6e1b5e6cb7f6facc06564bd22b1d815593"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00150-of-00512.json.gz": {"num_bytes": 29776995, "checksum": "1e14268cf723bc7336b33896537643d21dbefc1f05ffd5201feb5fb1130f9683"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00151-of-00512.json.gz": {"num_bytes": 30205172, "checksum": "797224cf74063fbcaec741535278ccce141e6dbbdd69a2191d07f89816ab14fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00152-of-00512.json.gz": {"num_bytes": 29845034, "checksum": "77eeb2353f544c714deea68d4a781b498c40d7c1e27db3aade4987b381ca29c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00153-of-00512.json.gz": {"num_bytes": 30258796, "checksum": "0fc581e92e70dda031d72a4aa0bbd65b1e9b28884f0ef5dd5e895cbecb270609"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00154-of-00512.json.gz": {"num_bytes": 30249734, "checksum": "ba10dd0a24bded170541e23078264b82b35bc99e402db594e2335e31905ededf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00155-of-00512.json.gz": {"num_bytes": 30198742, "checksum": "fe285ac893126062bcbc20df75a9f65c57d3a7391354fa7e62b7f6a7122d6e77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00156-of-00512.json.gz": {"num_bytes": 30168323, "checksum": "d21826b71bc85dbc496dd947ae9ee79d62885cffb3fa7c47409feee6ab247f17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00157-of-00512.json.gz": {"num_bytes": 30241978, "checksum": "fc41765301b62849eda0b7b08f792e45f03db458fb92063af70c43d7cd0d0bb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00158-of-00512.json.gz": {"num_bytes": 29959715, "checksum": "1eded3ce0bc099c7e198e9277719d578c3fb6c425bb2110cb0ca6ce469d1d19f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00159-of-00512.json.gz": {"num_bytes": 30109595, "checksum": "eccaab5b694c2f0017fe1d423637872d5587f6deb316796f7c0ff5517fa28178"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00160-of-00512.json.gz": {"num_bytes": 30201741, "checksum": "4ceee71372da6112101665f5bbf942a85f065feaab924c6e3f83498169bbe255"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00161-of-00512.json.gz": {"num_bytes": 30176266, "checksum": "6ed829daaad190b2d50b626d840edb750a063afad95315ffe7604a193183a489"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00162-of-00512.json.gz": {"num_bytes": 30018118, "checksum": "dcf8509a55213425a41706e5209ad411afb715fb9cd8c1a8b8edca23fab7d6cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00163-of-00512.json.gz": {"num_bytes": 30236016, "checksum": "d93cfaabcc7197637f233896b5799527f27d5b2dc60f0f0411ee51f05f09c500"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00164-of-00512.json.gz": {"num_bytes": 30150055, "checksum": "cc7de5ed3c774ff1dc350fbb5167dc1610c4f9a0dbc7c5d60ed4cf08aaf23ce3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00165-of-00512.json.gz": {"num_bytes": 30348056, "checksum": "b41c4a3b7b4e96262fe5c87d06fbeb000dc48cc1d304a475bb4f4e1af84a9afb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00166-of-00512.json.gz": {"num_bytes": 30015834, "checksum": "0a0821b7628b9b019995a9f34223e2960ded84331ce1bb55089838becb8a170a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00167-of-00512.json.gz": {"num_bytes": 30282254, "checksum": "1285af56d024efe2166fa892878d471948e1d4c996922c7673e3c0f7f0f76bef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00168-of-00512.json.gz": {"num_bytes": 29815124, "checksum": "29ec54ed647725ca3b9aec3bae341151a8e2b708cf21cd87b4389329298442b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00169-of-00512.json.gz": {"num_bytes": 30346843, "checksum": "1791e3f8371a63f9f849b7bf430e70d3f4011dbdef572c166cc5d49d06162fd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00170-of-00512.json.gz": {"num_bytes": 30175685, "checksum": "de8f82986addfc64b88fd3041d7ee6fdb64e6f770758146dc4c9309df348e965"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00171-of-00512.json.gz": {"num_bytes": 30145505, "checksum": "0dda47f679666862de6343e1109ed92866a42e8fa129ee69e9f0b73f18b6aecb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00172-of-00512.json.gz": {"num_bytes": 30009998, "checksum": "2990dae6c16b7d60652439bed8b80ee4cf93972f33d8511d3d6aabaddfeca5cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00173-of-00512.json.gz": {"num_bytes": 30062185, "checksum": "e154a969bba2bf9430e0c8307561de78599fd2bd527cb1f15bbaf8f8e88cdf23"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00174-of-00512.json.gz": {"num_bytes": 30055129, "checksum": "e714ae153e8a927c88fe577d4c27017985d3ed7f3d0f5470f9a5f25c2e901a9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00175-of-00512.json.gz": {"num_bytes": 30091082, "checksum": "5f47c663d1e15d94fb0057d303048be990c713f3285ada2c6233137b1d84d60f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00176-of-00512.json.gz": {"num_bytes": 30235767, "checksum": "20b05e4e99e5a05f6a4c29b304803b895bb8816caea6203643723ca587d66128"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00177-of-00512.json.gz": {"num_bytes": 30071950, "checksum": "29294e4b224df4695c9342c6f23d5495de9a0ca6a1be7217aa2211506e8ac7bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00178-of-00512.json.gz": {"num_bytes": 29932121, "checksum": "6022ed3b2ceef02324e40d3c7407622c95ead2cd3d3c41ab15ff9dd218265673"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00179-of-00512.json.gz": {"num_bytes": 30119251, "checksum": "42fa0aa883d9db4303a4981e4e308b2432b031fbccc98c3e1994ec775ba8023e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00180-of-00512.json.gz": {"num_bytes": 30175456, "checksum": "6fb2ebd61524846f6b1f746f9c6356045623beb4b685fe265a23446037c9cd9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00181-of-00512.json.gz": {"num_bytes": 30029564, "checksum": "b779d721bb135fceaeddebb0dad1bdb43c9067a5e8595b3d544dfa7a084eb9f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00182-of-00512.json.gz": {"num_bytes": 30437016, "checksum": "b388fc0e862d7f6bb5b879ff7c69c301038faf5b542f6b40cbea4e2096a41e6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00183-of-00512.json.gz": {"num_bytes": 29994048, "checksum": "8208eeca7bc76f8b1786c95939d321ca0c7ae190b1f12dae86738810e412aa8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00184-of-00512.json.gz": {"num_bytes": 30338616, "checksum": "49859e75d999f65de99f9236e649a81989360f0328ba684671057b0dd7cf5e79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00185-of-00512.json.gz": {"num_bytes": 30088874, "checksum": "ff6d32fdd471d3076a9367c175baab84a5d699ccd6dcfe00c755f0b714ca6074"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00186-of-00512.json.gz": {"num_bytes": 30193681, "checksum": "82508ed104fc57de3062258eaea57854ab9e1934437a88dc0d8a9921f3641bbc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00187-of-00512.json.gz": {"num_bytes": 30171163, "checksum": "409d6576b25ad27455c755e5484e3f51d5d9788962efabe1c32e06bb3febacab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00188-of-00512.json.gz": {"num_bytes": 30060432, "checksum": "fae94de96fa2962ef51e2ea90a5f760a5cee5de249bfd9f56d7c7b4e5c20f6de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00189-of-00512.json.gz": {"num_bytes": 30180741, "checksum": "25293d5cba09980086f380d9e9ab44543adbbdcd05ed08601248b3a2b16d118c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00190-of-00512.json.gz": {"num_bytes": 30207152, "checksum": "ccfee160de15df5d88f0ff5a898a0c5b2d0ef4ebd6e6832715a9ef8a9904f88f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00191-of-00512.json.gz": {"num_bytes": 30143987, "checksum": "4c579619e465d9d97451801147202826a3855e772ea6dc4e9968e43ce2b8c05d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00192-of-00512.json.gz": {"num_bytes": 30072097, "checksum": "9c32ecb6d4ec9feb27c5b642879b464e68ca8804db161219503f624e7ca1166f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00193-of-00512.json.gz": {"num_bytes": 30172886, "checksum": "8442ddc3843c72aa169ca67801ff865ff85e4183beb38faa664f4f1d1c22a5d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00194-of-00512.json.gz": {"num_bytes": 30037105, "checksum": "2942ecacb22cb9a2953c68f21ddf3368cd47ab1f2b2d8e1f5c76b1c849b28d91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00195-of-00512.json.gz": {"num_bytes": 30014854, "checksum": "9e5c6815a5734403a7062bb27b2565d433a3520a401c836ac3f16e743a1dd949"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00196-of-00512.json.gz": {"num_bytes": 30020510, "checksum": "792712f0073c158b5f96f7a99d97970fca3819b69739d34d7d2b7f4b8b407b7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00197-of-00512.json.gz": {"num_bytes": 30072566, "checksum": "3ece37e2d0d0b26fbd839b5d3facdfd70844945a06867fb68b141f6b1378462b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00198-of-00512.json.gz": {"num_bytes": 30036679, "checksum": "c3f37a9b89987dde4578b394b5c3916c2d4fd87e0902309b4c81af19b1d2d5ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00199-of-00512.json.gz": {"num_bytes": 30195178, "checksum": "ae01bb5515097a083afd498d8530e788d99671e7cf802c4402957d6252b2ec77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00200-of-00512.json.gz": {"num_bytes": 30064374, "checksum": "2399d4869f3a8bb4a9adced5ec548a9a3fde1d4fbc4e3abd9a0a3b495fb9a8ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00201-of-00512.json.gz": {"num_bytes": 30136711, "checksum": "5c922040697bad8d7807d79f34f2b667eea63ceefba89b2d413fcd4d66497607"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00202-of-00512.json.gz": {"num_bytes": 29962983, "checksum": "e4df518d612a8614de73d5944a31d22ad06ec9ecd26fb52e500df71fe363c1be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00203-of-00512.json.gz": {"num_bytes": 30178998, "checksum": "e84a98a176451fc82d940a64cdec821e320a648780edba6466b74a1966eca47e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00204-of-00512.json.gz": {"num_bytes": 29988832, "checksum": "c6dc56388bc7c57cbdee8280895ab80da7b4d49c9a0101a685229c50cad2e2e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00205-of-00512.json.gz": {"num_bytes": 30229414, "checksum": "e7e5175b6a7372377ba3a0db439911e189db459787d48588183ac1a0198c5fa7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00206-of-00512.json.gz": {"num_bytes": 29914929, "checksum": "eb263433133660ebe219cd5817dea3b546ef2fba0e15396b2768d7091117cdea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00207-of-00512.json.gz": {"num_bytes": 29912800, "checksum": "7f8a5f62ba5912b64af5b02bd987b4d81727223ef8eff110022e89d01961366f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00208-of-00512.json.gz": {"num_bytes": 29900590, "checksum": "bc2af142244601bb7a96859dfd9885196940e675ca217cfc7c73ac9c614ea938"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00209-of-00512.json.gz": {"num_bytes": 30242768, "checksum": "fa51a4337faecfc790ca925802f87f10761552e16578b880ced80497f62bba60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00210-of-00512.json.gz": {"num_bytes": 30039857, "checksum": "3adf7482ec6a3ad106c8edca3645a94032c33f84fcd26bd9876f2b8a1f6b5722"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00211-of-00512.json.gz": {"num_bytes": 29846856, "checksum": "8e931aaa9c1f069c0eca0b4605277610df9d2d0c07a0dbe6191fb7081b0e642a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00212-of-00512.json.gz": {"num_bytes": 30022172, "checksum": "21c8bba1c83544c27977b22b077fd77f8df9cd06bc4eb5e9e9a532c511498d36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00213-of-00512.json.gz": {"num_bytes": 29877918, "checksum": "b64ebaa088df5c6230e69f207267a038705c38f4d327970e9117979e1c13d1ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00214-of-00512.json.gz": {"num_bytes": 29906552, "checksum": "55d833a2b78ad564e6532d1acd14511e8b48d703030e3bbc92d7c835c1ed38c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00215-of-00512.json.gz": {"num_bytes": 30075441, "checksum": "999c77c136d3df83601e33c823f389b133f33c4c0b03736ceace617b526cb293"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00216-of-00512.json.gz": {"num_bytes": 30507152, "checksum": "0b23d4e57eaa101c78bab46151add537668d2722bf0c50470c1b434ec3389ae1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00217-of-00512.json.gz": {"num_bytes": 30044236, "checksum": "6abacfd53e231a38c714d436018cef9a58f53320026c2ebb27d6caf08f02d7ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00218-of-00512.json.gz": {"num_bytes": 30047926, "checksum": "01120ef69493d84c44d112a41c69a851edaf89232679366e812f240fd26a0e47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00219-of-00512.json.gz": {"num_bytes": 30349211, "checksum": "c4fc219559f0f076f634fc6812d4b13c229908c1ae45c3b74c059fb3b8124f63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00220-of-00512.json.gz": {"num_bytes": 30063445, "checksum": "11f712439d54ef062cfa1225328fc4faaef5f6c9c0b0d87a0a81d25a71350e28"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00221-of-00512.json.gz": {"num_bytes": 30115660, "checksum": "9a344857ef4f9d141b57df38e25f717153b773436d72c23e10289ffe67c315eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00222-of-00512.json.gz": {"num_bytes": 30134562, "checksum": "227cd1847a948e388b404b5cda9289f05510d4e22f0ae5ec4d5a87a8f7f98a45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00223-of-00512.json.gz": {"num_bytes": 30120819, "checksum": "e0029aa6b612a98f76e37d82107fcb90f2b57ae8d52beea172b5153b76334f20"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00224-of-00512.json.gz": {"num_bytes": 30371365, "checksum": "1ce5242d163ca12dbb22655eb841bf80750b552353af4f84973285d823d0add5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00225-of-00512.json.gz": {"num_bytes": 30319212, "checksum": "71cb82bb95107a7e0b7777a5fcaa0f76b465ba828ac47401babcf7289eeb2335"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00226-of-00512.json.gz": {"num_bytes": 30020940, "checksum": "b7b8d98ade41f52ece23e896bdc4c19ad034a92ba18adb5fac85c7271afbfa65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00227-of-00512.json.gz": {"num_bytes": 30109958, "checksum": "b2ec382f44caf4e8e46fef2faf6bd2e4000420e6da2eb12a5d9f6e7efb4e1564"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00228-of-00512.json.gz": {"num_bytes": 29940895, "checksum": "ff86264683d0fdf9d689aa30e7889c4ceed21098b7c60a220db92d396614cb1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00229-of-00512.json.gz": {"num_bytes": 30080588, "checksum": "3a5502cedd61501055eb16adb6ef861c75880524c5468a69cd346bc03e98e219"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00230-of-00512.json.gz": {"num_bytes": 30376399, "checksum": "6d3a4171a1febe9149f6900e3cca5a38046ca9d59214b548a4ef9de7de754bbd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00231-of-00512.json.gz": {"num_bytes": 30031670, "checksum": "a2c8d9bb3eb260d5d8a7dcafc4703540332e2896e5127372d380d7efbd567a3a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00232-of-00512.json.gz": {"num_bytes": 30132612, "checksum": "c9dec917eff4d72c684d6f8373ca66839061e29d25f0aa5fd6fb7de5c30df469"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00233-of-00512.json.gz": {"num_bytes": 30178285, "checksum": "1eb83b8eb7e72b2b3e55420436bb17521b989d0627da46f8cc61fe9f420fd464"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00234-of-00512.json.gz": {"num_bytes": 29991258, "checksum": "5e14e2a9e8c0aba73feb9134c694e99baf57357bb524877322ff5181eedef1f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00235-of-00512.json.gz": {"num_bytes": 30045172, "checksum": "50a118a072498b5338802cceacb97a9aa9242252e8d76d305cf5f0d928fd4af6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00236-of-00512.json.gz": {"num_bytes": 30403542, "checksum": "7d7605576975232579e422a1b72625ad6f9d714d27770725dc7b99ba258e1985"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00237-of-00512.json.gz": {"num_bytes": 30242989, "checksum": "22d152fa02c5a959e978ea4887dd873dfef7267af0a577b4d796ff0cb52d5c56"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00238-of-00512.json.gz": {"num_bytes": 30214634, "checksum": "6d0af6f396fa21867e899a7678c633e47bfe79bcbda29b8072c5d32ab20a9aa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00239-of-00512.json.gz": {"num_bytes": 30255546, "checksum": "d35a93632638b6283053b121f0f30d47ea20b2747d871c3dd0beb13f4ffbcad9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00240-of-00512.json.gz": {"num_bytes": 30347604, "checksum": "fd052d532fcfe811d96f8433f79a684f68f76ec42bd959c76ae3b63aec0b2c3e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00241-of-00512.json.gz": {"num_bytes": 30135691, "checksum": "12c80c41dc4d6313bce4a171999ecda93ffc59f2c70cca363bce214cd12dc9f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00242-of-00512.json.gz": {"num_bytes": 30229834, "checksum": "fca5b81914ac0c5fe0b0c1a554a1e62c64af5c98740df1f8ce8f48f2a62b6a48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00243-of-00512.json.gz": {"num_bytes": 30053753, "checksum": "ba41c505579524e9d244354a70060c9a0131007e0b129f03e628bb7b7b512ca9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00244-of-00512.json.gz": {"num_bytes": 30216889, "checksum": "54a391c1d2de7627e739f3cd94eeccd50a80d56a40606f7c5392f6098df456cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00245-of-00512.json.gz": {"num_bytes": 29887569, "checksum": "c3263ea7e16e0036961dad28fef57ce4f0495219e59b4e800af82b67b3c6c506"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00246-of-00512.json.gz": {"num_bytes": 29906815, "checksum": "a3dcc92aed81708434edee84397010eae4ffeaa38b39aaf3919256f72deee625"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00247-of-00512.json.gz": {"num_bytes": 30074896, "checksum": "019e983a95908651bfae83e37bda5200b3888b03ab235fc8db2d5b16742f028f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00248-of-00512.json.gz": {"num_bytes": 30108081, "checksum": "6f68835ec02cf899f8f44a795b1e3117956ff5bb6c8946435d9861ae7a112df3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00249-of-00512.json.gz": {"num_bytes": 29957882, "checksum": "9bed6b7f56d93fa3973d4f177dde0973fa0eb6fe17d8d85279d865531613f963"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00250-of-00512.json.gz": {"num_bytes": 29822284, "checksum": "1848bef8d11360df55a576c64147e519327b1178f77d3ec14ab9522b33b1c423"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00251-of-00512.json.gz": {"num_bytes": 29956462, "checksum": "425f69c361a8671cf571df577ac0cfafb4894de494360084b7cbe9cb8869bc3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00252-of-00512.json.gz": {"num_bytes": 29733712, "checksum": "7198e831e75eff1e116513f9cbe098c071f051c545b41d1943211a1d996a3c67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00253-of-00512.json.gz": {"num_bytes": 30450662, "checksum": "0452804e723c919bd3c84217bb1dfc8764112fd70c5581f84520df7592f28ae9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00254-of-00512.json.gz": {"num_bytes": 29944765, "checksum": "dbbff2253d70094537de481344e5706315271fdfce7ebaddc8d277ed05ddfe24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00255-of-00512.json.gz": {"num_bytes": 30321363, "checksum": "79173dd85d535cee71afb52f7775bbf7289509bc555efe21a8700d36f7e5da25"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00256-of-00512.json.gz": {"num_bytes": 29982818, "checksum": "bacd191568e72da06c564fc7476225ce83440de6aea6c85ebe7f5279f1c15846"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00257-of-00512.json.gz": {"num_bytes": 30338592, "checksum": "998287203665559c27a66e889611ed716b7a389e403b2e857086f548b2c47b39"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00258-of-00512.json.gz": {"num_bytes": 29911193, "checksum": "ed9829f41a71cc187d0ddfeafc9cbde8e362b52914c988708a1a5ffbd3c152af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00259-of-00512.json.gz": {"num_bytes": 30227794, "checksum": "2fe86814499a3379601a179acca1d440b3c79467827ce9ef9787e1ab311904e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00260-of-00512.json.gz": {"num_bytes": 30206902, "checksum": "c4efdad05d3f5e9f27884399ab0ec82081c26486e87f0ed5408a9eb80b223daf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00261-of-00512.json.gz": {"num_bytes": 30035514, "checksum": "e47675a956a626a32b1870c61e6f98c3cfe9cc571901cf477abae982b4e63c96"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00262-of-00512.json.gz": {"num_bytes": 30406718, "checksum": "ae19c1389e26562322f745bafbd7839e7a95b3169743d48baa7ae7f2db2a0b5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00263-of-00512.json.gz": {"num_bytes": 30266531, "checksum": "289c9fee87f12ea22ad5329f80cb379e5e9c22c5cb6639077748958228c62bf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00264-of-00512.json.gz": {"num_bytes": 30100823, "checksum": "7c65dd5d90c6df49ca2dcbfdbf1b9fbb0789cb32043795942d88c5f2d7a99869"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00265-of-00512.json.gz": {"num_bytes": 29957109, "checksum": "e3a1b501b2cc3f5f2667ef179d7876db602daedefd0cd741c0898679b24984e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00266-of-00512.json.gz": {"num_bytes": 30196603, "checksum": "9337dd8240f168da5f6a8b57c5c169a2a400a9a160eccc8a6e44e7b32004ff19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00267-of-00512.json.gz": {"num_bytes": 30304605, "checksum": "513eea4e78c399cc045e25f13bb5f77ddb6c9b606522bed8216945c529894e8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00268-of-00512.json.gz": {"num_bytes": 30312562, "checksum": "0503c5bf6848213c5fcb81a5c94307fc010d910a8989e104ad5fedca58c76f7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00269-of-00512.json.gz": {"num_bytes": 30045257, "checksum": "59bd3011d12d7d70b5fd64bc2dd2016b1a9ca6f0d210dbb3e6c202bbbf74ced5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00270-of-00512.json.gz": {"num_bytes": 30027628, "checksum": "8d3ecf4c61acafc49b624d08b6aa31340643e030f6c2248f689e8a17d355359e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00271-of-00512.json.gz": {"num_bytes": 30014730, "checksum": "b2e4820a0a7287786f802b3b40602c8ca77c7813b5f50db8a336b89b89bbdf37"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00272-of-00512.json.gz": {"num_bytes": 30145705, "checksum": "20c73e4a9056a5201621a4799b86c323c5136af43caa63a74298a5c3bee890a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00273-of-00512.json.gz": {"num_bytes": 30165945, "checksum": "8f07a91b6b40444635d869b94558fa68e3593626808bc6122d4e17403cf76101"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00274-of-00512.json.gz": {"num_bytes": 30097947, "checksum": "9530522c841d8f09ccb89f4f0238f7b9048c211e85b27449fb3c09d3bd2bab7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00275-of-00512.json.gz": {"num_bytes": 30296359, "checksum": "51a358db81805a20df4f920baacf3adea05209282f800fbedfc7fa49638a072e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00276-of-00512.json.gz": {"num_bytes": 30311407, "checksum": "a51253cf73fb200053eb5fd5eca398a7a070fcaa27fc99b23389d09eef7fe5ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00277-of-00512.json.gz": {"num_bytes": 30372345, "checksum": "cc4f6d9040d8c4909d4ea5b661a7e54ba4775ff1c7c55db1ff686a56d428e2a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00278-of-00512.json.gz": {"num_bytes": 30379507, "checksum": "1052defa657524e1211e67d775a32243b164eda431c4c6ed351f0c6727f21b16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00279-of-00512.json.gz": {"num_bytes": 30195406, "checksum": "6f4fdc92c516ad779fd521afba7d8d5bcd40672e63028f43f70fff4d7605f5ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00280-of-00512.json.gz": {"num_bytes": 29902057, "checksum": "c26f89efd0977465f45fe321036d88e2d6ca3ee1edc4bafe4b40ad1895cfc0e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00281-of-00512.json.gz": {"num_bytes": 29779702, "checksum": "094139d741b7a47faaaaf50093ab4edbef6ad1943985c6f453ce45a67a95b190"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00282-of-00512.json.gz": {"num_bytes": 30063500, "checksum": "280d69bfc795f1502a9e744d53d1a189051a1e771042721f8e6f74f6559e25a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00283-of-00512.json.gz": {"num_bytes": 29956350, "checksum": "505e49b7eeab46c77a324959eeff103f8899da1efc4d0fef5c0e6c6f8879a721"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00284-of-00512.json.gz": {"num_bytes": 30146285, "checksum": "9b075f2cfdb9a90fcdc7f779a52b0c5dad36385214844d4fd9df1e528ae78b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00285-of-00512.json.gz": {"num_bytes": 30160056, "checksum": "d9b9f3cbb9ce2a0a0a1a2f7ce91e98621d48a7a900c278aeef437dc6c0a7cdf0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00286-of-00512.json.gz": {"num_bytes": 29844025, "checksum": "6de9ff1013484662305e414725be2d0a4a1873a941250b95b80b5dea8919cf95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00287-of-00512.json.gz": {"num_bytes": 30089218, "checksum": "444ff132c4a5330653b7319d34b2c7f4ae3b960d8b510cbd7389e3881f65ac5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00288-of-00512.json.gz": {"num_bytes": 30092170, "checksum": "46dc5b3b84e4387ad718fdf96b751354d7048e898ec664e0d3bdfc21ee841ec2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00289-of-00512.json.gz": {"num_bytes": 30365397, "checksum": "b42e35746112198143ac18509e4f0148772db75e19f5eea9ed0d7e2849dbba48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00290-of-00512.json.gz": {"num_bytes": 30275920, "checksum": "25d99877235c4b9dacd5d1dd7e9d16bba76cdf6cb1725fa617209142873dca0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00291-of-00512.json.gz": {"num_bytes": 30125784, "checksum": "51da68b6f2751a83e2534c342b6e9d69c419fb606b44c42b872d69f5f726df3c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00292-of-00512.json.gz": {"num_bytes": 30201021, "checksum": "1e0a42b5e7ea7049c3c86b96d37c5d1c36f3ba2e2dab02145a897ef056fa6a87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00293-of-00512.json.gz": {"num_bytes": 30124224, "checksum": "8c744f5c6eb92c0de70649cd773c0ad147bc7a1487b2ae7f1107bce9d19da601"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00294-of-00512.json.gz": {"num_bytes": 30074708, "checksum": "b3cfa4c4408c1a9f39b48e18a62e112ec3c132b226efe0850f9e58e2a517aa97"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00295-of-00512.json.gz": {"num_bytes": 29990007, "checksum": "012f63e147d22e34249e930975a2d8958a8d0b17350a9f6e368d702189b40d5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00296-of-00512.json.gz": {"num_bytes": 30093755, "checksum": "5573859cc485ae4535b83fd408dcc6a82f644832c93e6125db9a16dd6ded338f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00297-of-00512.json.gz": {"num_bytes": 30078472, "checksum": "25e694485171ba1347ccbd7916c1b87a0d46acfd13795a8aabb1cb57b5eb1221"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00298-of-00512.json.gz": {"num_bytes": 30327122, "checksum": "6d6832cb3b1c86b6392bc9ca52f69a0bb16bf71c3c7664d9fe668ee259a40a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00299-of-00512.json.gz": {"num_bytes": 30214180, "checksum": "9f3c3d87a525874ea117e36e0b30d7f5cc6c64564506808058a0788d74943634"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00300-of-00512.json.gz": {"num_bytes": 29895171, "checksum": "e99d296965da2f731ea660889ce834cd1d21edf427298bab3a059ff3ebc64a2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00301-of-00512.json.gz": {"num_bytes": 30131063, "checksum": "e5eeb0f237cf986134c946bb3c2a4b5483fb9c88b3c2b16b9db26135043036d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00302-of-00512.json.gz": {"num_bytes": 30184609, "checksum": "4ac9bf5ca6fac7f7293238852424340326347ceaa6f5dfa6fddef8003421bebd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00303-of-00512.json.gz": {"num_bytes": 29956412, "checksum": "559019fe1ef1f7e77ac53ad98b3556965ebc524ecb80bbc3f26255d5ae6e3609"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00304-of-00512.json.gz": {"num_bytes": 29974071, "checksum": "3c54edc4b6a7e34048cbbadb55cb3b16496a4e6e7334b4ede4e1368daf4c5301"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00305-of-00512.json.gz": {"num_bytes": 30338106, "checksum": "1c91c0c5bcc2bec0a698318ad6f576a06db7885c20ed7f36782427b80580a75a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00306-of-00512.json.gz": {"num_bytes": 30178986, "checksum": "fff99f2758c2de57ccbfbfc6388f67e624d00d4a6cccb5820a7a8f5fcf02d386"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00307-of-00512.json.gz": {"num_bytes": 29493455, "checksum": "5d08c6e3909e21bed456ff9d06c983f14d3a277cb399a91047a692184f87c4c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00308-of-00512.json.gz": {"num_bytes": 30228844, "checksum": "04bffac195e24383d06b0ab9ebf019959a4e7abe8e8e6a0cdfbf0a8e7c23c899"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00309-of-00512.json.gz": {"num_bytes": 30351688, "checksum": "3ce14d5104d1318c6a16d042735f0a71f4452897de60d17408181ec5b135bbb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00310-of-00512.json.gz": {"num_bytes": 29993012, "checksum": "afad2f39bf4cb932e50d9a0be93940b423e7abcc3d67dac15b1939e4e40f4ce4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00311-of-00512.json.gz": {"num_bytes": 30448951, "checksum": "a049c31ef6304084d33cb7bdd2e21ada0c60b40b1002b2369e60d36a5098c4b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00312-of-00512.json.gz": {"num_bytes": 30034189, "checksum": "557d1e88400a6d1d8ee4d717a959239edacbdd3e18d8cd20c5c85b77174dc302"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00313-of-00512.json.gz": {"num_bytes": 30066486, "checksum": "e4823ea1e9a59d5db84564a5b90c28fd8058450f238c60ad689ffd6b673d65f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00314-of-00512.json.gz": {"num_bytes": 30397706, "checksum": "1b4c0653e7ccf7fda0a53d8cbd5ddd57322ac83822e9d05bbdb9eb8ac979cf50"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00315-of-00512.json.gz": {"num_bytes": 30219107, "checksum": "9c364c9cab4ff7acdd1818b13de2f36713df8fa6c504ba15cdf47fe8e3c30206"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00316-of-00512.json.gz": {"num_bytes": 30098661, "checksum": "84dd8a8739b5abc39d8180f0894b1fbf2930d6d333d7c86b646f40763327397c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00317-of-00512.json.gz": {"num_bytes": 30178992, "checksum": "16e4791b4e5ab3719dacf79fedb0b88ed54346372874c37ccb71d86bc419edc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00318-of-00512.json.gz": {"num_bytes": 30022982, "checksum": "98345a826aab12bdaf5e639205d5dcdc1da8fecd7cafc1982df89ac8d4df7ebf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00319-of-00512.json.gz": {"num_bytes": 30360409, "checksum": "d53a39019a1627b42ae6bff68e283d37d0bb5f48b328c2c5cdcc1a3897f4e992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00320-of-00512.json.gz": {"num_bytes": 30347267, "checksum": "c343a0eedf58484055e58762802ae8cc05f2cdb0b923785c493d056a2cbdb015"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00321-of-00512.json.gz": {"num_bytes": 29967877, "checksum": "cc5795d254ad749ccfe613034927bdf95529545ae1f277b694dd24a5996aca83"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00322-of-00512.json.gz": {"num_bytes": 29885538, "checksum": "d5eaaa1eea983bd37ed34651e6c16b746ff7c92e48038b234149fa6d04d3d866"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00323-of-00512.json.gz": {"num_bytes": 30308848, "checksum": "a42cfaef5e088fd6b24dfc121084a6cd038f5b0bfaecb9f33997ab22a97fb155"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00324-of-00512.json.gz": {"num_bytes": 30351634, "checksum": "0e2e6933f93466e9c8fe966f7770fe4c34caf182c713dad3206f4132eed1d41d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00325-of-00512.json.gz": {"num_bytes": 30077168, "checksum": "77cdbf7040ce7f38d735fef41813ce63aaa16fcd87fce80e6ca6bd56d350c369"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00326-of-00512.json.gz": {"num_bytes": 30031750, "checksum": "8d994c2dc1b766e3270dce3f0b8f6f8fe22d5c1e0e9780e1bfed52c1292b8641"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00327-of-00512.json.gz": {"num_bytes": 29845765, "checksum": "f6279e351d016769d6fb5482d01a15ba054d5fe6f9f1c4e92c0663cef0083002"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00328-of-00512.json.gz": {"num_bytes": 30253188, "checksum": "2ea84aafd94d1843a2cc4428279dbb079c6ae0aae6c00f90ee4b5ace3c827afd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00329-of-00512.json.gz": {"num_bytes": 30124922, "checksum": "49e3d91126d53eada7bbd87bfe9eaae74f059c69cd70a3a3b8101f49c1aca154"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00330-of-00512.json.gz": {"num_bytes": 30026414, "checksum": "07442fc4f7fb1732362293bc15a6754d70ecf4743392cf89c4497b3cd96269fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00331-of-00512.json.gz": {"num_bytes": 29961847, "checksum": "f437c6f5f758a5d32c8fc949037060259162864c29aeaabf37032e79f5a1cf0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00332-of-00512.json.gz": {"num_bytes": 30167166, "checksum": "96018497eb6dec020436c1333ff81980a64fb615997855fdd8cf35fe3f658db6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00333-of-00512.json.gz": {"num_bytes": 30192963, "checksum": "1c12ea6b9031049dbc84e4da6b5fdedf480e989385d758c88322c415a1cabbb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00334-of-00512.json.gz": {"num_bytes": 29847008, "checksum": "c269285f15f626b4b15a7d1705ffa08e3f4d49ce13de8174b72f9f6276a1c6af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00335-of-00512.json.gz": {"num_bytes": 30262244, "checksum": "179ee564e6fc644d9ee139bdb02d470a1172221b0f6e510ee5935683500f8257"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00336-of-00512.json.gz": {"num_bytes": 30262910, "checksum": "317933afdd8dc8a3a355e44ee3d84bbab12a2f30c98ea1172dde7074ed4c0557"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00337-of-00512.json.gz": {"num_bytes": 30155329, "checksum": "c5b850399252ec41b0fd9cb2da87ce25e5a44df9f44c6ed9d8c559a5729e5a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00338-of-00512.json.gz": {"num_bytes": 29952961, "checksum": "48083123ba97a6212e0501799bd01936f0795bdd4d9c2710b9aa67d54b29037e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00339-of-00512.json.gz": {"num_bytes": 30403399, "checksum": "313b60f985dcf591f34d351b758eedace655b6c6d3946dd2ddc55f34a9a97ae9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00340-of-00512.json.gz": {"num_bytes": 29917484, "checksum": "2c72290f3bd51dea2a2877d68a968dc2b75dadf99ab3cc2230e41be45f3515d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00341-of-00512.json.gz": {"num_bytes": 29905522, "checksum": "1acd83a0da4a7a4912b589dbeb68b37396d0454371b2b71af4ae18b854d482ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00342-of-00512.json.gz": {"num_bytes": 30022369, "checksum": "8756be42335bba12d06de63e247659f8d603a092ff342360dfed645aec135c47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00343-of-00512.json.gz": {"num_bytes": 30229313, "checksum": "863e29987a3ccfa08e14ae987c81367a53b9fe08795184db086117a9555e058b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00344-of-00512.json.gz": {"num_bytes": 29924335, "checksum": "aa9003a7cc3527fb658fd807c78890587a8b35634a1f0838bc221a6374205d20"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00345-of-00512.json.gz": {"num_bytes": 30229482, "checksum": "a7e88b015bcf7761217e9b3ffd413f13cac48f6afe083353436de6cbd0d0018d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00346-of-00512.json.gz": {"num_bytes": 30029147, "checksum": "b862ea62ac032c203c0038c061a44edabe4644be03b876ec7322e96762374940"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00347-of-00512.json.gz": {"num_bytes": 29808182, "checksum": "62915b86cbbf61a76f73d05509a8e839aae0b965134ef79022377625df7ef741"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00348-of-00512.json.gz": {"num_bytes": 30091116, "checksum": "6c384c2c6bc8340b88e085f8bbc2616be68c96fa7b8b88306b4500367d053a49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00349-of-00512.json.gz": {"num_bytes": 29867618, "checksum": "bfb19508ecf8bd4d9a8847f0edab5acde6896182c27da706a6f2863bec43c152"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00350-of-00512.json.gz": {"num_bytes": 29723106, "checksum": "a645c62c94de9018175f15a0b38aa8bd2484601ee189b7c27d589288eb5af97e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00351-of-00512.json.gz": {"num_bytes": 30047620, "checksum": "991061a23834e6bb3dc0595cf0e8328e07746d10fbf7a7ba397c1410cb66175a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00352-of-00512.json.gz": {"num_bytes": 29808328, "checksum": "6c8e377a6cc82e81d66e2be3d23c1cdd42480015a68a1db458d542b7ff64ab7d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00353-of-00512.json.gz": {"num_bytes": 30040117, "checksum": "ead6f32d98a91c47fb9c21334143f02181efb0b831705baeebb9820d069598fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00354-of-00512.json.gz": {"num_bytes": 29953984, "checksum": "ba349e503d017abbc1c83da2314c0a4892a9f3e5e480173812578f44d9b5904c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00355-of-00512.json.gz": {"num_bytes": 30179912, "checksum": "2bfeab794bbe0432db52cc595d25864b17fdb0744a80d6d907f6f2ffc5c56b81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00356-of-00512.json.gz": {"num_bytes": 30312163, "checksum": "d0dec696d28c601d3a1f75b0b6e6e711e00809f0d5ea915f63cb6d9b7adcc597"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00357-of-00512.json.gz": {"num_bytes": 29931515, "checksum": "d43c75371e32d0c1e65f43acc00aac3ca43762d4c6eb6bb61759ac5fca593a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00358-of-00512.json.gz": {"num_bytes": 29739788, "checksum": "96fef1b4a5d6a080ff5d4a10bc90911dcb2ddecb4be91d0c9620e6d2484e3ee3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00359-of-00512.json.gz": {"num_bytes": 29913841, "checksum": "05b065d2d13b787ddee4707be7e2be46173c23794b9e8c773d0da743f435db17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00360-of-00512.json.gz": {"num_bytes": 29805295, "checksum": "826104b9f4c2634d128f15564bd4990057dfbbb4066f2a082039d243bab56935"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00361-of-00512.json.gz": {"num_bytes": 29839676, "checksum": "ee5ba4cb14ecee0c857828a866615c6bfe45f67b158173dcac44146a02d97738"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00362-of-00512.json.gz": {"num_bytes": 30154783, "checksum": "d67b49e6fa5dc293fbd3057b7ca0beb7e0bd1ff692cdad7f2dfb7abadc1f4599"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00363-of-00512.json.gz": {"num_bytes": 30126118, "checksum": "6940704da6cde5822d48dc806280b8d57e0593ba299731e68ca9c2a4f7cf65bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00364-of-00512.json.gz": {"num_bytes": 30184894, "checksum": "e740b4a0240e691f16a423fd658aa3c7539986695418af3b5a171a48524db74f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00365-of-00512.json.gz": {"num_bytes": 30386766, "checksum": "5a6a9461ef9ca579a849f6bef4d6225504a885aa797d3b2236ed8df6f5ea72ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00366-of-00512.json.gz": {"num_bytes": 30208411, "checksum": "8e0ce2447dfadaa4d41b991a2ce1be63b409e58e88944594dc8591bf9ab41403"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00367-of-00512.json.gz": {"num_bytes": 30266003, "checksum": "04ea00b46a583edea7740d74d719ef7f303b7f3873365b9ff4e94f08ef80832a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00368-of-00512.json.gz": {"num_bytes": 29993752, "checksum": "38b1a55dd4ff1b504d2dbc0b2ad54fe43ab16c8bdba55bd97f4a55dafa8c83dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00369-of-00512.json.gz": {"num_bytes": 29833222, "checksum": "a25c405918920ed00edf5f3007cb8895b59fb67618dfea266b048273303b9592"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00370-of-00512.json.gz": {"num_bytes": 29988999, "checksum": "2812e6d9865d77ca8ac2d1499ba86be1ceed868a1da2bd13fbd0967058a3516c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00371-of-00512.json.gz": {"num_bytes": 29866636, "checksum": "ecd1d3bdc41c3f41f8c9d3a63c75766c173f70ff117af748a08c221ca4273b18"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00372-of-00512.json.gz": {"num_bytes": 30296883, "checksum": "723d2c5ebbdd95ab84c53e458d81944b6907d08c7aec67300f012880624d0010"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00373-of-00512.json.gz": {"num_bytes": 30310322, "checksum": "ae45d088521f2faf9852cb169962176e84bbb81d5ba157d4228d348f7fcf60f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00374-of-00512.json.gz": {"num_bytes": 30340527, "checksum": "9b09c9e1b424fd05540b720c5a85f71eea43d743dc4ebb318e839125ccac9383"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00375-of-00512.json.gz": {"num_bytes": 30193692, "checksum": "c3ca4bb179cadf872f25f1cdb5c3667933bb8dfb7af21068a24b1b09c961dfa8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00376-of-00512.json.gz": {"num_bytes": 30184130, "checksum": "5d801f4bc20c4c6d8821ccfff06cb5dfe4214e571734feacbea3325462afa280"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00377-of-00512.json.gz": {"num_bytes": 30259301, "checksum": "ebf08508c24e29a8a14b72248f090d765b02ee7a31296811d0391f2a2e73c046"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00378-of-00512.json.gz": {"num_bytes": 29650049, "checksum": "c13e994e68b938ca069d2d412e7891cbaf2ee205d65b1c17c6acfea01adce157"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00379-of-00512.json.gz": {"num_bytes": 30265211, "checksum": "667da6f0650dd684aa50bc691b5783968ae8cab847dea14fc8d8bfe203e351f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00380-of-00512.json.gz": {"num_bytes": 30429631, "checksum": "7cf0e9ae00bec72f571d152730107efdd944176818600517fb2d0412a859d366"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00381-of-00512.json.gz": {"num_bytes": 29889471, "checksum": "f781b3128e92c54365be7771695555378067a65fb922e04062ab6f3f092ec827"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00382-of-00512.json.gz": {"num_bytes": 30029894, "checksum": "2d133def2bc4b840312ebe5c466c9f22729b67aa4c2a41dda2e6a9a55ddcddbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00383-of-00512.json.gz": {"num_bytes": 30249255, "checksum": "e8610abf7e2bd70b1067a1b2dbf392ac32be156945502629228969974d3899b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00384-of-00512.json.gz": {"num_bytes": 30362665, "checksum": "f217071bd0c1b1bddb3342c85064d7ebb54bcde2512997636f0638a0b3641588"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00385-of-00512.json.gz": {"num_bytes": 30080234, "checksum": "2db4b15c7391b6e6d3791721ee574d09101df597110feebc59e4f0aff4df6c26"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00386-of-00512.json.gz": {"num_bytes": 29897704, "checksum": "035daed74487c5262b8cfbefdfaefd17f2834c7b4a1d293934d755e059b58f5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00387-of-00512.json.gz": {"num_bytes": 30072139, "checksum": "73013fbd06eaf94a7c8a0f0de420f83bed56655fb2d4e5d93972e8ca1847d130"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00388-of-00512.json.gz": {"num_bytes": 30123843, "checksum": "5db846c3d0b36774ce771ddfa8c53a915767926a2ad48222256d839326336f19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00389-of-00512.json.gz": {"num_bytes": 30278955, "checksum": "9e4c590e67b2fbd357af955e39864ffe73dda201d76759935fda80b10b463500"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00390-of-00512.json.gz": {"num_bytes": 30013591, "checksum": "90974ba6eff489e0f4f52187b6241120740c782945e86525cb5d1e551a54e322"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00391-of-00512.json.gz": {"num_bytes": 29925212, "checksum": "10fcd62813434e2557b5861fd8604f534952561065bee9dc525b1cd3f5b2730f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00392-of-00512.json.gz": {"num_bytes": 30016498, "checksum": "da88b36bd3f15551d8fad115a86f111cc5c3d9a3c6fa9497214aabec7bcd6aad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00393-of-00512.json.gz": {"num_bytes": 30061083, "checksum": "1ed9881020f240e1277e6513bc2abf24ea48e9cb0046d7e87a6d3669c8b42a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00394-of-00512.json.gz": {"num_bytes": 30043459, "checksum": "a35c3de1b0c982df8471705574e6eb7cc730fff122ff17d1381f2c7b9f20d6bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00395-of-00512.json.gz": {"num_bytes": 29921106, "checksum": "f4cf52f8d6a1288773cc366469df140f885b233fb6aa1cb75387a450d88ec94f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00396-of-00512.json.gz": {"num_bytes": 30024980, "checksum": "5ebe04e54e4242d52aacb4c2e107dd10e609d5a7a6ff0425d9952bed98ef4921"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00397-of-00512.json.gz": {"num_bytes": 30096825, "checksum": "3ac381004d8257aa50fb28f0fd2171abbb93ad825c3f43422b9dbec6e1c6f31b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00398-of-00512.json.gz": {"num_bytes": 30059739, "checksum": "40c38af325f4d01ae7c74aa9cd8f8d1c96c6af851175f80d3c50d85c5f5d3585"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00399-of-00512.json.gz": {"num_bytes": 30049826, "checksum": "2ba0109b2d5b88422250bcbd2494cc6e11528710f38fa6e83a1f699b840b68a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00400-of-00512.json.gz": {"num_bytes": 29953506, "checksum": "010610ba3af3dbfbcf2fac93136b7066fc58eb914dce9ae999722d0cfec4d331"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00401-of-00512.json.gz": {"num_bytes": 30271141, "checksum": "29587bb4be2c367f6479705b5c3c28716affeefc857ac1f77e4c33e55264def0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00402-of-00512.json.gz": {"num_bytes": 29861236, "checksum": "8e399149c335ec599f881fada448c9b4be22326357153c74b0de627078f1d43c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00403-of-00512.json.gz": {"num_bytes": 30175831, "checksum": "0d2800836914a1e2ef4a1aaea6e70d19699fc2555582ec670223177cac05a4fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00404-of-00512.json.gz": {"num_bytes": 30097682, "checksum": "f9665e9199978b123feb962ce347b30cc1520626c32dfef0ca3cd8895a45e445"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00405-of-00512.json.gz": {"num_bytes": 29810961, "checksum": "8ea29cf9f7774a16a4c2aaeff1b6353de2951073676a9c411f19b0a5fb755b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00406-of-00512.json.gz": {"num_bytes": 29963498, "checksum": "90b10c91f6e0006576ec9b426c424e50fc1726c25ae8eb91bf91bb9001ade2e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00407-of-00512.json.gz": {"num_bytes": 30089554, "checksum": "cfa905514e4f19c4eb82e438f5eb987731004476f026f4bebbeeafbe519ec85f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00408-of-00512.json.gz": {"num_bytes": 30148002, "checksum": "dddada59e2ef306cdf83b7c9ce3c912792237852053a4ea683224438a242c5ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00409-of-00512.json.gz": {"num_bytes": 29989174, "checksum": "907667ac304b6cca7100a9606e915c003fee43f1640d5b01405beb16eac4c379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00410-of-00512.json.gz": {"num_bytes": 30519580, "checksum": "acd5cd2ecc46927046c81c9bb3459dd72a98e346ebb59c13c0db08fbb60961a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00411-of-00512.json.gz": {"num_bytes": 30408107, "checksum": "6a9c2d42717f853cd4a76fc5275e95e2a584b7465c6059f586f6a06417048a42"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00412-of-00512.json.gz": {"num_bytes": 29699198, "checksum": "29e76bdab47496ed61a102edd3c61c20e60ab52abeb8e6068f7aa4ad1868f4fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00413-of-00512.json.gz": {"num_bytes": 30065457, "checksum": "b4a33941d0b994b82e3be351542cb4a832742e050ebbd71481e7ba34c8dcbc3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00414-of-00512.json.gz": {"num_bytes": 30342960, "checksum": "4ba7edb3c77a45f0e4cb7e969053db6f44ce8c0a8ef262582512814b1161d9ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00415-of-00512.json.gz": {"num_bytes": 30201576, "checksum": "25cb4eb4bdf3cd1b29289a23696be8bd41c5f577294e94607bea7b91252a04fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00416-of-00512.json.gz": {"num_bytes": 30021170, "checksum": "60472bd2a2896bfb57baabb583fc6cdd402a1d776f6a4c9bb58ed556e67cd76f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00417-of-00512.json.gz": {"num_bytes": 30237505, "checksum": "aea8fd33c2acf1cef890549b1f88b18a2eeb37f6d4dd22b552f735811ad0b8a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00418-of-00512.json.gz": {"num_bytes": 29999334, "checksum": "93583d771ce7f0e1d044de2919a3ffdd48b7b7dab0cd3b6dc459200dd53d8762"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00419-of-00512.json.gz": {"num_bytes": 30194801, "checksum": "cd36e129487272742f3e60ab6512dd79b3d1ce3c22490d2e47c00c2ae595cfc6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00420-of-00512.json.gz": {"num_bytes": 29903898, "checksum": "6f18a5ffc7efe5f555b02d3a31ed43714e09e73f7462206220d70450f47cd6f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00421-of-00512.json.gz": {"num_bytes": 30015573, "checksum": "cfacef2cffd953425eaf4d7b2b6cf5d2637bf5d58c6ed2bd0002442795c7d36c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00422-of-00512.json.gz": {"num_bytes": 29966521, "checksum": "14f646b15948cf586ec1abd4bf4bf45bf180913e4d09049fa779bc7a196e455e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00423-of-00512.json.gz": {"num_bytes": 29972805, "checksum": "ad7d4ab443c7a8122976570891a225a44ff86d2299d70706066633a6204eb0de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00424-of-00512.json.gz": {"num_bytes": 30317886, "checksum": "37c8bf3b535ea4053aa2424c846e3449f9eb27d5ff999e1e93b6cee0aa975333"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00425-of-00512.json.gz": {"num_bytes": 30059310, "checksum": "674ca5eaf6a88f76881c8a1c48e1e0f93794785ee5ea17fb70f49228d7f39614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00426-of-00512.json.gz": {"num_bytes": 30182498, "checksum": "988d08cd18162d9a309155d2e75cd4980f76ab4c73ef8286edae94ca4628ebcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00427-of-00512.json.gz": {"num_bytes": 30253874, "checksum": "aa8c08a684ea0bbfda9297aea07429172a2fa4a161268b964421796173275b35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00428-of-00512.json.gz": {"num_bytes": 30055421, "checksum": "b1ed26e826bee7fcbc31cf1c368c9a63eeedbea1c2fd0fb07370b461a03d1a7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00429-of-00512.json.gz": {"num_bytes": 29830674, "checksum": "3efdc67ad7a108416dae47886e542da5c2ab1cd7e1aedd25c1c5d4e0607572f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00430-of-00512.json.gz": {"num_bytes": 29938000, "checksum": "3221ef5e4c28d44c1da4fa04689f318217991c07aff4fdee5e1091fe8e1162ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00431-of-00512.json.gz": {"num_bytes": 29829687, "checksum": "225f4e22df1b45a7dc9fef2f5a44da8f8ee25608cbe34195e21b49c8cd10f3ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00432-of-00512.json.gz": {"num_bytes": 30006209, "checksum": "9fc53637db7b16c8cf6f824adf21d4602efab715ad78eab62c4be7981a8bbc1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00433-of-00512.json.gz": {"num_bytes": 30656456, "checksum": "6bf7b701dc18f68d0facd7cdea49a26cdcfdd7829d5346eefe555485cfa7f336"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00434-of-00512.json.gz": {"num_bytes": 30138891, "checksum": "793532f72aa41c1dd7c549e9597fe8e73796c53eb5fe410a73de418ec446d686"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00435-of-00512.json.gz": {"num_bytes": 30430276, "checksum": "0d13d345ad12999fb4e7a9675e08bb1c90980fd193ed8530e4258e07bd6ea754"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00436-of-00512.json.gz": {"num_bytes": 30173309, "checksum": "fbce5fadb4b49bf833f77337929d873b2b25c3b564f7622f3672dde7a044e5d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00437-of-00512.json.gz": {"num_bytes": 30142240, "checksum": "76c34800a3223f5fe0f1960f3d3c9dd9ecdc2e652493d71ef245415b5027c902"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00438-of-00512.json.gz": {"num_bytes": 29979673, "checksum": "4784c3787d24b9d46ad7c835683c6506c2e55c84835391e2aca0355f032a1888"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00439-of-00512.json.gz": {"num_bytes": 30169105, "checksum": "5012d03e637769d7494bd3cef0a8dfc8b38c995e0d5780089c15d6b1495b3a8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00440-of-00512.json.gz": {"num_bytes": 30107004, "checksum": "529beaf4ad0251e35be574b1f623571526ec91a588ebd7df43e9d1cb99445f53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00441-of-00512.json.gz": {"num_bytes": 30324563, "checksum": "f5e5fbf5e329f5bb0e83f758b8fc76516d65c3f91ad97e328187eaea83e4b667"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00442-of-00512.json.gz": {"num_bytes": 30335681, "checksum": "b8a26ed60f87a87347886b4467aa576ec5e8c106931589a1aa821b99fdabdb54"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00443-of-00512.json.gz": {"num_bytes": 30155655, "checksum": "e27bfb813fd6aba96ada81b095a559f0b7847cd25f7f8973663b19cdc5b8985a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00444-of-00512.json.gz": {"num_bytes": 30340540, "checksum": "705dec13ba2824d45e801bc2cf3e709d6492b1ff6de2f9ddefb5a57dbdada4ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00445-of-00512.json.gz": {"num_bytes": 30248960, "checksum": "09a6b83910369cf269c4f095607fb2f0ac0ec7e25b501f577fe13920a8573ee0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00446-of-00512.json.gz": {"num_bytes": 30316703, "checksum": "8f88b794c08bb492f50073337a30aafac0d05819505b507ab283dba0cf17d125"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00447-of-00512.json.gz": {"num_bytes": 30184407, "checksum": "38c819df823197bea6d647c3f78bcc15024aabba814cae322c1663c45fa8382e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00448-of-00512.json.gz": {"num_bytes": 30238484, "checksum": "8c0abfb8dca37a179b01dadd2227206cbe6e5b916d0111c0b00d2edc3951c7f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00449-of-00512.json.gz": {"num_bytes": 30143151, "checksum": "9731e9644e5615d5d5ebdbacc6efa6382df856c8763b7485c9a5838864c1332f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00450-of-00512.json.gz": {"num_bytes": 30122606, "checksum": "3b746f616f21c91277cde8e6d0d7f792ead7874de7ecdf11830a4a56db3dc799"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00451-of-00512.json.gz": {"num_bytes": 30128179, "checksum": "d6cadfc64ee39c9beb93f0bf8c169ca9d9053e0f76e1c9697841438e20dddef3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00452-of-00512.json.gz": {"num_bytes": 29979326, "checksum": "42de19ffc3ec821fbf5ff686d1b36d189ad9ee5c4553a2ff0d003ee1a754c9c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00453-of-00512.json.gz": {"num_bytes": 30118272, "checksum": "22f9b2d3a9f089f1015f74d1ca0aca8f2a4970595326d964817177cbe6859271"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00454-of-00512.json.gz": {"num_bytes": 30018294, "checksum": "17c16895edccbb8b40fcc52cbafc0c15957020eb530e071dcce34544d5958bd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00455-of-00512.json.gz": {"num_bytes": 30155903, "checksum": "8b9d49837b309c3389d03dd3bbae92395bf7086134fbc69d28d9fff60a90d4a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00456-of-00512.json.gz": {"num_bytes": 30282104, "checksum": "ab63fd2efb0cc883d303241b3488a8135a196db7edc844458cfc1483898ceb3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00457-of-00512.json.gz": {"num_bytes": 29920723, "checksum": "dbde2eeef90144b209ef5afa6d5165ad638ae57d919926a379a10fccf6850a61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00458-of-00512.json.gz": {"num_bytes": 30163167, "checksum": "800307106f5861e0bc246bcaae214e6dadeee849905cac184ecfe6d0b560fa68"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00459-of-00512.json.gz": {"num_bytes": 30248893, "checksum": "3e78d327a9463929f33311e18116f5d1d2ae4926f7a600378875ba854cf5ee47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00460-of-00512.json.gz": {"num_bytes": 29840067, "checksum": "047568a5dad00b04ca1ea4aa262c7a4af9b61e87bc4ea02ffd5c6c8c049bf8a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00461-of-00512.json.gz": {"num_bytes": 30179062, "checksum": "ed8abe7b465bc19150b831632cb7afa298d6cb4beb9b6043a35a0f8afb5f730d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00462-of-00512.json.gz": {"num_bytes": 30266398, "checksum": "d7b74f5c1c1f7bb489700adcfb7e48400c4fcca7669e2d56396d9fabb5a63b91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00463-of-00512.json.gz": {"num_bytes": 30158800, "checksum": "224815aee29f6d04ddbc7457c84338eef9b127a767e7b50ed77283ff166d4f93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00464-of-00512.json.gz": {"num_bytes": 30393915, "checksum": "0dd019fd2c19936ce2e6410b65872f630131c5da7543c8e66fa87547fd1a2209"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00465-of-00512.json.gz": {"num_bytes": 30148939, "checksum": "6d74dc9d74d28c2b8ba8d43ba3d594af0cb176cfa7bf738f3933be2a9c37bb85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00466-of-00512.json.gz": {"num_bytes": 30268228, "checksum": "0e201327066f28c19b082fe35e4fb3bd76c8fd2d32236d1d6e2309489152aa66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00467-of-00512.json.gz": {"num_bytes": 30121937, "checksum": "7352e5a9ee66dcbeed2c9e1fbe6c9355f0e5dd1b30b592a9fd5690958945e5a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00468-of-00512.json.gz": {"num_bytes": 30004669, "checksum": "53876848336ac57c082c9d5735bc1717f69ef38688b221d5e5ab9cd9cb4ec620"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00469-of-00512.json.gz": {"num_bytes": 30049860, "checksum": "a5a720b38f106dd5d2a2b7647748b52b4531ac12294e3b0d8dbc92062639c0c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00470-of-00512.json.gz": {"num_bytes": 29961380, "checksum": "9611764fc4f84b92e86fa6f9ea41464f6c26b07d1c51241b627a3d155e99d163"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00471-of-00512.json.gz": {"num_bytes": 30449164, "checksum": "db508df549d518c3e8b99b2f0098ea93fead1e632f53d8ae2cebff1d3476577c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00472-of-00512.json.gz": {"num_bytes": 30312620, "checksum": "1993b5e292c6c60a3373aabe896f1a57afaad73fdce0ec60e30696368f7c0afa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00473-of-00512.json.gz": {"num_bytes": 30406764, "checksum": "913045c61fb5a145379d9fe08c91ea63092b197400c0c87bfa65af91720b563c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00474-of-00512.json.gz": {"num_bytes": 30078563, "checksum": "c495119e150b083d709ca915abd760683793361ebf3e079b04efc9b7e1900379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00475-of-00512.json.gz": {"num_bytes": 29860761, "checksum": "50bb5f40d2e91ab136aa63063fff860529c8961f2a38500a645b10339751589e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00476-of-00512.json.gz": {"num_bytes": 30199778, "checksum": "c969cfbb7ed7716f665b336b2ed9f7b10b532c7adc6d8a347964831a39cfef0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00477-of-00512.json.gz": {"num_bytes": 30130742, "checksum": "54c8b89102cf882eda5208544a6c5d317c1defa8d997f9450ebd576e58f91830"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00478-of-00512.json.gz": {"num_bytes": 29901444, "checksum": "f669299d794ecc0523c64ad31af8fcce5cf3f880e87fd73f4c3f434425e9b238"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00479-of-00512.json.gz": {"num_bytes": 30587214, "checksum": "25d0fbd9027deaf140650f0b82a2316c37939f199fe7633b9f643684404f2029"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00480-of-00512.json.gz": {"num_bytes": 30145237, "checksum": "68a29728290e1199ce8d1ac060365bc443ea67c24292b2b04f1b4ca44ca7238d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00481-of-00512.json.gz": {"num_bytes": 30204159, "checksum": "1605034b89e33f6794c901adac1eb200bb489f76b9bae6bc56b01e9f6ab4c254"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00482-of-00512.json.gz": {"num_bytes": 30430794, "checksum": "2dce9df095e89ea6645fb599f518612511a62b6c475808ad004c32968b19bae8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00483-of-00512.json.gz": {"num_bytes": 30102412, "checksum": "c7c626977521b0d1f5bcc02c484b3eb4f517ba71006a4802df08a0f4cfb8ea9e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00484-of-00512.json.gz": {"num_bytes": 30171871, "checksum": "519ed997f1f1f1de7864b0bddf202b25e25bed349f63593a88337262d7705968"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00485-of-00512.json.gz": {"num_bytes": 30049539, "checksum": "8d2314fd3239ba3dfa99962c1d0a38e05edf9194e1faebae88f6b19ecab8fbf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00486-of-00512.json.gz": {"num_bytes": 29949995, "checksum": "a7521e09cbe77098c23172427bfb931dd50f0c9d58b034fd1621687849a8d379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00487-of-00512.json.gz": {"num_bytes": 30345072, "checksum": "ebc6254a4d241afb886b8df20819301121fcb234a32a1dd4ee8ae49571081f92"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00488-of-00512.json.gz": {"num_bytes": 30300622, "checksum": "509bba28ddf770d38554a2e846f2ce0d2af59e3662a6d6ec4dddb75fb509f8d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00489-of-00512.json.gz": {"num_bytes": 29949909, "checksum": "996e61f8e674b0a016a568630ee13a7473f99a919437c225a4198d232861e628"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00490-of-00512.json.gz": {"num_bytes": 29995429, "checksum": "9730024ad352eb12f74ac446ed32b9c57898658954be5dd639184fc5264527cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00491-of-00512.json.gz": {"num_bytes": 30293919, "checksum": "65b2a7de3284e892441b0fe8e850d89de842355d78fa9944358b1ee5912a948f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00492-of-00512.json.gz": {"num_bytes": 30115831, "checksum": "26b535c3175bb86ef721593f81d9cf006d4c3749f156c63ccd2a2c04e1201236"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00493-of-00512.json.gz": {"num_bytes": 30187809, "checksum": "a0918223c5523da20bd8230de1985b0a3cbb1e239af3d62a83d720a3a528c567"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00494-of-00512.json.gz": {"num_bytes": 30149878, "checksum": "6e9a5e329f834e41b4a8a9a6809df3243e5bffc580327912288ad7f790b43ab7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00495-of-00512.json.gz": {"num_bytes": 29711944, "checksum": "3b9ba9d667e1241692ff9a654a68e98e8e94e32244a9419b2542137b63fb4705"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00496-of-00512.json.gz": {"num_bytes": 30114815, "checksum": "24b78cc36bb0abc67c998320e7029b6e7bbbee267a367eb538f23956c13f27a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00497-of-00512.json.gz": {"num_bytes": 30048480, "checksum": "29c3606acf298498fc3498bd769544e2879afbd0d5c46cee298cb25058694aac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00498-of-00512.json.gz": {"num_bytes": 29934973, "checksum": "8afaffea92dfad745be8aa8cd3de0ee97cbcc26fbad6c71d56683aef6a27055f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00499-of-00512.json.gz": {"num_bytes": 29796509, "checksum": "9cbbd8f6d8fe92207c4cb2f0422284726deca1bde7f30cb01cce7fcd4665b380"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00500-of-00512.json.gz": {"num_bytes": 30221736, "checksum": "902904aa9fadaecbe698402a27b4e68b00813e67b79f84d4c696cd9c72f08f55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00501-of-00512.json.gz": {"num_bytes": 30108320, "checksum": "76e848f8dbc082158fc5d3a2f7c10cd6e03585667c00efc639f2c6f47d44aeb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00502-of-00512.json.gz": {"num_bytes": 30381907, "checksum": "885bbc9788235abf33728737f72f267e60d1f5d4a77493cae76f161651d89579"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00503-of-00512.json.gz": {"num_bytes": 29983805, "checksum": "5134934392b13e3f84dd32dcb1c59f4d5416d6dfd925bf896f3eb61881d82136"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00504-of-00512.json.gz": {"num_bytes": 30041413, "checksum": "4978245a7f545d676bad6edfdfe60ffdad94de47af0fb10649fa39e9b068939e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00505-of-00512.json.gz": {"num_bytes": 30021620, "checksum": "64933c28ea3f608326f1c6ef56170886767f1ab4f9ecbc4bf3263c7043901fce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00506-of-00512.json.gz": {"num_bytes": 30260343, "checksum": "84667dbe68ecf1f9bbdaba0e73eca6fe0444f6594a1e9a4b46e9812ae7bce7d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00507-of-00512.json.gz": {"num_bytes": 30173739, "checksum": "dd6d44e4f344f3ab1cd61bacced7b5f1429cf6823fc9282452a539012bda028a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00508-of-00512.json.gz": {"num_bytes": 29903443, "checksum": "4afc46096ac2697867c3a75896c5ceb36617c4c21a749dded58a1ea4565e41df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00509-of-00512.json.gz": {"num_bytes": 29862664, "checksum": "74a720dc16b389e8122d61aa94bc12a5bc4253ca6f39679781c938e2eb556878"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00510-of-00512.json.gz": {"num_bytes": 29744368, "checksum": "6a302049e7a1668c5fb2e4b5afca518fa53ba1a9dc717015ecb5768e85ec4139"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00511-of-00512.json.gz": {"num_bytes": 29896714, "checksum": "48b89e909c0e33fd59c9623f8517cdfa90fa35a4641f999c6f68e1cc9f2a309f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-validation.00000-of-00001.json.gz": {"num_bytes": 15284943, "checksum": "42ac859dc1c4d48d165ec602909403e2066ce1d4854149ed70b9ec9cc96dc65f"}}, "download_size": 15435025687, "post_processing_size": null, "dataset_size": 76369191765, "size_in_bytes": 91804217452}} \ No newline at end of file From 44a64877e5345f1c46e5b43b4a3ad258abd306cc Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 1 Jul 2021 15:02:29 +0200 Subject: [PATCH 10/19] typo --- datasets/c4/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/datasets/c4/README.md b/datasets/c4/README.md index e389e86c5f6..1963d694a46 100644 --- a/datasets/c4/README.md +++ b/datasets/c4/README.md @@ -16,7 +16,7 @@ size_categories: en.noblocklist: - 100M Date: Thu, 1 Jul 2021 15:05:03 +0200 Subject: [PATCH 11/19] config sizes --- datasets/c4/README.md | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/datasets/c4/README.md b/datasets/c4/README.md index 1963d694a46..226d943e0ff 100644 --- a/datasets/c4/README.md +++ b/datasets/c4/README.md @@ -117,10 +117,10 @@ The data have several fields: | name | train |validation| |----------------|--------:|---------:| -| en |364868892| ?| -| en.noclocklist |393391519| ?| +| en |364868892| 364608| +| en.noclocklist |393391519| 393226| | en.noclean | ?| ?| -| realnewslike | 13799838| ?| +| realnewslike | 13799838| 13863| ## Dataset Creation From 97ee3cd9fa3edf6a700647d6ef516acaff73df4c Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 1 Jul 2021 15:11:31 +0200 Subject: [PATCH 12/19] minor changes to c4 readme --- datasets/c4/README.md | 8 +++----- 1 file changed, 3 insertions(+), 5 deletions(-) diff --git a/datasets/c4/README.md b/datasets/c4/README.md index 226d943e0ff..8b7255cfa09 100644 --- a/datasets/c4/README.md +++ b/datasets/c4/README.md @@ -32,7 +32,7 @@ paperswithcode_id: c4 ## Table of Contents -- [Dataset Card for [Dataset Name]](#dataset-card-for-dataset-name) +- [Dataset Card for C4](#dataset-card-for-c4) - [Table of Contents](#table-of-contents) - [Dataset Description](#dataset-description) - [Dataset Summary](#dataset-summary) @@ -70,7 +70,7 @@ paperswithcode_id: c4 A colossal, cleaned version of Common Crawl's web crawl corpus. Based on Common Crawl dataset: "https://commoncrawl.org". -This is the version prepared by allenai, hosted at this page: https://huggingface.co/datasets/allenai/c4 +This is the version prepared by AllenAI, hosted at this address: https://huggingface.co/datasets/allenai/c4 It comes in three variants: @@ -79,9 +79,7 @@ It comes in three variants: - `en.noclean`: 2.3TB in JSON format - `realnewslike`: 15GB in JSON format -The en.noblocklist variant is exactly the same as the en variant, except we turned off the so-called "badwords filter", which removes all documents that contain words from the lists at https://github.com/LDNOOBW/List-of-Dirty-Naughty-Obscene-and-Otherwise-Bad-Words. - -The en.noblocklist variant is exactly the same as the en variant, except we turned off the so-called "badwords filter", which removes all documents that contain words from the lists at https://github.com/LDNOOBW/List-of-Dirty-Naughty-Obscene-and-Otherwise-Bad-Words. +The `en.noblocklist` variant is exactly the same as the `en` variant, except we turned off the so-called "badwords filter", which removes all documents that contain words from the lists at https://github.com/LDNOOBW/List-of-Dirty-Naughty-Obscene-and-Otherwise-Bad-Words. ### Supported Tasks and Leaderboards From 7fe3869dc33ce7a4ef355f860fc7d5517cfa53ed Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 1 Jul 2021 15:51:26 +0200 Subject: [PATCH 13/19] typo --- datasets/c4/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/datasets/c4/README.md b/datasets/c4/README.md index 8b7255cfa09..35621129014 100644 --- a/datasets/c4/README.md +++ b/datasets/c4/README.md @@ -72,7 +72,7 @@ A colossal, cleaned version of Common Crawl's web crawl corpus. Based on Common This is the version prepared by AllenAI, hosted at this address: https://huggingface.co/datasets/allenai/c4 -It comes in three variants: +It comes in four variants: - `en`: 305GB in JSON format - `en.noblocklist`: 380GB in JSON format From 5310653c25834415f52ec0a24c419b232ee0e9d8 Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 1 Jul 2021 17:05:33 +0200 Subject: [PATCH 14/19] pin data revision --- datasets/c4/c4.py | 2 +- datasets/c4/dataset_infos.json | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/datasets/c4/c4.py b/datasets/c4/c4.py index 01838eb53e8..b60abe87f13 100644 --- a/datasets/c4/c4.py +++ b/datasets/c4/c4.py @@ -41,7 +41,7 @@ } _DATA_URL = ( - "https://huggingface.co/datasets/allenai/c4/resolve/main/{name}/c4-{split}.{index:05d}-of-{n_shards:05d}.json.gz" + "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/{name}/c4-{split}.{index:05d}-of-{n_shards:05d}.json.gz" ) diff --git a/datasets/c4/dataset_infos.json b/datasets/c4/dataset_infos.json index 60e8bdac218..5cc0f19ac89 100644 --- a/datasets/c4/dataset_infos.json +++ b/datasets/c4/dataset_infos.json @@ -1 +1 @@ -{"en": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "en", "version": {"version_str": "0.0.0", "description": null, "major": 0, "minor": 0, "patch": 0}, "splits": {"train": {"name": "train", "num_bytes": 828589180707, "num_examples": 364868892, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 825767266, "num_examples": 364608, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00000-of-01024.json.gz": {"num_bytes": 319308785, "checksum": "8ef8d75b0e045dec4aa5123a671b4564466b0707086a7ed1ba8721626dfffbc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00001-of-01024.json.gz": {"num_bytes": 318039285, "checksum": "b945059cd1a343cabe311881b7840a6f0363f570e745a0eff0e687e266f6b55d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00002-of-01024.json.gz": {"num_bytes": 319748667, "checksum": "2967dc7e587ced6ecb9ba617ad2d4c44901467969de5bf5b0f5a9e5b70555d75"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00003-of-01024.json.gz": {"num_bytes": 318564193, "checksum": "b79d9abef5741578929be0d59db9ca652a8276207ef18a944b7a5f11fef5beb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00004-of-01024.json.gz": {"num_bytes": 318579884, "checksum": "cd9f98eac2bc6062f55d9a36bd744cc924a78ea2fd998830e0034e4456f5d014"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00005-of-01024.json.gz": {"num_bytes": 318003681, "checksum": "8ac5907a54dbc7ab9c14624448c7c3f6afed33af9d0a855f1eae955e62e255b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00006-of-01024.json.gz": {"num_bytes": 318495137, "checksum": "8fd9b9a4b74c9414466b245ebda7db041e7bd8603971de51b5db782bd758aac7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00007-of-01024.json.gz": {"num_bytes": 318417273, "checksum": "41dd377a1ba6b72eab0260c39c626fe45ab6b649d42d57b311d3ba21a0337cd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00008-of-01024.json.gz": {"num_bytes": 318131845, "checksum": "64da652c235f089a0b52f6db5883ef5f1e9c31edc4c950332b34dd12439c99a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00009-of-01024.json.gz": {"num_bytes": 318185592, "checksum": "807a548efbb10153c9eff0df5733a97a1b51ab1743242530de1b02a8ea17ace7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00010-of-01024.json.gz": {"num_bytes": 319045292, "checksum": "3bd0f6f664069c3bd964ce48ceae60ba47b55b54745a4b00c207bdb3a1926b17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00011-of-01024.json.gz": {"num_bytes": 319686980, "checksum": "5baa0c010083459ba58e34b4e93bb758caa878f7db6fba0528921329fa1a6cc5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00012-of-01024.json.gz": {"num_bytes": 320119088, "checksum": "fdee7442c06856e2c4b7665cc51978e9011b5e0a2112c30dd15bc9e53818842d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00013-of-01024.json.gz": {"num_bytes": 319474856, "checksum": "a4ab3b24087781c3577945492525696e182ffd7ca5265b958f49803a02867ecf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00014-of-01024.json.gz": {"num_bytes": 319693210, "checksum": "62215b2451e71b117018ef73570c944aff890624b384c538950b64c37f184c49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00015-of-01024.json.gz": {"num_bytes": 318427305, "checksum": "9893c9f413a1223e7b535527829bcd6df3219929fb1abf8f2a114dd8f6ea0919"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00016-of-01024.json.gz": {"num_bytes": 318785714, "checksum": "bd0ade8b8a57348952ca31c39efdab538f54c852941a225ccd13d0a7170724e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00017-of-01024.json.gz": {"num_bytes": 320134331, "checksum": "4132cfff3f5126d9e783191a5ccc34e5d85938bebf0b8489657805277a227202"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00018-of-01024.json.gz": {"num_bytes": 318653930, "checksum": "4675ab1d77da3d676d9743dca15bfce8478498f7738f79816a25ed790d28fa46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00019-of-01024.json.gz": {"num_bytes": 319468974, "checksum": "1d2f3a6aeb0f6c159295f283d302794cd3eb944cff3fe68691997bb2dc4c7780"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00020-of-01024.json.gz": {"num_bytes": 319109754, "checksum": "b5f26d832a0ec9b0489a27169d94496f5ea33c7fb046868c565c7b5a2407221b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00021-of-01024.json.gz": {"num_bytes": 318514423, "checksum": "428da5a8d4585de16f6b3f30865a5ca7a8d1ddcd3b6002dcc1283368b0c3d60a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00022-of-01024.json.gz": {"num_bytes": 318715623, "checksum": "9bc4812ba5e08c0b2d83cd3804129ba3d77cf84ba3d8828159788ee02e155a51"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00023-of-01024.json.gz": {"num_bytes": 319874293, "checksum": "38843ab4f5c60ed2b9ec0cdc65074eaca454014d5702edd809a266190689d2c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00024-of-01024.json.gz": {"num_bytes": 318105764, "checksum": "4fa0c7ec94445ea57dcecda7864b1346275e711c9820c2c39dbb9fdb95c97674"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00025-of-01024.json.gz": {"num_bytes": 319122521, "checksum": "0758514fa2e2c133c995c00d5f4abfc14b66582a4eedd0e721bdd95c4632a755"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00026-of-01024.json.gz": {"num_bytes": 318116783, "checksum": "56a73b9a556d6794d9c706e1b1c7e729fa13b711ddc25dd403b110eb5ed857f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00027-of-01024.json.gz": {"num_bytes": 320171191, "checksum": "fea1eabb734cda33d72f3d959234a240080b4fd42cc70494814a8429b087f9e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00028-of-01024.json.gz": {"num_bytes": 319047090, "checksum": "47d1c385952d6c18c431a7294339a030c213b8832f970ac987965b621c8181a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00029-of-01024.json.gz": {"num_bytes": 318705639, "checksum": "3c744d3dd915ceef3a93fd18c3ff5b117fb5118d1ced2089979b6cafc81c4525"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00030-of-01024.json.gz": {"num_bytes": 318327902, "checksum": "7f6959020242fdc841adfc10c102bbe79e2ef8502a09dac8451e0cec6f2add16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00031-of-01024.json.gz": {"num_bytes": 318990600, "checksum": "e56f29011594c765192c34298558e7227a829313196748f9a16ec34ecdb76d23"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00032-of-01024.json.gz": {"num_bytes": 320451482, "checksum": "9ea843dfd85e449439f3106d657762daff8f326730fefb342455c43cb48144e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00033-of-01024.json.gz": {"num_bytes": 319878207, "checksum": "2633cdb7b058f126173608897f69add614659b0b21cf54ecc8a2f4a79bc16073"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00034-of-01024.json.gz": {"num_bytes": 318701510, "checksum": "853c4b9ff2d79621ed27a6be826dae198af609d9f9dbd1c2773b778241cf6137"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00035-of-01024.json.gz": {"num_bytes": 318529104, "checksum": "fb50dac3f35cb71472464f511e6b8aee72ded10b3b6896d0d1f74a18ded2b8d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00036-of-01024.json.gz": {"num_bytes": 318849657, "checksum": "5cef5cfd50cfafd58feb452b85324a3d8198fca48789f0ce69227755e72d8e53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00037-of-01024.json.gz": {"num_bytes": 319621215, "checksum": "f0b67abf30e2d58d291aa9bcc9c8a03668afe819549802e4e591a261c171d970"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00038-of-01024.json.gz": {"num_bytes": 318135467, "checksum": "991bad578a83294d34a1b11649af07339aa8cb26d49330afa9fcbca0b87942c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00039-of-01024.json.gz": {"num_bytes": 320131759, "checksum": "abbbc21f81555e94484e6afe1975e13f67af19a820cd6f8d090c987a250bd4fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00040-of-01024.json.gz": {"num_bytes": 320214476, "checksum": "48020d2656709899abd2572b3424c0455df3c1089a69fe26b776aeb24f0da0ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00041-of-01024.json.gz": {"num_bytes": 319581259, "checksum": "db6fb8db7162ac87ea002c153ef0c54322f24c8f7ec263cfa290ac8c3683b194"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00042-of-01024.json.gz": {"num_bytes": 318100985, "checksum": "d499cba2383b16bb0f26b98416211eabf2599641ecd6708a5ef487692ca9e791"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00043-of-01024.json.gz": {"num_bytes": 317803029, "checksum": "dc6f1ccc3fcce79b16c5157f7125942e351d74744efc593f8372f8a408720340"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00044-of-01024.json.gz": {"num_bytes": 318837063, "checksum": "6170fced793461bd687640a658a085d02f971c2e609f6ff33b90df944fb56409"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00045-of-01024.json.gz": {"num_bytes": 319659188, "checksum": "b2f79e8600815578ec326cfc6c5242c2827cedbfac51772fdcf15ef5d027aa38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00046-of-01024.json.gz": {"num_bytes": 318771753, "checksum": "e4b4a3e53ee66c280a5e7ee33602ea0e910903748db8c2adbbec4b48bab1580e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00047-of-01024.json.gz": {"num_bytes": 318088661, "checksum": "bf8597fc359d8e9c721fd1d98b8ff3db5c011afd0fec9640670f31c7a7dddb79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00048-of-01024.json.gz": {"num_bytes": 317777133, "checksum": "369db8e9646b8229a23044a7257c2face97b8e05738f0413b581892876f268e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00049-of-01024.json.gz": {"num_bytes": 319329891, "checksum": "5cb2aa0432984b355b0ec6aad92f926b2fb75aea2a0e08b97f4c6a62838e6cc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00050-of-01024.json.gz": {"num_bytes": 318172322, "checksum": "11a7cc48539ac97eaec87beacef9d9bbb71fc875a0bff0c9ff096044bff46a44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00051-of-01024.json.gz": {"num_bytes": 318704544, "checksum": "ac2beee992c2b1ae8b1f162054e843e2b971bbd7cec45a0a7a7b7795fcdc7c26"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00052-of-01024.json.gz": {"num_bytes": 320806303, "checksum": "3a591fe9993c3d98a9e7949e98ca215ce164cd313fe53f3ce762c91b5fec7c53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00053-of-01024.json.gz": {"num_bytes": 320565764, "checksum": "60e67c8e6f3bfdf8b490ecfe62c79a13c5d04d393fbac712a6cda49fd78e883b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00054-of-01024.json.gz": {"num_bytes": 320425170, "checksum": "d69305c853e9e516f5fd4e2a9afb1939d829925f71102d8aa09387ded5d000df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00055-of-01024.json.gz": {"num_bytes": 318713224, "checksum": "e01737df8097a1526d6c31d37d7aeb1b92c0a7253b39f6964fcc897bf0eba9fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00056-of-01024.json.gz": {"num_bytes": 319441227, "checksum": "fe516c8c0a9e59f9f035ac5fdd13e973d25dd6635eee05d648740d3e8c1fc742"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00057-of-01024.json.gz": {"num_bytes": 319821142, "checksum": "7e058ed9072e968e9c8b92f9b50dab318515873cca6c617b544dacab5a2f018e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00058-of-01024.json.gz": {"num_bytes": 318643105, "checksum": "3479dc5a5b111b7f45f87e5a91c433907af97dbe15b9db1637bad666dcbdec40"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00059-of-01024.json.gz": {"num_bytes": 318053548, "checksum": "8208b0943f59b5914fa13d29108ede31a8d8d34bc6d603a2278ab8b80d28b1d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00060-of-01024.json.gz": {"num_bytes": 317935826, "checksum": "71324b62706aabd6faee682205cdedcd10dad289579b534d0e53f8d9b92bf2c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00061-of-01024.json.gz": {"num_bytes": 318870698, "checksum": "cdf0abc5804f0991871de48b249e30b666cb96f2254762a570c39904c5780f8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00062-of-01024.json.gz": {"num_bytes": 318945246, "checksum": "5ac676e16108446bd2980f9601c787eb754811a68e92ab6403c333820a6b9622"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00063-of-01024.json.gz": {"num_bytes": 318827790, "checksum": "a26f7cfe123cfdf3db7687996d0163212e70ff7635872b0754c03cbd5c31213a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00064-of-01024.json.gz": {"num_bytes": 318914155, "checksum": "858a145617a5902ab02bc77e47ee2f036a6211384c4f2285767c7558eb93e245"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00065-of-01024.json.gz": {"num_bytes": 319794084, "checksum": "52742215df5aaca43bed5405a397571efe7c22107ee2caa8c05e3ed229796efa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00066-of-01024.json.gz": {"num_bytes": 320294453, "checksum": "5b11cd54de0e95a75e53e4e32f72912cb01053d3fb609de6b7a45afafab414d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00067-of-01024.json.gz": {"num_bytes": 319468309, "checksum": "4c6c69b3eba9bcd6786d7dce893340f2d7093012ead04f3539352beccd2794ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00068-of-01024.json.gz": {"num_bytes": 318800742, "checksum": "ce94afc3c612e9de423a412147505ad7757216100becba2677bf5eaf443c4b6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00069-of-01024.json.gz": {"num_bytes": 319416585, "checksum": "ff3084a3e5a3960425a5c605274684c42fa638f99045527f77e74d165e52b6ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00070-of-01024.json.gz": {"num_bytes": 319165846, "checksum": "04c368b05f0ea42b3a51ed9bc0e817894f205c0ecd74084da015158d509ff2a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00071-of-01024.json.gz": {"num_bytes": 318017381, "checksum": "e8320e9982fa377b07c5b3e8a4451ac143b05ab7a4a03f748034b37fb998bfb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00072-of-01024.json.gz": {"num_bytes": 318874499, "checksum": "920f8d5ef2cae6bdbd52f724d0952e04146ff29f4aaec4dbf10bef7b66a98f40"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00073-of-01024.json.gz": {"num_bytes": 317890112, "checksum": "06a41bdb7bf0d52e2fe8e71f594de8d36d77880639ffdfb41e883237f76e8a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00074-of-01024.json.gz": {"num_bytes": 319201956, "checksum": "e0267d6782d30f1619a82c49c20be1c8b5424e653c093e4652a5c8ed117c6533"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00075-of-01024.json.gz": {"num_bytes": 320575937, "checksum": "42108758abc3c3197e7dca8293eed3800f3e79ceae80d3208d90c7a9fd205594"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00076-of-01024.json.gz": {"num_bytes": 320070510, "checksum": "c904b6e6041e23edeb1d88b7b69f07a339b7ff9835d0c22e0b6c354519369842"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00077-of-01024.json.gz": {"num_bytes": 319042024, "checksum": "1eb2b70ad4d12b7587eeb1ce86477817ad992c08fecafe5ccafc26af6b5657f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00078-of-01024.json.gz": {"num_bytes": 319997520, "checksum": "070370654960e02f766c10321546b280e9933531b796c252a94999d645f360b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00079-of-01024.json.gz": {"num_bytes": 320736487, "checksum": "3aa4f007660706563030b590cef9be992c18ba7ec1876210bc92665ec42c4be2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00080-of-01024.json.gz": {"num_bytes": 320082337, "checksum": "3b54eaf407bb593c2b16df99690446f26497530d21cf433a7d525e0eaebe9c3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00081-of-01024.json.gz": {"num_bytes": 318008114, "checksum": "d01975cdbd4360331b1a0f55e9b7e731d7d9fc70c7cdd0f33f1c772eff7aa03b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00082-of-01024.json.gz": {"num_bytes": 317829809, "checksum": "2a65dd37027fae03819ea5a5f6c3b16d921706ad758442881dc1d15b08bc5048"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00083-of-01024.json.gz": {"num_bytes": 319265318, "checksum": "e14cf18c687f7eb304df6abef7235e263a5736c799d742524205dead2abfb043"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00084-of-01024.json.gz": {"num_bytes": 319166958, "checksum": "1dc3fa8702a4477e3a3128440b68d4cc17e6d2ce7f3c53da28d50a57b8332020"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00085-of-01024.json.gz": {"num_bytes": 320338078, "checksum": "0222db7b1ae14c9b10aacdb05d055d1432b6d035e3937df5640facd242c52aea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00086-of-01024.json.gz": {"num_bytes": 318941314, "checksum": "55ddf7a27dc91bf8d932a5efec4aa458122ee337f2cb050e2c4b0ae8e770f3a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00087-of-01024.json.gz": {"num_bytes": 319218368, "checksum": "c61552d76bedbfa750c599a674d6732fb224c8a1e6c6583fca7ccabb20532920"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00088-of-01024.json.gz": {"num_bytes": 318974308, "checksum": "693fae3d50068ec39ad27a14335372c3e1530138cc65931edac5268dd62b7e96"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00089-of-01024.json.gz": {"num_bytes": 318781044, "checksum": "2d90b9318432a2313dfaec542c8b91431505035cca7416a63e3197ab26ad6e75"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00090-of-01024.json.gz": {"num_bytes": 318569651, "checksum": "ee674beda8ed39395e69c899f666990c5190dfad5494867e51fa727e4d38d86a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00091-of-01024.json.gz": {"num_bytes": 319683433, "checksum": "add2489350310ce500dde6637518c747c156f95f079a34367842bf875a8fdf5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00092-of-01024.json.gz": {"num_bytes": 318734793, "checksum": "5cfd4f25e9effaa2f7381bfcf49f9263e10619811aeaa32a77d3fdfc13517006"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00093-of-01024.json.gz": {"num_bytes": 319161014, "checksum": "bed8774909bba5ac656ebaad6e5cacca9e5ea12c80a41fd5689e6798c74f3c89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00094-of-01024.json.gz": {"num_bytes": 320143246, "checksum": "96abe370925f6962b4e75da530b5234eec21fab820d6cb02ae59b6070ab63859"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00095-of-01024.json.gz": {"num_bytes": 319707377, "checksum": "37b68cd632e8f86f364fd61c9581f48ad7602122b7f33c55103ac5bd727f015d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00096-of-01024.json.gz": {"num_bytes": 320159279, "checksum": "fb93c7467f0361c1d4b186d5e25f4bce4f237adb33b4e0ef56f57831b4f97f81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00097-of-01024.json.gz": {"num_bytes": 319841818, "checksum": "7f4d4a9536e37a0c2b9a1806fcb472784ff4d3840aa57e9603e74233b877fbac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00098-of-01024.json.gz": {"num_bytes": 321001731, "checksum": "239b9fefebe3815c8d785bd48086013d1a6dcd76c142786502c674d2d874fb11"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00099-of-01024.json.gz": {"num_bytes": 319475885, "checksum": "0a610d25a547839b8b6dfc2fd964e3ca64b23f0edc52d311c89dcb5e8a44a2c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00100-of-01024.json.gz": {"num_bytes": 319515329, "checksum": "f24d17cbd27296a15f51b9edc713c74a6997bbe82267403fdb6282404c2f4e6d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00101-of-01024.json.gz": {"num_bytes": 318803422, "checksum": "54b8b0c72ffa325abce3dd15bdcd0856b5594500c37f4bc6a6327721ba91e4bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00102-of-01024.json.gz": {"num_bytes": 320934688, "checksum": "24b99b4afa3b631a718a487d679026c91e2c936132df01df969e3173b49e091f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00103-of-01024.json.gz": {"num_bytes": 319835920, "checksum": "a2c68654ba81fa55bc24beb4319c8905f7b532fcb6793a6a311344d4f98a82b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00104-of-01024.json.gz": {"num_bytes": 319402378, "checksum": "27764d82793e35b8a7be3a3fb0470d018243a89283b5501c0b76056de1879389"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00105-of-01024.json.gz": {"num_bytes": 320100928, "checksum": "3bb2499337ebe52b63a5f20ec6ca6283971937962439699bd5e483cf80fed02a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00106-of-01024.json.gz": {"num_bytes": 318707110, "checksum": "83510312aa188431a8dda8746903d70cfc7ffdf5437e44c1f74b7670b78bd52b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00107-of-01024.json.gz": {"num_bytes": 319904239, "checksum": "40d42c39dea8e4898efba1886aa3be67742501f7a51d5bc635b03a2c6c2bd63e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00108-of-01024.json.gz": {"num_bytes": 320050265, "checksum": "88ce3ddae88e8024e76614a1b701c157f66fe39c6f0852a4869c5063876f6e87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00109-of-01024.json.gz": {"num_bytes": 318053254, "checksum": "865a124b663037f36a5738f25c82f8bea2ab54d4bbf8255ca0d1d00d76f8b250"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00110-of-01024.json.gz": {"num_bytes": 319794699, "checksum": "b17e210c8ceef98219ee12eba5dddd2001ded0d417c93955743c238360d96e76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00111-of-01024.json.gz": {"num_bytes": 318761540, "checksum": "05be318a057bb33bf9d7faca58569cdb0880fe8eeb0fc3f57f5999d5f2af55fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00112-of-01024.json.gz": {"num_bytes": 319121509, "checksum": "858dce8e43b06a0c1e26ab3e4f109814b6cc50c6b0e4d146ec79fda001ad471d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00113-of-01024.json.gz": {"num_bytes": 317916736, "checksum": "2e3968e48cb15a3326457d5a6ad49838d20d38c8138c529eee51f94e6bf269e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00114-of-01024.json.gz": {"num_bytes": 319319540, "checksum": "b72dc8207d93848f4fcb265b3e618d0eb8649445f7b9187c5165f4adec3e0708"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00115-of-01024.json.gz": {"num_bytes": 318863372, "checksum": "85ef0bf3cb12bc2fede4158853ed2259dff5d25adf99b43e8c35d7e0b9d4fdd3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00116-of-01024.json.gz": {"num_bytes": 318898370, "checksum": "a0c82c8b48e086be7396338cdda0fed52e8c4753f04fd086b9472c1bedfb150c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00117-of-01024.json.gz": {"num_bytes": 318153138, "checksum": "531d5d03fd8099806d92fbff2a48a0d68dcf46325e732e698e9c142902d152f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00118-of-01024.json.gz": {"num_bytes": 318966511, "checksum": "24b1c5ebbd07d50043be0d5d5c5427e042bdc53280825260226a2823e9b7546b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00119-of-01024.json.gz": {"num_bytes": 318733748, "checksum": "ce1fb1192b770e625430798aee94c93bd748ed474ff815a7f95cadebb826161a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00120-of-01024.json.gz": {"num_bytes": 319672996, "checksum": "4c2a6874921ac4a626a9c8ac4c6e91dae58f1f5b52e79124b3abf254b7433119"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00121-of-01024.json.gz": {"num_bytes": 318779046, "checksum": "029d3ab92f3e1724e3708790148e63b4c211d2ddfd04e3d194b24145e97c922a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00122-of-01024.json.gz": {"num_bytes": 320861175, "checksum": "4bb595140e5cf92147f99b58d236634ddfafbc0b160b4c88b337255482611ced"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00123-of-01024.json.gz": {"num_bytes": 318338141, "checksum": "d508261be287fa3d27e5f44524e22870269054213b61011ee8a6728a77910cc0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00124-of-01024.json.gz": {"num_bytes": 317655056, "checksum": "7612cb9fdd9f4b3a4f8958087ace120d4a73cf26bd16289bb20fc871f5744f2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00125-of-01024.json.gz": {"num_bytes": 317524610, "checksum": "049ebe4971811bb1fdcfd10cc264b2074b3ace18536340644e718dcc3cf3affb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00126-of-01024.json.gz": {"num_bytes": 317902192, "checksum": "d97bddf003b8f647c587fe9a9a9aed75ea604478e0b550d501ad7f07b6061b86"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00127-of-01024.json.gz": {"num_bytes": 319243191, "checksum": "6da4c882f88816a452af54ed217f84d6e4601c11a8e33bd47c49c0a1ea04f49a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00128-of-01024.json.gz": {"num_bytes": 318045852, "checksum": "ea43f63e6ef3bb5723ce75bb51f7183a525d8ccb00c93f49aaf2d9b560f7bdbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00129-of-01024.json.gz": {"num_bytes": 318436174, "checksum": "72ceb525367d6e8d1c0fca94d99d4fe5353ead08a5d52bf00e30e3b596fa90a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00130-of-01024.json.gz": {"num_bytes": 319017217, "checksum": "92f1b2687bee78441eeb4e05bbec2a491469b23c3aad0d951fbbe35a3c27998a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00131-of-01024.json.gz": {"num_bytes": 319237739, "checksum": "0fd07585a82b7d71ddabbc315195c84e2fa78a8319de7dea971cfcc9b38707b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00132-of-01024.json.gz": {"num_bytes": 318123742, "checksum": "c9f5604ca28ea2a9ae5267db50f6e3d1e576841abe840134b3817f370c057073"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00133-of-01024.json.gz": {"num_bytes": 319009751, "checksum": "7ec982de577e0eeff57dc60346ce35a7b35b3c4f037987316cfc071b0ed58a87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00134-of-01024.json.gz": {"num_bytes": 319750057, "checksum": "2619d265d76d82f6b84e2686371e5b6d6c08058cbd5765dd2906af9f549af092"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00135-of-01024.json.gz": {"num_bytes": 319068231, "checksum": "5e1bf5b09f2cd132a7747116442d6f26ce0002eaeb9f56fb02bc00e3abee8716"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00136-of-01024.json.gz": {"num_bytes": 317800994, "checksum": "80ebbf64fbd91215da553e3a8d9442380cee6c3b09fbbf8353a0817993d15862"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00137-of-01024.json.gz": {"num_bytes": 318954070, "checksum": "3b5d2ccafe526a19c52ac0fee50109b6a95ac3c8f7f2272a9a0302c4219e82f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00138-of-01024.json.gz": {"num_bytes": 318452853, "checksum": "2dd88569a62003383a3bf70d68143f16f234535469bdc8ab01a8764f6babb5fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00139-of-01024.json.gz": {"num_bytes": 320013821, "checksum": "f32ca62f6a9d2c8a72901e6f2c08880c2d1907f52beb4e8fdc30f4c02c7ad10b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00140-of-01024.json.gz": {"num_bytes": 319510423, "checksum": "7799838d8019d7cd71a505951f155bdfb862b4a3b3b77e182c706a624617169d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00141-of-01024.json.gz": {"num_bytes": 318339814, "checksum": "1601f6dbcbf4e7f1db119b232e862f3c9fe29e9abe5827177458079299ed511e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00142-of-01024.json.gz": {"num_bytes": 318438444, "checksum": "71d891be156e1b608733a3abe8f8dab7a6213c02931117b99889bc3fe8329d38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00143-of-01024.json.gz": {"num_bytes": 319413540, "checksum": "88fb2e7c3d426a6bb5775041658c07005a469306af0d97df7d68f148b64cbfe8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00144-of-01024.json.gz": {"num_bytes": 319901095, "checksum": "2734ff57f4265653b0b1f292f513017ba791c3091cf8ac0bbf6d75d0074e3386"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00145-of-01024.json.gz": {"num_bytes": 318500183, "checksum": "da2e6747f7230af5941c6bee262a606b4f7792da359dbf7516d82d8301cdf90f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00146-of-01024.json.gz": {"num_bytes": 319315120, "checksum": "6daac97153d51addc8b1e43b686e3d641666df3a106270a141d734079db2ad35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00147-of-01024.json.gz": {"num_bytes": 320621434, "checksum": "fb2584e0ce366ad30c8110591484b84798e9f06e8a27cd864e7800b8d5e2d225"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00148-of-01024.json.gz": {"num_bytes": 318269045, "checksum": "1c963c0ceb6cd776822352b186ae7e3d829ef334efcba0fbdd9182dde4deed05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00149-of-01024.json.gz": {"num_bytes": 318576426, "checksum": "6a21397e0104c7fe0fcd9f1d43a8e546000596d896a95eb9b6c4ab92235e6a49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00150-of-01024.json.gz": {"num_bytes": 318447048, "checksum": "075b113a73e6e21d7cac49391ee559ee8aaa2bb3338f709017077a4007a7bbb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00151-of-01024.json.gz": {"num_bytes": 315388730, "checksum": "bd47e3ac0209676d8a32490eb20ca8c07ca3c45c2beb88dae18b5c8d925f349a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00152-of-01024.json.gz": {"num_bytes": 319701880, "checksum": "241d9cf003f49d95168ebdeccd8209230507d4dfd0d170fa1b57d2355240a95d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00153-of-01024.json.gz": {"num_bytes": 318370254, "checksum": "3aa86900a749224dfed8a67960c166e43c3b9ef3ac7b49d28129b496c7193e30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00154-of-01024.json.gz": {"num_bytes": 320064875, "checksum": "3160c723cea6717fa9f5a9eb627d76107040d084a64106973099fa0e8de48758"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00155-of-01024.json.gz": {"num_bytes": 318089754, "checksum": "5b6e76a85bb1093eaba698864a54a938329b04494f9f72c3c3bbb155174da5e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00156-of-01024.json.gz": {"num_bytes": 320049467, "checksum": "cc013e8aa7c1cf7fc28ebecc64d893d03b092a09d725b5e626851de0b311c814"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00157-of-01024.json.gz": {"num_bytes": 319931950, "checksum": "2a27b4c29455bcd813a84aa3a54100d16cb6bfed25171aa3c552ea452ae569e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00158-of-01024.json.gz": {"num_bytes": 319963615, "checksum": "e477f769ea1513cf607932a29d793fdf1722cdea757e00c814dad594329cfac7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00159-of-01024.json.gz": {"num_bytes": 319000491, "checksum": "ff5d09415753c2aa4b51196e8f4bd6c77ba100ab281314aede118f501565cea2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00160-of-01024.json.gz": {"num_bytes": 319069618, "checksum": "e08c35aef8a20dccad80f6bb1579d6d2ce80113c8bf8459730c69fb7048c3cc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00161-of-01024.json.gz": {"num_bytes": 318750642, "checksum": "13eef84873b58e29894f9bf68a4de72a530c1bfc80a5654262fe71420292b8ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00162-of-01024.json.gz": {"num_bytes": 319847814, "checksum": "a8579c6bcc906fe018881a8474724576c3d0f7f1787f1568b79e5accbd9f962c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00163-of-01024.json.gz": {"num_bytes": 320370365, "checksum": "b97a74837ab9f659c13dcb4deb53c600584beb9e5ceed29e99974c4953f644c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00164-of-01024.json.gz": {"num_bytes": 319894618, "checksum": "9b63afffa2b84c91b749991ddb384399f1d408bd7b6b643e7329e49531ce9a53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00165-of-01024.json.gz": {"num_bytes": 320166197, "checksum": "5b2414477dc4e2b080b34f3b98672bfe3de6028e7ad83c323a7dd1ee08c05a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00166-of-01024.json.gz": {"num_bytes": 319612575, "checksum": "2cda682db53000c14fcb5d251bae4f50c8c4159348f8594c3ef020260f277a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00167-of-01024.json.gz": {"num_bytes": 319183884, "checksum": "5c406d7a8a404436039fde7c2019f0174ff8855caff319fa62bb7960d341b41a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00168-of-01024.json.gz": {"num_bytes": 319396348, "checksum": "df6a422d57a2e1443d10d61b13ab2c5227734195c82b43e1ead2db723cdea293"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00169-of-01024.json.gz": {"num_bytes": 319452933, "checksum": "81c81138e7163072e3779dd10ea8af7dff12b705fa008665298e08cfc2699f03"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00170-of-01024.json.gz": {"num_bytes": 317748609, "checksum": "6586ae8862b8ac925f424afb6ba779e95a147323fb83fc8c4bb0813877b17718"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00171-of-01024.json.gz": {"num_bytes": 319052376, "checksum": "8b3cd21d8ffbe963ce935ef9e0b6efc45f4d5abab703fdfed19a1309b700dca8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00172-of-01024.json.gz": {"num_bytes": 319068859, "checksum": "a42f5f5a10bfc84d51dd0855166959462faccd6a182af4c5d2115ff9995f5324"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00173-of-01024.json.gz": {"num_bytes": 319142377, "checksum": "e26514c5d6cea27c0cf7fcc1daadfa6f218ef9e62039c6d6fccfc31660c0c96f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00174-of-01024.json.gz": {"num_bytes": 319134484, "checksum": "75349aa8c734ed894965500eab2fdf59657a63e40e5a53e822ef1e5a12838a02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00175-of-01024.json.gz": {"num_bytes": 318330467, "checksum": "a3d0d14b28a5a3cc559d6d89e2ec09e49e92aa189e44e68dbb4ea47978e1eca1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00176-of-01024.json.gz": {"num_bytes": 318584643, "checksum": "dd68b42e5bfc656b71fe5701bacb929edae84055131f1dd65bbf3f3ad734e57d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00177-of-01024.json.gz": {"num_bytes": 319275087, "checksum": "05a8ff159006241cf938ef27b292f65906158ac25ac28919aa6761eaa634052f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00178-of-01024.json.gz": {"num_bytes": 318490550, "checksum": "a3aa38083c85baada29b207240bcca1a0d562a93971b420428d039092e58bd31"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00179-of-01024.json.gz": {"num_bytes": 319083249, "checksum": "12858fecd1dec728eba2c8c4311b17e4f2ac1fdb27c23e9adcd9258c5c4fc777"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00180-of-01024.json.gz": {"num_bytes": 319752094, "checksum": "67e968cb8d3ebec2f68eddfc539ea7402aa72c9274034494a43ea7d207b69a88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00181-of-01024.json.gz": {"num_bytes": 320476195, "checksum": "c1bd59eb7ca799e31bf037dc7c087c1ad94e4f88a4f12427c454510d97e1c803"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00182-of-01024.json.gz": {"num_bytes": 318538551, "checksum": "dbe7205a1919dca9d6936158d5653a20d239f2e547ec73280956da4f8c609220"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00183-of-01024.json.gz": {"num_bytes": 319620265, "checksum": "46f9e603e04040b59df8da6ee01d1c30588aa7233a00526d6f0fd84c4172ba93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00184-of-01024.json.gz": {"num_bytes": 318301621, "checksum": "880a02eabae231da388a5782a7194eef0d0211c2d1314db0c56d740647a114c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00185-of-01024.json.gz": {"num_bytes": 320515340, "checksum": "f522147aed30ebb3ab352c92a9dd24cd2e8b93df1d4c4a6284d89ceaa2858509"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00186-of-01024.json.gz": {"num_bytes": 318374733, "checksum": "5005f1c42038769e225a626a88c10bd4f6af98dcc14deed475954b00c088bc53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00187-of-01024.json.gz": {"num_bytes": 319116182, "checksum": "cbd7e0f486c6dac13090cd344337da1c336973e7ec75e32b0bd5b18b98f24bf8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00188-of-01024.json.gz": {"num_bytes": 318981305, "checksum": "064ce8c30b7a960b20720c133c3dd3281d27752a66def44d5133ff8f1b8279e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00189-of-01024.json.gz": {"num_bytes": 317036462, "checksum": "acc052da4501691fdd28f269c633ed826840f2634be49b5e2c5e1273de0cb4a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00190-of-01024.json.gz": {"num_bytes": 318061662, "checksum": "5a436e97c59b8636ca5081b71ca6fe8f8a3a99dd3f426c79edb2bf53345ee810"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00191-of-01024.json.gz": {"num_bytes": 318556228, "checksum": "2eebc89381ff78ae63f311c98b07853cefcc42fbcc210995095d568a6ff70ead"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00192-of-01024.json.gz": {"num_bytes": 317987733, "checksum": "99de46c4702c06a2303262b185b92fad82e12e189c923d5b76d9d8f96faabfa5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00193-of-01024.json.gz": {"num_bytes": 320294532, "checksum": "bccb7d8fc34d6cd6eb41e2a1c6234596b00a5517fdca7c47562fdee0e675377c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00194-of-01024.json.gz": {"num_bytes": 320852679, "checksum": "bb1e7768a57145fdbca7957ed964648d1deab5edc5dfad4722a81ad411c5e0f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00195-of-01024.json.gz": {"num_bytes": 319016077, "checksum": "ac520468a5bd933dbac1aa5f7f21ba276bdce15abf99963ef9d73af294e81e70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00196-of-01024.json.gz": {"num_bytes": 319289881, "checksum": "9eec5740115ab52ce98ac9efbed4fa1c5c06787fe93b4b28f6a1e4df06272870"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00197-of-01024.json.gz": {"num_bytes": 320180232, "checksum": "07a03763b84b4a86b4f71d725927d62c40925823ee454122a00fdb625ddb3a22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00198-of-01024.json.gz": {"num_bytes": 320004709, "checksum": "a1b250b01289fdaf6dcd997ef31c59c580f81f961aa0fd88ae0d175bd07c02ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00199-of-01024.json.gz": {"num_bytes": 321006991, "checksum": "650e57c3dbbf4ed929da8c6c5d78f35fbac4644722a84d98f93342a8d33b2140"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00200-of-01024.json.gz": {"num_bytes": 317913111, "checksum": "42caf6dee42bd73d9e4bf0c7bb16383caa936b2e0a913489b9f0aef57b6004cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00201-of-01024.json.gz": {"num_bytes": 317897148, "checksum": "990974a82de2b1c27465f6d097d7a5718c5ff334271e722ab3736e7aa5b89d4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00202-of-01024.json.gz": {"num_bytes": 319510250, "checksum": "8467066f2417af774363d4984a37968a0189adfe3a581723eab15004930e621a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00203-of-01024.json.gz": {"num_bytes": 319762388, "checksum": "4e7e20980dea2d5e77f380b24580f0df9319a0d1d73ec319e17d8cbe044e53de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00204-of-01024.json.gz": {"num_bytes": 317418128, "checksum": "2c027c5225ea7ce3c31f5f32dda12b7c892c6fdc9c52da6d0af749171cdce738"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00205-of-01024.json.gz": {"num_bytes": 320157174, "checksum": "d953e79c60be0e2c3b072c2186a845a351392ef395fa95135f47e6b8491c6f88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00206-of-01024.json.gz": {"num_bytes": 320459080, "checksum": "bc70c34931942ca143f7eb555e86458afcc36110aa9559151f31d781969d4458"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00207-of-01024.json.gz": {"num_bytes": 317361718, "checksum": "fad5ebd7a81bb737e12e9d4c803aea1a9e905d43a3fa87cace32a64eef01e8e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00208-of-01024.json.gz": {"num_bytes": 319976693, "checksum": "21381c727d945d8d3b4a275e3622bce64b07ed87d7f2371ac28b5d2023359cae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00209-of-01024.json.gz": {"num_bytes": 319550585, "checksum": "8b74e5f1780c4bf12936ac3a86be7a3d11287866522da8275aa4232c1e3d8898"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00210-of-01024.json.gz": {"num_bytes": 319574289, "checksum": "1594bd49cde9641b49a1ad9373a53e10d65440000363f7532a7d326d17c44236"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00211-of-01024.json.gz": {"num_bytes": 320615302, "checksum": "5b6f7eddfa3a9ffb0d6668d10f398b1d86482b64daa9817ca0af549433071244"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00212-of-01024.json.gz": {"num_bytes": 319395225, "checksum": "db58fa453269c794fedb595c6193dea5a85c72ff8b2d43e77c9bb371b8c86b78"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00213-of-01024.json.gz": {"num_bytes": 320131797, "checksum": "1d21d19b5e36820559590b339c049be29f27505ab4e88572edbdb84b649e0b66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00214-of-01024.json.gz": {"num_bytes": 320153141, "checksum": "55c9b4ff1cd8cc88738196f867aba620dec3c8b27b9a485c7e75d3129d76e9c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00215-of-01024.json.gz": {"num_bytes": 320525443, "checksum": "dfe9f44676c1abf0e2875924c094c0d788f8a0172d641d5f810258e948e37feb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00216-of-01024.json.gz": {"num_bytes": 320100146, "checksum": "57f19f5437b0428d9f40799af14f8bfba8f6c82ebacaea8f6fc7531524a6d4af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00217-of-01024.json.gz": {"num_bytes": 320688377, "checksum": "fad4f3143aa303c9c35165a15c6d90087c204c586fe20b0c0f45cf4238311b70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00218-of-01024.json.gz": {"num_bytes": 318896471, "checksum": "aabd471960d6db1e93e1129410d9138d9d9efa3292af7491b3b6844c2bd3f543"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00219-of-01024.json.gz": {"num_bytes": 319298204, "checksum": "f676701589e39802779a0947585638347bb4fe55376a33c6d0afcdc40c5f8938"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00220-of-01024.json.gz": {"num_bytes": 317757045, "checksum": "f3d0994379d244054c5e2db366a081caee28d301aa6b0d9431e7d9eb1cb38c30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00221-of-01024.json.gz": {"num_bytes": 318568870, "checksum": "8026854c8a8cc1d16b52a898b9dd8a8df7901dd8cdf285f5d937c4d5d45919f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00222-of-01024.json.gz": {"num_bytes": 319096912, "checksum": "71f76f898864de3ae60f7c0cdbc68d53cbfa04b2f8493c40d55e1cb56727b275"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00223-of-01024.json.gz": {"num_bytes": 319350414, "checksum": "ba01faf3fe41a738c255b5da83daf53a5858144557af6c6f8d6208a049e4245f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00224-of-01024.json.gz": {"num_bytes": 319007151, "checksum": "94200d12c61f7c73a9e3a2bb089a05b017a215348d52018a34e3224578c0da06"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00225-of-01024.json.gz": {"num_bytes": 319502985, "checksum": "0b7ce650e555baa546bb329d7f0567a3dc0a7ec9d49149792032a86321a73d6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00226-of-01024.json.gz": {"num_bytes": 317983607, "checksum": "40cf6d4b3deb05cd97ebed01405d08ae67be6e896736e4f371d15e5404567599"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00227-of-01024.json.gz": {"num_bytes": 320199564, "checksum": "e65ee475e3b6682b57bfa3f7b9c1cdabf36a7282fc793865df63dbe6a6a3d1fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00228-of-01024.json.gz": {"num_bytes": 318852183, "checksum": "8b27f2fbb0233802229fc776cfcb0b6b43af3149d217d0ab00cca0f1286482e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00229-of-01024.json.gz": {"num_bytes": 319407418, "checksum": "f2d5199a0022134ae127c88f0ac20d1b2b8a88014a774b5432b41085c83ecb5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00230-of-01024.json.gz": {"num_bytes": 320787790, "checksum": "e1b040895ac6068dd1aa892ec93d733096afc4adda698379006ef89926491255"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00231-of-01024.json.gz": {"num_bytes": 318220053, "checksum": "648a6349206c50c17d4e3562fd6fcb0a723b4cb40005890173d5de0c7ecc2ade"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00232-of-01024.json.gz": {"num_bytes": 319702777, "checksum": "0a44b7cb4f354e1eede683a697aba4051c1542fd030dd59767065f5f0204554e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00233-of-01024.json.gz": {"num_bytes": 319154465, "checksum": "4070448b7844776db6754bd33791900bf9ac8dbd81e4cd774a3055ada67f6fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00234-of-01024.json.gz": {"num_bytes": 319846160, "checksum": "b1e8c73078c347fa062ed408e81bbdcb2f714675bab2c082016e822e91ef63a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00235-of-01024.json.gz": {"num_bytes": 317722912, "checksum": "d8aa694e870157b2b5411f496db46dc71dfeed01a42973a65499596921198abf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00236-of-01024.json.gz": {"num_bytes": 318593592, "checksum": "e0c4ff6c8a12128da88777074d0b097664cf2f2395913c4d82b0eecd501946f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00237-of-01024.json.gz": {"num_bytes": 318902831, "checksum": "adce772ed699d7e908ae1fe1ddf1d9875305c7875c93cedf1b3ea0bbc21ff922"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00238-of-01024.json.gz": {"num_bytes": 318696723, "checksum": "926f9fc42cd248077afec1f4b88603c646fc5ae47c4ee3e9b8a5f6b8b6ff7f46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00239-of-01024.json.gz": {"num_bytes": 318321822, "checksum": "439d756b0ffc97ebecc6c48a7dc90da77de7ada05a6eae929db98057ea15bef1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00240-of-01024.json.gz": {"num_bytes": 318992553, "checksum": "1f57af6ff9477263806c0827c0dd8e494e103b6f54eec2cd5f8f8327b01ee39b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00241-of-01024.json.gz": {"num_bytes": 319345185, "checksum": "493932a44e09f4b311ac5bdb519111fad0982708d4b467688f2b1105316544eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00242-of-01024.json.gz": {"num_bytes": 320108156, "checksum": "de5603f1b276f1373011c8884f06af017c71b03c5de3b3bb89cd6d550a0d5902"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00243-of-01024.json.gz": {"num_bytes": 319855563, "checksum": "7c1b74de8ae3699c567edaa6e2d1a1f1ae82f4810e769c710a23cd2dfc536c60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00244-of-01024.json.gz": {"num_bytes": 318966332, "checksum": "d3ada80bad9fa776374878bc7504138e14c161bc9798ea8114b0d187d4c815f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00245-of-01024.json.gz": {"num_bytes": 319541864, "checksum": "3fe5f26e32795c49743d1b2497c333be57248c9db2ce12fb93e103d1a9595347"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00246-of-01024.json.gz": {"num_bytes": 318530369, "checksum": "a0bdeb2dcb5dfb46f843c4086230ba918f2d3ec125654cb924ea11e7c75cafbd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00247-of-01024.json.gz": {"num_bytes": 319496627, "checksum": "0c4099f832ada6b24ef6c1d15267cd3c179f5b3d79e3d813d944e3ebea908c99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00248-of-01024.json.gz": {"num_bytes": 319132981, "checksum": "608b1cd27ad345f6511fb677c00d56b6e827f288877d68aea1bcad3b02dd040e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00249-of-01024.json.gz": {"num_bytes": 318529093, "checksum": "8fd580be09f913cc3809e3b0e467e2faf657a5db6f71b75aa931043267b9b0f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00250-of-01024.json.gz": {"num_bytes": 318248903, "checksum": "faeac675c3634b0834939046e60cdfad6a13558d7a6799c5bde25567898d86a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00251-of-01024.json.gz": {"num_bytes": 319184870, "checksum": "038972e03db75417fc4cb25e54c3aee01e4f022eb0fab202142f539e4d866e28"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00252-of-01024.json.gz": {"num_bytes": 319631399, "checksum": "2fda0c2cec4624c6068556e16630c3551ef3110759bed59628913a9debd547a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00253-of-01024.json.gz": {"num_bytes": 318275716, "checksum": "b5da4bfa564fcc6c49a573b90e679d60c4e222249858f4e58fdb3727a5f279ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00254-of-01024.json.gz": {"num_bytes": 318638865, "checksum": "279eb2978fe94e1570318a247b82487c04d7494ceed74dccb1d7a5734ea84e5c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00255-of-01024.json.gz": {"num_bytes": 319640339, "checksum": "aa0a1ef845d0df7d81d2588d53f29205a4e3858a0888c1b7d9c83eb2fe1d32a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00256-of-01024.json.gz": {"num_bytes": 320353593, "checksum": "407133ea3b32a9e004b992a1bccade0440a39d0bfbd12993ea78c6526c0864a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00257-of-01024.json.gz": {"num_bytes": 318165587, "checksum": "72b7a72b8402b22cb51db44c9e7859460366c7c9d33e16a4c038ad07f7ad8f3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00258-of-01024.json.gz": {"num_bytes": 318003534, "checksum": "e5f9f2f74b7f9958dc9535f04a8965749ca4bd68005a6efa36f480fb487ca930"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00259-of-01024.json.gz": {"num_bytes": 318990454, "checksum": "7cb3c284613537fc6b1a85d7187dfca30b37a7a1a5708094f17486e3184e2d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00260-of-01024.json.gz": {"num_bytes": 319514850, "checksum": "0067e36b7156196e2451cdf78dc8832352f2481a4740afbef9046104b6810bdc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00261-of-01024.json.gz": {"num_bytes": 318747661, "checksum": "b1e4597420035c355abe15efc576751169e2b5e4c38e073c178346a7202d5ab2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00262-of-01024.json.gz": {"num_bytes": 319868329, "checksum": "374f4b951e545968da45b5055af2aa0b128c1d65d6c854f5b8f7e02d22c352e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00263-of-01024.json.gz": {"num_bytes": 319268788, "checksum": "7168e635a32859a85a152b29bcd1f699257ee4e340517e218ea9b8dac3922210"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00264-of-01024.json.gz": {"num_bytes": 319270640, "checksum": "1da08b65c83e79a0f5b7215e5a4ee58f21383b69f09dd9a3ba95381ba3d56d25"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00265-of-01024.json.gz": {"num_bytes": 318744354, "checksum": "0c908e81d59b2099eda038731b387a0ad86fa3d168eb2955413dde9cf29d947b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00266-of-01024.json.gz": {"num_bytes": 318518406, "checksum": "115e375464931638de4af669b7301b6112d18b23835f2db2b092f47545b1a855"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00267-of-01024.json.gz": {"num_bytes": 318921711, "checksum": "6d66c715137885a46f2472489b21751284ec8ecfde6dca6be3ec1ee75f6cd5af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00268-of-01024.json.gz": {"num_bytes": 317786222, "checksum": "588865d8f9d3da5a70c958997060ce4792e175c8fc5323f1887787070c8c160f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00269-of-01024.json.gz": {"num_bytes": 319004956, "checksum": "163ec7497602931de2eaffad320704e508e491937a2965e39907a086f640d975"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00270-of-01024.json.gz": {"num_bytes": 319175186, "checksum": "794e0e7ceccf28457a8ed5b0724337545661da16feafd0a53e4823b2cb1c92ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00271-of-01024.json.gz": {"num_bytes": 319785821, "checksum": "9c9ec0348f7d4ffc61e5f19f1f60c8382b33ca2fe4b852567cbc3c16024a4627"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00272-of-01024.json.gz": {"num_bytes": 318933435, "checksum": "883d85985237948018b13c20f4d4ee567c6ee36a135b326e8117d73dad4fe37a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00273-of-01024.json.gz": {"num_bytes": 318456664, "checksum": "fdca13067e8e118e538b8de538e164fb5397724045a5b1b02764510c8de90969"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00274-of-01024.json.gz": {"num_bytes": 318418161, "checksum": "27556558fe8a91a4aea4800ba9b7e844336a7638c5b96e652fcdb359f631b04f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00275-of-01024.json.gz": {"num_bytes": 318437784, "checksum": "6ad4e6a3e1cee04aee3051a66531e3f4aa97f7bbb7602c6aa5f46a727b319f2b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00276-of-01024.json.gz": {"num_bytes": 318470946, "checksum": "145a4d85ddf1e72fcdb8477dcd2f70a5554d9cd9349e02e058d3e7837204b6ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00277-of-01024.json.gz": {"num_bytes": 319580624, "checksum": "7116de0dbc5c7f6621f7c107dded9d85788937a87f2d56efca32ae9f25fc6865"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00278-of-01024.json.gz": {"num_bytes": 319619699, "checksum": "8dabdf2d26035d30c22204e6f46f292c58f4a4c3b0b77a1826a43341d4282df9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00279-of-01024.json.gz": {"num_bytes": 319344020, "checksum": "c2b7d5bf62be1772c6bb80f597b28d948cf3cdefb10b6df6f777f0ab7d8fb015"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00280-of-01024.json.gz": {"num_bytes": 318997864, "checksum": "025457720b0045e7bf01f9b4b847f28ef94af9ca250675efeee73eeb340a3f36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00281-of-01024.json.gz": {"num_bytes": 318718146, "checksum": "2979c0ac06570a9ee437521778c514bd8755193b9f1ae6a5a671ef885243f019"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00282-of-01024.json.gz": {"num_bytes": 318434530, "checksum": "a17bca50ec20c364adb899a9073bbe3a1505f81803a58190efc5d4f3f78b58be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00283-of-01024.json.gz": {"num_bytes": 319317663, "checksum": "9034f524fc5c2e246b22e2dee00b47e0c4da0316bc60d0a11d966c28db917f9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00284-of-01024.json.gz": {"num_bytes": 318957832, "checksum": "f08b96047e711831dfb8a44d90cb712d3e78c98dd28ec6b937ee83949bbef5b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00285-of-01024.json.gz": {"num_bytes": 318643283, "checksum": "c5df1f2e2dad46d71f8aadf856a5139020da8afc2ee010d53c0372ea09b2362d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00286-of-01024.json.gz": {"num_bytes": 318064839, "checksum": "16f7fd6abcbc69750b8131bca3e38ddc40bd7c86c48122ad2a9a77cb9cfd552e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00287-of-01024.json.gz": {"num_bytes": 320328448, "checksum": "41e82bd357b47a28f28a4a203d5b54263aadb3c9a08899f78302c727c56d8b38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00288-of-01024.json.gz": {"num_bytes": 319559271, "checksum": "970b9df224b58ca50b3023d92f6be0c37dbda479155c29c535e457ef6f2bca0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00289-of-01024.json.gz": {"num_bytes": 318786822, "checksum": "36a6515e7f516335d3fe057bb6ed9890a2aea033e08edd8588b3168b3445b2f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00290-of-01024.json.gz": {"num_bytes": 320634782, "checksum": "7d19fc82b9a5aa0e0046cd17cd2c46f356f8a4a7d203d5e03e1f319156f05cb8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00291-of-01024.json.gz": {"num_bytes": 318746713, "checksum": "86d610d4590bca69281348dbfaaec9e704fd6194141c50c71e84aad51ce26b91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00292-of-01024.json.gz": {"num_bytes": 320049630, "checksum": "d045df646213e29d4e7de4ec8915eb3b65bb962f35b0d74abf00889bd5aae8ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00293-of-01024.json.gz": {"num_bytes": 319966146, "checksum": "c66fff1a64b495211bfdcea650ff76115f8c857b9154c1b869062e702714b9ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00294-of-01024.json.gz": {"num_bytes": 318805332, "checksum": "ef3d9204ec85a1e65ae48af7924f614403d297a15f232ba41eb0e4fe223e507f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00295-of-01024.json.gz": {"num_bytes": 318898465, "checksum": "2a071fc28b1216f2dc0579528d9b04e597b5cdac9fd14719e312092242da190a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00296-of-01024.json.gz": {"num_bytes": 319406630, "checksum": "ea71e9fd444860d70d3728f7e2213a4bccf3aa31a164c9acfa8df7a0b6619786"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00297-of-01024.json.gz": {"num_bytes": 320312971, "checksum": "ddaeba8aad38b7e9727c579cc44f15b3c82d292e2901b47b785e9c8d3d5cdb9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00298-of-01024.json.gz": {"num_bytes": 320660744, "checksum": "814460ccfda29b45edaee5f44e3c980889aee2ee52e4e5323931ea489fbe938e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00299-of-01024.json.gz": {"num_bytes": 319848186, "checksum": "3b91fe32d3a731a5be3bf778eedfe13e8a7e26ba9eda51c278c5212aa7925681"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00300-of-01024.json.gz": {"num_bytes": 319647278, "checksum": "1e0424631f7f354bc63b3e71c5c6516c85343dafd3896acb9560eaf93b672799"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00301-of-01024.json.gz": {"num_bytes": 319080252, "checksum": "46c21af013f611729cc06ec033dbae80151987f9098e57fb98e2631f6fe76c8f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00302-of-01024.json.gz": {"num_bytes": 320028246, "checksum": "d1ca8ad6e5bd6cb18db1f1be9154dbc8ba9df7ca02db4c1f8a7df9d40820d8ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00303-of-01024.json.gz": {"num_bytes": 319388787, "checksum": "bce87161f77464adfb1fc04fc2993211bcec502d7172b86f726daf7096b04f82"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00304-of-01024.json.gz": {"num_bytes": 318627831, "checksum": "235b8085cbeb7b13f8e1a5f6d2225a9461b7bcd76e21466a189c2411ff4c4107"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00305-of-01024.json.gz": {"num_bytes": 318148428, "checksum": "f13f124e0ea150da13ebeb3390c311b3db54018de0d640579307bbcf2c46068d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00306-of-01024.json.gz": {"num_bytes": 319451712, "checksum": "de5c3fa2cd6a47551ab43268484d017602e2c3e1f66f43f1a1d8f95bac52cad5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00307-of-01024.json.gz": {"num_bytes": 319026244, "checksum": "88769fbf393671db352227a64cb8ba6b4ba60c5bddb4a14294b1ad9a65a750cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00308-of-01024.json.gz": {"num_bytes": 318447454, "checksum": "555bcfc0ba4db0551ce5ffb18057027ee695af166856125aeb79f7ce013851cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00309-of-01024.json.gz": {"num_bytes": 318147676, "checksum": "bf28e60a7970c548190cf0f4fe56f27ea55a1ad8313fa353a8013f0a0e7919f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00310-of-01024.json.gz": {"num_bytes": 318930650, "checksum": "45a68c0ef70ecd10838d604d51fecd26e5199f5372022b9c2af461a71c24c6ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00311-of-01024.json.gz": {"num_bytes": 319955339, "checksum": "fb3c4e93166f1cb2ccc8a7b68da0246f0827d3a81bb5614c8c84f1c01c6d53c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00312-of-01024.json.gz": {"num_bytes": 318554567, "checksum": "0dce2ac88ba7ac5340d551add9fe7b1a30772a6cc082347c536427b48daca598"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00313-of-01024.json.gz": {"num_bytes": 318978931, "checksum": "c5f99dab085fb705769a514626c9af8a26cf846fdaee4b403a3d6f84c892cb66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00314-of-01024.json.gz": {"num_bytes": 318158197, "checksum": "79de4fa2aed5e3efa71e75d13f08d7c1869aa59f42a819f4429430b3db6c1b27"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00315-of-01024.json.gz": {"num_bytes": 319744521, "checksum": "5a47a89a1537662a91853bbe2a5b3e243f5de74489f820621192cacef192593f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00316-of-01024.json.gz": {"num_bytes": 319861527, "checksum": "1cd34f17f3ae3c8bf8e1636714a9ff600a26799d5ec02ba42abefa5db9d00e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00317-of-01024.json.gz": {"num_bytes": 319286030, "checksum": "a3e34af81264a72b523b63fdc0268f450675f7993fa0885eb2b4c747b0d6703c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00318-of-01024.json.gz": {"num_bytes": 319054871, "checksum": "02fa8cf278578108083bc9a3c5cf07b0a9d243f2162397091ede6c85a1df31e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00319-of-01024.json.gz": {"num_bytes": 319943810, "checksum": "93ef0d7f1610043a6f7634af73e89ee9f3d7e87828ad34558a4d688e6fa6b6dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00320-of-01024.json.gz": {"num_bytes": 320037211, "checksum": "06fbd99a3d64df293db2655f321117f1afcf1cda51e421edef9335a25cb1a902"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00321-of-01024.json.gz": {"num_bytes": 318584237, "checksum": "a224e4d902f7368f91d6a72fc9f5730996dc37de576bc2211eb632e3690f1b38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00322-of-01024.json.gz": {"num_bytes": 319686632, "checksum": "57fba28c7104ff659f8a0f330ae89c68d3a392dd14a78247fa357a3bcc8b94dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00323-of-01024.json.gz": {"num_bytes": 319834993, "checksum": "e61c760cd3c42f71a1a7bb6adc4e0bc970bbf864b69e2a4a5d56bf0a14d4e0be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00324-of-01024.json.gz": {"num_bytes": 319243057, "checksum": "61d21ab1e7729f172ade5ab6c0dcaf07eaeaee6e047ca1c24722c06ddd919678"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00325-of-01024.json.gz": {"num_bytes": 318569583, "checksum": "2192a891ecc2a6aa9f6ea64f1d76ce763e0a3963ae03c95275ccd626171835ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00326-of-01024.json.gz": {"num_bytes": 319175980, "checksum": "d35e4d5f8e924ad97520db51a2c361bbc02097721195932b6768e7460df092a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00327-of-01024.json.gz": {"num_bytes": 319892298, "checksum": "ce967065d3915d466982b5258e07ad2c46b02d7637057e0547586657ea0f53a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00328-of-01024.json.gz": {"num_bytes": 318004026, "checksum": "0676d556f46b1f057669d3378c6fc335db6e3ac67a02e11dce3823658730f4c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00329-of-01024.json.gz": {"num_bytes": 319066225, "checksum": "b00bb4bda957e1287b98c432165448b3899f9155363f7b61bfd0f0181181acfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00330-of-01024.json.gz": {"num_bytes": 319268288, "checksum": "d14d1883941966ef3b35203d06e6fa1bb485dd77118bd7b6c811b0d06fa72fae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00331-of-01024.json.gz": {"num_bytes": 319131311, "checksum": "4d5d41c2b2242b299fb67fa8c9327db8b4f612bdf4ee9af4d4e45aba8cd1e409"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00332-of-01024.json.gz": {"num_bytes": 318827508, "checksum": "68cea08d4805b392bf4c2894a4501ee3fbbe9aac4b1b6533e686ea749ced2dcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00333-of-01024.json.gz": {"num_bytes": 320572240, "checksum": "06f211ae2fe1c4eef5e41caceda8ebbc289261057911fcf2583a59c730b7951a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00334-of-01024.json.gz": {"num_bytes": 318121862, "checksum": "46c62769e04ce8acde4562ba24d72e245babacdfb50600da4e6217948ad71d24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00335-of-01024.json.gz": {"num_bytes": 318692168, "checksum": "dca69a6976e7387a12c8da16b696ed4f604254693a3280be0f90fa694700b595"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00336-of-01024.json.gz": {"num_bytes": 319479902, "checksum": "c52969fad97f1dc0e1e115428e7dad1ac6cb6d804db0cd34f0fc7846b1b50c7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00337-of-01024.json.gz": {"num_bytes": 319987407, "checksum": "2c570f02aa6a6bac96be1e02663996c87f9a94c160f22101ce8ae1d549ae1de2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00338-of-01024.json.gz": {"num_bytes": 319051086, "checksum": "77132df95b147c471ead74bef16ed4fa11e15209f518dd460110132358816834"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00339-of-01024.json.gz": {"num_bytes": 319473192, "checksum": "7f3ac20a72d395c02ed3cb50052821521dc2d8d97303d00e0d0982e2c29e7659"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00340-of-01024.json.gz": {"num_bytes": 318423485, "checksum": "d1127da89e960d939cfc06cf1985df415b60d4bf02b12b7fab02b796100feaee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00341-of-01024.json.gz": {"num_bytes": 320087690, "checksum": "f753423f82157e95506566d3653d32af6a181e69ea0e10b4d4eb24b626d3ca49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00342-of-01024.json.gz": {"num_bytes": 319767100, "checksum": "db7410e6a6ca74163098681038f497faa373e1d81434b45c1a2f273d467c0a2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00343-of-01024.json.gz": {"num_bytes": 318389429, "checksum": "7ea1e432a1ffbed8f4ad6cb985c5cf1b2584d8eb7d2fa091a2db3f104a3f7210"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00344-of-01024.json.gz": {"num_bytes": 319117212, "checksum": "c7317a81a6224dec9be07b41134ac7a7db4039b7c98b2061b20bb59b82ed0a1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00345-of-01024.json.gz": {"num_bytes": 318504232, "checksum": "1498efe8280609d9d66c324e332c9433c6351bb7b99c5891a8f27d6841410407"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00346-of-01024.json.gz": {"num_bytes": 316721169, "checksum": "0cbc6b494d653878c9d52a37572064b88356058ed291aa773e5f47259fbfc722"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00347-of-01024.json.gz": {"num_bytes": 319007736, "checksum": "6265505e19a42a01a159297d33b1a91cd0e042a31ba6a1a867404a143ae565a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00348-of-01024.json.gz": {"num_bytes": 320167918, "checksum": "cc8b29deb44c8348aa4d05836f89cbae995c946f38d9cb8e7fedbd4762168ba0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00349-of-01024.json.gz": {"num_bytes": 319901226, "checksum": "2a0f2188b43ffedc8b95a8276c7647147587c5e544c9e6475e790f4b5e362992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00350-of-01024.json.gz": {"num_bytes": 318999223, "checksum": "1fde48c503998872aa71fc524c7408dc84cbc1faa0d885895d5c57708a15fced"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00351-of-01024.json.gz": {"num_bytes": 318935410, "checksum": "72d577eabcd814a7ff61b894b3fe9089f483a793e692d3ab20ce4ee59921f975"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00352-of-01024.json.gz": {"num_bytes": 318655907, "checksum": "8686dc0e4ff7b35cbc4fa6f3abce50c06f8b95378031c132a117e1d458cb4616"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00353-of-01024.json.gz": {"num_bytes": 320619683, "checksum": "cd5816469ef54bfeb0db6b55a78e0d34eb2e1f82448a41f67dfb70061c3ea91e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00354-of-01024.json.gz": {"num_bytes": 319352400, "checksum": "bf082c093423d562da4984b1f0428225d853a05b5f8fb3696273f36ebb5a235d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00355-of-01024.json.gz": {"num_bytes": 318868462, "checksum": "3b8baeca48e55a2cd268d6aef75f7eed96ef10fceca593a5179d52a2b0121f8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00356-of-01024.json.gz": {"num_bytes": 318903295, "checksum": "4c9a9926a4bad6721807d99cc02a9b6bd28bb0a6254aa1c15527b745c56a06a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00357-of-01024.json.gz": {"num_bytes": 318881446, "checksum": "84b4c2e05bc162fef4824e97ba7a03b1cecb41eda08a3e0aedd264b66e859a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00358-of-01024.json.gz": {"num_bytes": 318521100, "checksum": "aee99528ffd0323fe81e4ed26ed1b9295baa2a3910771dd2a42f4f378fd82569"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00359-of-01024.json.gz": {"num_bytes": 317796778, "checksum": "7b01f2d5ae54f60c2aeb7b96bd366d21e558e2dac48c83a78df9850f37e02f1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00360-of-01024.json.gz": {"num_bytes": 319502919, "checksum": "5b54f9a050e6f9008a1806101ea553d90eead56c949a5f3f46c8ccb88812081b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00361-of-01024.json.gz": {"num_bytes": 318595505, "checksum": "49f4164d66187d46adff7f9bbac97b232ab7906d812e571c2e0bf028895e7f47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00362-of-01024.json.gz": {"num_bytes": 318851572, "checksum": "17accad3c0706c54530f128260cacbf986cbbb20427d4ba8d3444a3702a22c55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00363-of-01024.json.gz": {"num_bytes": 318555337, "checksum": "2327866e541aa6aa73f7289c3ad82a19ff154d39657d98cb78a2f481a8765920"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00364-of-01024.json.gz": {"num_bytes": 318641145, "checksum": "6f52354d804e8d4a1af1f6c2c6b759ae115c4f23a63f1206a73e7e25acfbdd02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00365-of-01024.json.gz": {"num_bytes": 319212614, "checksum": "8f1834eeacc9bbdee95b1f0a4078eb9488bd1a7c5693489bff7943869674cad3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00366-of-01024.json.gz": {"num_bytes": 319336585, "checksum": "a9cf01b76104eebb4ef8462a924f61c262fa197a7c68a50e48d925cb81586e3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00367-of-01024.json.gz": {"num_bytes": 319161263, "checksum": "5ac822027d50c3196026fbaffc7d968e1ca702b947688a6f4d268b942b5067b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00368-of-01024.json.gz": {"num_bytes": 317911640, "checksum": "f9acffbe3c6617e85911ff9dcecec2378b3469ab4546a6973cceb460f9003cea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00369-of-01024.json.gz": {"num_bytes": 319585031, "checksum": "9234553649cfa5265c5a9ccc88486402f88eb81275067c51d9deef16bbe7211f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00370-of-01024.json.gz": {"num_bytes": 318345879, "checksum": "2fbb410346d31a33e8532602f4e3340fcc75c96be803250e9f0f1a6894ca0052"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00371-of-01024.json.gz": {"num_bytes": 318996184, "checksum": "b069b0c8a830ea841e82077548706f286308ef0420e163ff6d8312c8853af172"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00372-of-01024.json.gz": {"num_bytes": 317989343, "checksum": "bfd62e448d4d9f89353abaa384007b0b72bd860402ade3a9d938051a6446530b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00373-of-01024.json.gz": {"num_bytes": 319770759, "checksum": "e4e176250aceb7362ce38d496556a46409e9872e69f45166afe71aa750de8fcb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00374-of-01024.json.gz": {"num_bytes": 319212902, "checksum": "28aa4510c3ddb9ee0ac56aab3792bfe5e899531919ccc0214a4b68bbf2ba18a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00375-of-01024.json.gz": {"num_bytes": 318968029, "checksum": "35326b1f2280e07dd754e89dfa29989d0dfa5c78995d393b36a752d8364bfcd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00376-of-01024.json.gz": {"num_bytes": 318685188, "checksum": "0060dbaccf7f2f956fb8b57891cb176914ddac1bc485dd86c2fd110c46d174b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00377-of-01024.json.gz": {"num_bytes": 319291982, "checksum": "99fc38654197e506868e099c15b2cb15b93238dafd33f81a7d069b3e01c3b085"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00378-of-01024.json.gz": {"num_bytes": 319259094, "checksum": "9b8d97f9d57dd97373c4f57eae2b9c01a58e49017ee41d3969e94fb4dbabc260"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00379-of-01024.json.gz": {"num_bytes": 320228224, "checksum": "82913f2d182d2a57f6c93e9b229862cb72feaa6331d04cd4419113e1eb9d52cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00380-of-01024.json.gz": {"num_bytes": 319738339, "checksum": "e0de43f754ab97d103a02c708d1cd7e771ba079bd9e1f7c532a80a30bd5182ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00381-of-01024.json.gz": {"num_bytes": 319210620, "checksum": "df74823f78564b544677410508e675e2811905c56afe2a60d19d3e049dd65394"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00382-of-01024.json.gz": {"num_bytes": 319810275, "checksum": "f5d5291a695fe2cd228213fa2bf090bf6513c49c6911826aa43ecaefec0622ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00383-of-01024.json.gz": {"num_bytes": 319190426, "checksum": "a861ae79a66b72d6cd5e0a030daae52cffb85ba1272c36ae2be04a9b7c0287c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00384-of-01024.json.gz": {"num_bytes": 318501845, "checksum": "b8d0f5078ae82980f0f64120530bbeb20f627be0a8629d68885acb867091417f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00385-of-01024.json.gz": {"num_bytes": 319530458, "checksum": "7da119f3f63e25ff63cacd8ba0d77987b2d576be1f4b86e7e45aa3f2d194624b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00386-of-01024.json.gz": {"num_bytes": 318938980, "checksum": "c21f3de56fab26d7fb60bdb47c216b22793f67b8fa6d382520c79b88d1896f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00387-of-01024.json.gz": {"num_bytes": 319207426, "checksum": "e28b0884092f75836eed4d73ed24b7403d7b0530fc389386a68887420b0c2603"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00388-of-01024.json.gz": {"num_bytes": 319835376, "checksum": "b4f0db632cc9af66e8aea109c80d73a6281207e29ece131d5bf8b57ff8f81262"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00389-of-01024.json.gz": {"num_bytes": 319346837, "checksum": "413a8d8df1f6cf3094839b57231da5323f33f7115768c65d83f0af1574f71b6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00390-of-01024.json.gz": {"num_bytes": 318632301, "checksum": "a3e8664fbb3ec2af5a217225dbb7fcf3e93b427e5da1a88e35c04c319d61e4c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00391-of-01024.json.gz": {"num_bytes": 319066082, "checksum": "e22eed3415c90510e97768be5a685e0a8035e2635ef773c56e9ce2718c278658"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00392-of-01024.json.gz": {"num_bytes": 318356286, "checksum": "ddbf325390648d9d86f1e7901b75c99fe8db538d203de8dfb4c304282f82cd74"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00393-of-01024.json.gz": {"num_bytes": 318048288, "checksum": "974fd05f356c86be2f9109b0272eee69c5b2eaf0b16104cc573846c925d13b4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00394-of-01024.json.gz": {"num_bytes": 319444683, "checksum": "0d27d6f8c3b935cef23ea60abfa82bd6a4f5e2e061080419dc9c6bc455b9f868"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00395-of-01024.json.gz": {"num_bytes": 318353166, "checksum": "24d9956bd857484ffbabb3ba6f6ac688f48a94b50228238c7c9153a5c6878a7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00396-of-01024.json.gz": {"num_bytes": 319960396, "checksum": "9425f4f18e1690ded866c4b5313cbac8a6210092dc42f720200b7143b69eabe5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00397-of-01024.json.gz": {"num_bytes": 319030577, "checksum": "dee166674b835b9849d281a87238aa136e14d26edaa72d0ecb6b7e82d556a72e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00398-of-01024.json.gz": {"num_bytes": 317664320, "checksum": "f85e08272f73ce4aa602719d59205db54d230a6b7247830d78f91eac63d753be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00399-of-01024.json.gz": {"num_bytes": 319623875, "checksum": "85dea0672a0362a08503b70623907c8c92bd105f788fbd7f3816212a9181e7c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00400-of-01024.json.gz": {"num_bytes": 318840274, "checksum": "a104345698500611cd1a71a6647555300d315490918740a8c6e3b8dcff315407"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00401-of-01024.json.gz": {"num_bytes": 318336377, "checksum": "808327d156e183e102fd75cfbdb7b5a1fbde3740168f59b767ea380608305b67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00402-of-01024.json.gz": {"num_bytes": 319270185, "checksum": "b6a5f7c1ade628091fe86744a6011147ec32795ad694ccbc82929791b93aa307"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00403-of-01024.json.gz": {"num_bytes": 318038520, "checksum": "108904ab05b3ad23318f8aa0f7ddd00d97aae1872fb157eea73273e011cbec04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00404-of-01024.json.gz": {"num_bytes": 320933185, "checksum": "cd0c068c0831218849149eaab8f8a98748823911c745ca0ea33ae839bd625e04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00405-of-01024.json.gz": {"num_bytes": 317694827, "checksum": "d99909ccd59e2ec183b41a7c6d1bd5677798bd7fd784ab681546a7bf8292f353"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00406-of-01024.json.gz": {"num_bytes": 317937468, "checksum": "c7f2bd7a366b8c389e41fdfad4891068c86039e1a5fc3b8a0b993253badf33d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00407-of-01024.json.gz": {"num_bytes": 320226074, "checksum": "765db6f9f0c8c3d9bbb0499f0010928fe4f90d5915dfdd3b6d09d3dc78ad07a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00408-of-01024.json.gz": {"num_bytes": 318613788, "checksum": "165e78c858dfaf010307392474d4917846c9d21658558912e5ffc915803bd2fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00409-of-01024.json.gz": {"num_bytes": 319212414, "checksum": "5f7d5952aad1ae31413962983971b2b422d77c262ededd2ce1c1e186aeb6d87d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00410-of-01024.json.gz": {"num_bytes": 319023647, "checksum": "24588d41f40e3fe389575b97d41ef761be46bc9a9b3965c5e3f994760f7a4070"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00411-of-01024.json.gz": {"num_bytes": 318408922, "checksum": "b35d4ada5a000f51169557b00e508706d51a7becd33370014ff07c8b8dac1af5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00412-of-01024.json.gz": {"num_bytes": 317166932, "checksum": "d3ed1cae269ebefe4716843bd7954bf7e44ee889f72066afbdcd95f4e1f06703"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00413-of-01024.json.gz": {"num_bytes": 318519121, "checksum": "07fc61a7e164301113201e78c99d40289d88e0b463048e14aa5fe69c7490ccac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00414-of-01024.json.gz": {"num_bytes": 317417235, "checksum": "c5a7222b2eb8e8fe690f29a0fff7e214ba94e4d9dae62f67281fe25dd385b721"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00415-of-01024.json.gz": {"num_bytes": 319690993, "checksum": "37052fff729bdff124577d5ba041906b2ea7420c5cb28195e6cfca0e41d560c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00416-of-01024.json.gz": {"num_bytes": 319466518, "checksum": "6e8ce2b9e6e8208ad7e43ce709454cb0b96572d793e0b11c15892f5df18f6137"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00417-of-01024.json.gz": {"num_bytes": 319694381, "checksum": "20892d7a33c31d7967ae0cf595a2108de96a61c0bbd773aebc5d3d083f6ed93b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00418-of-01024.json.gz": {"num_bytes": 319048918, "checksum": "fd795ae8d53e632bb3e89a2becc5b801e10db781b14f2c0ed50b12def5376c8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00419-of-01024.json.gz": {"num_bytes": 319791424, "checksum": "5a8e56faaa0892249e5694ae01e2e4dcd22d9750a9aeea5ca390117c77b8de2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00420-of-01024.json.gz": {"num_bytes": 318060925, "checksum": "795ee64f4c9e2e35d9dc0c91ea593c9e41a3924162901fbf782dc7112f8094a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00421-of-01024.json.gz": {"num_bytes": 319328927, "checksum": "2670b7b6b53e9082c90e4a4e915f72673831ff15e9f55918a1244e0c19c8f963"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00422-of-01024.json.gz": {"num_bytes": 320065363, "checksum": "34df2d1afac2ae4699524492d6b93e4a2a1e551cb4a4ae35fc19353930afab8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00423-of-01024.json.gz": {"num_bytes": 319349887, "checksum": "a2b19afafb45cf30493ac2a3eb013e136e7213f63bd633374ca0d9fe2780efe9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00424-of-01024.json.gz": {"num_bytes": 317515288, "checksum": "ec2a84fb16dd16f9547f0c3314a91968324f2c537118ca36e982b235e23527ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00425-of-01024.json.gz": {"num_bytes": 319092219, "checksum": "1ac0b93c0faae7d446add3af3173637a4b0d638dbd5285b0f4e1bf3abd0d1542"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00426-of-01024.json.gz": {"num_bytes": 318421245, "checksum": "bade501dc71c0b4968a9a7c833751cee5d8f7067a45dabd53aa03534df48886e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00427-of-01024.json.gz": {"num_bytes": 317847935, "checksum": "7aef554aa2b120c4d787395e28aceba743e309f2540fab283e077a1429a2f7ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00428-of-01024.json.gz": {"num_bytes": 318822008, "checksum": "cd94547fe1953a1cc074d97558a70d1e55834606379a8f5e6e60e1b15b56fd35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00429-of-01024.json.gz": {"num_bytes": 318507684, "checksum": "4d3c9245565a808058293558603c657d6e9a0c87b6d2d4b871b856cea2eb3a19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00430-of-01024.json.gz": {"num_bytes": 319042136, "checksum": "9c5a4fe50db5d0822923fe29a5aa8ca6cb09e3629472b1bf61f670388b6c2076"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00431-of-01024.json.gz": {"num_bytes": 318925124, "checksum": "8f18b35bb952da090ade742753e30861ba39c6c54c8ff2d76b358ca7be475ed6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00432-of-01024.json.gz": {"num_bytes": 318680251, "checksum": "7968c370d0efa4601ab8b5ee68e480b211fb969593608bf7e00a0153f00f99b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00433-of-01024.json.gz": {"num_bytes": 317822797, "checksum": "f62d7e74434d52c36b22f6a8cd56ed3937ed6aa03f140d0fbdf5e360632d51fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00434-of-01024.json.gz": {"num_bytes": 320094364, "checksum": "55d7678c7e197e165b4e09bf3f8ac159853120acbe5801ed6ab3ab0f801c11bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00435-of-01024.json.gz": {"num_bytes": 319008936, "checksum": "09b451c8ee06bc06507b3e75a60c544a6b70f27e3d07daa29c59803f785faaf5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00436-of-01024.json.gz": {"num_bytes": 319023456, "checksum": "6fbcb93f9dfe65e12b7efeecc8af7823471787438b1ce90e5f48b68b2dcb1d14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00437-of-01024.json.gz": {"num_bytes": 319484997, "checksum": "9e70c8c1ccbfe93ec9296811ae496a518dcafbf38c81b7972f885e297da9e726"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00438-of-01024.json.gz": {"num_bytes": 320319141, "checksum": "eaab759d8c603e8a2ad3ebacd99e30338fb904ba307aeaba0d2e0e63679cfadc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00439-of-01024.json.gz": {"num_bytes": 318410397, "checksum": "7a03a92bf97b6750941c1070f933c68f1b2a3e13fb68b3a21a4726676ea75d34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00440-of-01024.json.gz": {"num_bytes": 319447470, "checksum": "bc899e436da7b3bf13c1bfa2fd2bbf9d90b42a0c00f2971259a14d858ca3e5ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00441-of-01024.json.gz": {"num_bytes": 317582955, "checksum": "4d777860c2750e43038ef709d77bdc403b3b3bcf0f08e3c4562952c9ac70b113"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00442-of-01024.json.gz": {"num_bytes": 319592118, "checksum": "d9e5dc244bb6f0b629b2a929aedf506dadaf5eacc80f0997816b95279552fe8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00443-of-01024.json.gz": {"num_bytes": 318104403, "checksum": "56133bbd7cf96dbe87d48898b886a024af69ca405d7cea1799bbd30f185e9c1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00444-of-01024.json.gz": {"num_bytes": 318547808, "checksum": "8be0270c3cc96dd7f7b3aad08bde81ea245feff4a09923277fb0d38a7c095604"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00445-of-01024.json.gz": {"num_bytes": 320463920, "checksum": "e02316fcd355914e4d08ecf37036d4727ae9ebe45bdc5c98279aa3437c2c1eb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00446-of-01024.json.gz": {"num_bytes": 319583221, "checksum": "80c9b8c47665b2cef6c291b0eefdac5b14be1d7cd4a4c06c2e14cf48b42da92d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00447-of-01024.json.gz": {"num_bytes": 319546881, "checksum": "a18d5aaca1717ec33fb1822a633268003bf88093dd7b48db080503c3d01b6ffb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00448-of-01024.json.gz": {"num_bytes": 320234711, "checksum": "c41595d2b9cbf0e23fd65df1cb51499ee262d345d79d2625388cf149c3c39f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00449-of-01024.json.gz": {"num_bytes": 320043698, "checksum": "3bef99334be9d39f41296f8f134c88f04fe66502da2d2639f0d6d2485338e607"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00450-of-01024.json.gz": {"num_bytes": 318033740, "checksum": "9cd05b1b70ffc3c004b4b4a2f21f91abee1395f3a485efd1aafda550193df9fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00451-of-01024.json.gz": {"num_bytes": 318549622, "checksum": "b2ef6cc4ac7c4c69fb1661d7ed9b2ce4da261c72f9e49dc3c934180501ef3a24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00452-of-01024.json.gz": {"num_bytes": 319317230, "checksum": "89927f1fd79a5b1439988fd37e0377175176d9ed22d14611f67a81e185a336b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00453-of-01024.json.gz": {"num_bytes": 318952561, "checksum": "427f55bbcfb6c1a0ef12f96cb122f362b975169770ce1d392b763c4b4408cb34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00454-of-01024.json.gz": {"num_bytes": 317545286, "checksum": "2fc3b172ea721bc92b0f7614e8fea61b0781e6f4f3e6b7263cf0190beef3ec52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00455-of-01024.json.gz": {"num_bytes": 318975631, "checksum": "c96f688ecb19bdb1592b0124021fb80d48965303442de76751d82fa03ab8f6d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00456-of-01024.json.gz": {"num_bytes": 320016575, "checksum": "61d2be7a4b9e34cfb994ae2c120ed5a51a6669564046637445a46b9872812416"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00457-of-01024.json.gz": {"num_bytes": 318236935, "checksum": "a74dd51c3c490458ea0e61196d7e0085aff80d50cd149a673f54f661b364a671"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00458-of-01024.json.gz": {"num_bytes": 318495925, "checksum": "adf9cd717f2c79504dace22b5929d4c4064353e869457c20cc81a0b2db390c89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00459-of-01024.json.gz": {"num_bytes": 318956821, "checksum": "d7be5bcb738a75586125e56a25aa234618528accda620eaac421beab6288b992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00460-of-01024.json.gz": {"num_bytes": 318968681, "checksum": "6181280df5418fd9ebb52aa26a631100b6c3da0750dc5fbae152a6a44fccb942"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00461-of-01024.json.gz": {"num_bytes": 320810761, "checksum": "5e943c458674371dffb2466274b8f2a9df9902a370901ef97992bdf920cdae0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00462-of-01024.json.gz": {"num_bytes": 320154899, "checksum": "76b3d1b120cbb7cd71d004440e0c6bd9f9c4395424c568e8362973038017a90c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00463-of-01024.json.gz": {"num_bytes": 319247449, "checksum": "9de2c86d85289113b24c2f7eb4771ec1391511930f5f26a12133d41faf0ce908"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00464-of-01024.json.gz": {"num_bytes": 318150152, "checksum": "85fce3104ef0b247798c1de8d9d616d3de754841fb6c49a01cca5b9da5efa94e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00465-of-01024.json.gz": {"num_bytes": 320342803, "checksum": "ddf312f0b8de8f53ed556483fd998ae308d4829d18195a48869db6bf1866c332"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00466-of-01024.json.gz": {"num_bytes": 318619029, "checksum": "01239a1ff6ffe9032da320c5a7d1a93125d0724851e3e10746821c9452070887"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00467-of-01024.json.gz": {"num_bytes": 317677227, "checksum": "41783d20189a4bcfc33f543597a5473900e692ea13fa522f2724e27e810b4e9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00468-of-01024.json.gz": {"num_bytes": 320038217, "checksum": "7131b6f4dd423f2efe55c3f598893676300b31651cce7eed32ce633a015f8ca8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00469-of-01024.json.gz": {"num_bytes": 318359701, "checksum": "925bc76c045f25532414f29820adb0cf1a56c54b406333a6f348c29e5efda9fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00470-of-01024.json.gz": {"num_bytes": 319329235, "checksum": "9be740483aa7bbaf94dce550f2c20404c89326f6ec4ebe1b7070f85f93507038"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00471-of-01024.json.gz": {"num_bytes": 318792779, "checksum": "0e3d9492f15dc9867bb0dc803bdf45608fbe67255014b4488902d7bf2e2554cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00472-of-01024.json.gz": {"num_bytes": 319552622, "checksum": "00484bbc10bace3dfd93b57fc53d6f5fac26b7dd54fd5b5428d75eb9e6dbb0e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00473-of-01024.json.gz": {"num_bytes": 319466828, "checksum": "5db5d585798e8ed8e4a3bc540871f1185f67125f397a12942d21b24e6b374519"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00474-of-01024.json.gz": {"num_bytes": 320014669, "checksum": "db07fd0e972c1a474806c1b4464ad4cefdd2e8fc15806ba0d259d4f9e594c3f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00475-of-01024.json.gz": {"num_bytes": 320379280, "checksum": "e6e36a9eed8be84c928980fffd8177b177182726c9e13b41a47343d431f76a7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00476-of-01024.json.gz": {"num_bytes": 318820301, "checksum": "0543ed2d0b3aaba0b0fccbf0311836143bd19175c5eed9bf0f024ffb9ce3c50a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00477-of-01024.json.gz": {"num_bytes": 320577830, "checksum": "a62fd62ad771dbcfb7af73841e15a49e9d7239c53dbbbd84de2282131bca9c99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00478-of-01024.json.gz": {"num_bytes": 319593908, "checksum": "beae9334a8e93e4b036c4a9b3c5b3a75fff17264177184d243d9e6da286dbe2b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00479-of-01024.json.gz": {"num_bytes": 319728825, "checksum": "ae5b475c7be35d98b77d6c4aed5d61cbd1c98544c9a6e73a53ef2911757ab7f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00480-of-01024.json.gz": {"num_bytes": 319903674, "checksum": "51e0611378455d909e8b0f292eb62038848aa7afaa4f93c9c83061258b211a95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00481-of-01024.json.gz": {"num_bytes": 319998409, "checksum": "68c640304ac952f544ea88c88d7c994c8d2955b95036f8352a67b57a836fa1bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00482-of-01024.json.gz": {"num_bytes": 319047238, "checksum": "74cefa57158d0008a06ae85b2a7a1c04d57a79b7ae3f7b4b3426dbe9918b36ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00483-of-01024.json.gz": {"num_bytes": 318775875, "checksum": "e99faa71222017521f1fc9999bbb0832df5c91f8b9f6e2ef501d3f827d3a1e85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00484-of-01024.json.gz": {"num_bytes": 319190491, "checksum": "4518faae7c9d51a51f0b02cd895cf27e7c87a623b787346c844a8d9f0b52d6ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00485-of-01024.json.gz": {"num_bytes": 318974502, "checksum": "1bc8b207583b9f36169e0e9facd258de8eb73dee8bf831051dd1ab04b7726c6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00486-of-01024.json.gz": {"num_bytes": 318599424, "checksum": "0b1d9900e1921483b85305491f914b6b78fabcd0686a20695e61b89b7380a894"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00487-of-01024.json.gz": {"num_bytes": 318958015, "checksum": "c0c789c5f3b34d170d2aeb72642c70d2fa5eca567e7850d0c89b3d170f3bbf64"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00488-of-01024.json.gz": {"num_bytes": 320205671, "checksum": "6eef7a1ea80be43e84cb0c974215a477c909844899ac694afe1af2e8f4ac171c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00489-of-01024.json.gz": {"num_bytes": 319193967, "checksum": "eccf5d7f682a76e11332f07e7d54a080f76c0be58a98a853a9fe90c815a22087"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00490-of-01024.json.gz": {"num_bytes": 319833603, "checksum": "afe99e32ba36134f23b59a2ee43965bf185432de947740fc19e26eef41027aef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00491-of-01024.json.gz": {"num_bytes": 318912982, "checksum": "e981151b23b233bd3e5798f78658b5f52a73f69db39c30615f615069cf0c4984"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00492-of-01024.json.gz": {"num_bytes": 320057824, "checksum": "0cc5f7df318e0718fef93d24e7ff904b3e8e2728c4fc0b1d13893c81d8e6e2c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00493-of-01024.json.gz": {"num_bytes": 317967559, "checksum": "93749543b04a5a7093177d2a03acfc0bf6f26d5b53864ae35839a9421fb48169"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00494-of-01024.json.gz": {"num_bytes": 320426917, "checksum": "e461f56b461a4d5ce353c60889dcb99e10818985d3788440c6119bb145876277"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00495-of-01024.json.gz": {"num_bytes": 319528392, "checksum": "e530f3030ddbf7191bc4082e8209f63eb48733d7085d79a8469ce3611ccb79b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00496-of-01024.json.gz": {"num_bytes": 317570766, "checksum": "ddec34b528bd5314019d12089e600df27e781d78f43b6722b9c0202ccf385755"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00497-of-01024.json.gz": {"num_bytes": 319154838, "checksum": "e7438a08000fc7a158f887755cc496edcf51c8bdf2bc4a888ddd2c829bf8fa3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00498-of-01024.json.gz": {"num_bytes": 317955368, "checksum": "ad133d808ca5b6181bae1921ab1261d79630c09bf9d6c904db036f22e6f32e6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00499-of-01024.json.gz": {"num_bytes": 318286671, "checksum": "cb40879ea08db5a9eb6f2c23756574bda34deb9acf039b992f0ab90fdbb01594"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00500-of-01024.json.gz": {"num_bytes": 318510936, "checksum": "21e5f7468a907f38c3dc0a5c19f09921476f9186beff967e829329f191dad6b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00501-of-01024.json.gz": {"num_bytes": 319611074, "checksum": "38829434c8539bb9fa9ea32bfba3c6732c5021ffb60c16fc502fe61de83906ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00502-of-01024.json.gz": {"num_bytes": 318630954, "checksum": "22d1ca1edae179d2587495fcdf1d3e515c6f547cebafc54996c93a121731fd8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00503-of-01024.json.gz": {"num_bytes": 318253198, "checksum": "e95689993390086880e630ec4540e0629551076c0cad2c70f5aedd3aebfec181"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00504-of-01024.json.gz": {"num_bytes": 319497151, "checksum": "0cd7b986d247e010fd76fa2ab2b62d5f9eec292b28c1e7bd3e4c577042b598af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00505-of-01024.json.gz": {"num_bytes": 317498965, "checksum": "f1504912fc53cc3690e26ec3babf736ddbeb8f7d9196dac83f757699310b30ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00506-of-01024.json.gz": {"num_bytes": 319684193, "checksum": "9f6defbac132e097cbf7cb7d181cb154bace6af48964fe09d111bc610fdcd2bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00507-of-01024.json.gz": {"num_bytes": 318394726, "checksum": "a58f39d0bef19abefc089342d8bb6d75dbb2c663f67127673ec395404bcf15ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00508-of-01024.json.gz": {"num_bytes": 319013108, "checksum": "176443b39840826bfb1db2cef2541449a6fd0c465ff9bbf0cb2479f07fb8baa8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00509-of-01024.json.gz": {"num_bytes": 319832758, "checksum": "cce5a142cd7a121eba8c182d499442f4b0a397ea1484c33ccd79b1acbae832fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00510-of-01024.json.gz": {"num_bytes": 318762241, "checksum": "bfc910625f0fd6074955906bb86e789b0d0adcd1f8956cb8da276933dceac256"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00511-of-01024.json.gz": {"num_bytes": 319240643, "checksum": "ce53021b90d1c86e2d46293e7053aa174387d7408bf0cf907898be69b1a7befc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00512-of-01024.json.gz": {"num_bytes": 318353376, "checksum": "e9333c6f73c30c9cb7f31794025eb9129455fac2edd64f8b3f22f879124c6a85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00513-of-01024.json.gz": {"num_bytes": 317653011, "checksum": "d9450c6f541e82922b37d3b7cc25611707b44884f27825db4dbd65466b59e8b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00514-of-01024.json.gz": {"num_bytes": 319391160, "checksum": "20b77f5fc2a939fc291f901e8774acfbf04ffaacb08192b724673eadc9f83c12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00515-of-01024.json.gz": {"num_bytes": 317994258, "checksum": "32ca1f60d0deb395538a93ce5044a48fde05864f2c26af42dc53405b6dc05031"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00516-of-01024.json.gz": {"num_bytes": 318786801, "checksum": "eba4f34749eef4da2b0729abbdfa2ada77bd65383c01213d4f86625670430a65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00517-of-01024.json.gz": {"num_bytes": 320010732, "checksum": "617765f971b879182db7debf879025f8dad4fd8846b11728ee1230767c031c04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00518-of-01024.json.gz": {"num_bytes": 318681019, "checksum": "6987893764c56b84fca014532824a05d4187db5c313be4f7bdcb363b7e8cc8db"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00519-of-01024.json.gz": {"num_bytes": 319951543, "checksum": "ba151c4734db52e7c220dbefe380825ac6d66a9c6abb901b8096a87d97a2deb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00520-of-01024.json.gz": {"num_bytes": 317948056, "checksum": "7e53ed26c3c068b0dedd026219b7cdab79775545ebbf31b5dadadb45364c9985"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00521-of-01024.json.gz": {"num_bytes": 317993802, "checksum": "4d1d4a5583430e373bd2cfd191e59cd8911953fbd73fa924e0c15be76499b54b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00522-of-01024.json.gz": {"num_bytes": 320189449, "checksum": "71d851498785e312acf93861a43169794d4d576f5fe8b960303419316c8c898a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00523-of-01024.json.gz": {"num_bytes": 320443871, "checksum": "587867d619115c2accb69322b197239b79f12de41ae80427fd369813ad8d81af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00524-of-01024.json.gz": {"num_bytes": 318192840, "checksum": "7324c02db00b06d0f41d6e5ebfa4e4dd6554f5f4849d6de187ebb84162d0446d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00525-of-01024.json.gz": {"num_bytes": 319294602, "checksum": "24ae3495e5b59883967c62b8fb3a4fa7525d33c40957fd5fa3be413d66c24eb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00526-of-01024.json.gz": {"num_bytes": 319783465, "checksum": "27cd95e7bc6a3f156f1f8f26dc5e490818fc4810562e3964a19fad401cceacd2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00527-of-01024.json.gz": {"num_bytes": 317240081, "checksum": "6b84920fe7e28c01a03800512915c7a9e47816267ac652f9ee0314e3428bca72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00528-of-01024.json.gz": {"num_bytes": 318320694, "checksum": "fec06589f714ffe1343cb6781898e29e5d0cb789deba3aa4a4ccf86514d3f690"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00529-of-01024.json.gz": {"num_bytes": 318391515, "checksum": "a98c34c04c1b6f0ca3acc9e10fdf4bd0ead2ea7271832ce4972df8677590918b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00530-of-01024.json.gz": {"num_bytes": 318473966, "checksum": "1677d541c7bc10971c711f1eb030faa2e85e0967112ba57d7f04712908e4f040"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00531-of-01024.json.gz": {"num_bytes": 319463272, "checksum": "92b5d82a058554d3396a2b54504f45fa88581cb2951140c0f0bde67ed11bed0c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00532-of-01024.json.gz": {"num_bytes": 318228175, "checksum": "291bb3d7613f7f00b6910a0de78dbab0d87602243c9c83014de341c131200853"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00533-of-01024.json.gz": {"num_bytes": 318966937, "checksum": "a0ce39eac6d6ecad3478373c264e88b2ea20b77fb2049537c229ad3da2769c85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00534-of-01024.json.gz": {"num_bytes": 318968162, "checksum": "387db79d4aacf8fa4c512fb78023ff94a43d5d597d5a8c2ec6198e62e4b8c98b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00535-of-01024.json.gz": {"num_bytes": 319253588, "checksum": "3ff8f4a926fdfb6201a94d75c17ec5afe662a339a65019eb5e1193c1238bd388"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00536-of-01024.json.gz": {"num_bytes": 319662526, "checksum": "0c805e83d8cfd979701df5714713d062e14853d7e2b0f77c0b414a626686cd33"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00537-of-01024.json.gz": {"num_bytes": 319177095, "checksum": "f9a0ac216e316075e5c2219449a954f989eb160ead2ca07ac9f3813274e18f2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00538-of-01024.json.gz": {"num_bytes": 320109104, "checksum": "a425ef4dddefb40bac5a8cd3191161a41737aea5088a614410d10d83bbab5e37"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00539-of-01024.json.gz": {"num_bytes": 320600564, "checksum": "3580ea8da9c4aff1296e89136c5d7f1a37d021e0b10f3ebd1e05612c092faebb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00540-of-01024.json.gz": {"num_bytes": 319993281, "checksum": "ad8dc83bfbe7c8976f08708c5f0229cd4e1a2d80e272b225a8d208133b129dfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00541-of-01024.json.gz": {"num_bytes": 318256020, "checksum": "c7452669237323fdd09ce97624791a0261f3ec07d8a5f98e71a4b1252a2805e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00542-of-01024.json.gz": {"num_bytes": 318843744, "checksum": "1e5a11c25f82ce717302dbcd9acc1f8b916d83eca88d345d8434b1f88768137b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00543-of-01024.json.gz": {"num_bytes": 320482002, "checksum": "bbf96edf50c913d5162ee154423242e7c8faf490ba229f325bac98a5e3eb9477"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00544-of-01024.json.gz": {"num_bytes": 319059260, "checksum": "22c04506b5744df8c71727fc6527fa2bc495a10a237c71762c66d09625d34097"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00545-of-01024.json.gz": {"num_bytes": 317874034, "checksum": "84a78bb62eb6f72de7a75325870d9ecd419f77c4f6728d29609b2f7ab1b8bcf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00546-of-01024.json.gz": {"num_bytes": 319891407, "checksum": "28631c527dc398c9626fc60b39ad94ed880b41c71f55b9c7c670f6a1837f98d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00547-of-01024.json.gz": {"num_bytes": 319361268, "checksum": "273b8598405def0165ceaf9723d1425c9b74368fc22a414616c7ac9327930225"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00548-of-01024.json.gz": {"num_bytes": 318360761, "checksum": "59990568c0ea055fab27f2b9cd028e1c7177df0479712d1e2d8372e9b017ccad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00549-of-01024.json.gz": {"num_bytes": 317320452, "checksum": "fd1e361f28cf099df6088e26d06d79f7f62bd8bd89b4524b9baa80ea49a1a4a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00550-of-01024.json.gz": {"num_bytes": 319017444, "checksum": "4424833afcb143f6fdbfc2f5fa2508d6226a4a1df391969b2a751d2d0070158d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00551-of-01024.json.gz": {"num_bytes": 319118159, "checksum": "77b78f94a8bc8f905cf8b1997df1fc3b8c6d77ce65fc28bef68c6083275a832b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00552-of-01024.json.gz": {"num_bytes": 320058125, "checksum": "e7b71167c4ad947232b6acba26e4d3cc9214c25b50b853b5745333bba942f50f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00553-of-01024.json.gz": {"num_bytes": 319220671, "checksum": "ce7891f3820ce065e3bd7afa006e90889428c80bd8e771d66fbbf023bb2a9eba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00554-of-01024.json.gz": {"num_bytes": 318858928, "checksum": "015a707235f46f179a08d3f6674b6d368dc9612841e2bf39f700f11fef8e64c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00555-of-01024.json.gz": {"num_bytes": 320490725, "checksum": "041dd2e902ed04dfa143476da03d5fd00c30ce1259c0658150af5b77a5a092c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00556-of-01024.json.gz": {"num_bytes": 319863694, "checksum": "22e3d9e4dbdf2b1b822a7bc8c889f4747aa16c71f4c91436d028a228bffe4b87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00557-of-01024.json.gz": {"num_bytes": 318940362, "checksum": "4cb8b113ad9687b7dee590242c5f50fb3ea3a8775c67492a8ce0cb5c15fc26d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00558-of-01024.json.gz": {"num_bytes": 319797786, "checksum": "ad157a34c6a8d496859f55b00c79fcedf7305d8502ca86a511026f39cdcaca59"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00559-of-01024.json.gz": {"num_bytes": 320156705, "checksum": "816d84753b71fae446428587f41de5b3490e88321f1fa0cfa2ef1fd5eef851e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00560-of-01024.json.gz": {"num_bytes": 318346216, "checksum": "0b1b3d26316f2c0e973ff19820793bcfffa957c3869f74f62fb40cb6839227e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00561-of-01024.json.gz": {"num_bytes": 319571572, "checksum": "4f92594382c897bf94211f1446dbb38c2cc1fff3647acba731dfe0ad89ba4061"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00562-of-01024.json.gz": {"num_bytes": 319453711, "checksum": "2a6ba0c64806add776081f417c8d1afdb324dd8b9aebb603372afd7fc2c4cd6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00563-of-01024.json.gz": {"num_bytes": 318990092, "checksum": "e3032365b9b86883c24bfe387d810c2d9fd1d0a55ff88acd1f5b5357246b13ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00564-of-01024.json.gz": {"num_bytes": 319491917, "checksum": "da6196ab8650fc9f8fa391b821ff070070946412277bd423c40d9fa1de325f93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00565-of-01024.json.gz": {"num_bytes": 318756269, "checksum": "edeb5b13aa0d65354d78a5ca5d1698732e95f1fcba249c42825a0351d4a34f79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00566-of-01024.json.gz": {"num_bytes": 318461036, "checksum": "f179addbca50d8612612b0e09138d7ecc89ba7ef2d6e857d7ef0b10223dc71d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00567-of-01024.json.gz": {"num_bytes": 319625728, "checksum": "eaa1d0ee28eb17c6ebe3d85c8af8b7adac28a720b2975f86ac83f3f4d2bffbcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00568-of-01024.json.gz": {"num_bytes": 318428567, "checksum": "3677e88545f2d76b601995cc3e2b6b12fcf65e350ed7eb4137ab4beef3d475c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00569-of-01024.json.gz": {"num_bytes": 320114923, "checksum": "2d8810d8bcfc0fc19d82313be6516b2fef4cf68f56b0448af48b512c98e1ae8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00570-of-01024.json.gz": {"num_bytes": 319148416, "checksum": "8e5356dc0fa2b4e5fa16b36a1586f16920306af1227c765e5d2f0818e74d30d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00571-of-01024.json.gz": {"num_bytes": 318223973, "checksum": "c87cf8b88e8e4fc0a664f4b3a381b78b317680253a83a672cb86e02adb43f2aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00572-of-01024.json.gz": {"num_bytes": 318322508, "checksum": "2bdc857dfeab99c8f83f0267ed5ed7529bca8ee086fce268534bc0264ff738f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00573-of-01024.json.gz": {"num_bytes": 319203246, "checksum": "564fc77dec25ce0d47f4e3d8d04bf114dc06119b28b3ab00d6092a799d496e51"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00574-of-01024.json.gz": {"num_bytes": 318397937, "checksum": "dc3f206e1b5da963184da72e47959844bb164335c76e3261f3a189a4b7b022cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00575-of-01024.json.gz": {"num_bytes": 319183651, "checksum": "7f0c46955e37d5d52b305f71b4ce4fca5368d72e8698e8b832ac0177f868e145"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00576-of-01024.json.gz": {"num_bytes": 318690625, "checksum": "b37d0fbd439bdc05021a71c192ce5e61ebce27448a17819bb53156d9d5f27e17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00577-of-01024.json.gz": {"num_bytes": 317926085, "checksum": "3092d1ad70fb2d262ecb33f3fb6ea554af3ddd26498ba42b644c383f6d4bd1a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00578-of-01024.json.gz": {"num_bytes": 319190472, "checksum": "d9833fd591a618a167b31b7aaca420f3e719ded98987dbc0f46fd4bfd12564c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00579-of-01024.json.gz": {"num_bytes": 318958744, "checksum": "a11217af10c85ad828de38847eeddcde6af6899563585d581c20adaed3c9e7dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00580-of-01024.json.gz": {"num_bytes": 319893900, "checksum": "71e8be705bfa8563e33392d1c14decd84f52d6a0139b98344f1a0ed9bdc94198"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00581-of-01024.json.gz": {"num_bytes": 320109861, "checksum": "c5f13ba973803ef069762d22bc37ee02a4348af379c75848d93b2685fc4280cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00582-of-01024.json.gz": {"num_bytes": 319238177, "checksum": "da815527ca68b5c2ed604d00ccbcc7c631c60f33e3132f79212634a82c266844"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00583-of-01024.json.gz": {"num_bytes": 319375634, "checksum": "a332b791df0801f0b7227117f0ea3971563e8e420ae24dd94b38d532c1ab0573"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00584-of-01024.json.gz": {"num_bytes": 318596018, "checksum": "e6496d31f42921eaf9f85047e7c2eeb5fef46e01e99760fa676da96481d7d5bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00585-of-01024.json.gz": {"num_bytes": 320156294, "checksum": "08b978ec05d65edd22c301ddc6ab44174eeb7bef5c5997a84342b6faaa47a79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00586-of-01024.json.gz": {"num_bytes": 318716838, "checksum": "567ce600ad99e543507fdf27b9009fe1782bc867f44f3dabbeb93fab1208f337"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00587-of-01024.json.gz": {"num_bytes": 320247814, "checksum": "8f5c82f5eaac4a315d8615c9700cd81f3b9c2e1a17376d3b2482f8694dfe2492"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00588-of-01024.json.gz": {"num_bytes": 319546079, "checksum": "bae91422f87091b3974ca92781a14fae8f10c5c41de9c9132f745b3dcb8bc468"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00589-of-01024.json.gz": {"num_bytes": 319771959, "checksum": "babb615d77f80e5ef99aeed3889a26cef5c9918a7fe68b70a503815e69b0b189"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00590-of-01024.json.gz": {"num_bytes": 318926571, "checksum": "61f2ed732f3b2b5e24882f47b4eb84fea28bf89d112f6f173cbb50523a43c4b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00591-of-01024.json.gz": {"num_bytes": 319669791, "checksum": "3aa2e792ec775a52ee78447b81204867e58b0a46727bab4b7974977aaec2889d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00592-of-01024.json.gz": {"num_bytes": 320393142, "checksum": "1419c263fb74409cb0e39ebd87b1c020ee6863a3a6f2f427be27d3c76b84043a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00593-of-01024.json.gz": {"num_bytes": 320977171, "checksum": "4f16f33217c35a2b155d5b6fe8014c2e52014e63c419e7d3aaf71a35246c1323"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00594-of-01024.json.gz": {"num_bytes": 318211092, "checksum": "c9301ddcafea22d085ae48f551f486e73089a76c7990871f787064c61e4e60b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00595-of-01024.json.gz": {"num_bytes": 318978629, "checksum": "349e104763320eaae96ac3bc53c5fa7a73e7dec93b8cc3afaad108a97e7c170d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00596-of-01024.json.gz": {"num_bytes": 318573003, "checksum": "0eb6c25cf57764ec3aa7f74d6d967c52003f872f2f3b140fe6d5ac6360241a8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00597-of-01024.json.gz": {"num_bytes": 318931514, "checksum": "b42b7b984aad729185ca9b3a6ffa856b2a79165ce2feebe519b10f8ff42c4ab9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00598-of-01024.json.gz": {"num_bytes": 319002677, "checksum": "8306c5971408767b3735288fd0ee7ee7d01d9af4ef4cbec2e57c97b1f78e6d63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00599-of-01024.json.gz": {"num_bytes": 319637870, "checksum": "844df34f2a263011f9d1d85eaad5a1d95243769e9cec5a104807dd55e1fe431c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00600-of-01024.json.gz": {"num_bytes": 318099852, "checksum": "b05e66568a4472feee31f20918e9813aeae2d881f47b5281ff29fbcfedf4d5b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00601-of-01024.json.gz": {"num_bytes": 319136069, "checksum": "8dff2d56c9915d73e6154533e5de0ca9d867c5fdedcfeceb3e0ab22f3ba509cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00602-of-01024.json.gz": {"num_bytes": 319369121, "checksum": "45b2c1757260395afeb168b545892b315fa0bf14b3d144bfcab1fdaa6d79086f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00603-of-01024.json.gz": {"num_bytes": 319499076, "checksum": "46edc9f556ccae692900b222b8e4843360dd5dbe0798a8ad9cb51c07a451dbb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00604-of-01024.json.gz": {"num_bytes": 319132921, "checksum": "0cba8c8738ea7ff9a08bd1bab215010b03c6c83fe35206d83344d78005bdee6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00605-of-01024.json.gz": {"num_bytes": 319315562, "checksum": "0dc0d37658fd672c8d72775bd8855dce9037cf9715feda35a76afb1f0e87bebb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00606-of-01024.json.gz": {"num_bytes": 319223528, "checksum": "f679e437a3acda1a81013dc0f3fa93fde6c3309905e8142f8699a76bc04b7114"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00607-of-01024.json.gz": {"num_bytes": 319326218, "checksum": "7fe91f86f751b9aa3abf1c5ed0fdab89a76c7fa4eb7ab8b809ef29b0cf4a78d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00608-of-01024.json.gz": {"num_bytes": 319393715, "checksum": "a5daf706100eb797b5b0770fe0c790856637b22dc849aeda5b445ae5fa63cb3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00609-of-01024.json.gz": {"num_bytes": 319554192, "checksum": "4434338fe97d398d9565ae940c62539e868fa261be361ede1b5b0feb004160f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00610-of-01024.json.gz": {"num_bytes": 319786301, "checksum": "6b0d0e0457a721af6c67a31f5016432011e717302cfdc7ee39feb253fbae4754"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00611-of-01024.json.gz": {"num_bytes": 319356910, "checksum": "bfe201b1775270afef3a09fcfc074920cbb01093eef90d46f26b6b813d603994"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00612-of-01024.json.gz": {"num_bytes": 318780229, "checksum": "29248c4732fdfda2ba97ed38192ab391457e20fd70f713ef4a7cf084f9865846"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00613-of-01024.json.gz": {"num_bytes": 320190496, "checksum": "f5cb9be2442797d967b9041e48771196a6c0595933ef2102840b704e355f4d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00614-of-01024.json.gz": {"num_bytes": 320245862, "checksum": "89b74d0daea02fb69289ad259bbd0ddb1a64c5d6380848f7d51669be952f8a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00615-of-01024.json.gz": {"num_bytes": 316874605, "checksum": "78600c8703d5ebf80c99c089bb7a7c1cde843a66d706fd219eeac304f80e8525"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00616-of-01024.json.gz": {"num_bytes": 320237707, "checksum": "630ee29d4dc4cd5062eeca7877e5c1b204b36eb0b3aeacadf036cdb75c1ce840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00617-of-01024.json.gz": {"num_bytes": 319739365, "checksum": "d418fd284d06b1d2d9daebea3047ed06286640ac75d23893f1effc2ee9d7aa14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00618-of-01024.json.gz": {"num_bytes": 318634299, "checksum": "f5d75d129ab6c0f052028cf0139c3cf20eed3a9c5cdb151cd88ae42d5d1a32d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00619-of-01024.json.gz": {"num_bytes": 319086471, "checksum": "c558908f6e08b0d02f377c9aed1655d80106f4cfe26e955774bb420d19b2f74f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00620-of-01024.json.gz": {"num_bytes": 320665446, "checksum": "977f959e5b5eaa24081ce025d137647fffd65f1a54d2c45db9805a232e0c0364"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00621-of-01024.json.gz": {"num_bytes": 318576410, "checksum": "d07f3c31d7ec1c71b5ab9539a2ed49f6d5f46b48ee2e51800b9e28cee588a163"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00622-of-01024.json.gz": {"num_bytes": 320053075, "checksum": "58b897603eb83f789a1cfc6bf40a091093cbd8a0c20702018c411adc7b07a437"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00623-of-01024.json.gz": {"num_bytes": 320045187, "checksum": "3665d7579b3c57eb21ec9e55850e39307cc6f4ef8aa8b9937076ad6f142063a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00624-of-01024.json.gz": {"num_bytes": 320136842, "checksum": "35db069ae090e95c5a4d3db44eae73bcb29463c120584d7f6ccbe235983c5fef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00625-of-01024.json.gz": {"num_bytes": 317314201, "checksum": "7f6ddbbc8815e8bd10c99361fd8113cbbd84ebd92799eb6958cf98af825d2aa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00626-of-01024.json.gz": {"num_bytes": 320219970, "checksum": "4e2c46d1e3a94957717bbbf1e1e4300bd27ac17e588d426e0ba688983e83f4e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00627-of-01024.json.gz": {"num_bytes": 320083102, "checksum": "851ce6dfa6a4d1a4e3b8bf439e36db9ceb59eefc60558d429e2fec80655e1775"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00628-of-01024.json.gz": {"num_bytes": 320386844, "checksum": "86d8927f16d0790a07d6c68e745501188d13887df4a137e937ae00497d07c055"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00629-of-01024.json.gz": {"num_bytes": 319476643, "checksum": "c48cff721137b641fe9d5bcf30462c7e4e3a3ae631b7b4e39979c8c77f0890ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00630-of-01024.json.gz": {"num_bytes": 317961579, "checksum": "cde626b34c6c8455227fbb18a577877b518f529b6c8e16881cfdf334f2875cd9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00631-of-01024.json.gz": {"num_bytes": 318952266, "checksum": "0401582821f7b15f0b406f7ce00c56351b8e86a3c3282bdf4dd45b2f6146ea22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00632-of-01024.json.gz": {"num_bytes": 318261820, "checksum": "be48396ef18ce0f3650eca86eb36039f90b51737f9848086494f34fa28d60e70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00633-of-01024.json.gz": {"num_bytes": 319748854, "checksum": "9d5c342d82fcace21de2900202c3f2af47229aeae9d487a8b77b7f5b86c05f74"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00634-of-01024.json.gz": {"num_bytes": 317806530, "checksum": "00a70705afb91f6570d17257057c15b45386597b917061686f131bd41ddce421"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00635-of-01024.json.gz": {"num_bytes": 320313573, "checksum": "22a1286582d65975ed94f0ba25bf87e94d52a55214d0a51979a3e0fd9f95e3cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00636-of-01024.json.gz": {"num_bytes": 318151690, "checksum": "026c699ac6fa30f9e156a957026d8fa8df72daee3407c8fdc5e0bd7d6a3b50fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00637-of-01024.json.gz": {"num_bytes": 318665365, "checksum": "9bd931dfc074bc99df31d7fd31a5ac1dc8c8bc75f8e87b763545cd824edcdcbe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00638-of-01024.json.gz": {"num_bytes": 318521250, "checksum": "4b30ad531f7502ef7bc6398ab286e5c6c63d340c22792da9258ea95b496d1c0d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00639-of-01024.json.gz": {"num_bytes": 319997068, "checksum": "2bfdf36396e49ff625138d29925f54eb12b18d35f6d0bf5ca9e79194977cfb43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00640-of-01024.json.gz": {"num_bytes": 319355927, "checksum": "d0d0ed7304b5d79318b5230a1ab48d3ed03183f1eb11d96070604a7008cd7b30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00641-of-01024.json.gz": {"num_bytes": 319002081, "checksum": "1461ecb6b92819bfdc12808a5442d70f94538931f856c91dea602a23ba86ab98"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00642-of-01024.json.gz": {"num_bytes": 317689465, "checksum": "aa0af0169cf13db1f8133e8d76afeeae5f71d63d179794377a55b6c2eb938dc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00643-of-01024.json.gz": {"num_bytes": 317523344, "checksum": "5c060166e776f8efda48882c118dc0fd5e058d9ef40be578bad31e477114a16e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00644-of-01024.json.gz": {"num_bytes": 318876813, "checksum": "ad98ee119742cb8a6efa1be46e9670969397c7bde10049886d7d6fceb82387ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00645-of-01024.json.gz": {"num_bytes": 319981258, "checksum": "8930ae8e14c124218793d2fd1bbfb1b624e918cb092b21c6ca74347abd9dea4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00646-of-01024.json.gz": {"num_bytes": 319624889, "checksum": "a40705c4f9a4db4d2d698cf96e43b99fa0790b886506300eb4986a26de7063e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00647-of-01024.json.gz": {"num_bytes": 319240920, "checksum": "7129182faeac82b47127458e92903a209acf8272166024e8313c167d6f358456"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00648-of-01024.json.gz": {"num_bytes": 317305623, "checksum": "3124091a6c438fecbfc948b1a35ffb1462287ae06866b02a6dbb1a6651ccf1e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00649-of-01024.json.gz": {"num_bytes": 318998755, "checksum": "fdb286cfe9e9091a57b31be61a56a425fae07d6b44f0b45f8743d7aab0e980dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00650-of-01024.json.gz": {"num_bytes": 319612451, "checksum": "ff88c4310f049344b8a3f701bce12d08ef5f9b037e82fef7f1f670b3d51e59c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00651-of-01024.json.gz": {"num_bytes": 319098081, "checksum": "9c3b1843082aae39b057bbc7364e69cbc39bbdf91d5bff4f52b12cf1a264adf2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00652-of-01024.json.gz": {"num_bytes": 317107981, "checksum": "e6199d12a893ae5d05c5388ae7a679df419ef6a050c8e3ce3c15fe534943a774"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00653-of-01024.json.gz": {"num_bytes": 319623884, "checksum": "333ac93cf1f1f4da0f72c5e57b675052453b42dffe1e4d45ec680f4e3e075d97"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00654-of-01024.json.gz": {"num_bytes": 319055728, "checksum": "1efe352f2f2eba826231a5bff6c79390630b44039b226a5041a087e116b60f5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00655-of-01024.json.gz": {"num_bytes": 318539829, "checksum": "613c741cfb738017b3fa233512296d9127d661738721d3fccd806aad54d19d84"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00656-of-01024.json.gz": {"num_bytes": 319970377, "checksum": "51fa9b217b6bcf664c472cc2b258813e1f1d7a0f501c29b822221bccafa4e201"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00657-of-01024.json.gz": {"num_bytes": 318548629, "checksum": "c542c6fd2f3284d64f8d53b71ab8308bbba59f7f13e9d9eb20bbbaf13ad4782b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00658-of-01024.json.gz": {"num_bytes": 319845984, "checksum": "b3d8fb6ed2258c463367108e2942742e88eac657c859cc8d128035110fc87e7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00659-of-01024.json.gz": {"num_bytes": 318887872, "checksum": "02feb4e03020d767a4468251786d4857d5dc833969626bee616c7882bfda9ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00660-of-01024.json.gz": {"num_bytes": 319854892, "checksum": "a997d9187a185a29fb3bbeb1e696d32898efba8f5e9d6ed816493669f0c5ec02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00661-of-01024.json.gz": {"num_bytes": 317599289, "checksum": "86d9189ebc534c99da5a4407624a623561b159f758fb04373a270887d0b45709"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00662-of-01024.json.gz": {"num_bytes": 318138720, "checksum": "9c626f7aebcc4fc9afd533b6c8a372d884d01f508ce49c01ddd830e4e9e8b2d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00663-of-01024.json.gz": {"num_bytes": 318110835, "checksum": "441d4dd0d5d2ea7b6098a3fe006b9d7afd526188824a3325d44538fc5655942c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00664-of-01024.json.gz": {"num_bytes": 318996945, "checksum": "08ab0739c3565643b6a83d7091936f5d75a4d8418c956146114aa0315f205dd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00665-of-01024.json.gz": {"num_bytes": 320612903, "checksum": "1ab7bc2d0f7c6704c97848a9325015f06228339bc52cc1fb593d9c56145e7c48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00666-of-01024.json.gz": {"num_bytes": 319241006, "checksum": "8b1213325ceb2a2c89dffb891a31317e903d08fff911e4ba1ae66fc3bcce9973"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00667-of-01024.json.gz": {"num_bytes": 319650665, "checksum": "14676f97937eb3d0734e5f121c5f63002ba2d2c62b6c41b4b46d2fcab9ea9614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00668-of-01024.json.gz": {"num_bytes": 319198651, "checksum": "a406fceed5b7d17ff6d5773679c3df50e747215e39926228ddc9a60c6bf9d152"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00669-of-01024.json.gz": {"num_bytes": 319363200, "checksum": "1d3267d77f43d3d720dcd79c40bc3e8c0cd777d421b1b7d0e69e140199e34552"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00670-of-01024.json.gz": {"num_bytes": 320079826, "checksum": "85111c229b8fcc8428b3c13676bde8268f027fe06e1f576a3adcd82bce1603bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00671-of-01024.json.gz": {"num_bytes": 319494773, "checksum": "eeeed8d9f63a5c16ab9d62454fae5bef1896973cfa69cedfcfaac4565a793b27"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00672-of-01024.json.gz": {"num_bytes": 318304853, "checksum": "6793ec3ffbc147c36e471e1c06a664ac2143408c9ee46305694708eee0fb38cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00673-of-01024.json.gz": {"num_bytes": 319031236, "checksum": "3c886ff71973805a59312d8d43ee9e616bcfafd76c03a64d53ab548036b1fa90"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00674-of-01024.json.gz": {"num_bytes": 318647345, "checksum": "fd7f4efc0c8af611e7e137680342843d0471ca072421ab3c172a169ba2f5d217"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00675-of-01024.json.gz": {"num_bytes": 318313871, "checksum": "3b797b2ad717749a24866a97acb95aace0dd4e91ee7d51dcf1fdd46a9232b794"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00676-of-01024.json.gz": {"num_bytes": 318858652, "checksum": "2ccdf652fd413dc624643d35a76223e8a44e6241997841ec2d13ae11b56400fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00677-of-01024.json.gz": {"num_bytes": 319236091, "checksum": "bbf069c696f09e5467b17ba98479948a85101efa776094084e37581e72c01123"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00678-of-01024.json.gz": {"num_bytes": 318996096, "checksum": "3e3dd21861c713bd38d1803c32da1c0bc2496899648b4cffe1fa2e61b35ca056"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00679-of-01024.json.gz": {"num_bytes": 319915466, "checksum": "6ed56468a31564cb25668ceb5df325ff7138dd231afa85f676ac7af5e81e0642"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00680-of-01024.json.gz": {"num_bytes": 318537417, "checksum": "959ce407e7a892495c477b9e0071dff496fd20db9cfb04dd035ac59dd5b2f309"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00681-of-01024.json.gz": {"num_bytes": 320181225, "checksum": "0aa77d778f24bfdc8566b390a7a1ef1d7880a42b98b3e82e9b37ee3ed821a8e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00682-of-01024.json.gz": {"num_bytes": 319087756, "checksum": "a4da802570ee7bc27e752069612b633edf226078f48d5f55280f73a6dc934127"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00683-of-01024.json.gz": {"num_bytes": 320019766, "checksum": "587497efb7bcd4ca85ec0559e372ea285c1b95e3889d406f142cfe454d8e0e2f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00684-of-01024.json.gz": {"num_bytes": 318814245, "checksum": "6e904f73976ca18aed3375d1c1b308d749b9a4405a333dd0a2cf85360822e205"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00685-of-01024.json.gz": {"num_bytes": 318586686, "checksum": "c51012772c5bae73821b67f72c035f22a40725d42bcf51e439bbdfcd84393ef2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00686-of-01024.json.gz": {"num_bytes": 319648436, "checksum": "890b7408abd0cc04a84be3a3992d05714dbd30a9d33a8a9b05316a980fe51313"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00687-of-01024.json.gz": {"num_bytes": 318909835, "checksum": "b54b20c21ae9834b630a8aac057d47069cf137577d30b91fd1475f5824b61561"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00688-of-01024.json.gz": {"num_bytes": 319381735, "checksum": "422091d5ba0d44c64bb0c84ab4757318414bc01455a97f53190eddda89c2f3f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00689-of-01024.json.gz": {"num_bytes": 318995026, "checksum": "ad5080fbddc914c649027d5e2214f1d75e0cf0617eb3ca0b1fdb8ed9129f99cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00690-of-01024.json.gz": {"num_bytes": 320745318, "checksum": "d45492346bb4bf519e657356ecf1805b6b592683b98c20c93da2f07c50b06092"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00691-of-01024.json.gz": {"num_bytes": 318575084, "checksum": "43a07e8a98bc99f381558c938fc83acd4a37d565459c0f3f83aaadda816f66c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00692-of-01024.json.gz": {"num_bytes": 320651368, "checksum": "21a790ef1dcc9c6ffa071d1a2e21e330d6afcb45368dde9cfae8933c6d029742"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00693-of-01024.json.gz": {"num_bytes": 318429145, "checksum": "85558018ee61e33c4f3e05acc2029e69447a5717be880e9a0aa8fa715dbd0c05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00694-of-01024.json.gz": {"num_bytes": 319562061, "checksum": "894f4c906a33c644ea80c3a00155ced807a62e1bcd9f6e254cb6c88efeedd142"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00695-of-01024.json.gz": {"num_bytes": 318298964, "checksum": "06eb05f651f1d2fff495c48475894420334070df10c051c7253b7afb0bc38291"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00696-of-01024.json.gz": {"num_bytes": 317473664, "checksum": "59ea4f951335553945a644f7628403ba1a99a27e0d93fcfe5db18cbc3dd48ce9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00697-of-01024.json.gz": {"num_bytes": 318839008, "checksum": "f0203b0f2caa3287b8f7a64288af52bafbf033bcdf31dae54e501e4da47b9935"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00698-of-01024.json.gz": {"num_bytes": 318288032, "checksum": "fe2a581cd174429a81424e407aceb1d81b61d9796d74db4590327778fbd5016b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00699-of-01024.json.gz": {"num_bytes": 318696527, "checksum": "edf3aabcdb28fa2feb532b3bd55cd167c2200a6d8e19f05152be194e48acf87b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00700-of-01024.json.gz": {"num_bytes": 318900366, "checksum": "67d89417d1440afeeefd59a0993e4d12fb5731e917ec7f4e65d9319541b4b9e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00701-of-01024.json.gz": {"num_bytes": 318901212, "checksum": "64d302459e6871325282fd890d2922cb1fb25b47d677ce793bc065acc8d1bd07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00702-of-01024.json.gz": {"num_bytes": 318913325, "checksum": "f0bb360189166a0bd717bad85edf06943333b1854687839864aef3ee02814795"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00703-of-01024.json.gz": {"num_bytes": 318730274, "checksum": "c4e027079b9cf9b1adae3e285c5cc5dafeee5c74cf3621c424b6df9801d508f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00704-of-01024.json.gz": {"num_bytes": 320112232, "checksum": "37540f6a00523cbf429764893aa15aae6a57e53c89cf51d82a815feef02b1210"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00705-of-01024.json.gz": {"num_bytes": 319643559, "checksum": "9dae018569fa4bf33674f67ba03732a2f85cfceb53ec2cbb9457eaea607b8dfa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00706-of-01024.json.gz": {"num_bytes": 319941519, "checksum": "03926405dc629f0664a3d27c700a4fa2f606496f0b52a9bbf2fd2d75faae2f46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00707-of-01024.json.gz": {"num_bytes": 317628508, "checksum": "fac92295e4c85f087d27e0a6f231d782be7b2448e99cfc42c09c0e1e20964c3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00708-of-01024.json.gz": {"num_bytes": 318863059, "checksum": "39d4880d3e47e65ab6351e94b015810d66295a86a9f08534260ccbef41fdaf04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00709-of-01024.json.gz": {"num_bytes": 318412651, "checksum": "044fc99a1307737bc8d6d8a9b67997010309fc695eda6e8dd42e5b6bab2256d1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00710-of-01024.json.gz": {"num_bytes": 318631334, "checksum": "0b2c93cf298051864b8660e57182b38408ad738cf930afc09afdde26d952f819"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00711-of-01024.json.gz": {"num_bytes": 320587866, "checksum": "f1f6bb9770b76742d0131495879fa38ed8aebe8a0b38463e7834f0697f174ede"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00712-of-01024.json.gz": {"num_bytes": 318191204, "checksum": "b6873a7d375aa29ff39ca17c3bbc7e328292b1671b59a35e7b01c0e992da90f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00713-of-01024.json.gz": {"num_bytes": 319472539, "checksum": "3bb12a0a806ecb8a5eeaa00188c655f399460609b8a19005a7141bbcb3a7a694"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00714-of-01024.json.gz": {"num_bytes": 320196397, "checksum": "ca6e1fa6f27c9dbadbbaa767fd21dddee7c84ca96bbb6735640ba2631668ad0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00715-of-01024.json.gz": {"num_bytes": 320075706, "checksum": "1a773eec7d738c0e1e253bfd4533f0c43c0d133e564c3458159e0c47d767689c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00716-of-01024.json.gz": {"num_bytes": 318736413, "checksum": "c17a6b2115e56cc3d6bbbd94e8565fb14287057f80199528e6cba20adf557bf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00717-of-01024.json.gz": {"num_bytes": 317351537, "checksum": "cdba391e16c3bcb5569d978a8d11518103e7687714710ef4eba4f7c0821d67d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00718-of-01024.json.gz": {"num_bytes": 318017965, "checksum": "a25c494e4baead0af0afe6eabaa054bc15f80b6ca0ac8dadb1b354d72ffbe63b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00719-of-01024.json.gz": {"num_bytes": 318124432, "checksum": "94f5dfbec85a8c5b22ff1368a16ec2eb7fb4be25c0c8f004096156ae40bfa2bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00720-of-01024.json.gz": {"num_bytes": 318235852, "checksum": "c0248326e698599dcad01eca25d747c138881c61b5636ba765b21f9cd0df996a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00721-of-01024.json.gz": {"num_bytes": 318817834, "checksum": "c11df487a966e748cec522fae4ed76abf3e8cc9bcd28c301117fa52ddb83dc6d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00722-of-01024.json.gz": {"num_bytes": 318553851, "checksum": "63d3d0c3f5dcdff29a0a6ef41e3a9df3fb505c73c8554839e3032293a78bae2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00723-of-01024.json.gz": {"num_bytes": 320174720, "checksum": "29c97bb8ff301080547255af29bb5019a2c1fbc74f0a2711e626461d5a5f0b54"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00724-of-01024.json.gz": {"num_bytes": 317805413, "checksum": "65f8932f3c77b0fee5f2224643a71ff95246720368fe66d45c22df25ea4b9c2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00725-of-01024.json.gz": {"num_bytes": 319460597, "checksum": "dc785a8aa3a1f4ed77512d51a9139dfb24b356b5499ae67dd5b860101b1e0e4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00726-of-01024.json.gz": {"num_bytes": 320934004, "checksum": "45d857536d3535d08cddb6cf50d08d89cc28138a5be082465c3a8c27c02ae2bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00727-of-01024.json.gz": {"num_bytes": 318393879, "checksum": "e4a02e43eeabbecb81b971f4201212104b6214078cafd9500d5b5f323595f060"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00728-of-01024.json.gz": {"num_bytes": 318826577, "checksum": "cfaa0d0c8dfb333899c73e0c2aa00dfdadd00e5b4a3d477e7518c4141899c8a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00729-of-01024.json.gz": {"num_bytes": 320390067, "checksum": "528fe99b0c8dc917ac0f02a555603f9ae81e690b4ce1040f65ebbad3390c0426"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00730-of-01024.json.gz": {"num_bytes": 318156386, "checksum": "786e6913b4417a87cd4cb1882e181d8b2e1eb4b4db5b4b9ad2120b5efdf3e2ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00731-of-01024.json.gz": {"num_bytes": 320013543, "checksum": "f28fc2794c280fc1de263b9b2a81e42423f8dac3af7c4fbd3b3aff888821ca9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00732-of-01024.json.gz": {"num_bytes": 318753697, "checksum": "69491eb25dbaef78235f769422e773de7a2578e678ecde29dcaa663f4ebfa78d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00733-of-01024.json.gz": {"num_bytes": 318640706, "checksum": "dfde8960d738b873bcb75abe1661fcaa096d70c76aef21846b173b8adf049bbc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00734-of-01024.json.gz": {"num_bytes": 319447398, "checksum": "145add76dcd73916b548e7e3b161757c1bdc1f22a0f127019f24827afd6f85e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00735-of-01024.json.gz": {"num_bytes": 319868149, "checksum": "dcd4ba95672630f89e75b70dc08cb918bbe896f5d32ffeba7d3e4921b27c1f4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00736-of-01024.json.gz": {"num_bytes": 318404586, "checksum": "4710b1569342b7aa7ca610d8b8cbb2248a1c5fcd8c6ab3b7f875657dff4779cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00737-of-01024.json.gz": {"num_bytes": 319915151, "checksum": "7091dc758fd14c206514663eed0ae446178ff38e76c4cb7e711c63d419506e49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00738-of-01024.json.gz": {"num_bytes": 319709793, "checksum": "afe1a96ced49662b14bc60b4ff8fc1f610bbc6f3c515bb73f2fade7a0ba67678"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00739-of-01024.json.gz": {"num_bytes": 319789716, "checksum": "9e2332cfc994483d4b913c6556ca9c1698b95e81033b7bbc5a4f5271e5cce708"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00740-of-01024.json.gz": {"num_bytes": 319102226, "checksum": "61ddcc3af919b753638dd46f18f790d7783cdc3090dfddbbeb40faa93bed340e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00741-of-01024.json.gz": {"num_bytes": 318717589, "checksum": "aa3038c23a37561f2ba92e95ffeaa3e3641c1a69f8688b724116edd128e9ba52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00742-of-01024.json.gz": {"num_bytes": 319456536, "checksum": "ea9d23abfed6e3e8ab900291a3bc1faa27751ff94e35378f8c4eb07207036a9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00743-of-01024.json.gz": {"num_bytes": 318641730, "checksum": "6efcec6cd087be4eaa98491e463d0fb9c1253aca275971de08c56a20be9aa579"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00744-of-01024.json.gz": {"num_bytes": 320264992, "checksum": "71653351253c8f7fa18673a3f956bddebd158978708c5a4c9e9b5318f598e1f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00745-of-01024.json.gz": {"num_bytes": 318665967, "checksum": "347dfd824d6f4afe58c6f418ab5d332909038c880f4dcda7f774d3d7a588c3f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00746-of-01024.json.gz": {"num_bytes": 320005833, "checksum": "812bc3c082e3a65c8c77fc7767bb435f9be9a999961d84eadc9e0c602e5ce168"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00747-of-01024.json.gz": {"num_bytes": 318575441, "checksum": "a4414d376c69ae8dd5e60b206315cf920d5a797c6ef7c08fe0c4b4e28b4eb4ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00748-of-01024.json.gz": {"num_bytes": 319266882, "checksum": "f08aee694b85d5e7120652350bfafaa05495e609aa6d2fb0b913ed8a718d7dcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00749-of-01024.json.gz": {"num_bytes": 320205042, "checksum": "b3402b16a5cc817d89a19fd3456a50b5b6d5f3f555eea725167558cc85366d12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00750-of-01024.json.gz": {"num_bytes": 319198252, "checksum": "6b95232f6d53cff8045bd5ebaa87d6e6c511a74dc646d2a960eb87e801ff4f2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00751-of-01024.json.gz": {"num_bytes": 317855407, "checksum": "badc9d82efdbc8db5dc328e8aa5e80155c52f00b105b136d8c5c948fe237d61d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00752-of-01024.json.gz": {"num_bytes": 320283992, "checksum": "67c32eb497533d6fd20b206c38483d171275029ff525bba3da13b0c62e1ef073"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00753-of-01024.json.gz": {"num_bytes": 321030653, "checksum": "5e95b1cb54d7d7f12bec1559ababcab0c364a0af99e10a42a08357647ef5d3cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00754-of-01024.json.gz": {"num_bytes": 319059779, "checksum": "32cb59ad16dfda8a5b52615498fe2e6d85753fa44ab667af2f525a2467508da5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00755-of-01024.json.gz": {"num_bytes": 317737268, "checksum": "0ad2fef2fe37d59b163e29c2287938a768ee87acc34752394809295d0710c602"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00756-of-01024.json.gz": {"num_bytes": 317293218, "checksum": "db737ceace329fb1f8fe1aca38db048a1dedcb5226a4132485f26afecdc6c3c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00757-of-01024.json.gz": {"num_bytes": 319529375, "checksum": "8b823e97964894189a13df393e1b3978342fb24bd81f07af6e54b7bfa2992796"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00758-of-01024.json.gz": {"num_bytes": 319297548, "checksum": "3f31d7ad99d88dde757a651b12db909a30cfcae5796fe3f85722598d92344ba5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00759-of-01024.json.gz": {"num_bytes": 318154496, "checksum": "a4b780127d6f22aed49d155e234e21a847a60626143a8e7dc6e31a5f204e79f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00760-of-01024.json.gz": {"num_bytes": 319386997, "checksum": "020e68dc60004d0661de8a22fe2b9fa7f481fcecaef8fb06efa43093a2a9cc52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00761-of-01024.json.gz": {"num_bytes": 320035555, "checksum": "8d7b5a97770a062276ca909a3bd20365cbaf3931fcbeb8b7e479f5ee03b47053"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00762-of-01024.json.gz": {"num_bytes": 318099583, "checksum": "b8fcbbf9b55cde2ff66ca046884870e1e5f2d2a729a8eedb253c16fe0d7658e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00763-of-01024.json.gz": {"num_bytes": 318354409, "checksum": "ce2d9e44161b13f6226cfb9f93ad42fa0edd18eeaee923c8ab31c25aec1fc976"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00764-of-01024.json.gz": {"num_bytes": 319181291, "checksum": "53ed1ef77f24bdd7c189aae0905d63be97f48aa3233fda139e59af53baab242a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00765-of-01024.json.gz": {"num_bytes": 318147738, "checksum": "26b9b9ea2f94b322c03d1b83b25ab4e9a1a203fe9923728c5dd91f22d5f8fef5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00766-of-01024.json.gz": {"num_bytes": 317964368, "checksum": "e59fec52abde3fb4cea58a5a4e511f4cc61e21062bfdd1e3ffd60131a847e0ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00767-of-01024.json.gz": {"num_bytes": 318750919, "checksum": "0e5eff983e793a3d7cdd1ec85a45d58e5e6ecf7a12cf83a01888e148ab08acf9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00768-of-01024.json.gz": {"num_bytes": 318978892, "checksum": "171509b0bed8854b6de92fe146993be80ab31e0aa56953c7b0a66eeb738ff70a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00769-of-01024.json.gz": {"num_bytes": 319386097, "checksum": "704e7daa85c0e3ac974d51a6e2cf6df2ee053613fd2b77b5fe16d10b29a50a4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00770-of-01024.json.gz": {"num_bytes": 319623528, "checksum": "e787064473427fe17ba95d9326d009e9723148fb314a7a9605dcb6698854dad5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00771-of-01024.json.gz": {"num_bytes": 318911381, "checksum": "c54aaffd8162b30280e974e81e9d0669357b74394e0da2d1ca2ce613f5715e4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00772-of-01024.json.gz": {"num_bytes": 319386949, "checksum": "2f9c83681632482df6c65e4c70718c83f500305ee1d061626cdef35bd794a412"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00773-of-01024.json.gz": {"num_bytes": 319962599, "checksum": "f47c487ba09051c9a4bf320d69db9546e98948e3de68050ae2ba025c71e09146"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00774-of-01024.json.gz": {"num_bytes": 320370991, "checksum": "69a1eacfdb6f6fd49ea2b729a7ab291b96fd5bd42f993e2306d044871b069aa7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00775-of-01024.json.gz": {"num_bytes": 320433220, "checksum": "d35934fb537d1283d40897d05c1486f629776fe9e4ef127694ecfd0221f860c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00776-of-01024.json.gz": {"num_bytes": 318809986, "checksum": "9079970aa1618b6be51caeab7a2cab26e61c30aa53af361a6184ef6249bf65a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00777-of-01024.json.gz": {"num_bytes": 319617796, "checksum": "5e200e354ece1713a32a3e1ebcea33412de814dd5843df3523afa1ec9a4d5275"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00778-of-01024.json.gz": {"num_bytes": 318039278, "checksum": "b79309eb335c0c860c85d2b724df52c3613f61b92ab6cd6276c2be8c25a7b01e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00779-of-01024.json.gz": {"num_bytes": 319078058, "checksum": "fc6053d53255e4d4a4c22c42049ce3eabc224320a51c94c1116f3201f87b377b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00780-of-01024.json.gz": {"num_bytes": 317637428, "checksum": "e38c933003910b02beef64af2d330f32af6e6f3b7346fa121e89045c136c13af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00781-of-01024.json.gz": {"num_bytes": 318792407, "checksum": "b6795b4db199f7a7a92ef195aee3753e5e00df05fad2d8401b2b9feb56d71a76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00782-of-01024.json.gz": {"num_bytes": 319081289, "checksum": "dc20640bded03596eeec689f1293be55e72d138cf0c576df9768c7631931ceb9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00783-of-01024.json.gz": {"num_bytes": 318663257, "checksum": "ac2b4ee9ab8f25ec010a17358d2f3f1fb9d8d50c9f4b73357429277710e6564f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00784-of-01024.json.gz": {"num_bytes": 319687102, "checksum": "fb93dee8a974f2ea204c240ed4c24e1b64f91ccb421070be305487e4e53ca083"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00785-of-01024.json.gz": {"num_bytes": 318909034, "checksum": "2f298b358cc619fa72097e3dbd9ac91e7dc3f7c5f9c4f2ff6881c988921d2a6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00786-of-01024.json.gz": {"num_bytes": 319213094, "checksum": "60ebe35e0f23ccc61fc0eedc891ea9deb43001beb8205d31360a05b5d58e31f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00787-of-01024.json.gz": {"num_bytes": 318335621, "checksum": "a7b0aa4dafdda2f3dc3c1832b71d4a92af08f99a70a315b4cf9f60c1768bf2c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00788-of-01024.json.gz": {"num_bytes": 319444037, "checksum": "874dda510a01a2f78e51d917d309bcf1a0f21e7e1ca46661f93931a6200b3d01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00789-of-01024.json.gz": {"num_bytes": 317955670, "checksum": "ec949a05ec7750dacfdf692c1ba118a33454097fdcaa56626fb042eb93933811"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00790-of-01024.json.gz": {"num_bytes": 319033823, "checksum": "0939164a602d7c7140c619130977b6814639122d0038aff7bb840093def5172d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00791-of-01024.json.gz": {"num_bytes": 319366402, "checksum": "fd6ea942b3402b5da4acb1a03bf59b17df402e90c47dbb66fb198ca2f4b5e1cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00792-of-01024.json.gz": {"num_bytes": 319218667, "checksum": "9e8af5aaa6d5ed915eae334c6101948fbcc7bcf6c8c6beaf80fd1adecd67b078"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00793-of-01024.json.gz": {"num_bytes": 318865241, "checksum": "675330d6736a677760d854dcdd9a174eb7c1d426f94e34836a048c2139befac0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00794-of-01024.json.gz": {"num_bytes": 319384084, "checksum": "fd4c2623d9cbaed3fefd6bb88c2d88b58fe8f08e9e8ef0cea6bb22cac68dabd2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00795-of-01024.json.gz": {"num_bytes": 317654308, "checksum": "157533ddb56290662e25cb60842327daec23e377e116496338c9313cbf6991b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00796-of-01024.json.gz": {"num_bytes": 319298258, "checksum": "fd90f055499095efa9cb848dee62406d25820f929554b0e07674d4c95db574b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00797-of-01024.json.gz": {"num_bytes": 320048871, "checksum": "e089a95e96a081dd76e38acf9506bfc7b86c682892d3a8774e9784019db39306"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00798-of-01024.json.gz": {"num_bytes": 319291246, "checksum": "e29133ab6f83c84a69752a451053dfe20887ea884e09cc373afd89bba7458664"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00799-of-01024.json.gz": {"num_bytes": 319175282, "checksum": "8f3f3a67946615bdf499d64341d200477280947e5be8538748e28db768115947"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00800-of-01024.json.gz": {"num_bytes": 316687275, "checksum": "c9a17dc92658ce5d062af25e5c8610a7fbae501627cfc7324ace7ca6a8d75d8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00801-of-01024.json.gz": {"num_bytes": 318710698, "checksum": "4b7d1e130fd8ba536da073069221f68d567492b2bff27d8769fb4ef124cec3a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00802-of-01024.json.gz": {"num_bytes": 318914381, "checksum": "9f186b8d08f5d3090b7c9eb8a6954cf3202caec7cbf5c308221333cd115af561"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00803-of-01024.json.gz": {"num_bytes": 319111424, "checksum": "117b0590a976805001a879c49c42db55579e5bb9a5d4db9ce20e42746f59d574"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00804-of-01024.json.gz": {"num_bytes": 318186018, "checksum": "ea376d6cc1043dee9a00e1eca1c431aa59755d8966162701817f9cf274a758c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00805-of-01024.json.gz": {"num_bytes": 320382848, "checksum": "1e69e7896202206f9f804b2497c4d99cca5c1d139efc782b8ede2cb88f68b48b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00806-of-01024.json.gz": {"num_bytes": 319508172, "checksum": "9da7e230c7abed9beaed9d6090efa8ae1029a418dbbf6d04bb4386aafde3dbce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00807-of-01024.json.gz": {"num_bytes": 319995091, "checksum": "2e3ba0dbe85c004c6a23b4caf340282e0d0004ab574a14bedc9c83c67cc2c0c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00808-of-01024.json.gz": {"num_bytes": 319880961, "checksum": "f53fd08fea0f874d727422357521176c6810a54abf4fcc7019357b50f1928daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00809-of-01024.json.gz": {"num_bytes": 317100774, "checksum": "dbeed220f330b489cc262fbd7cbe84f04ba8a5118ebbd8f48bc7a4f5f63ae7b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00810-of-01024.json.gz": {"num_bytes": 319625750, "checksum": "fe5dced88ccd54b258c6740d8988e10b128a869ecf28e7096e689c59fa147d4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00811-of-01024.json.gz": {"num_bytes": 318375975, "checksum": "e4bcc5571fdc4f51b733d975e78ff02939d3463264a02d7e651271ab91c81df8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00812-of-01024.json.gz": {"num_bytes": 319663092, "checksum": "b1e41c198bc69d026ab997fdeaa4e687f7a8ddfca751add9bc85f00481708a63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00813-of-01024.json.gz": {"num_bytes": 319094357, "checksum": "c07287aedf6854f581aaf83b75c4939aa4b10181977d4c4be97c20989ab8f992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00814-of-01024.json.gz": {"num_bytes": 319521327, "checksum": "c96203ba5461ef92a7a2b0d4e598efda943b5b3adf42a7268c26f1c224410c01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00815-of-01024.json.gz": {"num_bytes": 319098749, "checksum": "72f2e65c5b482be0d9e3a3d8f5cdb703cec7a515e927bc4411e2f6ff5085ed5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00816-of-01024.json.gz": {"num_bytes": 320377295, "checksum": "df95ac17a25cebb854088cca345f60c2634d07f088e45e251d7f9afdb334c0c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00817-of-01024.json.gz": {"num_bytes": 319007451, "checksum": "bad1cc25de4f66ff36c69284e6b615f68bdc25e45f08e04e33ee463a0c6ef0b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00818-of-01024.json.gz": {"num_bytes": 319609737, "checksum": "acf1b390f1c492d97bf027f06898f1dd5cf8cc6def41f4d43b38a0c99f4a85e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00819-of-01024.json.gz": {"num_bytes": 319164157, "checksum": "3d973eb401876c57e9cd1420fc938da9dd7b08f97d4596c66a8c159e2b56b1b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00820-of-01024.json.gz": {"num_bytes": 320181073, "checksum": "101d5f0079caa840b934c14800ba5cbb7fca22e9e6915b98b4dc5f37c57f5b4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00821-of-01024.json.gz": {"num_bytes": 320949305, "checksum": "34ba423c93c4262234e6e2005aba0436daa99b05570cff0a58e9d27b65d76896"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00822-of-01024.json.gz": {"num_bytes": 318392521, "checksum": "4a586e220fe34f544dd068f4e1c310459cabd5dbea9a991c21c09f70079eb4c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00823-of-01024.json.gz": {"num_bytes": 318526893, "checksum": "3b10a8e32a3a8f6541400d697516fcd3fffba3554e8d8a96451f01fc6b729d8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00824-of-01024.json.gz": {"num_bytes": 318640792, "checksum": "c921270db8004d309f91e3209340c476191793d47b3cfa9d19fdc602d43dfe65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00825-of-01024.json.gz": {"num_bytes": 319524026, "checksum": "a6eb347db464976ba5d1aaa4fa64e103ba36520dd1e9c103644caf187be471a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00826-of-01024.json.gz": {"num_bytes": 318469810, "checksum": "dc5f88e6161ac06165f3cd4cb91a00cdff75d2f900e8f53d62bacfd833e352b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00827-of-01024.json.gz": {"num_bytes": 319391185, "checksum": "66a240be851d6622adf7801d9634a456e83e9edfd135601c0dc1aab48902d7cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00828-of-01024.json.gz": {"num_bytes": 319625277, "checksum": "2e989beeeb2a63bfb87a5a401619a8e4155a961b44441cb5f627c29f25962dd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00829-of-01024.json.gz": {"num_bytes": 320001237, "checksum": "0653e4052fb7a4ef503bdfbbee332d650492e99c130a85c04250e18d91cfd30c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00830-of-01024.json.gz": {"num_bytes": 319240468, "checksum": "bd56e55e75a8237b5292fa65e5ecb0dfbabef6ef0dec6695b13522803210f40c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00831-of-01024.json.gz": {"num_bytes": 319174603, "checksum": "ca9d6c643127a390823655256a45462ee6e75aa2485141f6530a3bdf6ce4f572"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00832-of-01024.json.gz": {"num_bytes": 318909883, "checksum": "e91c35d94e183515e660cd8c874c12bbf22e1fd683312446f02287b0d032fb68"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00833-of-01024.json.gz": {"num_bytes": 319095835, "checksum": "971d9a4f8bfce564d42dc0a80009acfa7d2f47557ac19836ab426defe1877714"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00834-of-01024.json.gz": {"num_bytes": 318319786, "checksum": "159412a58fb8deb59e039fa0102bdb746065cbc6b4d1d3da892930fbf8b0f178"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00835-of-01024.json.gz": {"num_bytes": 319959334, "checksum": "814518d53b3023e3b8ac22dad9d65dd50d455a4c7db1490022f447f793f4d24f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00836-of-01024.json.gz": {"num_bytes": 317642779, "checksum": "19ad4fbaa3ff5c638b77980300b8c162c21a8237b87d054a30c46aee67d0ad94"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00837-of-01024.json.gz": {"num_bytes": 320687986, "checksum": "190de7948a4b163047ecdfc856e5f78bbff52ca883edfad26b32fbc0b57ffe36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00838-of-01024.json.gz": {"num_bytes": 319802866, "checksum": "ccb4d342791a187f3bde225e008ff8cf70465f7fd3eacaa8bbce1ec4e52c2622"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00839-of-01024.json.gz": {"num_bytes": 318621894, "checksum": "3ff5cf5b33996a663df5783f3f41a5b5b2f6e08a2cf91e74cad3bf82291192fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00840-of-01024.json.gz": {"num_bytes": 319757379, "checksum": "8292e0854c01ca79ef03dcc1752ddc1f0df747ad67551b7c0fa5208b6aa3f822"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00841-of-01024.json.gz": {"num_bytes": 318779722, "checksum": "9eee9e089bd396adf5a276eddca9f6352e07f8c33877f85c1f65968aa0c06128"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00842-of-01024.json.gz": {"num_bytes": 318692591, "checksum": "caf3f40a144b43af08687e41a1eb7d08da1b78cd1600574566e11f29fde9cd34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00843-of-01024.json.gz": {"num_bytes": 318944616, "checksum": "e74d624534091173546755ca236e5912cc8acf8cfef5f9c197b541ebe76f0818"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00844-of-01024.json.gz": {"num_bytes": 319392887, "checksum": "e47d3f44f996398b54f18729f4e81d88d04b19bc529847e86277a6a91ae74e6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00845-of-01024.json.gz": {"num_bytes": 319215311, "checksum": "de7cffe64f422b02668137272943537946c15539954b564345d6722c4eb06345"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00846-of-01024.json.gz": {"num_bytes": 318129297, "checksum": "1d5ea0ab8fcb3975735aa421d646cea4544087f60a79ec209b63c93b6318523f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00847-of-01024.json.gz": {"num_bytes": 318134095, "checksum": "6fa4c50808df2aa8efebae3bbf832ba2b0be2f7113633fef720cffb3c50143a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00848-of-01024.json.gz": {"num_bytes": 318521356, "checksum": "3aeb657aa448af82551c653802c669c985c00b7daa593de07f80733ae5dee84d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00849-of-01024.json.gz": {"num_bytes": 319541694, "checksum": "1cc016f58a4a2c54625214f028df05247ed319b8c1868c96c2efe8147a73d08a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00850-of-01024.json.gz": {"num_bytes": 318861613, "checksum": "eb5fbe6eeb4b0281604df264a5b04a3a0db96ff0d04f252375a788a0d3345c67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00851-of-01024.json.gz": {"num_bytes": 319356648, "checksum": "ffe1397f1d412979cc66820555ef27345f3a2a48b8bcfe682d48301135e8c12a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00852-of-01024.json.gz": {"num_bytes": 319662372, "checksum": "fa78ed98d602276520e823e17adc7f796320d95e27e08d84d06e66e415b79161"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00853-of-01024.json.gz": {"num_bytes": 317625507, "checksum": "b10cff62fac5191b9cb5e2025227adb838088773e79bfec0937a34bb857e1b1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00854-of-01024.json.gz": {"num_bytes": 319665550, "checksum": "15441b2a7c09a477389a8fbd7401c549dc8281f2bd44251b1546077301e24624"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00855-of-01024.json.gz": {"num_bytes": 319059897, "checksum": "f6127845b162181dd7157dd316021a4e6b5d41393c66d3e577491cdb74657f2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00856-of-01024.json.gz": {"num_bytes": 319243991, "checksum": "ec9f0884c5ddf82550105f969222d3ee8b0d4907a0a2540ea6c8c67c2d2e9179"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00857-of-01024.json.gz": {"num_bytes": 318546680, "checksum": "840205fa73336ff51d75008ce8c530164ebcef3b50f1ad8deab879a67acf8d5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00858-of-01024.json.gz": {"num_bytes": 318306547, "checksum": "e9b3819e9dc98d66a61f8f4e8f6ecb03099c79ae87a175fe1ae484174b173b44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00859-of-01024.json.gz": {"num_bytes": 319088302, "checksum": "eced8de72f8755fa0dfb690c626cefcacf5fbbce97029d4589058913c31b9339"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00860-of-01024.json.gz": {"num_bytes": 319704792, "checksum": "90a169718609f16abe120c4b63a20adc0bbedba51de14b004d34dabe530339f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00861-of-01024.json.gz": {"num_bytes": 318444445, "checksum": "d020840f09fa426ee15d19f05e5afd9cf674048e0dc4438dae0b6f02c7227d9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00862-of-01024.json.gz": {"num_bytes": 318606300, "checksum": "e02bf9d3f1a398972f7d78b9b1aaff9a92146554a1358ea1b16ce7873a9f8fd8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00863-of-01024.json.gz": {"num_bytes": 319273730, "checksum": "c977f143cbb5e61160ce76f1cabf7bea6c158abb7e159ec3362aad1cc7af0ade"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00864-of-01024.json.gz": {"num_bytes": 318143165, "checksum": "bdf20dbde61f0663feb70be419c39c60acdc7ecbbe1430d47bf79ae2e114f168"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00865-of-01024.json.gz": {"num_bytes": 319041356, "checksum": "11c9c068ec5c1b612494c1473b7cace67a55ee66155559b19035df180ee260a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00866-of-01024.json.gz": {"num_bytes": 319758401, "checksum": "ab4436f283af0ef2d33b93cf026907cf68255beee9d9dc1d6c542dee9c3f48a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00867-of-01024.json.gz": {"num_bytes": 318991336, "checksum": "56beb5edbca3b66981f5f8e65f2a13a0f6e99e68ff50cc263cc529a4d8ebf371"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00868-of-01024.json.gz": {"num_bytes": 319984390, "checksum": "b9368d2ae0eff869c70c1a1214126c1d084f56887102d3d46e450b2c934102be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00869-of-01024.json.gz": {"num_bytes": 319462888, "checksum": "68ab404e0ca2247686eb264a0d7feeb9d2460162434f5babb2b1da82d865343e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00870-of-01024.json.gz": {"num_bytes": 318426018, "checksum": "2d60208a558f6ba92d6c6307e1ab626acd7ff3b7bc25963b09e87e464751c42b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00871-of-01024.json.gz": {"num_bytes": 320233396, "checksum": "ee2517922079c713605dafffe6bc0db0a947abf64ff92c409aa1015b92cdb099"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00872-of-01024.json.gz": {"num_bytes": 319570251, "checksum": "83ca4f125bd628cb28210fb874db717635009e36c60b42237bda48fcb611a53f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00873-of-01024.json.gz": {"num_bytes": 318755978, "checksum": "d94ce49fd17da5f70d1a89bc9e5323daa54f0b8417e1ee5d991467c80c068ec7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00874-of-01024.json.gz": {"num_bytes": 318986904, "checksum": "f634915d1b529d9d728fd96993bb151dc07016767cd44ceeedddec73eaf37074"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00875-of-01024.json.gz": {"num_bytes": 319116193, "checksum": "6367b1216e1c6ab18af66471d866f39caeb9a538209134a9e6bbbcb81bc51db7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00876-of-01024.json.gz": {"num_bytes": 320829257, "checksum": "c9ad4ab8c6e5995aaacd72ebc6654b43b4756804bf3cea808610f9b618f98fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00877-of-01024.json.gz": {"num_bytes": 320082625, "checksum": "835ae7d54732c309bc9aff231268474af66653b06ad6ca17b54dab6f4a7d30c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00878-of-01024.json.gz": {"num_bytes": 318964554, "checksum": "49c761449d5052dd6c408268c77196bffc5125eb5189390f73ba0ce8550f0175"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00879-of-01024.json.gz": {"num_bytes": 318699617, "checksum": "521e1c5fa967a6f29641e7c4c2b210acda0736b32f318e24aef0e587895ed492"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00880-of-01024.json.gz": {"num_bytes": 318723630, "checksum": "dee1814b24f9bbc3aa3430cd80302b08b863eb1b92698158960b6be216845843"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00881-of-01024.json.gz": {"num_bytes": 319839271, "checksum": "9e57ea6a0e3d8a7798a0cb3e6344e1711e8fd879e2e396294718ff360fc7c4df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00882-of-01024.json.gz": {"num_bytes": 317773196, "checksum": "2e5e5749618e53668222c7d310929e2177772dd7c14592e61dc86f163e353c8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00883-of-01024.json.gz": {"num_bytes": 320262049, "checksum": "f80afaa4495a2d41ad4d7380b79040569179b24ef5c2df17f75ce8e135d786b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00884-of-01024.json.gz": {"num_bytes": 319146213, "checksum": "77338479b420dab9316a4737fc243de84b5e88392cbbb46fa0619045a42432cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00885-of-01024.json.gz": {"num_bytes": 319022605, "checksum": "3a67fee2fb77e64aa13fd595d7786b432203f36712ff723ec5999a341834b38c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00886-of-01024.json.gz": {"num_bytes": 318624429, "checksum": "2afe387f2500c57294acf1403a8c27f27f6c7c2d228dee0f1ed70a02c438f838"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00887-of-01024.json.gz": {"num_bytes": 318733911, "checksum": "3fe087b3441f74730ab137ba9486650cfedfe2d724573c3d166565d7d1e40938"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00888-of-01024.json.gz": {"num_bytes": 319926754, "checksum": "dd2df1977458cac34ef1e52059bbc28738e541761d7ad11c0ffc8ef3ca061190"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00889-of-01024.json.gz": {"num_bytes": 319085344, "checksum": "4172244cc3fc4a4e9e09f04f8097cbc678aebaedb9d1fb97b1daae16b0b8ef45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00890-of-01024.json.gz": {"num_bytes": 319838671, "checksum": "8ffaf34eb8209e7ec250303298f9eebd2833fedcf80414c20331e8dbed42251c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00891-of-01024.json.gz": {"num_bytes": 318169092, "checksum": "daaf74ba5d12a7415da94be0f4454336aa3d86ad5cd300dbe30cef596835ac8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00892-of-01024.json.gz": {"num_bytes": 319662776, "checksum": "6d99c0419a6c9633620fb0aa7b7610cc5d06696e839a1a52953fd7db7a18e053"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00893-of-01024.json.gz": {"num_bytes": 319541919, "checksum": "5f246aeacef0dc8d40a036bb1eeecf278f66d7215a134fb746d30f3420d18c18"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00894-of-01024.json.gz": {"num_bytes": 319528897, "checksum": "9975fd5d23d25938f00de3fc9240d77c27b4784c2f443b1914652a06d3b59fcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00895-of-01024.json.gz": {"num_bytes": 317548307, "checksum": "7af9e2abfaebd4afe05a0e28d3e6e3126800a8b9b7ad49de360e42f2eb2c8506"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00896-of-01024.json.gz": {"num_bytes": 320278601, "checksum": "1941689d6a0e449423faad6e41714f33d5b23cdb1bb73961a888a87678fc74b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00897-of-01024.json.gz": {"num_bytes": 320161831, "checksum": "3d951cb1ae4a9b3c6ff70555139435febda83d24bb04ea27b229a05424b470c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00898-of-01024.json.gz": {"num_bytes": 319341305, "checksum": "3227b97aa9ff57b62be2a26fd8131e9ea45f7731673acb43432e529ea4978a25"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00899-of-01024.json.gz": {"num_bytes": 319658969, "checksum": "c746f8bd5fffac933640ff39db0b9d7b022edb28d7a4b3237d8c69fd919b7b48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00900-of-01024.json.gz": {"num_bytes": 317494627, "checksum": "0327f0c57a668b2b34e72f4c53d4cfaeed787d879843d0bba27b5be58d1ee5fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00901-of-01024.json.gz": {"num_bytes": 319683481, "checksum": "886449092779ee26fccd11e0c89c36e449346dc6b1f0a7cb15b6b53c897790a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00902-of-01024.json.gz": {"num_bytes": 320228529, "checksum": "6960d8539df78e98858ba8cebb2e637b6c2ef20890b5f2af1cbf4621b52c364e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00903-of-01024.json.gz": {"num_bytes": 318961279, "checksum": "4ddb3c9e9276d220f1d4dfc32bb61a090e895e9e3c9f53c169db99a024e7cd95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00904-of-01024.json.gz": {"num_bytes": 319926290, "checksum": "69a941cbbcb673efdb254c162854fcfff6fe1132182210235b91d1d21ed4d2ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00905-of-01024.json.gz": {"num_bytes": 317982280, "checksum": "1d9613f366b91102d018e57894df520aaf1910aa98e06cf369d9676e498610c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00906-of-01024.json.gz": {"num_bytes": 319012210, "checksum": "4855989c814582f5cc0a5e9b8f9d1f642ae33de81625d4bbafaafb709c1cd260"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00907-of-01024.json.gz": {"num_bytes": 318515420, "checksum": "8f34dbaa454215922a29fea975357e4e705381a65e4dcaf8b0d8c200f9a277bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00908-of-01024.json.gz": {"num_bytes": 319286320, "checksum": "536bf0610a2c14d1d59aea0b52fdc29cec19cd7eaa4c3a5e5fec04dee103b29e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00909-of-01024.json.gz": {"num_bytes": 319938295, "checksum": "3bb3943183f579c15d0d30440f6c82d0c9c64d6ded398dfc7c67502d73868781"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00910-of-01024.json.gz": {"num_bytes": 318423425, "checksum": "adbdcf170531c725b54c1e5713676b789589b2fb77310f3e64a0cc30b83602ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00911-of-01024.json.gz": {"num_bytes": 319578185, "checksum": "a1342a95ce77013820c36e7d038ed47ca4d40cdf3584a66abc310132435b25fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00912-of-01024.json.gz": {"num_bytes": 319154715, "checksum": "4973afcb1d7b4816e3a3df1b9ce1e48a0eea4fe8ead5f83ea753e46a934e5ddc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00913-of-01024.json.gz": {"num_bytes": 319011218, "checksum": "c9a158f69a123859569e1cdd475355afda32d7e5c48001591f0b6c20dc17d572"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00914-of-01024.json.gz": {"num_bytes": 320027387, "checksum": "61f6c0f839908e7d3105a6926c501bcacd293d1ba50c3b8639ee227c9a8270b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00915-of-01024.json.gz": {"num_bytes": 320280632, "checksum": "a74fb91d8f7d79b09017a7f996b6ca5d59e4ecad9fec354ac977c0076d53fc66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00916-of-01024.json.gz": {"num_bytes": 319278877, "checksum": "cbbb8dc274fabb4435db5fef5da1d91671e1a4c7f3f652742324f9632b01c5dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00917-of-01024.json.gz": {"num_bytes": 319616831, "checksum": "31e62cbd6209fb7831078e4a262d1b25c0590f9425c62b2b208d4030ed5722d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00918-of-01024.json.gz": {"num_bytes": 318635363, "checksum": "95e5c2f51abc9ef4c0422e91b77f79ff83c8cc38e585df621fbc0dfef48a84c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00919-of-01024.json.gz": {"num_bytes": 318885096, "checksum": "ea5960d4fbc7d5e7097edbf2c9c706e6b7c7e9d3e36633be9bd68c4038955f10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00920-of-01024.json.gz": {"num_bytes": 319228627, "checksum": "73b721ae576dcfa83bd963e49530f73d76b788a669e3abc1c02189900c80cf02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00921-of-01024.json.gz": {"num_bytes": 319557114, "checksum": "710c65cd504e87b5019c01f658e669d1e023473d879913a9522760d33546cf24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00922-of-01024.json.gz": {"num_bytes": 319356053, "checksum": "f0b54b3c6b51a356debc9414df0438ee525ae5114cbb7c8176634b7493095022"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00923-of-01024.json.gz": {"num_bytes": 319766600, "checksum": "d5b80091c8113c283d91ff5826b46068b96c423c0dc74a646e2c8d1c5d815cea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00924-of-01024.json.gz": {"num_bytes": 319733540, "checksum": "56a54c7d4114c21c1657df0d295839c2bd4904cd1b651104e2a155c2bf1b5aca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00925-of-01024.json.gz": {"num_bytes": 318944357, "checksum": "4d396c29cd1d9ba16016fac37c333c0a872f6cb0e9faae7966e53f6e5c879d67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00926-of-01024.json.gz": {"num_bytes": 320276135, "checksum": "39a64c261a76d5e13f187f12c886b22e2db08fba968bc9d0c1cb0d3c241abda7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00927-of-01024.json.gz": {"num_bytes": 319181837, "checksum": "86db529dd52fb67173588fcbc9f0e52c99ad6dd34e44865150bc6c962de5b3c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00928-of-01024.json.gz": {"num_bytes": 318966114, "checksum": "d232df8033ddaa7397dbcfa8ba4ded9421ee9bfc091c725b311fd963b29f13eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00929-of-01024.json.gz": {"num_bytes": 320087917, "checksum": "fca6bfe8fe17c867681c58df081f2186dcc6bf22e46ce3783f85b918644c0b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00930-of-01024.json.gz": {"num_bytes": 318921677, "checksum": "b8031359e758cd835c44e81303e04ef7b2137d2e1a9472d7e04552c353d883c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00931-of-01024.json.gz": {"num_bytes": 318978028, "checksum": "bb5f2ea8a2e56c69813bdc08cb243c0763126e7b5f6c5cb57e7f4767d2126f89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00932-of-01024.json.gz": {"num_bytes": 318627424, "checksum": "f6fd2065ce202d5347243a2b396707bb606be20c1829989bd7dff6d9fb7adec9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00933-of-01024.json.gz": {"num_bytes": 320226802, "checksum": "b303d2ece81c1f7b882703b915765212796518010aea6a108a441dd0a84a6128"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00934-of-01024.json.gz": {"num_bytes": 319908526, "checksum": "e5b05714922d132073122e83933853f52f0046c9f51f985cfbdbd310e8d677de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00935-of-01024.json.gz": {"num_bytes": 318941663, "checksum": "4296055a31409a778c516afe25a8108f23dfffaf13cac33e5ed834a37c46b37c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00936-of-01024.json.gz": {"num_bytes": 318430860, "checksum": "4634630c012ed184b264ea01c97f7bb3f1af030f2466f1d99d20bb0472f74511"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00937-of-01024.json.gz": {"num_bytes": 318008229, "checksum": "131cc9a2fef4ebe81749f1844b7c4b194b97de7db4f5253ce59207e68d8b4df8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00938-of-01024.json.gz": {"num_bytes": 319099506, "checksum": "fff55e3b2ff8b53e56ab99def626a7334ce67d2414351b2e83d84298052dd9b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00939-of-01024.json.gz": {"num_bytes": 320457851, "checksum": "8431e38c86516ed88d5c028f4a1dad32b02bcccdc03f9687d18f8312e493bcb7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00940-of-01024.json.gz": {"num_bytes": 320607829, "checksum": "a68c577555781adc777c09c68f623431469d67e9b66af7b0813f09a512b7d777"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00941-of-01024.json.gz": {"num_bytes": 318923471, "checksum": "807ffde4034b6b95a5eacb71f093686586ca11e417517894cca99dfe7b12563d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00942-of-01024.json.gz": {"num_bytes": 319880902, "checksum": "d03d04f619a8f3afbefa6d67986f50d5ee264c45de36c0ba67b069e343e002ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00943-of-01024.json.gz": {"num_bytes": 319079341, "checksum": "e482c4dee03a34a1a5756e6def26134c9a3f18ee386f5569d6cbf16d3875a429"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00944-of-01024.json.gz": {"num_bytes": 319436318, "checksum": "6241f9f35640598c05bc5cd00d8cc024dde59c0065c8935da229a8a583de32fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00945-of-01024.json.gz": {"num_bytes": 318998098, "checksum": "85f192c1ee9734da0f1dcad31c2b8111076977582e139ecc1ba959bf2df6b262"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00946-of-01024.json.gz": {"num_bytes": 321951470, "checksum": "44bccedf6a8db115bb6563d6775ff03c67511ce4e23a2de77e79edcb568c9fa1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00947-of-01024.json.gz": {"num_bytes": 318689631, "checksum": "36f0bfa191ad7d51452d51249c724150f8c3774142df3720f176f2772f42f3fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00948-of-01024.json.gz": {"num_bytes": 320347661, "checksum": "f4a7afa90b6d81a4cdc99100b75b4d3174c4d5d670042766c3e0418b7a97ef80"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00949-of-01024.json.gz": {"num_bytes": 318054841, "checksum": "f39d0c9bfc0a562ede67b8cfc57e6974a8a999e2bbc1b6940f107169b4f06e4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00950-of-01024.json.gz": {"num_bytes": 319722042, "checksum": "bf376260e5a838b3b901ceb22f922829619be710718446ee95c24400cbc73495"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00951-of-01024.json.gz": {"num_bytes": 318315382, "checksum": "987cd895f63bb74c9d4ce229ee853c7bce53c75c324366a0d06377c36030e39f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00952-of-01024.json.gz": {"num_bytes": 319247792, "checksum": "d218dda02748a22821c2ecccf1cbb136dc8772a25ddfacc7ab354fc089470e87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00953-of-01024.json.gz": {"num_bytes": 318411551, "checksum": "698768f3d7959b33fa74a3827e995b0c184bb3b4c46eba667d7dc3365fdd07f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00954-of-01024.json.gz": {"num_bytes": 318809810, "checksum": "651d9ff43d5a3f7f5945ccf26b9410018248bf64956f3485c50b0df9034fb2ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00955-of-01024.json.gz": {"num_bytes": 319761211, "checksum": "29fa5c68fb8d3719e5f5f17568ce888522de64499554b5f0f4dafafb4ee5b40b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00956-of-01024.json.gz": {"num_bytes": 319255736, "checksum": "333a90a9c13f71e41a7cdd4784684bc142c79ef99155b9d62d062db318798b93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00957-of-01024.json.gz": {"num_bytes": 319504417, "checksum": "730c90615fca09c81d9644cfae40d325851bb9bbc1af696caaadd67d8282ab5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00958-of-01024.json.gz": {"num_bytes": 319066016, "checksum": "bb565af6529720ba2a3e989769b33d978ef49cb2aae49c60f2ff98a981414280"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00959-of-01024.json.gz": {"num_bytes": 319887940, "checksum": "8992783693dd0ad5ce07427f6b5739c818f13952d90bb61312ec98f9c813f313"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00960-of-01024.json.gz": {"num_bytes": 318051437, "checksum": "4773edbc822ff8d51ec13af6c371214aea7545047d9babeeac0b29180d52fa0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00961-of-01024.json.gz": {"num_bytes": 318373291, "checksum": "ff33854746566f7d3b4ba9eadd1329ece48c034345fda000d9af73cb26d197af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00962-of-01024.json.gz": {"num_bytes": 318572513, "checksum": "a6d07f7caf55fda0df74a22b454d196fb2e29312d433bc5506b00448c22b579c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00963-of-01024.json.gz": {"num_bytes": 319488084, "checksum": "453f666c6578376508b1fe8bd3fb8ea5bf030aca5cfedf383cd23b27de15228f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00964-of-01024.json.gz": {"num_bytes": 318905670, "checksum": "74f64ed6583e6a4df4b3c3f8a76263a2d63905d51d5680d9683d86f5039d5b56"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00965-of-01024.json.gz": {"num_bytes": 319452844, "checksum": "88016c1a0663b89dc3d76689c827c82a6d128401ae05f7b70c8727d75302cd47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00966-of-01024.json.gz": {"num_bytes": 319334588, "checksum": "dd9300bdc27513dd62578e1cf3c8302647b49c61185c282a684011d788c43d17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00967-of-01024.json.gz": {"num_bytes": 317872396, "checksum": "90747ee63ac7d8176fde1f2afce8deb7e39bf19e682e17d0fcc1711d09d5f1d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00968-of-01024.json.gz": {"num_bytes": 318988069, "checksum": "2cc785d650013d35d5d31b1e85c5530b197687c69117881362bf6b98f47c22fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00969-of-01024.json.gz": {"num_bytes": 318324244, "checksum": "83750d93c788ad32a256862b8173db3549eedf52ac131f09f662f1fe0f46bd13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00970-of-01024.json.gz": {"num_bytes": 319494164, "checksum": "e0e46e185851ec569dc13a18519988ad926bdcd9bf448eff00aebf6df141f5cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00971-of-01024.json.gz": {"num_bytes": 318714665, "checksum": "941c9bf116353230417950d292c38b12b00935184162227eaec01870ab7f4510"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00972-of-01024.json.gz": {"num_bytes": 319518275, "checksum": "de30e19a155a6f4303afb0311416aa84cc3baf5a09cef55b8e2adc2a4f478f6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00973-of-01024.json.gz": {"num_bytes": 318092574, "checksum": "f70bf6727f1f308d93684ca41e9c2c68dfbd737a90da6375b58f162e8470fdea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00974-of-01024.json.gz": {"num_bytes": 318555677, "checksum": "109fe184ac9498ac571cd9c6cb38ae5ed566b0e98e8b7718984656a70cc6b224"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00975-of-01024.json.gz": {"num_bytes": 319045215, "checksum": "03c4257851857450f7397ac3d627a60ffc98708ad5aac6e1f73e6ce818fe7be8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00976-of-01024.json.gz": {"num_bytes": 319172031, "checksum": "7d98fa662aa9d0ff7ed50cc72195bdda2147212b34a3d22f0f757a4eb158d5b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00977-of-01024.json.gz": {"num_bytes": 318650530, "checksum": "bb8ccc07ecc6fd39ae97136418efc543efe5541e85910a7f333ee5cebaa3b595"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00978-of-01024.json.gz": {"num_bytes": 318609909, "checksum": "40b49f3fbb2fce73bb1851304b290fc7fb400d13c2448ac7e5e559dccfda7ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00979-of-01024.json.gz": {"num_bytes": 318881197, "checksum": "b29f96cfba574428cb66f54b20c4a848bc83438256167afdaed576a3931117a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00980-of-01024.json.gz": {"num_bytes": 318506081, "checksum": "a15996adaaf41e5615cb5c7fa2ef1b4e3003836542d0851d1c6907522f534fee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00981-of-01024.json.gz": {"num_bytes": 320000305, "checksum": "38e282b433c4e3dcc9fc2b056f6ddbe4eb857c5137f7c51301d53ca259d6bdc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00982-of-01024.json.gz": {"num_bytes": 319959158, "checksum": "97d5e58088a87a15b71db975d5e09b69daf497b7dff3ef809e1b8292caa27905"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00983-of-01024.json.gz": {"num_bytes": 318921242, "checksum": "f062e04f89132576ac1969fdaa43db761a0ff7e4269a6f173d87fa011a4c289b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00984-of-01024.json.gz": {"num_bytes": 319577980, "checksum": "e52a6c08d5243717f21120b4c3ebc8fcf77168928945adf68bc665392a6e8d11"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00985-of-01024.json.gz": {"num_bytes": 319812101, "checksum": "8b4f5645ae0e0b190af4ca5335c57735ae919d3c6402438af506c7907f1d1494"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00986-of-01024.json.gz": {"num_bytes": 319582409, "checksum": "3654109968d918aa4d8db17cb7057111c42894cfc7eee093df13036cfb3ac6fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00987-of-01024.json.gz": {"num_bytes": 319957581, "checksum": "4b9e6febb461940b993c50945a2ed06736c6786aa8f758565ff545814ebfddcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00988-of-01024.json.gz": {"num_bytes": 320346479, "checksum": "2891565dd75fd4354777b4f4f393983180584ee9c64b5d9b4557dbf26a3c4cfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00989-of-01024.json.gz": {"num_bytes": 318546717, "checksum": "929d0236c9fb77d638e0a18aa97b00004316bbb0ef3c4323e39f61aaf7c0af53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00990-of-01024.json.gz": {"num_bytes": 319606761, "checksum": "6ebd2552ecdcce7b194d4f6d5b5e66ede9d65da4e4999ee8ec4705d847e473ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00991-of-01024.json.gz": {"num_bytes": 319117521, "checksum": "1b3496964d0a895b347529ddb7b712d211c9419317fb41cdd6e20bba43f39f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00992-of-01024.json.gz": {"num_bytes": 317781551, "checksum": "9f9cfb5f9152b9a60121b03c24d944129c1ee43e862112fe3896e2772fef99a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00993-of-01024.json.gz": {"num_bytes": 319341839, "checksum": "fb329b7470ae127efe1be4adc960b06eec4f55bbcbe1f3f0f0b794d70a8aca14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00994-of-01024.json.gz": {"num_bytes": 320357337, "checksum": "bbe9a60c3c2b3b5b11a5d531d1d85f0a90ebe3dbc79189b3825e169ae302932f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00995-of-01024.json.gz": {"num_bytes": 317824612, "checksum": "26643091ae3425b63036453ffca7ed82c85c24b6a24264197e6516b68a39a4c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00996-of-01024.json.gz": {"num_bytes": 320453890, "checksum": "db33809437e62bf1f086f40e4d66ad0133db7c7d406b2ce52ce5d9c9b0809961"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00997-of-01024.json.gz": {"num_bytes": 319469732, "checksum": "3447b74f09dc4d63dd04d6bbd4382147071504338e6ea428b37c3a5174877537"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00998-of-01024.json.gz": {"num_bytes": 319562604, "checksum": "270a1c19e6321541398836d3d982c2e396db99abf94317912714251d1f68e8ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.00999-of-01024.json.gz": {"num_bytes": 318895764, "checksum": "d68f8f4d85d91679c20e972b2b1955d41a8f6601873bb311a2621f4b3f3152a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01000-of-01024.json.gz": {"num_bytes": 317697031, "checksum": "68b47464ca3e97e9d3f4075b656f804c1bab667f231701db9cce1f0b0a921088"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01001-of-01024.json.gz": {"num_bytes": 318915840, "checksum": "582216879b058ccd4d0ca2edccaa2db49b64459371f8798a1d9c66c06a0cf908"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01002-of-01024.json.gz": {"num_bytes": 317811256, "checksum": "6864299a7d0174f92abc696dc293524291623891b86cd69132348fdf78760a4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01003-of-01024.json.gz": {"num_bytes": 318605529, "checksum": "4ef35b7546266f99eae5f332cbe3e284801c5d7b39f840297d67e71c036edf62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01004-of-01024.json.gz": {"num_bytes": 319379897, "checksum": "040dfa80eaf8355370d8a50692bc3ad03a1d57272af340d70031a4398f37b9ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01005-of-01024.json.gz": {"num_bytes": 319515177, "checksum": "012ac70ef2715181ec1fb578a2366d68e786d3a9ea41c59c08d7c494b89b429c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01006-of-01024.json.gz": {"num_bytes": 320078217, "checksum": "46030d85d8333ae224320fa54e487f3770de7de280cd0001344136b0bd87c431"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01007-of-01024.json.gz": {"num_bytes": 318526753, "checksum": "dd432d865ef3dba4b5af30e42b11ace96900bd7b97af053ea892292e75bd142c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01008-of-01024.json.gz": {"num_bytes": 319407137, "checksum": "165cd3a688be6f9f5a4cedde198a9dda4f9d3dbc1d275d1e99411f3ee96a0d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01009-of-01024.json.gz": {"num_bytes": 319763066, "checksum": "e44e86d497f8471e53531374b0e6ee61aac54996b6af64a4af0f5620673f9f7d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01010-of-01024.json.gz": {"num_bytes": 318653930, "checksum": "61115f16e718d3a2b66574cc17841aa5d02739762138abe3c9a7f325cf9f2e31"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01011-of-01024.json.gz": {"num_bytes": 320037079, "checksum": "65e18df845f1e6cce1bb92a45f71274dca94d3f0ece1d556116085b5c0e6338f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01012-of-01024.json.gz": {"num_bytes": 319753418, "checksum": "cd5a8ee1bc7d9ad58e98aa6fe56d60501115592519a19efcf9fa370668c6327b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01013-of-01024.json.gz": {"num_bytes": 318657671, "checksum": "986ead2c1b37f4094aa6f7a7882824ff013e6393323d5290d7f3e9215589d07b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01014-of-01024.json.gz": {"num_bytes": 318028602, "checksum": "3c82c0611fb1fb0f635eaedd2bbe7cfc9d53d1ae967a9cbd0416def046e4b104"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01015-of-01024.json.gz": {"num_bytes": 319164504, "checksum": "5eb5cf76022b12d8751a2fce5c4d4831066785a68edd7b3cd3dfc10017f91621"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01016-of-01024.json.gz": {"num_bytes": 318474894, "checksum": "a99d827be814e27d948264d6ae55c6a032a664f3ff0ef6ae94bda90f7faf29bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01017-of-01024.json.gz": {"num_bytes": 319516762, "checksum": "7eac25ebb9383a4592023634b852d88a128604c494972a8fd9e2b183fbb303a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01018-of-01024.json.gz": {"num_bytes": 319433935, "checksum": "35adb751748043a36f22b412d3ea0e01166037cd96216f516abc547e9d2609ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01019-of-01024.json.gz": {"num_bytes": 320305440, "checksum": "54c4d52564221e48dc5354cb51d447658707ab8edaa3d6d8fec5ec379a29d462"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01020-of-01024.json.gz": {"num_bytes": 317445661, "checksum": "edf1c6ab9900d75b91738fc7e9e3db8cdde3f9ef2234ff249833b5cdb04c65a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01021-of-01024.json.gz": {"num_bytes": 318134525, "checksum": "1c5e670ec9d815637e9bdbd75289c7ef7f3ecf384e32f403ae8a9fe2595cc983"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01022-of-01024.json.gz": {"num_bytes": 319809162, "checksum": "9def881764ca614c88ceabb41032d3e145f06c843a7ceebd87dba6b93c974a6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-train.01023-of-01024.json.gz": {"num_bytes": 318155801, "checksum": "552a6a2be423c0ecbb767611074200c5b85c1cf76c8640c79e3be5e967b293b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00000-of-00008.json.gz": {"num_bytes": 40471190, "checksum": "1f25b6af12da84115301d4ee93ea5246c8fea5bb4a2008472794d95b917cc97f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00001-of-00008.json.gz": {"num_bytes": 40675053, "checksum": "db4c23d7a336032de37dfe2f3ed39653c8afd94004d4e8d9c73c03222299292c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00002-of-00008.json.gz": {"num_bytes": 41175078, "checksum": "4bf6b248b0f910dcde2cdf2118d6369d8208c8f9515ec29ab73e531f380b18e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00003-of-00008.json.gz": {"num_bytes": 40728516, "checksum": "082b72c1ec600502df2e4403df6884390c85627ffdf37a5b700397c9a1ac6b8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00004-of-00008.json.gz": {"num_bytes": 40920200, "checksum": "37c2ce46864db0b6f1fe89220ebf4ef811ea10485c8336f1712227bbbdb530e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00005-of-00008.json.gz": {"num_bytes": 40921460, "checksum": "00b164e59df49df5dc1df170db99bb0d9207a6329cb9272ed8b6ef7a55058359"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00006-of-00008.json.gz": {"num_bytes": 40549809, "checksum": "86896a9baffe0ab9df39a2901f0e515009989ca1fec9a42583d718ce16166b5a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en/c4-validation.00007-of-00008.json.gz": {"num_bytes": 40446172, "checksum": "0bf87534c7050091c60466df50f174c3147d052ec7dc645da9574c902445beaf"}}, "download_size": 327104523018, "post_processing_size": null, "dataset_size": 1658004128680, "size_in_bytes": 1985108651698}, "en.noblocklist": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "en.noblocklist", "version": {"version_str": "0.0.0", "description": null, "major": 0, "minor": 0, "patch": 0}, "splits": {"train": {"name": "train", "num_bytes": 1029628201361, "num_examples": 393391519, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 1025606012, "num_examples": 393226, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00000-of-01024.json.gz": {"num_bytes": 396728190, "checksum": "06fcf4d9bf6ae45fac94245952f000c924d2a0b5cc8841c916b3ee949333410d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00001-of-01024.json.gz": {"num_bytes": 395686133, "checksum": "8a0b64c5efb1db1ebcc0a664c801221049f5812652dc1a727a0e9f8d0df0cd0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00002-of-01024.json.gz": {"num_bytes": 397762165, "checksum": "087fabf9563297a6eab8bc39b68c0c6d15169032001d3a17c9bd964080759f2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00003-of-01024.json.gz": {"num_bytes": 395307518, "checksum": "1e5b89200528320e354f60be0868a3ab6dbbe667a6b16b48e4739b988a6360e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00004-of-01024.json.gz": {"num_bytes": 396280504, "checksum": "8291badbe84854960c0ddac3d6c226cb519268d1b3fd267bd72cfb4f10800de1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00005-of-01024.json.gz": {"num_bytes": 396636600, "checksum": "c74226ceada7d78e3e7a2ad931d0a99df93f4cc4377ec69d4f1fab4164c3d845"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00006-of-01024.json.gz": {"num_bytes": 395364336, "checksum": "4e52e99dfc4e55c41226978b4dbf48fac2f886b9b0446bc3bd576f32bdd7cfea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00007-of-01024.json.gz": {"num_bytes": 396428805, "checksum": "283ae93ecc3f8daefa9c47651ded763dc5f339ddc619c8cb5e32dce9cb9cfe4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00008-of-01024.json.gz": {"num_bytes": 395030041, "checksum": "d3fc7fffdf9c2172d233bea3bb7dc485d753319e6196672d0186b8ba04a1d903"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00009-of-01024.json.gz": {"num_bytes": 398255693, "checksum": "61e10cef5c2cab162fb1d26f97fd9d76b30c9ee989c01ef8597d2a4e35b303da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00010-of-01024.json.gz": {"num_bytes": 397825333, "checksum": "f72040887c2a2c17564c2c6a9a4b5ff95fce6a0eed4f0800cdeff8277af651ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00011-of-01024.json.gz": {"num_bytes": 397877458, "checksum": "ee34ff11164e10a86f76593205cb13986c70ea3d3a8849174a6dfb5b4ec91262"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00012-of-01024.json.gz": {"num_bytes": 398317059, "checksum": "7a3ef558efaca3e5d19e9ad02b47dd61f9639dd806130b62d66e9c3341c0edce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00013-of-01024.json.gz": {"num_bytes": 398518794, "checksum": "f5a6c18992ab2b59a9c02469d20768bf5757624e03bcaf92957ce736a3a9edb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00014-of-01024.json.gz": {"num_bytes": 397026214, "checksum": "c174b625c1534c69814f8e4879169b58af96f801dbb433113740af0d78535abd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00015-of-01024.json.gz": {"num_bytes": 395621683, "checksum": "4e8e52a602d4eb4b27104780f4a36617505505fb66a82f36e90631a4e668f5b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00016-of-01024.json.gz": {"num_bytes": 398138551, "checksum": "a3e7a95b16f09e09e45f1c3bed3524415581e21b065d8efcc66cece705dee4d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00017-of-01024.json.gz": {"num_bytes": 398720813, "checksum": "79cdb89052e8dcecd1f1319e47f4c4ae1d350ab81777a9ba8077cebdb558e795"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00018-of-01024.json.gz": {"num_bytes": 398538940, "checksum": "8da6aac3a794ce326b5a3971fb75a2ee848f008940d4f1bedd724ce7c5874278"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00019-of-01024.json.gz": {"num_bytes": 396834319, "checksum": "b57c93502949dad9001e89847947f6c65943927eb519e16de4eaf5590b235faa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00020-of-01024.json.gz": {"num_bytes": 396402861, "checksum": "05e14c7e21df3d4af7be7a597fa22463868464d6475282376536e12e82367401"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00021-of-01024.json.gz": {"num_bytes": 397560852, "checksum": "756d15d8b07414dffd7cff3efde606aa62cf8f73b85d8e1cd17408d6a339414b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00022-of-01024.json.gz": {"num_bytes": 397210987, "checksum": "60aa08d9c5d813d5f2448d910bc23a705cdd0828a9403c18ec223e53623889cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00023-of-01024.json.gz": {"num_bytes": 397563062, "checksum": "bd865213ffb2b40c2cd3eb16724b68c0f37e29f68215990dc84d91852c7c0d72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00024-of-01024.json.gz": {"num_bytes": 395799120, "checksum": "08ff3615ecea3eb5b55703e123475c95afbecfe7107eedf05750147c9ffd12ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00025-of-01024.json.gz": {"num_bytes": 398336372, "checksum": "e3e30b97e585fd881b3a1b006775854a11a2b967d992e7eea886338d8beefb13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00026-of-01024.json.gz": {"num_bytes": 396819084, "checksum": "fddc9e1a8405c5e05e63ce98b19c7833c0fd46392b4b55532b317e7f81426590"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00027-of-01024.json.gz": {"num_bytes": 397912380, "checksum": "d3e597b3a96b993840e47adb761cce2f2ae1c96aefcbd6c250198dedaecde15a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00028-of-01024.json.gz": {"num_bytes": 399078461, "checksum": "abd6d2341b6c61cdb89b80a8b9bfd938bb6d8a423a89e6a9f997c22c6479d537"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00029-of-01024.json.gz": {"num_bytes": 397303107, "checksum": "ee35a3af1056cdab79b644f6352150aeb6fb19a630cd6bc893a072e35fbfbad2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00030-of-01024.json.gz": {"num_bytes": 396602401, "checksum": "1d04d4bc295aee2ab80b24f587f8c483599db7d5a8157acc99a1d8b001f8353e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00031-of-01024.json.gz": {"num_bytes": 395941329, "checksum": "cf1dd244555511245c0e6a5b1dc9c24f747b8377674aa3690677ce08ebb8c26f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00032-of-01024.json.gz": {"num_bytes": 398049663, "checksum": "c83e5572647eba5ab14fdc4dcba8efb6981740b99b8f634e2c6b1942a051c249"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00033-of-01024.json.gz": {"num_bytes": 398044404, "checksum": "b76815aadcf4ad802071428864ce0b406cabd73dfc2be5e20b44885ec6a85419"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00034-of-01024.json.gz": {"num_bytes": 396885224, "checksum": "da00d92418fbdb9799d8f16977b3a33f67cb98a31808544cb68cf3b42ea9adf1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00035-of-01024.json.gz": {"num_bytes": 396185021, "checksum": "265ad43ce00666c83fd441d35ff29ba1ebf7d62442cc3e3c176091b4c725ea9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00036-of-01024.json.gz": {"num_bytes": 396702503, "checksum": "4733156df48f2dd0f2e859fef28f56d12a84e8012085ca9318073ae647b0fcdc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00037-of-01024.json.gz": {"num_bytes": 397582277, "checksum": "7d62d03c3496ee2e17ab6b9635710efef9e4cefb88ddccdc16ed720a414c38c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00038-of-01024.json.gz": {"num_bytes": 396186761, "checksum": "670affddf8fcca6933af3f5b30efd1bf490c3e38c3e90f2e8e9a464994d613f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00039-of-01024.json.gz": {"num_bytes": 397056953, "checksum": "4acbd97f9c8fd9a930a6f4284a11cfe37f6cca3b5858ae3c2cde747dae35e0d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00040-of-01024.json.gz": {"num_bytes": 397809786, "checksum": "d350e48a36bb1ba3125f72a07ed8024d26eae6d89ecac686ac0bdf3d5d89e1a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00041-of-01024.json.gz": {"num_bytes": 396944358, "checksum": "817a58dc40440b8b1f54d129db08ae9124e0293e5a0e45f034fbffb2140d90c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00042-of-01024.json.gz": {"num_bytes": 394327995, "checksum": "6bd6bc1269c2dd81db466ae9c41f76b8b8cf71cc7bd6e131452fa1a1318ff459"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00043-of-01024.json.gz": {"num_bytes": 396476043, "checksum": "f3525d9c861d984ea0cdacba7fddffaef058d8f95aa99ef1f09f9f0792fde5e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00044-of-01024.json.gz": {"num_bytes": 396893614, "checksum": "292ca2b6b9ba41567fe7cc60e5424aa1f3e431ac874d06ae8eb98794563a7d35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00045-of-01024.json.gz": {"num_bytes": 395885483, "checksum": "ea2c8fac41ededba7da8bf2bb48463d83f148e5c0970a689876d4932ab18a3c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00046-of-01024.json.gz": {"num_bytes": 396963386, "checksum": "97672d9bca357cd2721f51301aa37d37a271dd3ca7487244c057570b995da66d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00047-of-01024.json.gz": {"num_bytes": 395856712, "checksum": "52c517670ba4eefb262cb71373d6370f86ddeb0aea7391a47a22d52a55bff7a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00048-of-01024.json.gz": {"num_bytes": 396091027, "checksum": "49f5b68e29c55eb50da941eab1cf446c7d8c9d0b30290318977edb39ef0b887f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00049-of-01024.json.gz": {"num_bytes": 396892998, "checksum": "82a51eb6f301c00d927ca7920338247038cf4e9e0072d74c02bac897701f5859"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00050-of-01024.json.gz": {"num_bytes": 396308050, "checksum": "d72f92ecd27b716cd90cc4abe562d25fe6d49740b4a3d1fb9beac2526a61988e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00051-of-01024.json.gz": {"num_bytes": 396137777, "checksum": "a956e4d086077f7ab309ff10b0eaf4833e4d3ed74435293e96588f4361e1536d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00052-of-01024.json.gz": {"num_bytes": 398302544, "checksum": "5a54f7faa07661ea6a5f0585ca49ad66c8f7025fd9627b3af832dc886d50f78e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00053-of-01024.json.gz": {"num_bytes": 399616791, "checksum": "7f8fa496d50a0b7c399faff4c1864e24717b3f9c86b2552536c8f91e3e0cf9d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00054-of-01024.json.gz": {"num_bytes": 397332881, "checksum": "ab862f26b4fa38b6c16d8cfd0d63a9f0973827e45915e85aefb95d4e182b7b9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00055-of-01024.json.gz": {"num_bytes": 397075146, "checksum": "cb67aa9229bec8b88e496829aa0a60ca1c3ff4a2293632cf7782b69aa71aebfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00056-of-01024.json.gz": {"num_bytes": 397827600, "checksum": "2f63e3ec40d32237d4a50c873b966d7fc2c16ef5c04a2bcfc33328b128654e7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00057-of-01024.json.gz": {"num_bytes": 397533583, "checksum": "7c90bf39bddf8ad0c6a8bb3dff02caea8bbc2abbd76047c5d523930d2a00dbc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00058-of-01024.json.gz": {"num_bytes": 396411363, "checksum": "ee6059f3c8a2df34858a0110a06ec4e9673555fa56c1a2b40930337ba5b1b39c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00059-of-01024.json.gz": {"num_bytes": 396735510, "checksum": "d9dbe2421edba1820294e757d88aa25455db42ce8992f8933b51cd84cfc35a36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00060-of-01024.json.gz": {"num_bytes": 395694553, "checksum": "b05d6502fc95587fa7047fac64978d6be13761dcc6954629332812e5937c2731"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00061-of-01024.json.gz": {"num_bytes": 397740757, "checksum": "39303faa5dc33995dfec683b44fc24066ecccdf6b5001b9c0644d8e9899d45f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00062-of-01024.json.gz": {"num_bytes": 397358263, "checksum": "fe27dd467cc2c34abe5b0bb34473ee68859f2198eeb78304e1d2e54460a67383"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00063-of-01024.json.gz": {"num_bytes": 396826654, "checksum": "1da2c414bd03e5547d8c9c7447e42b8dcff5f6ca8ba35c53076f2895e8ea63f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00064-of-01024.json.gz": {"num_bytes": 395781869, "checksum": "af96de4d6b5bc1ab0527efa33a73d7eb788dca15829acbb7291ce72ad05e6c66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00065-of-01024.json.gz": {"num_bytes": 398192274, "checksum": "7f46ccfc1703fee106e932bc9a1bc5dedf7de944172cfa34ec9b31413bf0bbda"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00066-of-01024.json.gz": {"num_bytes": 397133438, "checksum": "dd3b67d8578927d7474dae76bdca35f35a2aa125fc50873e4a9f6e73d7a81831"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00067-of-01024.json.gz": {"num_bytes": 397204214, "checksum": "4cdc87a7c9fea33e15d638e5c921f45149212769bfba5f59f0a5943398ca0d55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00068-of-01024.json.gz": {"num_bytes": 396489592, "checksum": "64d175c23574998f8c5d28ce3d3f3934144b1fd4f6527ede1aa3420c28bb90d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00069-of-01024.json.gz": {"num_bytes": 397697351, "checksum": "3329857f531c9fa22d98bd567638f0564f73062da1478ca84385246f71baabff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00070-of-01024.json.gz": {"num_bytes": 398449973, "checksum": "bd13494aa03a95d943a01f3436f62c46ee3390b30f6ff0fec0636f3c0b09fa1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00071-of-01024.json.gz": {"num_bytes": 395498960, "checksum": "5e69529ae82c305acbf1f58a7021b4e3fc67285a871dcbcaaff0781d0e721070"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00072-of-01024.json.gz": {"num_bytes": 396170387, "checksum": "9b9c7e11b9bb2cf6ea0fcdfd58754f522a95070feae74c29559522e12e1b41f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00073-of-01024.json.gz": {"num_bytes": 395915819, "checksum": "87a2069589fee8de23730b8b994ba59d63d5128175b5326ba0a8c8ac9e01a3dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00074-of-01024.json.gz": {"num_bytes": 396986018, "checksum": "e073efb3f00db65c1ee14e8bfa6e8c807f7827d0f3dd4d4026f823bc6f61b1cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00075-of-01024.json.gz": {"num_bytes": 398555103, "checksum": "a1793748c7979e241ca34291c843ca3cc90dd7643f04810b6cd324220efbd6e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00076-of-01024.json.gz": {"num_bytes": 396357420, "checksum": "7b1cd69788ca9a7e614de70a8b908183f41f316eaadf3b0236a7c4e126db9844"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00077-of-01024.json.gz": {"num_bytes": 396666167, "checksum": "aec828d3c2a1f7fa970de328a8fd1a85a90493dbcbec4f50816ccbc2275a1fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00078-of-01024.json.gz": {"num_bytes": 398167446, "checksum": "e14bdf5af810574aca7c6f3daa67e503f24ab1705435a62129c66c248667ee97"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00079-of-01024.json.gz": {"num_bytes": 399696096, "checksum": "b63756f81b8b19ecdc9bf227045df10840cbf973b60bd8ffdf28f58a53cdb028"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00080-of-01024.json.gz": {"num_bytes": 398755610, "checksum": "dfc118f680b79260e7ece75f27c0459484eb8458f2422df9f1918f726b54ccb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00081-of-01024.json.gz": {"num_bytes": 396606787, "checksum": "17d6a503947f5132728f53ea62fd093f55bf2dc6a32316a5c0413353cf13eff3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00082-of-01024.json.gz": {"num_bytes": 395714484, "checksum": "8ca41818ee6a0ffd5b00714779289c18cd97d620258c5d3d741c482b72344300"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00083-of-01024.json.gz": {"num_bytes": 396807173, "checksum": "12d87c0a948f32f788497858751c3ef22f289136e6ae58518a97a2e976f5cdc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00084-of-01024.json.gz": {"num_bytes": 397241529, "checksum": "7c3da4ca4d2b2077f0ab7be511038255732fc88d954f2f17cb0f3ab144216206"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00085-of-01024.json.gz": {"num_bytes": 398357369, "checksum": "26df55183e78f8d69fb16e21d07edf98659b69bcb3c48f340da6a5bc44007f4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00086-of-01024.json.gz": {"num_bytes": 396997317, "checksum": "09f0641e9075cb88800d0eaae3f7b99b047552edbc71d1fd2d8594f645d22c2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00087-of-01024.json.gz": {"num_bytes": 397978000, "checksum": "c9437ef5f58a46b8a6d8efcae37fa658da3f2c4f1cad0f9cf47fbcd09bb82f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00088-of-01024.json.gz": {"num_bytes": 398468913, "checksum": "be187fc14017f666b84ed7049c169c1a28654441c2f523eee8b655b3b9d9ba8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00089-of-01024.json.gz": {"num_bytes": 397071121, "checksum": "637c3f964ee2c750a0a175f2e5d24b786a37d37701f10616b448804d68b72f4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00090-of-01024.json.gz": {"num_bytes": 395753807, "checksum": "8eef7ff1a8080aebe5226cc3539baac46ab64d93f8e3ffb6e8b7ab3346e151dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00091-of-01024.json.gz": {"num_bytes": 397039764, "checksum": "a2904ae5bf69b393a697afd62ae9b8a560c1f076e8a141e6f3feef29cb5d1352"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00092-of-01024.json.gz": {"num_bytes": 397058578, "checksum": "eb4d7e2712a9983bc1581133fa8eaa2e1d28b314861833bd8d810d615ec1ed81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00093-of-01024.json.gz": {"num_bytes": 395855981, "checksum": "5c9a7573a5644d89d46666306d333ff1e4af3213f287cb9adb48ef87a023d479"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00094-of-01024.json.gz": {"num_bytes": 399516118, "checksum": "de7ae1508815e48ba031762c084cf6946b084871463821407090d23c197c6474"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00095-of-01024.json.gz": {"num_bytes": 398236235, "checksum": "616cef1f21ef078ffb9fc2b4148735668debdd15a8bc1be281183ba3659e9fcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00096-of-01024.json.gz": {"num_bytes": 399526010, "checksum": "eb754381b8a6f3c74dda5ee5852958f7b69c707a3908cbaa9410c972e002a0cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00097-of-01024.json.gz": {"num_bytes": 397935028, "checksum": "6d6d2ca80708b7c6ad4240a042dddc2170060e8976c2e7b4ace446d2f2395076"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00098-of-01024.json.gz": {"num_bytes": 398645934, "checksum": "568db6971230fb42df8973ecb5a2a6d77204aa8cf0bdf47b386c04370da8dfd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00099-of-01024.json.gz": {"num_bytes": 398110916, "checksum": "9bacb381e3b06976619e816e40ac2ccd3bcf3cb9ecd30c294b388cfb75c8bf77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00100-of-01024.json.gz": {"num_bytes": 397631228, "checksum": "7d515ac0f767736600a216ebe7280b9751f16e70df969ba601d1aaae15f201e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00101-of-01024.json.gz": {"num_bytes": 395102356, "checksum": "87c5c81e154e136f3e090ba91682ad54fe678653f86f6f32002ae5ec3c9aa743"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00102-of-01024.json.gz": {"num_bytes": 398926159, "checksum": "2df85a9ac13812c3870180901dbba99b52e53fc045da019160a3f06d0dfa5e95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00103-of-01024.json.gz": {"num_bytes": 398383820, "checksum": "8134d12e84ed4a58a5f8f6eff8a4349f7d6ded6a1d7539b5c23193571569d6c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00104-of-01024.json.gz": {"num_bytes": 396628542, "checksum": "208f0cb3365b0243d70e7b4e52ff977e9b11d8e451adea521a5bf6e10cd40ee0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00105-of-01024.json.gz": {"num_bytes": 398737797, "checksum": "855ac7b8cb621a240319ef00197d2f20338d17db71a1aec68fb66930bc17c59c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00106-of-01024.json.gz": {"num_bytes": 397281064, "checksum": "544d5d91d066f2450bfe622ce55bdfe16a300aee9c05aaffae8a645966bc695e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00107-of-01024.json.gz": {"num_bytes": 397919761, "checksum": "f4af405c0f19c9139d93b3073f3fe328be998c9dc6f74afc7e21ad068964b92c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00108-of-01024.json.gz": {"num_bytes": 398810219, "checksum": "bdfce29353c6caa33b178bdebbf7e48526c391bc6c71180e3fa378b723879563"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00109-of-01024.json.gz": {"num_bytes": 396605124, "checksum": "ed6acc172bc9af0e31170f5533001a8fcd344e6732a4b3a714b7ad43740f25f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00110-of-01024.json.gz": {"num_bytes": 397491755, "checksum": "428b6c91f12c4f7032fa692bbe887f1a4c02635eb88b91d876da4c71f3da5e4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00111-of-01024.json.gz": {"num_bytes": 395754897, "checksum": "a723863559edf291fd8a6c2736cc1cefed70dd3c8625b967df049ce0d373f68a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00112-of-01024.json.gz": {"num_bytes": 398567649, "checksum": "a90ddc9ccfbca20b9c75bd2b7d63ee6abd03236a0f0dd2827eb9f7350d9c3931"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00113-of-01024.json.gz": {"num_bytes": 396706569, "checksum": "479052b6b9edcc2bbda40b982976e7e28d84fad7b2dce46b017f4e3d1f61e0d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00114-of-01024.json.gz": {"num_bytes": 397384355, "checksum": "a95984e4c261a3057d1bc51939aefd9413853111e19030b19c5d26f778be00ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00115-of-01024.json.gz": {"num_bytes": 397702826, "checksum": "5eaf7fc2c9d4b2ee3e216c215da7f4fc7558e89d6993033b95a940a78061ab05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00116-of-01024.json.gz": {"num_bytes": 397252590, "checksum": "268033cbbdf3be9790cb6010791693f1b490af06f9fef91b0b307420a4e30a08"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00117-of-01024.json.gz": {"num_bytes": 395506730, "checksum": "cb80908eee1054ddaf7e2e5d66c9a41505025c2b6dc7fe6aa287db0a9f3829ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00118-of-01024.json.gz": {"num_bytes": 396452136, "checksum": "d75bf895c88ff2e9c4031c1f65b067222cfbb1a937d685ab4dd33369f5f5ff7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00119-of-01024.json.gz": {"num_bytes": 396777389, "checksum": "2c00362f4d99cef2bae2f13f17b79ec56a5ef8aca18ffd56a12fea2308e5017b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00120-of-01024.json.gz": {"num_bytes": 397730478, "checksum": "e31296949f7ce2e2a74fd2443552cb64b9f3cddcca691097a56992f51033fd11"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00121-of-01024.json.gz": {"num_bytes": 396593647, "checksum": "c2f0f81e3c835848a47532d8fd1c215a624f47740196a7bb45b5099916853014"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00122-of-01024.json.gz": {"num_bytes": 396576172, "checksum": "72edb7581a623e20f26cae4885f3b9d7f329581921253ca4d7ceedfbca17b7b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00123-of-01024.json.gz": {"num_bytes": 397378329, "checksum": "4f045ce7bd077b7f878012aead8c51073022448de66d2e35a755d4c8c4a6f59d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00124-of-01024.json.gz": {"num_bytes": 396545003, "checksum": "dc7949657328520d31a27d8e267c2ab07cd4e8639036d4b1bb59454c309f862d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00125-of-01024.json.gz": {"num_bytes": 397630505, "checksum": "530bd95e5ef9a1d5989c595e60e0ab11583e0f42d16b2bd37c49ed09a67af207"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00126-of-01024.json.gz": {"num_bytes": 395483747, "checksum": "d9df071edec6959ba842509f72ad43be3ea3f529b60d48f3dfbf390908887a5f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00127-of-01024.json.gz": {"num_bytes": 397295159, "checksum": "02b61f5bc7d1d241484c4f04fd517960ae755a69f35192bdd5bb471baeba5614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00128-of-01024.json.gz": {"num_bytes": 396276865, "checksum": "0c7d618df232c36ba018269ddf3b2863cd6d63bb7fabeaae33fd508715bd8ce2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00129-of-01024.json.gz": {"num_bytes": 395314703, "checksum": "03443afda032187d2dc2e696ce6eaecbf2219e6dabbdd593379e97c0e00e3112"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00130-of-01024.json.gz": {"num_bytes": 397411481, "checksum": "8969873d5efd3df0cef1742e4bc67f2df7a5b5d9e641f7a12e77c7e8e96a1bf1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00131-of-01024.json.gz": {"num_bytes": 396925311, "checksum": "31adc39ea4eda8667662608bdad6bb32bbc82b1ee1ad53ceb4df50924a933bdf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00132-of-01024.json.gz": {"num_bytes": 395826124, "checksum": "d2f035ba2c388fec2d847bd43449c885eadd0bcab5fb8afdf031a53e72c4ec32"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00133-of-01024.json.gz": {"num_bytes": 398892794, "checksum": "b7ed60983058a5f9f0ef72602789f50359f415ecbe60dc967e7a869866d833b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00134-of-01024.json.gz": {"num_bytes": 398206890, "checksum": "9ba78624879aabb72bae0b4119fa2625793915382031ed897a0b4c3f2863b8aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00135-of-01024.json.gz": {"num_bytes": 397161888, "checksum": "9fa6fee55f5e8f887dcc64d94cc65ada6f283a580edc7926cb159b80d0084ea8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00136-of-01024.json.gz": {"num_bytes": 396185585, "checksum": "81a1fcafcedfdd9bcb32d2467d9c963cc7d8b2f32e13e52ee04db41b0d3f5483"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00137-of-01024.json.gz": {"num_bytes": 396933735, "checksum": "c7558304b614e1cff13b0f6e967fc5ef77e4953a1eea1f39ed925c33076d7723"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00138-of-01024.json.gz": {"num_bytes": 396371698, "checksum": "3e896da8bf296403f7b4061ba0b24d3c3978993de4854fabd688cfce9fbf7bba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00139-of-01024.json.gz": {"num_bytes": 397289537, "checksum": "1a5ffa3aaf565ccf4db7444983643ad06e386938a0a2d313aecdb972c36111e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00140-of-01024.json.gz": {"num_bytes": 396983259, "checksum": "4047916916fd9dd7b76a8cbc595d52803344467135f744b23bd10296004a47d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00141-of-01024.json.gz": {"num_bytes": 394947050, "checksum": "7edfc9e5870d80d470e3797e8bef5183e9d170eab410ab50957e946dde2e8199"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00142-of-01024.json.gz": {"num_bytes": 396852755, "checksum": "4affc3a24616858fab84211e3825e90a1ea7d9c8f2cfabbe9a5c9b24c21a116b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00143-of-01024.json.gz": {"num_bytes": 397579248, "checksum": "d5aa9ba68e9b30576bd640f647d4069b6c56db276cc5229573440e4a38a7f1e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00144-of-01024.json.gz": {"num_bytes": 398800367, "checksum": "fa104e63eb7a8a6b066a5f00bf05b3ea095bad35a902bc728251f096173f1417"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00145-of-01024.json.gz": {"num_bytes": 396709510, "checksum": "b615ecd58821b1697c82094cb3435375924263827c342ab1b87e53907d4aa63b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00146-of-01024.json.gz": {"num_bytes": 396042389, "checksum": "6004c782f3235490865b6634b2c4840a989745b70ef2da674e75c62aeedf8a6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00147-of-01024.json.gz": {"num_bytes": 399840661, "checksum": "5e8b46726f7ff2c3dfd381fb252f1b4bddf9436fd9ffd10fa300cb0fbe76998c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00148-of-01024.json.gz": {"num_bytes": 397098215, "checksum": "0851cb274aff2ec4f781c82af11c94f8938a797aca5097fb0089299cb4c75aff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00149-of-01024.json.gz": {"num_bytes": 397540697, "checksum": "7cadf4ef9b0e29d9e8f68474464dc072b78e909a0f03c74e61b67912ff9b551d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00150-of-01024.json.gz": {"num_bytes": 396347701, "checksum": "521e4f67d12ae47b8f2a02b6f77e0c85cdf9a0efbcb45602d09ae116110ebe66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00151-of-01024.json.gz": {"num_bytes": 394890490, "checksum": "2255bf3e1940ea28da9656028dee26865a9ee682cbaab4d5aeb34c081062f8fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00152-of-01024.json.gz": {"num_bytes": 399584675, "checksum": "f8ca4aaf5706ffb0f5518c7461d9045d18c645df068aa436137299e5ca77df82"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00153-of-01024.json.gz": {"num_bytes": 395606567, "checksum": "24f0e81dc3140f063ac89173fc262b01f2420133025b114f29632262cdd2e7fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00154-of-01024.json.gz": {"num_bytes": 397925578, "checksum": "5f40a87b15b0acebbd324e7c5cd2c0f31f911558d57f774f278634db94f2d5f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00155-of-01024.json.gz": {"num_bytes": 395428741, "checksum": "36281c154f187a09a83822878da815cd9b7f659a41cd90ac64653b437e798c72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00156-of-01024.json.gz": {"num_bytes": 396799274, "checksum": "0fb66965107e54c9fed0013962763e874b940b0e174d775b21fa5e688fa53b33"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00157-of-01024.json.gz": {"num_bytes": 397321211, "checksum": "014d1443a4940fe95089bf87e245817d3a90c50e3e371a703098f5b9c3f6c759"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00158-of-01024.json.gz": {"num_bytes": 398736992, "checksum": "f912d27d68318fc0089fbaf8e0481ebe8dc5d2963cb89ed315f3bec637460bfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00159-of-01024.json.gz": {"num_bytes": 397250687, "checksum": "1bfd02a301b09bfd53058522d0613e1fbecb788d3173eb30b58115cd1cbdb477"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00160-of-01024.json.gz": {"num_bytes": 397492158, "checksum": "149a7bd76e9ea41185d99d21df870ddd4f32857fdd628cee927d6bee7d6a527d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00161-of-01024.json.gz": {"num_bytes": 398383574, "checksum": "0c385b4c9b33574cdc75070309a0aed46aa7b2e3b8754a7692035a3c5a04f916"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00162-of-01024.json.gz": {"num_bytes": 397126197, "checksum": "5c012b2a6bbc9413914ed1420b6150a5549cd74185bf2788d8809005034d433f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00163-of-01024.json.gz": {"num_bytes": 398201223, "checksum": "79448c338e86cea2609399705268fc6011cb21c4f0aff82e3fb7660391ce85c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00164-of-01024.json.gz": {"num_bytes": 397914908, "checksum": "dfb89631dce146ab4713a03f184e864472eb133b2cd04db8b4bccab688e9e287"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00165-of-01024.json.gz": {"num_bytes": 398142696, "checksum": "74acc88d6612aae7bdf5187d3b9eddcdb04cf60f1cc350661ffa50219a747f9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00166-of-01024.json.gz": {"num_bytes": 397533050, "checksum": "757d23402b3a155cfcb6b30bdc305c8014c9b64ba4e067753664670c2c5e9534"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00167-of-01024.json.gz": {"num_bytes": 396241119, "checksum": "521bd7a9dcfa0390c35e50a3d0cde3ea627ca538dfc419a97ed83b251d8a3005"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00168-of-01024.json.gz": {"num_bytes": 396041761, "checksum": "dc540ec27d5999f6a4c71f075ae1ec64ea84415c720cd2b6ef3fdac925e576da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00169-of-01024.json.gz": {"num_bytes": 396350882, "checksum": "36d5d35075a82038dfdd5abd29a839f4e9ab79d51f0bbc635d3dcf3f5f1e2732"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00170-of-01024.json.gz": {"num_bytes": 396885157, "checksum": "db9a3f6a7e085007eee381357ea9e4d5d6f702580d38220860967ec441ba3525"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00171-of-01024.json.gz": {"num_bytes": 397266368, "checksum": "7f8098cb6532bc888d3c1f0ea5072cf8419ce1689b9ffe1c370ca20071e7e1c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00172-of-01024.json.gz": {"num_bytes": 397140430, "checksum": "90ae7e2551b1f3bf2e5ccf4fb3fac8fa3512add5e299ba7c90319611baf8c840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00173-of-01024.json.gz": {"num_bytes": 397069631, "checksum": "a86f5ab72e1a9b1d491988154fd6400e6ee8c74378a9e64276df438a3c4edf9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00174-of-01024.json.gz": {"num_bytes": 396743897, "checksum": "451cfe8e14c17113a2f6673ece27e01f8d54bed1b57d1b20cb84f125879939ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00175-of-01024.json.gz": {"num_bytes": 395780705, "checksum": "3252e9781545bc3f9f19ac6e8fdb87d81cdc5a94838798daf6037c9f4f473db4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00176-of-01024.json.gz": {"num_bytes": 396205053, "checksum": "49d1648d37150b90632a6459828eedd82deb2fce7f108bf4e1b050f2f9ad1668"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00177-of-01024.json.gz": {"num_bytes": 396248718, "checksum": "99346ccda762ae85038a10baba937ef8ef668a0beab483c4005dce77e331768b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00178-of-01024.json.gz": {"num_bytes": 396634813, "checksum": "8d3bb1610ce79cf359d75f32e7624b6203140ed3eb276362b040615e9ffd4b54"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00179-of-01024.json.gz": {"num_bytes": 396524113, "checksum": "971e5c9499425294cf5945436b2ee419379a75bdd72d4cd6a33b1d17c17de298"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00180-of-01024.json.gz": {"num_bytes": 397938782, "checksum": "dd6b3e60219788b82ab3fc63a9e65f38f64aa2f7b294135ec2d16b36350f1f40"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00181-of-01024.json.gz": {"num_bytes": 399155769, "checksum": "c6a806d627a9d197789bfc6257a92b0223ca51e724c3c2ad10fe2397dbe30848"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00182-of-01024.json.gz": {"num_bytes": 396136228, "checksum": "2c48e3237253eaad9afc121e6946a9e1856bbe82c5a7cb287b05cff3e6ea8e8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00183-of-01024.json.gz": {"num_bytes": 397083292, "checksum": "52645e03ab47da01bb40226eb90042be914f1170688ae940314871e16cbb1037"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00184-of-01024.json.gz": {"num_bytes": 397402964, "checksum": "1edbdb41edeabc108f0147e18b439a75e390e0a843ed915f1cbf73a7c7f7867d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00185-of-01024.json.gz": {"num_bytes": 398411052, "checksum": "ef071e52174a19597e567696262470906275c2cd1cbbb0b1e98864999ea2d463"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00186-of-01024.json.gz": {"num_bytes": 397122443, "checksum": "0d87080bc08f7f8a1952a7df57ce2bdbf61e40c05b61937c8c19ae0ecd952b1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00187-of-01024.json.gz": {"num_bytes": 397244868, "checksum": "4aed75ea9f885fc3dab599c19c7bb98f7d57ce2b2ec11ac8ab3258fa479fc0db"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00188-of-01024.json.gz": {"num_bytes": 395677432, "checksum": "342882e436ea826cda9fd38c0caca68bb35444a2a07596f8de0e53a3e2169f59"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00189-of-01024.json.gz": {"num_bytes": 393653750, "checksum": "22ed9e389f6c8410c9bde898d97ad798c236c2da4d0b2c76b86d013f8686da03"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00190-of-01024.json.gz": {"num_bytes": 395437920, "checksum": "b3f9ba5834d4f0280d6defd3bd50fdf961bee6be4c71ed47046cf4e115acab01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00191-of-01024.json.gz": {"num_bytes": 396944861, "checksum": "4e7ed636a60edc44b5ba709dcd83bf4263ad8d5a06a02827d3d27191bf3731a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00192-of-01024.json.gz": {"num_bytes": 396611165, "checksum": "4fea34466d9b470bf0bc44455183b2c61994c4e71e4bfb684dff3b5e3870d1e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00193-of-01024.json.gz": {"num_bytes": 398283211, "checksum": "4c4e6d31f455831330971ed1e0c33221203401b817adbda5b53de16f8299a9ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00194-of-01024.json.gz": {"num_bytes": 398915952, "checksum": "dfd0b1ceb2a437da8cd38c9c791af809e94f2e36ab4399b2a45a5b916f4ccaa9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00195-of-01024.json.gz": {"num_bytes": 396352694, "checksum": "0ccd90ced34b3ff28c21d015a87eca3f31eae2bf31f11f25ac073139f9d50c22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00196-of-01024.json.gz": {"num_bytes": 398582922, "checksum": "f22e59765cec074a0c687c500f4e6348250d0e418d12dcba211e39c133aaf290"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00197-of-01024.json.gz": {"num_bytes": 398839554, "checksum": "95fa68cd75d77a1b5bb526dd5ef16a2f04a3520604f734baeb6e2d95608b5973"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00198-of-01024.json.gz": {"num_bytes": 396202192, "checksum": "f0e6343e8105178b38f75eade6774aa6e85b62a271622fcfcbe2745f1cae11ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00199-of-01024.json.gz": {"num_bytes": 398029364, "checksum": "4c58736410c8d3c7174ce011e2f281cb16e4949d756ff4ace86b4a9d4795c04e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00200-of-01024.json.gz": {"num_bytes": 395867629, "checksum": "1cb798ee6609e670053987d881d130d5b73db19d9f37fecff7a6da41152aba05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00201-of-01024.json.gz": {"num_bytes": 396858169, "checksum": "7357eb22b2aa75c55885252c62d12e08cf8f7ef285c0052cf1d706c3f0f74fef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00202-of-01024.json.gz": {"num_bytes": 397955766, "checksum": "8901d0f27c4c11916cda7cf806cd00000771b6351954c8503bc312cca5ad3a10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00203-of-01024.json.gz": {"num_bytes": 397737882, "checksum": "ed51917fc8936701b681cfc49ef95b2dab451ca597e76b34ba90be9405a1a0b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00204-of-01024.json.gz": {"num_bytes": 396094006, "checksum": "88692bb8da78347cb97c0e0849d1a10a97b1686cde1f75626236b89bd507e2b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00205-of-01024.json.gz": {"num_bytes": 399027636, "checksum": "fb17fe19d1f0fcaa43fb31a3ad9b105b3d93fa287351c7f93fb599edb7f40bc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00206-of-01024.json.gz": {"num_bytes": 399406254, "checksum": "668d2a9927080b686a4d728236e4cfc780b262f9045dfe9575cfc48cb69d6adb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00207-of-01024.json.gz": {"num_bytes": 396291803, "checksum": "928f451dddfe42bb2ca791dbc61c36ddc618006ef709eaccbc2beb665c8427e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00208-of-01024.json.gz": {"num_bytes": 397807368, "checksum": "11e8627b758588056b61d31de07c50092222013a38ba802b7a9ae34b6b8b84a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00209-of-01024.json.gz": {"num_bytes": 398085408, "checksum": "d49d31d1719698ab7a2b9ee91d887f3192c8fc1b6108152a75b39de2a0ad25a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00210-of-01024.json.gz": {"num_bytes": 397670254, "checksum": "049b3294c3e22e6db6c115979a4a55f0650966c600ca17250e91b241cc97bbd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00211-of-01024.json.gz": {"num_bytes": 399643598, "checksum": "7772f26fd90f47033670e7f1d3f6fe092116486bb9a991577f9560b54ed3832c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00212-of-01024.json.gz": {"num_bytes": 397390768, "checksum": "7a24e4a70f43f6227fe6491fcc7bb6b2a19cae203521c803bedf8882c995d7e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00213-of-01024.json.gz": {"num_bytes": 398657925, "checksum": "21d0ee8d1a01957b56ac503aa88c6f3269b4e4692762a3f929fe0e7069be8c0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00214-of-01024.json.gz": {"num_bytes": 398282324, "checksum": "ede2d9824d8f99dd578a36ea82caae942ebcafd99f308cf5d0ff8aa4a56f0a05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00215-of-01024.json.gz": {"num_bytes": 399178235, "checksum": "82516fa361dec02c7ed59ea2d0510d9ee4187609b449dca649a04141b12bc037"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00216-of-01024.json.gz": {"num_bytes": 397630870, "checksum": "4a6d5e60354b7b93f005010c6fc55c0a81596e98a116cdeec99e1ab4e58fd03e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00217-of-01024.json.gz": {"num_bytes": 398628848, "checksum": "02dffb623b628a3a3ea38084fe6bb840aafab8419feed3d1f2bd3598cfa80aab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00218-of-01024.json.gz": {"num_bytes": 395087998, "checksum": "e1e9a7ac7a922d6a9bb90f82cb48dff11ab7208dac08511e9613cd2726ca67ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00219-of-01024.json.gz": {"num_bytes": 397622792, "checksum": "955afc7d45a080ae137e9dc25ba3d85629a6a14c3d9bbe4065aa37d710345b7a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00220-of-01024.json.gz": {"num_bytes": 395112655, "checksum": "a3560918bec20087e9908009a362957ecb06401924789e20b36c26e363db5ae7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00221-of-01024.json.gz": {"num_bytes": 397132000, "checksum": "d8459bb5b6fb6b341b24fe517cfc5dc099765ad70c3383bae913229e06cf99e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00222-of-01024.json.gz": {"num_bytes": 397138513, "checksum": "20d3c6219921dc9c2928d637000e488635fd9a12b5636de5a6a7e52c1b67d781"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00223-of-01024.json.gz": {"num_bytes": 397167661, "checksum": "43a18accd194646893324537991e0162f6f98a9cec5ff59fe8fb510d81d707bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00224-of-01024.json.gz": {"num_bytes": 397905941, "checksum": "a516485cbefdef2e31a493cd8827a5f936f10674ff3525b71d414e17f48241c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00225-of-01024.json.gz": {"num_bytes": 397218123, "checksum": "791c85c78c5e7f3557855a1fc71acd860521710515b89f92e54e02960549f46e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00226-of-01024.json.gz": {"num_bytes": 396619135, "checksum": "52a36037696e6245efad80e00d1f123c36dbd79e7ff52b1fb99f579e712d2b30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00227-of-01024.json.gz": {"num_bytes": 396654998, "checksum": "e31123ab579fe95bd50afa10d52a51e9c15a4af28c06583fb5aeac4e3418f129"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00228-of-01024.json.gz": {"num_bytes": 396899165, "checksum": "86481361fff334dee3183fac8ab3f346e44ab3e6e7b35bbd7e6e062b2d2fa0d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00229-of-01024.json.gz": {"num_bytes": 397489378, "checksum": "bbb717711fb4c78ebe8a0476296a21a50285ec41d9fb9f08d5d66d899577e04a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00230-of-01024.json.gz": {"num_bytes": 397462301, "checksum": "054414aac29b5c8faee71a918f2586ad3fce8ee44c71e7a2e2af4b91e0169523"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00231-of-01024.json.gz": {"num_bytes": 396097584, "checksum": "8136e320fccba75a493954fefbb560f92532be44a6e0990404edae659d48ce1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00232-of-01024.json.gz": {"num_bytes": 398984795, "checksum": "3d9362aab157beef3b5fcd4a0a0236d59de635a565b1c86423f45b26e8b437b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00233-of-01024.json.gz": {"num_bytes": 397258012, "checksum": "e1a532922477d17f7cbea7db72c2391d26b4db580e526ebd5a90be23607a8d31"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00234-of-01024.json.gz": {"num_bytes": 398350453, "checksum": "c464829565bcaafdba165b2d886be4580f3c0a516b5417853ffc4fe30049cffe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00235-of-01024.json.gz": {"num_bytes": 397147353, "checksum": "573a6a1d33ccc6c5b605d381f04d73989504bb6d24514b938e92c3d4f61501e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00236-of-01024.json.gz": {"num_bytes": 396963006, "checksum": "21318462014bc185d0da7cbd342fddd07521401ca2b73e47eb5cb4bd42a82bbe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00237-of-01024.json.gz": {"num_bytes": 397087111, "checksum": "49459c97b078726bf8377748d4bb2066bdfa47e2717315a9b3c8075cfc4b9b10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00238-of-01024.json.gz": {"num_bytes": 396984031, "checksum": "befb46e9f928876edc580c60ea4242f63cf6df77c6c107fec6e4280d279e348d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00239-of-01024.json.gz": {"num_bytes": 395915197, "checksum": "dc5ab17e04e4f2678771094af67909dcaa8be36a6cb047cfa66e75f986c91312"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00240-of-01024.json.gz": {"num_bytes": 398321096, "checksum": "25b92f7a499e9aaf0496a57f6292a7f65941b34dd6c78f14b08358d180070029"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00241-of-01024.json.gz": {"num_bytes": 396626980, "checksum": "1ae21ee5585ec718763a3c7bd70d9338aaf77d0e02f92a41f6ed213d1eefa5b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00242-of-01024.json.gz": {"num_bytes": 398220596, "checksum": "c29f98174a0c02a817d5cfa3ebb2a92d5f49df8a34fa40abd360f1b39b4bde05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00243-of-01024.json.gz": {"num_bytes": 398250083, "checksum": "819387c95ea7183b1f9e1e78d077de65023c4809198ef3a0c946f46f8b6c19b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00244-of-01024.json.gz": {"num_bytes": 396943969, "checksum": "7a0b0b984d7afc4181827705212f917cf4ac12412f640a2c8120513763cdb390"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00245-of-01024.json.gz": {"num_bytes": 398365865, "checksum": "a424157137a5eeca89819d600deea2a1619ea8f5ae1ed395c88ac600a85e3afa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00246-of-01024.json.gz": {"num_bytes": 397285385, "checksum": "73029f721bdaccd9d126e871973e70a551f48f077f5903656b305ea9885c4798"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00247-of-01024.json.gz": {"num_bytes": 397132841, "checksum": "b223cf1270d2c728592ec65b09599bbdef8d64f7df2eb525e114f86268500daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00248-of-01024.json.gz": {"num_bytes": 396316645, "checksum": "94102d9bcc086ed5b203bc0c6b830dd245c9bf6c695b23b19922b2a98eeb6a52"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00249-of-01024.json.gz": {"num_bytes": 396644237, "checksum": "36be793f4d76070ba1c696b3274e6dbab43f415c8fbaf752145cc99af6558680"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00250-of-01024.json.gz": {"num_bytes": 395860541, "checksum": "313febcf026d2cd1495fdd3d5ba3b492ce5d5749153e189672b6d9dff3e26a61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00251-of-01024.json.gz": {"num_bytes": 396709140, "checksum": "7e2480b3d5869ba35007c40e18585f3fa208cdf8e004078cc8de4fac36773507"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00252-of-01024.json.gz": {"num_bytes": 396508847, "checksum": "25df46ae56c0d4a6f945922e31fc697d12e0b7c525be9bc2b8eced802641488d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00253-of-01024.json.gz": {"num_bytes": 396364816, "checksum": "6b2125b9eab9bf893e7f8913a6beedbeeef5de53893fbd6172f706e33bab5177"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00254-of-01024.json.gz": {"num_bytes": 396122930, "checksum": "7947e5152c5305863e2d664622e3de49f9386b4384eb09630c5bfcad21fb458e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00255-of-01024.json.gz": {"num_bytes": 396929803, "checksum": "a1ec8c609ac969c24e2524f0f3dc31ef43ca0147ffe66569d3135e4f28394325"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00256-of-01024.json.gz": {"num_bytes": 398432943, "checksum": "3fd0373f5a8974a3499c436d96ea73be95f5619b8388dc316f51aff01e9ecad7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00257-of-01024.json.gz": {"num_bytes": 396003748, "checksum": "516cf3626076f083962983b2d6c596ef355609492f2e81c6c3cdec01acf8c5d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00258-of-01024.json.gz": {"num_bytes": 393890690, "checksum": "700760a7764f890c8aae337e7ee458c8467eb9048347edd237e341dd2bd5d236"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00259-of-01024.json.gz": {"num_bytes": 398130606, "checksum": "d868f8ef5e1cc971ffd00908bdc7eace32ec151d7405d7cac5fac22df9ea10c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00260-of-01024.json.gz": {"num_bytes": 399765969, "checksum": "7d5eb3b88eb8a0291ae70c1997458cf5aecac645397e50a67fab3d1193064353"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00261-of-01024.json.gz": {"num_bytes": 397418895, "checksum": "ca607c9e13d7cfb73a29ee3131f77e6bef3130d8627037cef9f57ed459185f0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00262-of-01024.json.gz": {"num_bytes": 397925991, "checksum": "ca789394ab4398c41490ec6147a41ffc8847155ea9ff74d7ff8b3402ed0634e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00263-of-01024.json.gz": {"num_bytes": 397082336, "checksum": "aac81d1bf0ade80758c14d01842b9b06c89ebf2fcdb9a06b1472bf2f70bbc348"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00264-of-01024.json.gz": {"num_bytes": 398101079, "checksum": "3cf56a2989b5c3f26ba94124cc534f5c9ae9770bdc6a3431dd745603b480ab19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00265-of-01024.json.gz": {"num_bytes": 396949669, "checksum": "d4f252a6c2f43833d6d89bf69337449b4cae5dc88fd08fb20b35fe7194a50ddb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00266-of-01024.json.gz": {"num_bytes": 396242007, "checksum": "71c745968d8ee4a0d64f38930a76e65d68ea094ba3e0b963d5d6878f65f51b34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00267-of-01024.json.gz": {"num_bytes": 398342031, "checksum": "706a560c862979594265925c3200d4bd0981a9eaa279841f2cba673634f7074b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00268-of-01024.json.gz": {"num_bytes": 396399468, "checksum": "eb3dea553c37f220b3b9b5f377d5a4ef94243b3c0b6b46981e3e5b7ba5b4a935"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00269-of-01024.json.gz": {"num_bytes": 397181296, "checksum": "4f0feae035dacaeb720ca3b6ea17685144895a0d78cfa358e30983f8d6c4ec76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00270-of-01024.json.gz": {"num_bytes": 395712883, "checksum": "6e0f6de1e5a5c6d4bf23d0539ee72ecc2b4285da2b0f1ec2cdcc443d2e22aa88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00271-of-01024.json.gz": {"num_bytes": 398066980, "checksum": "4c5cd1ef1917ed762d7d8c5c54e1da05db74e45721697df8b0626e0aeac96966"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00272-of-01024.json.gz": {"num_bytes": 396667308, "checksum": "77a33c37a5d88e419e2b31cf560d53f129a38e5bc2306b5baccc187b7e94e589"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00273-of-01024.json.gz": {"num_bytes": 396020214, "checksum": "b18e40c00b8e0e02dfac40ea0519964e231c8a2f28bc1294b044fb090f41a9fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00274-of-01024.json.gz": {"num_bytes": 396300833, "checksum": "34c8945a6ebac564fe87881d6968d05363a89985f297692a3df7104128b9c26c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00275-of-01024.json.gz": {"num_bytes": 395206463, "checksum": "1e41d7e2a6117224dc23fbaae8e9d20df9d7744adb4687d2b0e570bf8d9e47f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00276-of-01024.json.gz": {"num_bytes": 396667995, "checksum": "45973b91c2f1140f79265a24f484fc6d6653f43f83d5bd2d18954892dfa4dfae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00277-of-01024.json.gz": {"num_bytes": 398134029, "checksum": "b7da91889b6695cf01bceddfc139b23f9465bda5cad54088b84a1f5a4d7a4f9a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00278-of-01024.json.gz": {"num_bytes": 397422615, "checksum": "e794a2903bda1f3c082e8f590383c714a518c202ecb99eda5513d6b320f70e86"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00279-of-01024.json.gz": {"num_bytes": 398776175, "checksum": "a5528d3e33151138ef9bdc2433744f1797de2b20673a570de5bd4d81b306354a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00280-of-01024.json.gz": {"num_bytes": 396208086, "checksum": "1be2d8c3d0eca510fac7b06a5401b2b8873bc6dfbf85a3c736301756f9681309"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00281-of-01024.json.gz": {"num_bytes": 396893734, "checksum": "1db3e9017561d38a91c417ffef875b7a948c4f64c51b90b0983c71bc9d950903"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00282-of-01024.json.gz": {"num_bytes": 397411883, "checksum": "4e23d39fcec2c310cbde3fdc5d9c185046086877ac03bbf9d772b092614f93da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00283-of-01024.json.gz": {"num_bytes": 397906911, "checksum": "850eb5e60b84bca4d2f10b2e511fdb2661e3d08444a07db1782ad85c754fe808"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00284-of-01024.json.gz": {"num_bytes": 396043261, "checksum": "fea24050c6aec13eb706a6f3854b4debde62b1b842f2992fc027820c66218b0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00285-of-01024.json.gz": {"num_bytes": 396961329, "checksum": "6052f82887cd2362320f72f6545d2e5b5a775e9bef95783c9b9995ecb7a5ecc4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00286-of-01024.json.gz": {"num_bytes": 395697481, "checksum": "f4361838b5b679c8306447364166c1c3083af392b4c8793399c122af09c7312a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00287-of-01024.json.gz": {"num_bytes": 398773520, "checksum": "9add91f23f31ff8c5d8d84e6a0af75fc6fa08ceef8ccd9b633d8c49aa1d0104d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00288-of-01024.json.gz": {"num_bytes": 397684645, "checksum": "64dc94555a122353c3a3c9999e67d17b0e4b682096ba80be2258c791ce1c2b9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00289-of-01024.json.gz": {"num_bytes": 396655864, "checksum": "2472c76b1cbcfc3cb82126795673126e8f532119a03722a304396ceee9b7db3a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00290-of-01024.json.gz": {"num_bytes": 397415313, "checksum": "960b71edbdc6a6a62a0d3cc1069bbbfb11893cc017aba543e10c9a23cb759d1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00291-of-01024.json.gz": {"num_bytes": 395617977, "checksum": "96e582d7a750bee597331f373ec2e16d3a9686f48a49d39765d39550c8cbbad8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00292-of-01024.json.gz": {"num_bytes": 399332500, "checksum": "cd6ec4941aa5babbe274684945bf899447ec2459b8f7076ec8c74d2b3fe794c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00293-of-01024.json.gz": {"num_bytes": 397021546, "checksum": "d0d0c4d80e75c5d02103b49027d9e2e6f7db74c12f8b53f600d7fe420b2d0a7a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00294-of-01024.json.gz": {"num_bytes": 396272726, "checksum": "caf5708a6989f867ec6c4c56f338aca9f3a43a1806a27ef473d9b0f219001cb4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00295-of-01024.json.gz": {"num_bytes": 395233811, "checksum": "a7b5f904e34c0b370238e6beb19149d4bb96d0cce43a1eca3bfaf181952ede53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00296-of-01024.json.gz": {"num_bytes": 396480926, "checksum": "4fcf284d98c2f7b63e47573e9d084eeec2516fbfa62be42c3ff94e1cf518e313"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00297-of-01024.json.gz": {"num_bytes": 398883718, "checksum": "c1cb458076497e7dee645f50281d1af2fe5dad556d28a2cbbd73abe6537c8a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00298-of-01024.json.gz": {"num_bytes": 398733629, "checksum": "4a612c715025292e62860fb0018e9fa2d3fade692342746d044be6297e25a034"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00299-of-01024.json.gz": {"num_bytes": 398155026, "checksum": "d33f4043fad9551f92084a45b7f54d920ded9d6fec271cbbf85f71b021f9ee4f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00300-of-01024.json.gz": {"num_bytes": 398612975, "checksum": "61b1181b796a2f40db3cb6954f2890397c3722c486dccd4075d74679cf61a70c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00301-of-01024.json.gz": {"num_bytes": 395385748, "checksum": "95a78e9d3cece0620430c85822fedf4021ebd88ece57d6714933c268d3b6af6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00302-of-01024.json.gz": {"num_bytes": 397620059, "checksum": "321aed402a5e779febe9766294ad040a3f8dcf57bae68648c03d3c59023aafa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00303-of-01024.json.gz": {"num_bytes": 396549027, "checksum": "4198f6a2b5bdaf90ac4251f013908123a5964429870ccd6b245a9069278c4e17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00304-of-01024.json.gz": {"num_bytes": 396596460, "checksum": "74a6440e93d18d0d6d0622ab7d8832d7ccc91c03297faf20c8090d16f7c042d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00305-of-01024.json.gz": {"num_bytes": 394881271, "checksum": "654deec494bba4eece19c27140426049574cf529c93ccb422fcc09fe4496af15"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00306-of-01024.json.gz": {"num_bytes": 397760377, "checksum": "e0840cbc94db6cfc35df66d413a11261756392dd59b0fdf89d9ff166ec76f3e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00307-of-01024.json.gz": {"num_bytes": 396671816, "checksum": "31ceb8cfcd09fda621a9a483b09dfb43f5436e867363f6736ea3f710a6af10fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00308-of-01024.json.gz": {"num_bytes": 395961013, "checksum": "8c1e5acc3f964eaa5aff300731a74dde84ed0671cd764b121ea638fb08c3dd0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00309-of-01024.json.gz": {"num_bytes": 396035179, "checksum": "7d555942b1bcb2518aa5ff9c0549d98fabe7bb563cdc6c73d3f11e6a0bc502b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00310-of-01024.json.gz": {"num_bytes": 397140669, "checksum": "859eeb7a9d2ed03d5299bbf7f1c3e719236477950d7601112a458ea5a2adf7c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00311-of-01024.json.gz": {"num_bytes": 398170419, "checksum": "1e7661637b0a4445119ba403e4f8ede129c829fb7d1907ca7660870b536b8b29"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00312-of-01024.json.gz": {"num_bytes": 395605627, "checksum": "87a3ccd2ac9deff1ac4a5dd02bba269a48692d4598c5899630e8d2e4136dbb99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00313-of-01024.json.gz": {"num_bytes": 397081206, "checksum": "c6952116cf573a6e20c849cf1b7d8d0edf3b9d00fc7e717e7bacde915c4c52a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00314-of-01024.json.gz": {"num_bytes": 395555727, "checksum": "762066fd85c596ee01b3b8070708517cc5759bb1e3c4bb65f4645fd62b550d13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00315-of-01024.json.gz": {"num_bytes": 397871218, "checksum": "814f19cc5e81144f5bfd7037f5f522dd5c44faf150c10337c675174a5965a5b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00316-of-01024.json.gz": {"num_bytes": 398577523, "checksum": "27643c7c3c0a1a78c9003b936ea27785709a2df80d09817278a179eecaedc352"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00317-of-01024.json.gz": {"num_bytes": 396388623, "checksum": "5f840180e2017c41c6b1c865784788dc3b002478a9ecb43c3859174af788ba5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00318-of-01024.json.gz": {"num_bytes": 396173471, "checksum": "2aeab99fbc84a2640a05081e2c7438451e75f76cbece3cbe5d82e85463a61966"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00319-of-01024.json.gz": {"num_bytes": 397912127, "checksum": "fda805ed19f4b996b048386f4bd73924dc965a069e85b8b4452a54a1372375fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00320-of-01024.json.gz": {"num_bytes": 398765416, "checksum": "bce244d024c076911c1c6dbd35609be5442c8b0440690e2cbb342ac64bdc494b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00321-of-01024.json.gz": {"num_bytes": 396005962, "checksum": "763584ee096223b8aeffb1576ec6e4f3bea674ec4de40fa163c2f2221b3701d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00322-of-01024.json.gz": {"num_bytes": 398615672, "checksum": "5c12ec1d0c450fb7515c586f24311bad145050dfc64180d65bacbd346c2ce9c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00323-of-01024.json.gz": {"num_bytes": 397861187, "checksum": "93326f43273fb963593e0b1caab1e9588387291c23d5c14b5ae40b46b199998c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00324-of-01024.json.gz": {"num_bytes": 396679008, "checksum": "6ebfe6e28851e6d79cfdbf370602373fc2136e88936eece302ecaa8ef8251827"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00325-of-01024.json.gz": {"num_bytes": 396358086, "checksum": "51190fbfd48479842ec3c7d910b5519e01ff797ca0143c39be142c1650c5e893"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00326-of-01024.json.gz": {"num_bytes": 396490692, "checksum": "f4d9bbfd1bbc6e939fce9a2df26e45c79be73dbe2650fe79af395bdaa39cd121"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00327-of-01024.json.gz": {"num_bytes": 398354656, "checksum": "c70c824b6c16e5fad922ec9b8d363d97bed90501522b641b0eb0f66b8c086325"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00328-of-01024.json.gz": {"num_bytes": 397326336, "checksum": "7e6008433a0e5bc6eed28a13b9dba17246e7d65ca96c31092086c3546a3a397b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00329-of-01024.json.gz": {"num_bytes": 396390524, "checksum": "f379d844a35172424554bb82a65c790c354b76c0e7abfd868225d1968017d1a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00330-of-01024.json.gz": {"num_bytes": 398259199, "checksum": "ea15be4a83c3de66c42410e13e5ef9c93baf86099a8eded1c1d10b0cd5ad0f29"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00331-of-01024.json.gz": {"num_bytes": 397618860, "checksum": "7b6aad6224ead9ee3a0c860cfd991301ef5e97093b23c76d713e73f4911d0e44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00332-of-01024.json.gz": {"num_bytes": 396743573, "checksum": "bc5333d383020d2296aa0f6ec940ab586a367efe50d1c597f9db55ca72fa66e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00333-of-01024.json.gz": {"num_bytes": 397460128, "checksum": "095b3a85a9598009638622ca21cb00142efa0d68196c8c3a8bb922cccb465e8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00334-of-01024.json.gz": {"num_bytes": 396900262, "checksum": "6f005575f4843b84f4512e1b7c1b748edf497e4e9f55eaae47f9b4637161ccab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00335-of-01024.json.gz": {"num_bytes": 396106895, "checksum": "66bfe399d0859f71c20db01de53ca7bf997b33afcd3d181f181d9f265a2c2fa2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00336-of-01024.json.gz": {"num_bytes": 397732616, "checksum": "1f1e0435de870b98b119e91edd4a0d32d078dbb810f919a70b85360cd860f0cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00337-of-01024.json.gz": {"num_bytes": 397834763, "checksum": "1db4bcdaa6fca612c3f1b38dad6d5402679ca21aa6a545850d61bcda10103697"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00338-of-01024.json.gz": {"num_bytes": 396712179, "checksum": "810c104a8862699c490fc8625a7be4115872fe2de4d8c061e095dc5a81eb4d19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00339-of-01024.json.gz": {"num_bytes": 396838831, "checksum": "9bbc616d5c4aba46475957a22544dbdb0557f8de31cdf919718fbfe55bc70ac8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00340-of-01024.json.gz": {"num_bytes": 395587861, "checksum": "48c8411ee2b5fc8cffe1589ed204d0ac8a12b5b3bb1857373f84bae984d49e8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00341-of-01024.json.gz": {"num_bytes": 398093153, "checksum": "4ff8ba83e489580da2401aaa23ca3329befe8fc08b6f299b612950c358688604"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00342-of-01024.json.gz": {"num_bytes": 397248009, "checksum": "c72e063f95d10ce661b4bc97538eccf6da6ad493b7e54da555a46e4a47aabbed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00343-of-01024.json.gz": {"num_bytes": 395939409, "checksum": "249eb2080c55402aab34a31a442b06bcaa25d2df3f4319ea1a5f50dc6bb709b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00344-of-01024.json.gz": {"num_bytes": 397608807, "checksum": "8cc57604fcc5fa920b0d16df6e8d8b7f4ca88c0c76c86f9ac81f42a615b330e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00345-of-01024.json.gz": {"num_bytes": 395751274, "checksum": "13fbc76e49a8b856f7563b945bef10d786a86caff63b4cebea50416ca34932ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00346-of-01024.json.gz": {"num_bytes": 395516794, "checksum": "61d43da2e3e7770016ba7235eaa74a1e6a180e64cd2cfacefed5c34e8b72eca7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00347-of-01024.json.gz": {"num_bytes": 396180000, "checksum": "4a0ca2103de168d05d0090c8800d47f216cc167a9cfe9e736403aedf040c5e46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00348-of-01024.json.gz": {"num_bytes": 398461180, "checksum": "a56396961496499ac289a85d126b916132e787d0dc4fbd9961aca7dbbc7cfcff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00349-of-01024.json.gz": {"num_bytes": 398049366, "checksum": "ca012572c575f6a8e6ad6453296ff93f22118995c17928e76b655da44ce5810b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00350-of-01024.json.gz": {"num_bytes": 396532962, "checksum": "bb35d17862201063b46d8745dc182756d1bb09e809c4c355452ab1967e655491"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00351-of-01024.json.gz": {"num_bytes": 396576223, "checksum": "19ea45ab2fe5487d2a69cca7c9a1db7a09c8d5dfdf130412bbcd241cc60a61c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00352-of-01024.json.gz": {"num_bytes": 395956381, "checksum": "bb5869b8649fffadd5f1945ca9a79588e84081a8fc45b7e4cb5507149b5be2d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00353-of-01024.json.gz": {"num_bytes": 398903623, "checksum": "cb16a7ecadd28a8b5622c4e581f463f0ae2fe20a3e6582fa6885d76e7523715a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00354-of-01024.json.gz": {"num_bytes": 397316693, "checksum": "42aea18548695c458ddc229d8c837356845609aca3bb64ce6e07b185443b9468"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00355-of-01024.json.gz": {"num_bytes": 396240550, "checksum": "1577d76807548d83427293b9f534a3261fb72a345569f0491a1fd2691047bd92"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00356-of-01024.json.gz": {"num_bytes": 396132315, "checksum": "b6e17a39292e082e517082b23b381305ebe889c2530fb5eb74a2683d36d07a86"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00357-of-01024.json.gz": {"num_bytes": 395948117, "checksum": "524ebed10c881f52f155db5d6690806f5a97aa8f811deadae916323b50427ed5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00358-of-01024.json.gz": {"num_bytes": 397397242, "checksum": "8e23d852bc3a0dda4684d5fd511003ad6f18232e5f54e32638c8db62e9d18c6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00359-of-01024.json.gz": {"num_bytes": 396141321, "checksum": "345c34dafbc59f5e93355c8b2e6fcde6bf59bc9e1ebbf5cb962d54228e6d3204"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00360-of-01024.json.gz": {"num_bytes": 397258644, "checksum": "51db06055d95e2b43fddebf8c2b7d76b7572745f129d89fe005f8e5d3f12b758"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00361-of-01024.json.gz": {"num_bytes": 397913411, "checksum": "2c0f6054fef084d3e7cd10e2de0b1d3a48dc716af1e9146548195df128bdaba9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00362-of-01024.json.gz": {"num_bytes": 397722576, "checksum": "664b390b20498eb6e78fc09604b3a947fc1847a01e3eaae4c7861d1dde3b90fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00363-of-01024.json.gz": {"num_bytes": 395416894, "checksum": "c57529884c6d4977a279a097c0dfbcc31d52048cdcf64950182c743583d7989a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00364-of-01024.json.gz": {"num_bytes": 397028679, "checksum": "ed4f252d63c679f6e3f35847e0871c3360e072b0d6963f662d7e808b6615457f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00365-of-01024.json.gz": {"num_bytes": 397574891, "checksum": "68e8e44a531d98897245fee90ad349f4fdee891b2f68dfda78a1dedcc9474326"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00366-of-01024.json.gz": {"num_bytes": 396905692, "checksum": "9e88b888d85633671e009ed7093763b934a42054ed6a1252222dc64781a20e22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00367-of-01024.json.gz": {"num_bytes": 396802011, "checksum": "2abaf3f3946788258b8543fa2ccccc0c20e6980b9d26a38decd356e67f575fa1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00368-of-01024.json.gz": {"num_bytes": 395630737, "checksum": "b4960e3395d8a1bf8350f57e5f6280b00443a4c6b85e6fd47478fbbfc1733caf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00369-of-01024.json.gz": {"num_bytes": 396228047, "checksum": "08e8210426e6c6ef9746675592a3eea4a92eff9aa4bb7ffc6bf6ba54bc411f72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00370-of-01024.json.gz": {"num_bytes": 396548482, "checksum": "10e0305ac4d1e410d749637e0c03386d969563f8eb73bbbc376fc1d21025e4ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00371-of-01024.json.gz": {"num_bytes": 397344482, "checksum": "03df0f4aa5c377f6b45db3c3b863240bfb1211ddb226bc055433fbcd9ee8e873"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00372-of-01024.json.gz": {"num_bytes": 395872223, "checksum": "9b70549213cb01595179928cdb020daaf7bcd2085c5e947d111f3cc66e406d2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00373-of-01024.json.gz": {"num_bytes": 397399096, "checksum": "945c204cdb107669a8d1252a91323eb300c902bdd6c6a8167a90805ec02cba9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00374-of-01024.json.gz": {"num_bytes": 397755002, "checksum": "8353d4383f73caceb5d112f260b37d1349dc7898af2d05b98ffe17d22aea97ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00375-of-01024.json.gz": {"num_bytes": 396534763, "checksum": "a3de41388a6d8ce3b605c6586e47b74a565dd2f54175551987bda0a0ff95036f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00376-of-01024.json.gz": {"num_bytes": 395594630, "checksum": "7cadf813f2b31a1bfe44fdfc84aef4eb65e889c2616c56b189890734c22b731f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00377-of-01024.json.gz": {"num_bytes": 398241040, "checksum": "15df154b52cb4d9314dbc4ac26ca4b4df7125b12131d538fd480f8a6b3fbdfc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00378-of-01024.json.gz": {"num_bytes": 397217224, "checksum": "208ce680427f62d78dad857bee91122a79f968589b4e44f2f89919e91f4dea30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00379-of-01024.json.gz": {"num_bytes": 398504097, "checksum": "0052fe7f27e720423b6143f401b8618428d913b22fc2af2950874785e2ef7528"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00380-of-01024.json.gz": {"num_bytes": 397494149, "checksum": "15c4f07a2629c7bd79b243c97367e3e18de02b5ab09eccc0f85b1eba0e0b071a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00381-of-01024.json.gz": {"num_bytes": 397190859, "checksum": "77c71b4a79ac2f462040ea0e8408fdb8f719fac0f09fadb760ed00b709e9dea5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00382-of-01024.json.gz": {"num_bytes": 398126420, "checksum": "aa44d029398c33f733065c489ab3ded9395f6e53263407173b6e9c27b6fb9c45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00383-of-01024.json.gz": {"num_bytes": 399108296, "checksum": "f507161fbe96f8abe9dedccba2458448719e6b153bcc1256ecee6b4b9c82256e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00384-of-01024.json.gz": {"num_bytes": 396156787, "checksum": "83c236bbc8508fb81992c837751a4d8ad4b9bc138dd1f4bb5c1fcc68203e12da"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00385-of-01024.json.gz": {"num_bytes": 396878483, "checksum": "df45b4749951a46695f88789fc536617ee3470083e55562292f606e09185e4a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00386-of-01024.json.gz": {"num_bytes": 397495799, "checksum": "a8240c9e7266e47bda8880e38ac8a5afa8541aed4b989d6642b31497716a51ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00387-of-01024.json.gz": {"num_bytes": 397062301, "checksum": "e6fd54ea6f17d5570fa4cc97554813a7a33bd4e44cbc456b27b0c87c1af22c60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00388-of-01024.json.gz": {"num_bytes": 397074091, "checksum": "fdc2a134df4a669deb839f26947c86b7e7a4bc7596a6a1c25562cb97fbb6b089"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00389-of-01024.json.gz": {"num_bytes": 397056868, "checksum": "e7390f0007582a3460fa67375b2628c85a1aa85954796d8e6584fadcb35761cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00390-of-01024.json.gz": {"num_bytes": 396404332, "checksum": "820a97060abd3172852f38e1636706c8389adad8495de56f4c3a2c3ba6008235"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00391-of-01024.json.gz": {"num_bytes": 397125489, "checksum": "68732c5ab9f4b6945e79ce2a1b45b97a97822d6a107aa79aa9135f29d91173ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00392-of-01024.json.gz": {"num_bytes": 394992472, "checksum": "c9d1e8cfd481631a76544e5880ceee9990e7553c88c5978a91b48ec8aa47717d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00393-of-01024.json.gz": {"num_bytes": 394778146, "checksum": "7a5ec4f0878f676a3ac2c417f512186066d793f28d611f97135c3626b3b60fdd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00394-of-01024.json.gz": {"num_bytes": 397024190, "checksum": "44e32db5a39684ab1789cfe97b6e9cbd3c539390e7a4c8ec9298e7177945452b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00395-of-01024.json.gz": {"num_bytes": 396537190, "checksum": "601ec281240753ac5793ec7cb83802a788c4d88e56dfd83e6c875cf2ef9bd8f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00396-of-01024.json.gz": {"num_bytes": 398049705, "checksum": "b1024b69e191b2c7073f5f4f3ea51e8710be54db8603ce8aaabbfb919ea6694d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00397-of-01024.json.gz": {"num_bytes": 396670567, "checksum": "11357bc600f9b0c443f124c7fa4046d10cf03e19016e5ba8cdde884d2ff76c9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00398-of-01024.json.gz": {"num_bytes": 394706629, "checksum": "778eca6d845b9a7d49e22941b959a95e5e4d2d9714720f27b810230d136acfde"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00399-of-01024.json.gz": {"num_bytes": 398257272, "checksum": "27c2a30af83975d32469e85fb2e27953a3aa9f97514f621063325cb9af1829fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00400-of-01024.json.gz": {"num_bytes": 398732278, "checksum": "aff9a39748526a03d3476288cdbce122c3683baf113362e9085895609d03c3c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00401-of-01024.json.gz": {"num_bytes": 396372632, "checksum": "a6af262bb962eb1c45d2003ee1bb2be1a3a12cb3e53d4ffe58b4b68dd852957f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00402-of-01024.json.gz": {"num_bytes": 396783625, "checksum": "db9aca12012da21fc5a0619a47e9c3075959786d6d6d74f6a244af1cb33c402d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00403-of-01024.json.gz": {"num_bytes": 396950960, "checksum": "b3566f7b9251f6aea9343d1344151f10fc104464f92e8f10a97742defffc2244"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00404-of-01024.json.gz": {"num_bytes": 398481154, "checksum": "897904040b5887620b9996cf89656f5bff329a430a8c3dfd6802d0c879675376"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00405-of-01024.json.gz": {"num_bytes": 396065216, "checksum": "45e0108549ab06d9a8ad5c45dc53250798d0e58f7e940080a754106801250009"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00406-of-01024.json.gz": {"num_bytes": 395637879, "checksum": "bda70f3a19b19e2ffdd1c3a26b959945b447acd450cab49e72ce727d2218af5f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00407-of-01024.json.gz": {"num_bytes": 398356109, "checksum": "1df9e8b4715d9a3f02a0b06aef6095f81d38acd1be0b4fa402acaac0258c3116"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00408-of-01024.json.gz": {"num_bytes": 396041456, "checksum": "e89ebf354280543204e78f4308a8f8751cc26094524628cd8e9cb691d9911b82"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00409-of-01024.json.gz": {"num_bytes": 396254329, "checksum": "15729474174d6a5adb5935f25afa6de2f03a8dd2f73b780e23795ede92f5762d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00410-of-01024.json.gz": {"num_bytes": 397850848, "checksum": "98f1b8fc845e0005b76d7eac70a430ce98e6989569344ea92266f8391b1396fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00411-of-01024.json.gz": {"num_bytes": 395527322, "checksum": "52b2e31f2adb61c8e703c6758016cbfc650f8104dcd5f78867c81434be155ea6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00412-of-01024.json.gz": {"num_bytes": 396155992, "checksum": "7b6b4192f9bec4fdeaf9d6dcabd9cbba6b4c8ebb42d26730fea21bad139823c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00413-of-01024.json.gz": {"num_bytes": 395766377, "checksum": "775d1fac6b1708ba0384d922640b2f372b3ee146fc79fbe692ff69a7c6c699b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00414-of-01024.json.gz": {"num_bytes": 394860848, "checksum": "0386d8a8e0cc9d5d613b1f84085791de57ad05751d94d25681d86dff5cec1afb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00415-of-01024.json.gz": {"num_bytes": 397566065, "checksum": "1957b0d185943b1952dc66e78f0a7d449f49f8f55fc0978bf77e8dde10f4714d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00416-of-01024.json.gz": {"num_bytes": 396297306, "checksum": "3f8796934edb79d172e682511a5ed7666aa09ff541ce55e2c66406bdb6eeda9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00417-of-01024.json.gz": {"num_bytes": 398314475, "checksum": "8da08075b966c04aa7859275eefd34c78cd2b9edc366684733d027ad6d619ba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00418-of-01024.json.gz": {"num_bytes": 396296110, "checksum": "efe43733ebfc7b65c646aee68b883cf40124c1446a28e70ff2bfa9e1bb1377cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00419-of-01024.json.gz": {"num_bytes": 397614415, "checksum": "c0f02d78715de9c3ea0c684dad36a506386081fed2011ec298ca0ee623c7792e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00420-of-01024.json.gz": {"num_bytes": 395133656, "checksum": "6237f5797a35dcdd89a0b70cac4dedcfb3fe418560f8dbbf6cad685f11c870b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00421-of-01024.json.gz": {"num_bytes": 397061849, "checksum": "ee37899a6a49269026633ec79577491ff4b11e219e0236dcba68eb168279067b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00422-of-01024.json.gz": {"num_bytes": 396539584, "checksum": "e5914a4b97c27da82eaee2f4f67a165de946bb38a00d6126b1527f5eb1200417"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00423-of-01024.json.gz": {"num_bytes": 397715346, "checksum": "b99e628f8790a7baa8ee7828e31f2ec72374f9a8390c1d64c9b8092b10d9c7fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00424-of-01024.json.gz": {"num_bytes": 396335469, "checksum": "9cb3b9eb00760bb68f3df4b66b96f1e5798c338231500472fd64c49cd87c6599"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00425-of-01024.json.gz": {"num_bytes": 396714466, "checksum": "f28d4901ccde8eb7afcede9732ab94fd18c49e0e3731659ef587058d6ea2ab28"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00426-of-01024.json.gz": {"num_bytes": 395566563, "checksum": "9ab75a89a425ce974fd36e936476a30db913c2d7c9ca6e5522b91ffbcbbe30cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00427-of-01024.json.gz": {"num_bytes": 395379035, "checksum": "5e1ca658bea5ba5506afbb9ae5a5da4d35cdc3a215478c68e11652a7d5d918f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00428-of-01024.json.gz": {"num_bytes": 396419259, "checksum": "d740b37b576bcde0e1c8eee27c3bfb3b58c1a0d3c5b471001804b2a37f277ac9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00429-of-01024.json.gz": {"num_bytes": 397116774, "checksum": "d1c10b0ba72aa2d4cb4640d1263c32868190942b1e93b4bb4e9798e25f10ba67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00430-of-01024.json.gz": {"num_bytes": 396634586, "checksum": "11dec038b4c1c35d32d000915812b6ec8da9abbbec2e15f7493551198b6a1ef3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00431-of-01024.json.gz": {"num_bytes": 396704705, "checksum": "efdfdef444cf68fc05090107033ffe2ac906b6efe2fc138e90f47cd4bd0b6204"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00432-of-01024.json.gz": {"num_bytes": 396264701, "checksum": "fa649c2e2dbc992408c3a60327e5d5ace4697c84010446bb286e544eb6c604be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00433-of-01024.json.gz": {"num_bytes": 396887722, "checksum": "3d5fd3fbf209dfff2057143a3dcf7eceeccb1e85967a9a85a992f465e3522335"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00434-of-01024.json.gz": {"num_bytes": 398856291, "checksum": "ab6dc5343b052da901f4671c1cb3173850fbc6bbfac2623ca14936b2b83d9667"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00435-of-01024.json.gz": {"num_bytes": 395888569, "checksum": "26abd1e2263af02f998705501bd02ead2edc3d7f68fadc7b198e7fcf4dffc454"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00436-of-01024.json.gz": {"num_bytes": 396976077, "checksum": "a5dadf6ec93e8dcd62b0e1de3cb03c866147bafe0da8e631341663ccc03bb801"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00437-of-01024.json.gz": {"num_bytes": 395809168, "checksum": "7f98e98270f9b88570b5e498511ee65d07428db604af349ef9107dbcf65ac4e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00438-of-01024.json.gz": {"num_bytes": 399136723, "checksum": "0e03ec507b90b38d5b6d7dfe27d40e127efdc9a0bae349bea2e743375ea29b9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00439-of-01024.json.gz": {"num_bytes": 396435416, "checksum": "5f868ba66ea32a23be4a926fda0a86d0d2ab4948326e1ebac615fa16a2a6864d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00440-of-01024.json.gz": {"num_bytes": 397487165, "checksum": "d30005787e7472313982cf2860e0a0764900b82a7bf616da27e6c1c3298eb215"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00441-of-01024.json.gz": {"num_bytes": 395968030, "checksum": "181461b447d88040130c3348ae7d22f220e0f97ace030d6f54301a9a3d483fc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00442-of-01024.json.gz": {"num_bytes": 396909150, "checksum": "0854cd3454047e0c6a0746ef21e0cbbb22fbdf4349c2e668f4fa1e49add183c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00443-of-01024.json.gz": {"num_bytes": 396271897, "checksum": "2493db29dd3cadef3719576c34213496eff807df5ae8cf538f13e84d403fec77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00444-of-01024.json.gz": {"num_bytes": 395540084, "checksum": "5e717d9e0c1b6f728df0f206e422a0958a537dddf31fffa4d699e5bf4b3c2b16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00445-of-01024.json.gz": {"num_bytes": 398750991, "checksum": "b8af9d413da48fb5f9a9174b12ad253b2eb2c1ed7709cab710d66710841568e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00446-of-01024.json.gz": {"num_bytes": 397575547, "checksum": "2bad5a914cb9f2e5e99d76afbf85eef66c18e7c1cf2e11c5d455792ae86ab441"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00447-of-01024.json.gz": {"num_bytes": 398035036, "checksum": "d834925674a33ed5eb8fcb335fd81b95e4ab882010e434e3fb9323e0f23be2bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00448-of-01024.json.gz": {"num_bytes": 398658613, "checksum": "16f3ac40180e47b9b97998f5d1d7c0e9336e2fee5612a3397fd161937f7a2b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00449-of-01024.json.gz": {"num_bytes": 397934476, "checksum": "09dd3d5a529f62b10d1ec97f37ed142315190fb437be3f50987ee955b11f7672"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00450-of-01024.json.gz": {"num_bytes": 396444119, "checksum": "8a25c11e0adc5fdf50944767fbfbf01a9c35b3c0e07205c7c06288d1f68b4c10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00451-of-01024.json.gz": {"num_bytes": 395963541, "checksum": "f3ac2e295ca4b3ca1f55c8b500ea2588f1519163cec381297ad4bef390fbbe1c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00452-of-01024.json.gz": {"num_bytes": 396594911, "checksum": "25a57709e934077c2972f0f8a1a9db7afe9b7558ab023bd6ee5224b2f8cd770a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00453-of-01024.json.gz": {"num_bytes": 396745507, "checksum": "75c1a4803bb58efe5df885bccd13596d46dd1f3ea30899a7e83812167b990bde"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00454-of-01024.json.gz": {"num_bytes": 396193342, "checksum": "c151679573ea5f5b52e26e8b50da7e14760d1ec15c63a5b864b648190efd48f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00455-of-01024.json.gz": {"num_bytes": 398096160, "checksum": "7f86270b13ee4133adaa06de809f26ef581229407813fca05db521d9d36880dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00456-of-01024.json.gz": {"num_bytes": 398965570, "checksum": "d5b292189c5d318e0ad622eec1e764993084d0477147f51f29acd637935fec5c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00457-of-01024.json.gz": {"num_bytes": 396672892, "checksum": "8b490f615b3ed701390ed671d5645dec4aa3fc576a032da8f9d434087c1eb8c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00458-of-01024.json.gz": {"num_bytes": 396911580, "checksum": "8bcadc16baaa4e36fe17ffc0862c264230385e18bbd861671ad5fd8cbb86404d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00459-of-01024.json.gz": {"num_bytes": 395969213, "checksum": "b8ff8371a01d7bd1782044058ee0f53d4d1275ebca0870ba16104c1c4b12f07c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00460-of-01024.json.gz": {"num_bytes": 396928338, "checksum": "23dde1fe55277467d6d2385684b71e90e9066e6a3c349a1da30a1487e87c8539"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00461-of-01024.json.gz": {"num_bytes": 400009637, "checksum": "34b98d46d207c5b6ea7416fab6f3cfcb1444cdc19376464ae9abb9296fd14c3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00462-of-01024.json.gz": {"num_bytes": 398107677, "checksum": "2031735c0f38ce43e37a5bb1b9728fc37c758fc4af71758c3d3b9535716a3253"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00463-of-01024.json.gz": {"num_bytes": 395503017, "checksum": "7820184904183fad9a61b6c638df9de11d4624bb3aca08885b842255172cecee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00464-of-01024.json.gz": {"num_bytes": 397493281, "checksum": "b39b1b1e6686014a3c62e74912ec3b915dfc161b62e2d1108410354e6dec760a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00465-of-01024.json.gz": {"num_bytes": 397080149, "checksum": "a65cc7f590cc498da334d5a8653e818421e09e5e6ce2e8bc2a29ac67a02c3d43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00466-of-01024.json.gz": {"num_bytes": 396633690, "checksum": "15d891873ba02923893cbc8c42adc0468bb39161f898a810037cc2e9f82e0796"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00467-of-01024.json.gz": {"num_bytes": 395045117, "checksum": "711686ff5478ec35ccaaf1549b7a33b941e322585f702257dfe2d31630245ba9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00468-of-01024.json.gz": {"num_bytes": 399486439, "checksum": "59c4599c8610f4c54778daedbb358f5e26fa527f8f94c3364b70565ebc90571e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00469-of-01024.json.gz": {"num_bytes": 396170105, "checksum": "4263dbb03135c2d8b16fb323208f98fe1a1ff1223e76a7ba085f881411a0ab95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00470-of-01024.json.gz": {"num_bytes": 397479432, "checksum": "2db90de8f4d2bde9af453478ed4667166f636af701bb487095311f99b28e59bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00471-of-01024.json.gz": {"num_bytes": 396679096, "checksum": "caea3c4744adb89f006d9b0d9ef93241a55c1fc165cb0cd62b6d07fa3a40cdc0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00472-of-01024.json.gz": {"num_bytes": 397080237, "checksum": "34995676d953f4c95f8bd4f54fba8f92b86189cd73298ab77ee2702611b86e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00473-of-01024.json.gz": {"num_bytes": 397881706, "checksum": "c0fc6c68ae509d8273e7ca0efbe24f1452a57dcb000f44f550fe9600fd305e62"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00474-of-01024.json.gz": {"num_bytes": 397705270, "checksum": "50aeb620f8c03a2e4f2346a0c79a4509adfae084ffbeff0b86d8892b858a821d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00475-of-01024.json.gz": {"num_bytes": 397201717, "checksum": "4fa508d23abd417bdb0b0e7a61f9aedfb770609214cd85b10b4bde7ced7f12b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00476-of-01024.json.gz": {"num_bytes": 397522775, "checksum": "27da6164865687041e4f53d9ecec2edc877b147da5b424acbac2c69480132a08"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00477-of-01024.json.gz": {"num_bytes": 397323156, "checksum": "e40115fc4901a3930494652ce9ee7abb0c3f41abc6d6c58c81fa75a0ee752db8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00478-of-01024.json.gz": {"num_bytes": 397380721, "checksum": "79a16b7016aed0eec375ca383eb316765687f12421f786b2e133faa5690ef197"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00479-of-01024.json.gz": {"num_bytes": 396828680, "checksum": "08185ce3c3e5b01552be7d8f08ed5b27a6b1b121bb2d7d70a78b7074fee02fa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00480-of-01024.json.gz": {"num_bytes": 398678311, "checksum": "37a5804dafb2f4aff9e393af5b127c3577ab8a5dd23f1e41f2304b25a4c428a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00481-of-01024.json.gz": {"num_bytes": 397654112, "checksum": "47ce12535b753d8936ce3b569675e76cb6f638bfb74a93caf201f3ffc409d71a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00482-of-01024.json.gz": {"num_bytes": 396387301, "checksum": "1d07828a199bb1e1c0c8342ba99e484093557188370d1ced90803c2615d24b7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00483-of-01024.json.gz": {"num_bytes": 397178863, "checksum": "b6499612fac654798010e11c27ee8a25fc05d1dbed8aaf2338fd0ea377dc4732"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00484-of-01024.json.gz": {"num_bytes": 395826769, "checksum": "ce197ad5a226249bbba53c34b9f3c83508b542853748c3094a5b98befb537f2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00485-of-01024.json.gz": {"num_bytes": 397100006, "checksum": "f483044a4a0418b695e0b989f0fd03bfa79df01b649991f2356443bcb29d0820"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00486-of-01024.json.gz": {"num_bytes": 397658615, "checksum": "297beef7b85dc128a6a58d834c5fd1b24bd7fe84c7a317500461720c742235f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00487-of-01024.json.gz": {"num_bytes": 396904673, "checksum": "06751938694fad1645ed575208e8e2c1efebb7165b4feb2d0ea871dc348741f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00488-of-01024.json.gz": {"num_bytes": 398019631, "checksum": "eb58bf8b011fedf15835841317e445e9e757c9939b4453a013233f020f98a697"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00489-of-01024.json.gz": {"num_bytes": 395822836, "checksum": "b339e33e7affbdaf691852d3668ff79adf8476a3c33eb86ad9f4ad4a6ebbf3dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00490-of-01024.json.gz": {"num_bytes": 398410737, "checksum": "4d8356cf804474538772c5520e77e75ac750dce3e6b103c9feab49ccd46a58ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00491-of-01024.json.gz": {"num_bytes": 396607853, "checksum": "1757097fb884d03aa288a05870016b1c2b9f1700ac5913d85c9821cf2e367702"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00492-of-01024.json.gz": {"num_bytes": 397612443, "checksum": "92e98e431a378e0402d81299c49209c66d39b0ba7ae63711f8d6ecf542f5fdf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00493-of-01024.json.gz": {"num_bytes": 395595466, "checksum": "d839e1763aa6ebc7cbcf1b870d947ba45b0b4ac95b0adbe4941a0b121690a311"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00494-of-01024.json.gz": {"num_bytes": 400397068, "checksum": "31caeb5f0ef694c06ce434df44c01f4a91fcd48e4acb4f1bf167eae6e59a02de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00495-of-01024.json.gz": {"num_bytes": 396458630, "checksum": "26291dfcae5145cdc306317ecf95851a3f693b4a7c6e132e55384ec69d85ef3c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00496-of-01024.json.gz": {"num_bytes": 395037560, "checksum": "b32344b92f81006ad9e2e471f5ef8133e87924c5150145b13d51c3d7a0f68c46"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00497-of-01024.json.gz": {"num_bytes": 396247929, "checksum": "0396f0bb16b06ff130e955f260233ec868ada1daef6e8cbd480ce388628d49b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00498-of-01024.json.gz": {"num_bytes": 394798084, "checksum": "28d43d4e7bbce4e20167741ea2bbc3f17981aa51f9c040cfc41c522e732c6d32"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00499-of-01024.json.gz": {"num_bytes": 396699883, "checksum": "c6f6deff919b375fb08c74e159c25aa66362e4cddb0700f9b1e0e2701293ae70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00500-of-01024.json.gz": {"num_bytes": 397014521, "checksum": "7ee22957fdfad0880f132f47860612331afce7a48975b9312233ba8ddf537bed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00501-of-01024.json.gz": {"num_bytes": 399063718, "checksum": "ec94186b620037002819cd40347e6aaf67cb847848483790cd687222c9addbbf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00502-of-01024.json.gz": {"num_bytes": 396938850, "checksum": "a218de10cee75c4bb5a7102fbe208e6e65142ba5f960ecdc2b56b6f85fa30840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00503-of-01024.json.gz": {"num_bytes": 394631309, "checksum": "8189de9454986f63253fa1ad44c63d5c2f692ff4bc3a848c7c2fd02e08f4e1b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00504-of-01024.json.gz": {"num_bytes": 397884411, "checksum": "b7b268545c27573840bf8a6abb7361c209f92f9b5f0f8028fffd49b0c773854b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00505-of-01024.json.gz": {"num_bytes": 395784113, "checksum": "b9f1610be9f045c15e43a7343bd2918743a71585a7122a4e781533dd39a73132"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00506-of-01024.json.gz": {"num_bytes": 397939195, "checksum": "f07b77d1be71c5922321e8683140f9a63a90903f1fbd1515d908807e12fc4597"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00507-of-01024.json.gz": {"num_bytes": 395925741, "checksum": "23e9927e9e83fd03e9d99c3fac05f1bf63d6c296a2b02d1aa208798d27d8dc1c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00508-of-01024.json.gz": {"num_bytes": 397426015, "checksum": "f4b8a74c610cea50a6b144337f65fcfed11fff21df6683503f25d4b82e29a4e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00509-of-01024.json.gz": {"num_bytes": 399072341, "checksum": "c3069ae9658273cbaeaed1730f171837c8d3042e31d1093cf0f519f601309a41"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00510-of-01024.json.gz": {"num_bytes": 395859781, "checksum": "e5863648f64423397ca1a7838df18aeddbb3d5d3a2551321fd99a480508fa86f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00511-of-01024.json.gz": {"num_bytes": 396948832, "checksum": "a2209ec05a794f083cf163c102c6ddd8d5e5627674686950e17e586128a81e60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00512-of-01024.json.gz": {"num_bytes": 396585426, "checksum": "1c6fdb002dab490e6ddd7fe6023b2124bb944b7ebe95ee3b7faca9a92f4b5de3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00513-of-01024.json.gz": {"num_bytes": 396789970, "checksum": "83b02c0cf9ffea9d021adc102269c30a33ab3a803d331ba8d39aaa9b3b7acb43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00514-of-01024.json.gz": {"num_bytes": 397131474, "checksum": "783f25460641cd3532c3bb3920c7d3f0c68b5e674d44cba33b1ed755608cf8ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00515-of-01024.json.gz": {"num_bytes": 396127068, "checksum": "61e5b9947f77d929442f23fe84465d88044631aa1eb6438a0b86372cba7286fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00516-of-01024.json.gz": {"num_bytes": 397526020, "checksum": "539b032f528d1ec3a8e8420514ef2118f05482297b052f6d28876a8bf776a080"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00517-of-01024.json.gz": {"num_bytes": 397748661, "checksum": "03b85a51aa7bcde672cc017fcbb0f11976cbd1447fc0ccb4f4bc822b2b04b27b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00518-of-01024.json.gz": {"num_bytes": 397915751, "checksum": "80dec6dc7d15459c113c16f23978c38cdc1157ca18468d8a00e0d2192bb2ffd9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00519-of-01024.json.gz": {"num_bytes": 397847480, "checksum": "7125e7915fd03c6312cfe448e4e7a8629249765c13d8558b17c240c2aef713b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00520-of-01024.json.gz": {"num_bytes": 396232144, "checksum": "27974f9766c18fd0b652c94eafa3493243c8e1b25b6e850e857ab6246b193b48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00521-of-01024.json.gz": {"num_bytes": 395111538, "checksum": "61406e92a8f9a6ab800b3dd25cbac842e3487a4c7db7b1bb2070a41d627367a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00522-of-01024.json.gz": {"num_bytes": 397690206, "checksum": "b2e29801d120132a5fbbd3662a54290e46ff5e178b3146ebfc2169facf72e7e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00523-of-01024.json.gz": {"num_bytes": 398274007, "checksum": "79905dbc45756c9f1c225120709d39cbf3caf435e322a531a4add690a1d0440c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00524-of-01024.json.gz": {"num_bytes": 395689218, "checksum": "1dc3086cb869abb13862970186f6a77cb29b687cd49518173f639c148d937f6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00525-of-01024.json.gz": {"num_bytes": 397979085, "checksum": "6958bbc6029c00229fb0059d016a6b7a2bd21cfdc69392893423d2657c35c7c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00526-of-01024.json.gz": {"num_bytes": 398473877, "checksum": "895f42c4e7569f0db3832af13e56499f65fff74e93fc0cdf60c1c4b4b08881c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00527-of-01024.json.gz": {"num_bytes": 395879939, "checksum": "e84e72048b56878b1ff904ee83d92c208e15b16663b99a9d763edc23c2e0e55f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00528-of-01024.json.gz": {"num_bytes": 396472889, "checksum": "badcc3cda339c61936591e9333787ea032c42d7ff2288fdaff791bdc8504ce96"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00529-of-01024.json.gz": {"num_bytes": 396983038, "checksum": "ad20643f9d50c7c508fa136ceed0039ce39708e0e7a5e743c1981f1000bc3c4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00530-of-01024.json.gz": {"num_bytes": 395774249, "checksum": "9453fa3fd296150b436f0146171ea8317512c6735ee9434622a83765a5d9e310"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00531-of-01024.json.gz": {"num_bytes": 396171120, "checksum": "3e3c230ab6beda13e4dd4747c7c6291e57b1ccb4a96ac2edb46ffdb4c3cb05b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00532-of-01024.json.gz": {"num_bytes": 396200411, "checksum": "e9b52c3dad233fd1c4310cf5f76c2e6d0788ed084abcf931f99ab7002976d75b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00533-of-01024.json.gz": {"num_bytes": 395580851, "checksum": "e135cc4420d9f4d17ab523f7db8c559021a46a9a6bcdd21a6c4075047465906e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00534-of-01024.json.gz": {"num_bytes": 397459281, "checksum": "bb4f32ee1c1bedf4582b0f4f9ec7644be73fa25bf18cca7506e3c26e98818bad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00535-of-01024.json.gz": {"num_bytes": 397344480, "checksum": "3766ddf8313c5cee08a575fa96bdde06a5b293f1964e58293ea583d72bd18e20"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00536-of-01024.json.gz": {"num_bytes": 396588089, "checksum": "56d236a4250f9488d80b93c0c005962d018da256ea5632c7e16ae26c54188749"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00537-of-01024.json.gz": {"num_bytes": 397606873, "checksum": "d7ec24ef99de2769937b89e0ca7e291eca2bd0438d501d9228d5ab035f49d83e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00538-of-01024.json.gz": {"num_bytes": 397608864, "checksum": "1a60378a0f1a200b11f85577bbd0f373ae47022eab16fad53da492ca1ed35bfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00539-of-01024.json.gz": {"num_bytes": 398377669, "checksum": "787d263107eb09e852b015c17d1d0f54d8b93e78292c0c1e60cf99f27535c608"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00540-of-01024.json.gz": {"num_bytes": 398516980, "checksum": "dce03ef0813ef66e27df8730da7e341b49bf7e684bffd3a9cf700905501d1d72"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00541-of-01024.json.gz": {"num_bytes": 395557685, "checksum": "e4035222d65124bd3e33372b76b65c2dad9e696701607ceeb5968d483595645c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00542-of-01024.json.gz": {"num_bytes": 395725875, "checksum": "4e7ae0b1c0c4d514e0208e21336d095fea5970475077d6690a917faadb2b72b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00543-of-01024.json.gz": {"num_bytes": 397625187, "checksum": "a96ac467b6ace74a08f7dbc4bb8e3fc57fae36abc8975d6b60a7b7353ca9ca88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00544-of-01024.json.gz": {"num_bytes": 397078230, "checksum": "337470c84cde5d02bc6a89003a6796de9e63db269e7800637ef2d220d75bd3ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00545-of-01024.json.gz": {"num_bytes": 396145060, "checksum": "da65d66aa4cfff77c754f8017eedd92cb82494b9425c2d5c5491d64603b2231e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00546-of-01024.json.gz": {"num_bytes": 396093007, "checksum": "399f7b70d1c1b45ce315f396d5fa0db2c69e41c522b0514e19bcc6802b953b1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00547-of-01024.json.gz": {"num_bytes": 397457696, "checksum": "47fc8fd82271e6b1fb074512da45dc005e22cb7f0aca3b7b621ea87613aeff9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00548-of-01024.json.gz": {"num_bytes": 396246097, "checksum": "3108770b39746852d7c048d9a8777722480505bbf4592732c7d1f231e2505c55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00549-of-01024.json.gz": {"num_bytes": 393096516, "checksum": "9bb2b88775593afe4060349985ff4417a37f1ba9b4ef33399c58644c01a92b89"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00550-of-01024.json.gz": {"num_bytes": 396631619, "checksum": "cbb55d645d145ecc2ff9b96524463f82d5548c0bdf42381fc6faaad256e7ead7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00551-of-01024.json.gz": {"num_bytes": 396806780, "checksum": "ece03d7f12daa39473b6b8d5faed08a3f751efb9b1ee99f69c5188633d4a0f43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00552-of-01024.json.gz": {"num_bytes": 398608968, "checksum": "7fbbde9c39d67d8d7f9f16c0848188b743c6ff5bc44e6339d5fd88c32e1aafef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00553-of-01024.json.gz": {"num_bytes": 397696672, "checksum": "85f9c5c5fbcfd06f715b520a1a3a63a014b1831d2f65de5f02cfea49a18ddf63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00554-of-01024.json.gz": {"num_bytes": 397122204, "checksum": "78e3d43c3d2b71d8483788a085cd5706648767de7a2fc4aab707d6a05257ff00"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00555-of-01024.json.gz": {"num_bytes": 398704893, "checksum": "113e5fd99ada6ca96c086487b6e4012bad711d1d482d580e22d3af5b9d118572"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00556-of-01024.json.gz": {"num_bytes": 398099675, "checksum": "c7a816f8f2f74b4554ac17ffc41e67ebbcabb7c8b0c94292b4569bea372bea3d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00557-of-01024.json.gz": {"num_bytes": 396538561, "checksum": "7af6d2c9886481a0d393e026739b5ad7d0fc358ecc216d2fc124160402d4b50a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00558-of-01024.json.gz": {"num_bytes": 397660839, "checksum": "c1033428189671d4e1ba55c822040f307748c6ec31b80be3e4ed8e7a4325066b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00559-of-01024.json.gz": {"num_bytes": 398754128, "checksum": "69c9f88840166363f2b7ddaef05ac9d10441fd184d8451abfde76eb105572342"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00560-of-01024.json.gz": {"num_bytes": 394988981, "checksum": "a2dc4fc315a0db8f1a868d631d2941ab2806f44c2ae698e94bb7e8308bd67c70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00561-of-01024.json.gz": {"num_bytes": 395801300, "checksum": "dc1b2b4594e3fc7f8795f7649d1c524405edce56d617f1e214692565de8c8937"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00562-of-01024.json.gz": {"num_bytes": 398322250, "checksum": "c23404fef6a6b5b887cc2dddfe341e983939ae36078d62842919a3739c96b43a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00563-of-01024.json.gz": {"num_bytes": 397584845, "checksum": "c909fe429772c8198f904496ea6cf239d669c6c787889cefcb7623e08a988db0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00564-of-01024.json.gz": {"num_bytes": 396436964, "checksum": "8e7cb1863057a3b9929af4da29b4e1cca1f71c254f5eba91a657d9e8c1fd6dea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00565-of-01024.json.gz": {"num_bytes": 396486039, "checksum": "23ba56e78c4edc4d58fd7fbfcf784b29037204a641e43a9894c95c68bdb982fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00566-of-01024.json.gz": {"num_bytes": 395358745, "checksum": "71259a300ff096b49e3461c91824a8185037ca85ef2018dff2617f335ab304b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00567-of-01024.json.gz": {"num_bytes": 396405726, "checksum": "d9b56ed523376681dd81cb9831727467461bdfb87c80d3932937338370093033"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00568-of-01024.json.gz": {"num_bytes": 397509797, "checksum": "c650aad13a48d5b0c51162ad19c9eb3135559d0a3318dba701a90e8138a8cd24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00569-of-01024.json.gz": {"num_bytes": 396514261, "checksum": "d71e4126c2deffae8ee55077cee9dd2b70ce27adec767bce06e02afb23b42416"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00570-of-01024.json.gz": {"num_bytes": 397072833, "checksum": "519a32e1bdf7f5b97e1a438242a79218317e04e44021dc61aa65c526d35ce8ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00571-of-01024.json.gz": {"num_bytes": 397170114, "checksum": "919a9659156cafb26b87190fc00b9d33c4fd536dd35544cbef8e5ddc018ae365"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00572-of-01024.json.gz": {"num_bytes": 396475017, "checksum": "3d7e4e548f01c9ad5fc99b4342cbf9a9004737058dd93aae8b7d95b2c00856bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00573-of-01024.json.gz": {"num_bytes": 396749955, "checksum": "032f8e37328c9f0fc046e5a6ff5a79cbb744f3100c4cbea78e397c449471bb10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00574-of-01024.json.gz": {"num_bytes": 396036505, "checksum": "8e795341527712be32a69307ce8cbd2d6195c6b2fea596d326a279734505198e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00575-of-01024.json.gz": {"num_bytes": 396722381, "checksum": "45a43576cfc61842bde146eaa566b4f22a128c3c2eb8f30c59a6b6cae4bcd4e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00576-of-01024.json.gz": {"num_bytes": 396163377, "checksum": "38429d2d6176ee42ddd495e052c01735a9a7f0076cde107d24a0a9c7a26bf2a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00577-of-01024.json.gz": {"num_bytes": 396813305, "checksum": "eae77c319bba236feaffc9f74eaa38e911fa48eb06f4794c9b1a6d17edab91a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00578-of-01024.json.gz": {"num_bytes": 397797226, "checksum": "1dd2b3d7e99fde8903bc12625568ec4fc6fe653737b3af5e9c71432e311cf5f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00579-of-01024.json.gz": {"num_bytes": 396012631, "checksum": "d9322e66701b4ada3788b91a07e87b03af6c91eb4cfaaefee23c0330987a1840"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00580-of-01024.json.gz": {"num_bytes": 397943129, "checksum": "23deb32e1b0f07a55a5cf1572cb8e313ce716c748a07f58bd90cbae97290d0a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00581-of-01024.json.gz": {"num_bytes": 397614648, "checksum": "6193f8b848c7930fc04b9f2429dbccf36f1b291271b3eaf646c655433bf3ff9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00582-of-01024.json.gz": {"num_bytes": 396659280, "checksum": "40997ef02c7040356cd1c5acd8e6a5121e00b31253713cad4f529ab2922affc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00583-of-01024.json.gz": {"num_bytes": 397686445, "checksum": "5cd21271e4ae036f8d1e0c320330a6c93a8b1ffbb9293a80c56c2d7f123f9ee7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00584-of-01024.json.gz": {"num_bytes": 395500815, "checksum": "c25befb7c735b2340b092a04375d2109c1b876d2b0057dd8d4ed4beac87118ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00585-of-01024.json.gz": {"num_bytes": 398413461, "checksum": "073f632e95c218fdf17274fc21915c94f56bdfbb58a6b1a0550de249ce4d2129"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00586-of-01024.json.gz": {"num_bytes": 396849745, "checksum": "647cbe9bd7709c0d8a01485096fd88ad0fc09b27de324eae141a8d841536b71b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00587-of-01024.json.gz": {"num_bytes": 398567154, "checksum": "557af97a8d2b2656149bc25ee5b362116d173e6a48911b860ec10d512b4b763d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00588-of-01024.json.gz": {"num_bytes": 398086388, "checksum": "9e9afa15ee3534e497c9fc7c8cd967388183193dade3d1ec82a8e2b0e82c5118"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00589-of-01024.json.gz": {"num_bytes": 397335823, "checksum": "ed8a1d0b9c55f465b5d4a4e5ea022f6d17aaa8b82569be7cfec55629c1bf26c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00590-of-01024.json.gz": {"num_bytes": 394931693, "checksum": "3fbe539fcf64f0d914c19b383de9953b0605d4a69f48801145f0db1972f9c6b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00591-of-01024.json.gz": {"num_bytes": 397828770, "checksum": "9165de8866384d3d03c3876c39c96706e33a24b9f95acc09999c2dbfb85cd9cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00592-of-01024.json.gz": {"num_bytes": 398782493, "checksum": "433a9cb730d7ab024b56ad662a3ea53633f7ff26c625051c4c02f252beeb87a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00593-of-01024.json.gz": {"num_bytes": 399264489, "checksum": "4a7e5f40aa8b692cfa0519d33a868e9a05e579ad430204bc13c48b533eadc5ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00594-of-01024.json.gz": {"num_bytes": 396629833, "checksum": "521d5e90550dbc97ab26a18a0b75da81e38ce2083ff5fd93340fded2e54e1ca1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00595-of-01024.json.gz": {"num_bytes": 396916313, "checksum": "30c9be1d99ce0a41b214fdbd5115988c82ca317d4aceb30c19fbca05e0a409e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00596-of-01024.json.gz": {"num_bytes": 397013253, "checksum": "b16bd9d7d893b4a71056575fa0799bef96120c03cfc6e2a88c292469a67f2614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00597-of-01024.json.gz": {"num_bytes": 395980036, "checksum": "3bd15089b6fff342df2b3109d7ebadca35cead4f44ca5b1b55e55d8892aab82f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00598-of-01024.json.gz": {"num_bytes": 396295935, "checksum": "6252d951a9570baea9767cf3350a6d09ac5a5fc34ba80eae3b5c40adb8361ab9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00599-of-01024.json.gz": {"num_bytes": 398608239, "checksum": "b265a385cdd5e64d1fb2ffce739e72f2fe2cc8944621f20e2084dc52b91cdd9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00600-of-01024.json.gz": {"num_bytes": 396563743, "checksum": "43d12028cbe738e8f450911f6a55dcb00f8742cefc2a2c4da5f9e9220b0572c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00601-of-01024.json.gz": {"num_bytes": 398256993, "checksum": "9368dcfc581e6d572d899ef25b129bc0268901a2fa009500174a0985bcf330df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00602-of-01024.json.gz": {"num_bytes": 396202546, "checksum": "3cc57d7afd161fcd411f73da8369d98db4c6d8e30643ee01450adef21e8ea3ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00603-of-01024.json.gz": {"num_bytes": 396338425, "checksum": "cc21fc5b8ed6e5115bd8924954d685ed52cd5b773ab63d37188343443c95851a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00604-of-01024.json.gz": {"num_bytes": 397597307, "checksum": "d24f6d807ae35037e695e19917ed446f74448166fa464c862e31fe7ba2bea196"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00605-of-01024.json.gz": {"num_bytes": 398278313, "checksum": "99166183c752aed8d0f2cc9c010f1ebdd4fb93d40e936fd6c082eb3542baa956"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00606-of-01024.json.gz": {"num_bytes": 396590468, "checksum": "657ce79340c15524a5897459a6cf712fa4127def2445f7eb3de21c9b46db3794"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00607-of-01024.json.gz": {"num_bytes": 396603228, "checksum": "3705441435f18d1e4aeea9e794e1216fcd29b48213763a554808e3d3697951a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00608-of-01024.json.gz": {"num_bytes": 397280580, "checksum": "be0bef2c16e9bdd0387276402dc99fe5a9a0a7a105a44e88bdb783139f2de474"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00609-of-01024.json.gz": {"num_bytes": 398284528, "checksum": "3a7c7a8cb01f6d7589152a1483682a5fa99e119490f3e70d8a02f582f2e2b19c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00610-of-01024.json.gz": {"num_bytes": 398872039, "checksum": "c349aac5b64227397ec2870992ac9e4fac9fe39f1fd4e0a7b8c727e171655e14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00611-of-01024.json.gz": {"num_bytes": 398736440, "checksum": "63ca5eb2d27632b3b4dde8e40f9925e71e21ef737262bcda7a99324a67e0fab5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00612-of-01024.json.gz": {"num_bytes": 395170895, "checksum": "3b4bb3e14ee981a9edb9828ce40b86b5d83dfafcc1a5e0e02642cb40924bd6ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00613-of-01024.json.gz": {"num_bytes": 398443337, "checksum": "e95adbd7d55024b7e62145860f217a6f04f5fcef79ac23e92dd9e14f9a0b2a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00614-of-01024.json.gz": {"num_bytes": 398854661, "checksum": "def8cb789f8f79fa169e855816c5e4bc7d5c253e565502691a9abb826d7436d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00615-of-01024.json.gz": {"num_bytes": 395505189, "checksum": "6775ca6aa4f834289396a438906b90936ed0ff6390213dac2b0861f40d7761e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00616-of-01024.json.gz": {"num_bytes": 398999454, "checksum": "6cd5efddacb09cc80ec1eb79f93b562044787903b3cb1c879be2acec64a9dbdb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00617-of-01024.json.gz": {"num_bytes": 398570431, "checksum": "26d1f587377446e8b1499be7a3b6776d437baa40353fb04c591203a420eb0cc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00618-of-01024.json.gz": {"num_bytes": 397064982, "checksum": "e59a87fd1cd3d87fff4b15c3a9331521d7587ac7f4a7fd51ec3906b484ef9ad0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00619-of-01024.json.gz": {"num_bytes": 396676338, "checksum": "8077c3a15d93579d0fbf00bd9d117bf4f50092c5be3acf46c7d4433ef7be9dfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00620-of-01024.json.gz": {"num_bytes": 398186471, "checksum": "ee3fb91d7797ebf1daf8dcb81563b7dae7b161d97732efd35e3eb6ebea732ee2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00621-of-01024.json.gz": {"num_bytes": 396467968, "checksum": "386adb83129a7306ef4da37c1cbedc39b3971e7633d516d406a982f307577e67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00622-of-01024.json.gz": {"num_bytes": 398293882, "checksum": "b708cad0e04c56174d0feec84d7224a4490cb8db023d38e57398cad89b78568f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00623-of-01024.json.gz": {"num_bytes": 397396780, "checksum": "c50c4568c6f103b3e6a3702cbd915ecb530df954df808156bc38a98f36a0b944"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00624-of-01024.json.gz": {"num_bytes": 396971282, "checksum": "11351ef83c9fb883d6c0f484af5c10f0d686b7ac4a2f08fae9ac3d9837df0a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00625-of-01024.json.gz": {"num_bytes": 395882440, "checksum": "dfa97ea7949c9bbf7af43d43ac5c8d0034bdbd1ad572895159b7c7846ab89676"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00626-of-01024.json.gz": {"num_bytes": 398292846, "checksum": "fbc9c23dc286ad6fd7f01f344de97ef5789733af581de278488869bd36f3b246"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00627-of-01024.json.gz": {"num_bytes": 399890427, "checksum": "f43bbde36b8bd34ed9998b99b42c85434b8bbc8bbaa1cf5b38cec6393099c23f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00628-of-01024.json.gz": {"num_bytes": 399589466, "checksum": "c50058a4937912b678d33d34ff91e2287e8701365f4f71fce61f9002652556cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00629-of-01024.json.gz": {"num_bytes": 397355095, "checksum": "051c4631d0587b6f65827410ad2f2121c05c849a009274415bc5e7f72db42d44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00630-of-01024.json.gz": {"num_bytes": 397860559, "checksum": "07b48a86a8a3245fe5b78f6943c8970c839942b8d86abf173507225b0d1520d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00631-of-01024.json.gz": {"num_bytes": 396161304, "checksum": "70a03f0308105de5266c4a40803b51f99888b362b71409719b7f71f73761b590"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00632-of-01024.json.gz": {"num_bytes": 395620184, "checksum": "c6923984c419f08bb4e6effc27dd25dd986513034338debc9b238592dad9f607"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00633-of-01024.json.gz": {"num_bytes": 397572527, "checksum": "900fc701703234031e825a1eb2d11b364f1dda97eb0c7943e17ef278695f7bea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00634-of-01024.json.gz": {"num_bytes": 396215174, "checksum": "0cc838e395581933123fc57c6690afbdd2be1b67d213336d9b8c08b3876f8458"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00635-of-01024.json.gz": {"num_bytes": 399176005, "checksum": "5a3daa1bd0be8c997da56257f063a7d1c7b2b271648a46615b26ca4beeb42863"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00636-of-01024.json.gz": {"num_bytes": 396035356, "checksum": "9d21ce1c8b5a7c1330cc95b1f45286fb8578d5dcec0686724ff6e25a97f38a7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00637-of-01024.json.gz": {"num_bytes": 397214839, "checksum": "83cd34e1ba09c268b515fda7699e12bfa2531fb7e60e2f861946ffdc01e54a04"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00638-of-01024.json.gz": {"num_bytes": 396292535, "checksum": "82a7bae9a7d35fa707bcb6d90f7b244f1509e112dfdbd604c9be1f8b8ce7150b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00639-of-01024.json.gz": {"num_bytes": 398009954, "checksum": "b6d7ebd102c67960413caf5fcdc5b4aea728b6d3d6369ab8dd3cd6bee6c769de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00640-of-01024.json.gz": {"num_bytes": 397558496, "checksum": "151c55d019fd84fdc0eab73d24984e5d88ac964c86f89a361a03dc776a22b5b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00641-of-01024.json.gz": {"num_bytes": 398031508, "checksum": "e0e87304a8ac408adca2badf2564ec52caf155295ea303a121c30f3b1ce797b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00642-of-01024.json.gz": {"num_bytes": 396594124, "checksum": "73d08c99b6b96d96b82d88267b2a392a7dda2084ba5142b8eefd0d23212702d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00643-of-01024.json.gz": {"num_bytes": 394552252, "checksum": "ebccf3b935d63c30f626d317af250b6bd0f04ef5e1cced829287ba64fbb0d25f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00644-of-01024.json.gz": {"num_bytes": 397586341, "checksum": "674c0965a9a880c057b6f2dbb785a4a6ae048954d44ba4f5266dd5e65095d06e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00645-of-01024.json.gz": {"num_bytes": 397950976, "checksum": "7ac8d4dacd682a2977818f01d860c3dfa5a5e5a78f7d2d95be0353a675452e93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00646-of-01024.json.gz": {"num_bytes": 397511840, "checksum": "452a9cc03facf9151552f914f9a8a3507a96fd8ea40f7d04951a29ecbf6aa1e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00647-of-01024.json.gz": {"num_bytes": 396692070, "checksum": "5a795a238203444596c711bcedc634e653e5240c9a800a9884c51f878340b494"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00648-of-01024.json.gz": {"num_bytes": 392707626, "checksum": "9cc366c37950624df6af318ee52a97d32a40e278fcb519cbe8545b04bee3204e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00649-of-01024.json.gz": {"num_bytes": 396283284, "checksum": "4ddeec31a30b5c563838b17e1115ad30041e08c70a94f299ea324ee4b71fd82b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00650-of-01024.json.gz": {"num_bytes": 396349662, "checksum": "f5bc63114ec9d73d6cea7f8e38a95031ae2bcde849b27440afd840a3e72aac13"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00651-of-01024.json.gz": {"num_bytes": 397187042, "checksum": "7199c0242b2654509af187c9c8bbfc22cc5067aafa1ff69949b1f0e5b718425b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00652-of-01024.json.gz": {"num_bytes": 396263026, "checksum": "c9e62b6df7213ea5b71913fbf736403f33c51e5a868bf1035cebcc39d80635bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00653-of-01024.json.gz": {"num_bytes": 398689010, "checksum": "f3bcc9eca4d71043e920db6399a032f916c23b1da329d2ef86434a74f8e7b318"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00654-of-01024.json.gz": {"num_bytes": 396938678, "checksum": "fb41df26e1f68e1e9d12ae8740535ca66e80910320be2270d680fec40d6fe9a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00655-of-01024.json.gz": {"num_bytes": 395995226, "checksum": "018b40ddf6d88c4c346c8018439d16f6ca66ee0720970e84ddc34b1010ae35d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00656-of-01024.json.gz": {"num_bytes": 397860049, "checksum": "8f3847e9bb5a8145e2959b340f86cc06f85e6646f32d5d785c5c90ec11a9f404"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00657-of-01024.json.gz": {"num_bytes": 397142407, "checksum": "a1ae8735a39bd099dac2e50c22e312f1a010f2644774ef53c995f3437c0a5524"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00658-of-01024.json.gz": {"num_bytes": 397827609, "checksum": "f6154377cfff2453392fb899f81514a7c0ffd40dbc35d8842d61a115d0aeef35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00659-of-01024.json.gz": {"num_bytes": 396861858, "checksum": "4299633524667921549573c469a73e33abae89d107375d5ccc6a6d987c2a2a26"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00660-of-01024.json.gz": {"num_bytes": 397773823, "checksum": "44eaf6c1739d8a9c13c54750c473ac04aaf9d2223d8893cd8094f1769b1f6f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00661-of-01024.json.gz": {"num_bytes": 396311257, "checksum": "18edb60444b660c7cc68dbe59ac71989be0e20ff13639725a5f05e4d4d512514"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00662-of-01024.json.gz": {"num_bytes": 396176936, "checksum": "7b60541181fbb92f361fbdf0bee80d086c75279610aab792a7b3877d49a3e1bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00663-of-01024.json.gz": {"num_bytes": 396274985, "checksum": "59e057ee5f5e8c7267138c18c5c88f3ca24d30f86c484e4bb0c0a4eb5169c4a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00664-of-01024.json.gz": {"num_bytes": 397483935, "checksum": "585f45d3ac3f88c3bf1c86e01daa46537f8f5c5165521412de0e67393cb6da33"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00665-of-01024.json.gz": {"num_bytes": 398831104, "checksum": "e403d2f4ff6e74abc9639749f93f77cc868453908c10821fea7fafdbcc981a06"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00666-of-01024.json.gz": {"num_bytes": 397668116, "checksum": "f9bbafa396a466b24630a259a01804b2857c1dde2fa3cec60b2967a88ad9f528"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00667-of-01024.json.gz": {"num_bytes": 398123165, "checksum": "ed693d5ecb9dfcaf545e831b5769b877e927125794cae61a0ec7821c3c85dfe6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00668-of-01024.json.gz": {"num_bytes": 398152096, "checksum": "51c33c07d503743704f564bc6a372c2f6f8f13a1ddd00b0b9a2c44c94cc57444"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00669-of-01024.json.gz": {"num_bytes": 397927981, "checksum": "d356b5268ba39e38ffccd20e95803f3218407e0a1ca3b4d1165ff82796ec1bae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00670-of-01024.json.gz": {"num_bytes": 399074605, "checksum": "bb96ea8154ae01275a9197709820e670c4e6212c740e92a7f1cfb7c618a49bea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00671-of-01024.json.gz": {"num_bytes": 397864381, "checksum": "afca3dbcaefdc368e996259fd595b77fd98a885ec005a93069a01b83227c827b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00672-of-01024.json.gz": {"num_bytes": 396077133, "checksum": "3da96ebd1b28b55b03bbab8e85f78295cffdad9020f869cb456da27058ffa090"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00673-of-01024.json.gz": {"num_bytes": 396943842, "checksum": "6a4c344a8af68a95e20d58b64fff8fe616c2a406cf26f642cdfea65fce5883d1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00674-of-01024.json.gz": {"num_bytes": 396975969, "checksum": "e6b0f7727d78143fa180abb76e617b37660b35f6323f19bf1dcbc78fb9374508"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00675-of-01024.json.gz": {"num_bytes": 396692800, "checksum": "e4ed97b19c6d83e618a3fcaff75460d828ca419b1e62842a1493b0ec4c9703e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00676-of-01024.json.gz": {"num_bytes": 396514400, "checksum": "a5672f1561ab85f071395de43e702791aaacff77a9f67f6ec9e14b12aba675b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00677-of-01024.json.gz": {"num_bytes": 395939125, "checksum": "3dacd3bb90b5e645d1b9a962d8df87f571b0fcf227996068535bb98a68f9191d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00678-of-01024.json.gz": {"num_bytes": 397022852, "checksum": "c1a0ef31342161369b7fb709be17e3c86191c1a52cb04b704fc58190818302c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00679-of-01024.json.gz": {"num_bytes": 398325372, "checksum": "47ddd1056ad977407f61b2eac3ff803d17b1aa8fa0719279bf911caf49bbb7c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00680-of-01024.json.gz": {"num_bytes": 395502228, "checksum": "cbb93f322d684ed558cbf8d92b9f83958ba772fe4177093a334b4596343f3cd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00681-of-01024.json.gz": {"num_bytes": 397981781, "checksum": "9ec2dec493733846a1ec9f68ff5130cd461d7ab9c07b22d4aae94463bcf03146"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00682-of-01024.json.gz": {"num_bytes": 395265758, "checksum": "7731cb9a2898c730a650e5d1b358886ed562228928aefe55d991cfaaa61a9a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00683-of-01024.json.gz": {"num_bytes": 398783283, "checksum": "6f2bb48070e809ac17fc90e1117d63bd8c7cd0079d9e44c9f262c4ce60f5d373"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00684-of-01024.json.gz": {"num_bytes": 396160769, "checksum": "fd07413637b97b68cb3a7a6cb86c4656017b7841728e806485ae196294e79f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00685-of-01024.json.gz": {"num_bytes": 395594461, "checksum": "939925a9169da729891fbeef926f420b80bcc60e0f170bcf9a2095449a22d424"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00686-of-01024.json.gz": {"num_bytes": 398275260, "checksum": "13836c45719ba10f2d581cf17cdab1daa4cc207a49db2b4786b451605842ac4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00687-of-01024.json.gz": {"num_bytes": 395256765, "checksum": "0c0d0e6c1e3cb9a024c184a8510066a005c031a15af74d117d0e736a358a91d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00688-of-01024.json.gz": {"num_bytes": 396635904, "checksum": "2462e084563f8b8de68c6e826289949ff8ebf8cfaf323344c07ab93e56373539"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00689-of-01024.json.gz": {"num_bytes": 397749444, "checksum": "d03746220f3374c80102ed39d8f6ae0daec40fc1b23312c08ecdee82a65ac6df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00690-of-01024.json.gz": {"num_bytes": 399380060, "checksum": "217d032ecce8d0b7e448befe83aa051a3bfab8cb0e167d043b6abc833f5e9b4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00691-of-01024.json.gz": {"num_bytes": 396975651, "checksum": "354fe9bc07aefc55cbbf8752f53ad69d45761da928bc8deb6fee1de9e244e93e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00692-of-01024.json.gz": {"num_bytes": 399720848, "checksum": "21f88940b6cbceefd66ea5e8d466467806370ae24a5833ca308cd840daf5ff8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00693-of-01024.json.gz": {"num_bytes": 396787846, "checksum": "c8d28980ffa1eff4459d2fbf0043a1f8eeaf840a3b1d1ea4989b2192c7a82041"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00694-of-01024.json.gz": {"num_bytes": 397945967, "checksum": "1936570da24c4bab9fe0559826f1cc509c4ab6eb3679e26d697efa6e7e5c8a81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00695-of-01024.json.gz": {"num_bytes": 396349049, "checksum": "8e497506f84513272a8a0694e7d4efb004b1e3b515887e3b5762f59b6c659dc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00696-of-01024.json.gz": {"num_bytes": 394901418, "checksum": "9e1d6cc187ff67ee734bbadc6cbd57eae05634a448edfde184fa8d6fc3259836"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00697-of-01024.json.gz": {"num_bytes": 399142528, "checksum": "9584496113a8612620748aaba35e185b8f47b7c96b4ff0dc7bfdd6024a3faa14"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00698-of-01024.json.gz": {"num_bytes": 395923784, "checksum": "83a3c57b3870ed9beeaf3ec8ab694e0be458106f3128b14b2a44a036e89d32b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00699-of-01024.json.gz": {"num_bytes": 397137494, "checksum": "0befea64fe749d79592e337bc359bcef70ca8816d0126ebf89d4b8fbfbdcbec6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00700-of-01024.json.gz": {"num_bytes": 396554785, "checksum": "34739b543636aeadb6dcce3e7c97ca49026cc9897c13add6b592fe60e5c40338"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00701-of-01024.json.gz": {"num_bytes": 398091188, "checksum": "c9bcc7c9e91de707ee548e67452d6970af2e19bef91f966b19fa71504e5305fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00702-of-01024.json.gz": {"num_bytes": 396039798, "checksum": "fcda5f8ddc5ed163db84aa70c565f8181731af9a29918a2ece0436d3146d7125"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00703-of-01024.json.gz": {"num_bytes": 396889704, "checksum": "c80445d442a766d2e87ecf5804e87bf7f8b23c2238476fc2b51f657400739306"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00704-of-01024.json.gz": {"num_bytes": 399465260, "checksum": "0bb73674d579523fcbe079fbea7190138911711f023404ae46ea7b685fc09c73"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00705-of-01024.json.gz": {"num_bytes": 398579507, "checksum": "97d6fd9cea2a47913c6ee9d1e34c3440858f25f3d670cc81c8f83f2346fce6e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00706-of-01024.json.gz": {"num_bytes": 398761590, "checksum": "2f4836001b8b80066ae09b6e385ed0048770c13ba2410e0f0309ab4b9200e37d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00707-of-01024.json.gz": {"num_bytes": 395576626, "checksum": "8e0c0c635a7a7c32d4fdb1a7906ee95a9f334a55b2ff3881cdc7d5e816a9c817"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00708-of-01024.json.gz": {"num_bytes": 395930921, "checksum": "e6978b92f333230972e2b4c31cb86b5286fb899948c7680c7a9cbe75a9d60296"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00709-of-01024.json.gz": {"num_bytes": 395734676, "checksum": "13071a3527071f06570c6cfa485073f2f3980c83cac782db6bf66a75dd865df3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00710-of-01024.json.gz": {"num_bytes": 396501107, "checksum": "6562cb3675a42a58b8c8b2a232043adf532fe49420e30c3c237a6d8889a8de30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00711-of-01024.json.gz": {"num_bytes": 398422179, "checksum": "f38b59c4739d3c15e5bf5dbc0965d1a5dcc0f49a3c89eb7a6822003aaa1ae7c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00712-of-01024.json.gz": {"num_bytes": 395905103, "checksum": "500b4914f3c42d5e24ced7d36dbd3143c49e4fd5dfc3d53a172d1a55ae738889"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00713-of-01024.json.gz": {"num_bytes": 396009909, "checksum": "4f50bfa762db1435a89195fd180615e9f569c1668e128d343c87c40ac5cf60ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00714-of-01024.json.gz": {"num_bytes": 396963447, "checksum": "fd9eea7dfb93916a3798a8b69d29fb5d4bf0fec448b8a24427f729e7a41205e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00715-of-01024.json.gz": {"num_bytes": 397474378, "checksum": "3c61bcf6f24e21d2584bb4ae008230540d9a375e35f3c4ba1668621b80d85c5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00716-of-01024.json.gz": {"num_bytes": 396285471, "checksum": "c554e562a369d9696219ea8b0e363907c50f626d7c410a26515e07de801da74a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00717-of-01024.json.gz": {"num_bytes": 394827995, "checksum": "f8b4678c21d93c19d50cb576f0910050d24dfd606238bbf8013c45f98defda12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00718-of-01024.json.gz": {"num_bytes": 395517823, "checksum": "1bf63affd6914d98e197b6e1ce526cae7754ecdc750184154d3cb8e3bdd21a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00719-of-01024.json.gz": {"num_bytes": 395561934, "checksum": "c04b162d984ff2ada9f39aa6c0fac04a1531fbde05175f856d2e3ca2797a448a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00720-of-01024.json.gz": {"num_bytes": 396227762, "checksum": "25da2ac7c1f3cbc361807f67e8826ffa95f4caa25f81f66832cbd0a08f1a51f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00721-of-01024.json.gz": {"num_bytes": 397716450, "checksum": "28180c6396deaf34e2a197f5cad1b53ba1c9532db8b5c21dd7d81332b2793181"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00722-of-01024.json.gz": {"num_bytes": 398022279, "checksum": "9c3a8038a7f9431b90f67ea0d3b77353d0508b09865f49af575b6aaf5e32d6b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00723-of-01024.json.gz": {"num_bytes": 398064523, "checksum": "4b18959f604bd5f379a73b52947261cb8d63f2243f5afeb5807a13669ef4a800"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00724-of-01024.json.gz": {"num_bytes": 394747045, "checksum": "615f13a1b2a6942931519b7a7f6aba286f6045aad65b041c2c6643ce906de1a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00725-of-01024.json.gz": {"num_bytes": 396726374, "checksum": "4099a416eccbb56818efda68bd027c993c1a5fa1a8e722bc268041fd3f804cfb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00726-of-01024.json.gz": {"num_bytes": 397361407, "checksum": "152d5e2bad0de3b6b48fb26066891b160ea79c4c382ce6aec6047196e3b08ef6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00727-of-01024.json.gz": {"num_bytes": 395542925, "checksum": "ce1d46b0cd7d9e4075db3feab71d2f72939817ebf45819e73ec277c9cc07307b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00728-of-01024.json.gz": {"num_bytes": 396647931, "checksum": "c859626b14584c1bab396c867ad5eb11ff3af39628206b03612ee2d2b3058497"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00729-of-01024.json.gz": {"num_bytes": 398272080, "checksum": "758fbdc5bf6d66a36d69d31141742b2a917bf0341494b844f22ab82cd54e7ead"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00730-of-01024.json.gz": {"num_bytes": 395977662, "checksum": "56a7fcb59ece26d4b19be0bd5e6c2d0f05e4b1b23e8ce7b4fab064a29b229c02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00731-of-01024.json.gz": {"num_bytes": 397530948, "checksum": "bf0f4dc8796a737daf80b977a6e3656cb1e244fc40d6df92852da45e53e6cfdd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00732-of-01024.json.gz": {"num_bytes": 398314575, "checksum": "1862bcc85d48f59283eae56836e5598f20287ce36a185252abb24bcfbd1377cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00733-of-01024.json.gz": {"num_bytes": 398547748, "checksum": "476389cb582df3c214f3f5a45268bdb47b581a432c08723bd811daa5f5990083"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00734-of-01024.json.gz": {"num_bytes": 397380175, "checksum": "2b6fd36a8f8bc3edfcd8a486de44d2f3132f7b8f4bb2d4c93453dbf1a1b6667a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00735-of-01024.json.gz": {"num_bytes": 399584382, "checksum": "3e0a067fef0b40edcd23ce6680efc07253660b8c00699630bb7629b9d803a198"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00736-of-01024.json.gz": {"num_bytes": 395312038, "checksum": "e4f92413c837d269481ecc0b5d0fc87548bd2ae718ef7f9bff18674ece289bc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00737-of-01024.json.gz": {"num_bytes": 396820243, "checksum": "e61680c57505f027ef8cbd28a45e706936befa2ab40a24a63e638019a1717b63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00738-of-01024.json.gz": {"num_bytes": 397691872, "checksum": "d3acc0c9c76ef2df89f49896744dac53f488f830d3d42f0c481f2321ed60fa67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00739-of-01024.json.gz": {"num_bytes": 397912166, "checksum": "18d281ed9831f28c4c54256a844ab2cff7a5b681da1b7c8eab2565b106381aa9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00740-of-01024.json.gz": {"num_bytes": 397093867, "checksum": "6a65230910384587f5e7f34b52c2a6d9a86a8b1f7a23d26f890b6e810c051815"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00741-of-01024.json.gz": {"num_bytes": 396371058, "checksum": "26eb40e98075ab716b4edec76d1723a679e648258d6812119b46f7522dfa9b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00742-of-01024.json.gz": {"num_bytes": 398346941, "checksum": "466043ec98eb806916806cff7495f0bae89cfeb2835204ea34328030b92a27f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00743-of-01024.json.gz": {"num_bytes": 397366055, "checksum": "d98d31aaadf95dd0d1cf0548db515c8e77c95bbc4b611ae9ab5650429c171889"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00744-of-01024.json.gz": {"num_bytes": 398722902, "checksum": "a43c80ab3bd8d12d12b4ea41d9054b90214fd3ea2ef957f317d6ed6fa7b60e34"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00745-of-01024.json.gz": {"num_bytes": 397562514, "checksum": "1e6dad94e0f90bfa0fdc5557c58873aaa95fa9ce1c7b70a1fe76817289cff78b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00746-of-01024.json.gz": {"num_bytes": 397731351, "checksum": "21fefd6cffa9032c9ca7cec91cd775c83bbd37419ae236eeec9589f8bc4be0dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00747-of-01024.json.gz": {"num_bytes": 397781450, "checksum": "b84c74bf1caecf92777fb85129bb009eb3a27fbab1b97af567f36a8bf100e704"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00748-of-01024.json.gz": {"num_bytes": 397425031, "checksum": "fe9bb225f6d03b44e552ec985c844e5012e90c4ad99f699ec4ed4297db91349d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00749-of-01024.json.gz": {"num_bytes": 397925850, "checksum": "3913b2955fee02e2ba716d843559bc4bf4e85a2884ae4495446a379f857a30e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00750-of-01024.json.gz": {"num_bytes": 397089489, "checksum": "773486144d3008cb3207c3c8b65fe6081c9e64dda09728d3586bc82e6bb73fca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00751-of-01024.json.gz": {"num_bytes": 394819424, "checksum": "d728b117a7b74150b03ed7d562514c2e45ccc03b0bceb120eddfa8333166a923"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00752-of-01024.json.gz": {"num_bytes": 397199683, "checksum": "6c10c3f4e3737db6a70375bd605139de61ae8b09a1aa91dd1cfdb82c183f0cb3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00753-of-01024.json.gz": {"num_bytes": 399197199, "checksum": "101c4ed5426b586a4aeeb7dbd377306eae9eec2eaf934e79d25583abff70b15b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00754-of-01024.json.gz": {"num_bytes": 396415619, "checksum": "732f4dedcf1266bcabf15a6a1cdead617ea37d428d8cfbccb5a9dd7521133075"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00755-of-01024.json.gz": {"num_bytes": 394564662, "checksum": "a23f1bb1de23554efff68e730d85802a6491936fb54e256744af641f97ec155b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00756-of-01024.json.gz": {"num_bytes": 395577258, "checksum": "2f4275994a103dca517d4eb3656009c8138930079e00303c7b8746ab6094fd19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00757-of-01024.json.gz": {"num_bytes": 397161772, "checksum": "ab16360173283b22a7e19d181fbf55a6a8d07f0d9007b51aa159c1e81661f5e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00758-of-01024.json.gz": {"num_bytes": 397545456, "checksum": "ff5a6292bc557aa9895de39697e8aea5843fa5a00c83c7983eaa36640d446ecf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00759-of-01024.json.gz": {"num_bytes": 395470957, "checksum": "66a64accfa6c281d2bdfa7b6846397f56c2d4f8a22ae8925a07af853e42f5521"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00760-of-01024.json.gz": {"num_bytes": 397328304, "checksum": "46778c90bcc6da96cf02e66956a1bcabcb9a95bad538cfc0d5190db473a278a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00761-of-01024.json.gz": {"num_bytes": 397706141, "checksum": "4825f25d6e1d13c70e6e65ce13ccd7b1922344c48ee2806952f3ba1b6e26d3ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00762-of-01024.json.gz": {"num_bytes": 396983663, "checksum": "25e1645f05d342b5f872ca809b36d516c7336c22035bfa86cf295d0865e08789"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00763-of-01024.json.gz": {"num_bytes": 396355038, "checksum": "d4c3a92808f0bfb042423cd4166abc57d20603ef07a0f0912058a718a38f26d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00764-of-01024.json.gz": {"num_bytes": 395434042, "checksum": "aa4384f587fd64c24fad9a27defb0345eb44cc536b3d45c710017d225c191ded"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00765-of-01024.json.gz": {"num_bytes": 397204482, "checksum": "cf419554f6c4f6201ebe92e7a232013e5949910f3d54f5cf3d1d65845685c7ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00766-of-01024.json.gz": {"num_bytes": 396420917, "checksum": "32076dd8004ebe35f46d6e790fd6330ad1d7df2b7ae3c4ede325b0da73a673ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00767-of-01024.json.gz": {"num_bytes": 396840905, "checksum": "08e5fd0fc1578a337f3dafdb3c718ade437256119e1968e9f958a8ea9d052c81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00768-of-01024.json.gz": {"num_bytes": 398085225, "checksum": "3579e0756bb6cbf1eddfca27de5cf067a212d683134bc6f8c26a79b7d802bfce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00769-of-01024.json.gz": {"num_bytes": 396879117, "checksum": "0913c93203a084521212e473d08c1d11e8136a8e37f1891330fbce0397bd431b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00770-of-01024.json.gz": {"num_bytes": 396386647, "checksum": "6c12ab51c92b9c92336a6142a1a4e2f7c3725beb7e61dcb004551d13e8d5488e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00771-of-01024.json.gz": {"num_bytes": 396279989, "checksum": "752deaefbf22dd1b1adb36561e8524c1dc555fd105bf3acb78611be9bce72318"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00772-of-01024.json.gz": {"num_bytes": 397850815, "checksum": "4f1969284d1f448caf0bff5d05eeb995cf2339801f6a71e01286f4f7f387c564"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00773-of-01024.json.gz": {"num_bytes": 399466666, "checksum": "20ba552cd30349bc8a2c0b6a8701d4587a005e7ebdf6e3f2a3bf95462c304447"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00774-of-01024.json.gz": {"num_bytes": 398051538, "checksum": "1f66196e8fbf0ebef977f235d2aacb7245f4033b53ecf75ada2f8007465a629d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00775-of-01024.json.gz": {"num_bytes": 399284061, "checksum": "97df92baa605c34ce857d380f1ca42f9e2a0de499ccaa9bab26a5c449451d1ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00776-of-01024.json.gz": {"num_bytes": 396710162, "checksum": "4b1ec54b82c8e5d969d3000ce547f4c20df16d9cc0b889b2b58c8839e9d8e27f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00777-of-01024.json.gz": {"num_bytes": 397265441, "checksum": "03827ccc3c5bebbd12a04019e9797945c55becabf7f9c1f3fe5353513f5c5a38"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00778-of-01024.json.gz": {"num_bytes": 396050013, "checksum": "54aeadf4fe16949b2ee9438feabe979570e7587bb07b3c57e47422f662191936"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00779-of-01024.json.gz": {"num_bytes": 397124991, "checksum": "913e268b5474a8b4cf1426f5a0a06c7f437eeabbc35f0126481328b419f85bf6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00780-of-01024.json.gz": {"num_bytes": 395196367, "checksum": "4c1a4f296916c30103a5dacacf8a167e43bb424d085ed3491b19f0ec1985d9f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00781-of-01024.json.gz": {"num_bytes": 396578403, "checksum": "a54f26c233662299ec8f0ae1bd266879e93cf4676707b0955114a1a80e2fcf61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00782-of-01024.json.gz": {"num_bytes": 396142106, "checksum": "3713c6b725afd833063402e6577bc0ed003a87720f700f9272864c2360bfd260"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00783-of-01024.json.gz": {"num_bytes": 396470511, "checksum": "fe9d904a07ffb2581b6734c8dd847435b867d3043ce4b4840b1c54374919d757"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00784-of-01024.json.gz": {"num_bytes": 398156228, "checksum": "af762a9ff3eeb7ed4a56f54702911f0c190b97f8efaa02cb89b1626a1c44c9f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00785-of-01024.json.gz": {"num_bytes": 397185035, "checksum": "6629e1827aab88f55d53de24625f8362daccf910663db8584d959aa44f8043a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00786-of-01024.json.gz": {"num_bytes": 396556703, "checksum": "ce51603900ea0aad8981fbfa8d05d684bfef5360413dadc6933246c2dc81c413"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00787-of-01024.json.gz": {"num_bytes": 396214799, "checksum": "6eed5802b89d63eea115cbfd9e00f6d1b4970bb3600a887b904b548181a4acef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00788-of-01024.json.gz": {"num_bytes": 397965162, "checksum": "eaa948fdaa744576f006bd70d54f129968772a479fb0bd8e946d7605857545d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00789-of-01024.json.gz": {"num_bytes": 396280999, "checksum": "e0b80ec73507f96310abf070e5cd17d5a67ffb4a337820a8b79a02afe81a0b99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00790-of-01024.json.gz": {"num_bytes": 396224660, "checksum": "2b4a06fb6f68c773da34f8d4c33d7746b6a3206bb242042841e5e007fe3cb6ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00791-of-01024.json.gz": {"num_bytes": 397681975, "checksum": "1b167c20d0414d970cda74cd357cf07d69abd1d3fb0f57222028b369551d513b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00792-of-01024.json.gz": {"num_bytes": 396210611, "checksum": "ab55128753a1e58d1032b8fd747c48158a721b12e85990627478f22b78e156ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00793-of-01024.json.gz": {"num_bytes": 397534599, "checksum": "e7476bde08e0065c523d09932cf2cf6ffe8ba023ae0ee435238efb5dd6f93d7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00794-of-01024.json.gz": {"num_bytes": 396536137, "checksum": "6228922504b2d3ebeef4735abdff06cc786d6533a6c150d50f34042aeeae1544"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00795-of-01024.json.gz": {"num_bytes": 395235406, "checksum": "9dae151c15898d7991417596a364e30f00e0ff6280f1505953e6de40c2e228e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00796-of-01024.json.gz": {"num_bytes": 396226178, "checksum": "1dc8decde490324087fcd06e4b1e17117606f2d61a80d506d89a12cce11ba291"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00797-of-01024.json.gz": {"num_bytes": 398556774, "checksum": "a454758e8cffccc88f83517a241f2457e683647949cde6aaf1e217de42f6a52b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00798-of-01024.json.gz": {"num_bytes": 396109677, "checksum": "3daa6b8602517b9873db96522a2852d940d52cdf0fa86f259ac41a9cd688751f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00799-of-01024.json.gz": {"num_bytes": 397930210, "checksum": "09dec669699a437d6fb78b3f2705028fb380b2eaa20ee73b77270216a48b8a95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00800-of-01024.json.gz": {"num_bytes": 394545441, "checksum": "726f99301047519de253e3edbaef5f4a4f95e3850b1b98e01c7864499dad7833"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00801-of-01024.json.gz": {"num_bytes": 395867151, "checksum": "a97ef657bd8ea718427ffc686f55fc1786f0834755fce3ea3ae8402d9f75c11b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00802-of-01024.json.gz": {"num_bytes": 398573429, "checksum": "20ee1f30272a0d5db74e8589be12c17173580cc9f14b039b3d33f3197816ef95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00803-of-01024.json.gz": {"num_bytes": 398084513, "checksum": "31d1a8f6965d3a8cb7e28fa8bf2cb9a5609d4a129dbc630a8e2a939f475b2003"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00804-of-01024.json.gz": {"num_bytes": 397815811, "checksum": "edb758146d462848bdb113df90fa4b9f451eca6658cbd2cab147c8b0eaf88a70"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00805-of-01024.json.gz": {"num_bytes": 398641802, "checksum": "b916bafa7269ad4ed09c58c74dc3f098b529444609dafc57e6e4056aa6496ee9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00806-of-01024.json.gz": {"num_bytes": 397993720, "checksum": "92fcc5881ca81b808c14f8c9960d873be70f857f95fd1e777b1ae1d4c62bbbaa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00807-of-01024.json.gz": {"num_bytes": 397743279, "checksum": "79aca62194176964b66a90dda7631d01acc2a6abea1ba19a90076139e390170a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00808-of-01024.json.gz": {"num_bytes": 397076817, "checksum": "a469391e432dac6967e841d46eaeabe9429849492a3df5e91431777fe9b9f164"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00809-of-01024.json.gz": {"num_bytes": 395533122, "checksum": "1278d928e105ea7d9c397ef1da79dcc8791dfad9177727aba098bd451734ce45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00810-of-01024.json.gz": {"num_bytes": 397468683, "checksum": "5c6f3e7550827de9d7028decd82320a55722785394ea4951ee78f3ffadb2d4e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00811-of-01024.json.gz": {"num_bytes": 397348260, "checksum": "8c1ece72814dd82bf1bb663b76a40c58129c08540195f9b2134eff5837faa366"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00812-of-01024.json.gz": {"num_bytes": 396753479, "checksum": "b3770924d0576f7cd1706771c411f0f288277c6c6c922dc7af4017b665109a88"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00813-of-01024.json.gz": {"num_bytes": 397977743, "checksum": "864040da6f03f4d2ed2a9eae4daedf304e0d27196f0b522cee4e8fee55f9ea71"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00814-of-01024.json.gz": {"num_bytes": 396168620, "checksum": "542986bb3b75ffcfc853af11a80edb6a31e12527d2588f1c5b2119fe35d3f150"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00815-of-01024.json.gz": {"num_bytes": 397639162, "checksum": "a617c2f27306ce5de74ab756cbf74707fddeb0aa92277b66d0cd65be230f386a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00816-of-01024.json.gz": {"num_bytes": 398296204, "checksum": "174a2e77e6562384cc4e7459ebf536db5cf4b530e4f1d7714e60d082ac7a19c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00817-of-01024.json.gz": {"num_bytes": 396112543, "checksum": "95af2c4f32efb4ed2a41cfa38dd2be09d51d4b0dc53ca8763309503f0276d56b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00818-of-01024.json.gz": {"num_bytes": 398371592, "checksum": "67789e3525f2daf6af2551df12a50341c3ef51c89a9c714a8def76209b5b7460"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00819-of-01024.json.gz": {"num_bytes": 396751420, "checksum": "07431a263e2bb92c048fadbab74ce1399f76fc57a04d7f9e90cb33aa60a4c5e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00820-of-01024.json.gz": {"num_bytes": 399213859, "checksum": "83c03df95869973c2ed46c909c0e92e7ecd75317c06b09e447a62b592421d1c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00821-of-01024.json.gz": {"num_bytes": 398408628, "checksum": "b5cb8c52a8713c5291ccf29c171e9bd9b57a54211392a19e8f31182d1053a032"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00822-of-01024.json.gz": {"num_bytes": 395429180, "checksum": "8c47bf7a0d2b9c84d255df0e7da058fba2b4ca6da3c20cbdfe5a686e01cf5c45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00823-of-01024.json.gz": {"num_bytes": 395437149, "checksum": "62818e45f34e70728494c74daa583e30c70aebf91c2f057470039f6d35059691"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00824-of-01024.json.gz": {"num_bytes": 394503147, "checksum": "e9fd88994b23531ba26e6859ec1985798a2ab9b300c2fdb1e202ac553ab305b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00825-of-01024.json.gz": {"num_bytes": 398841091, "checksum": "77ad5a9ac5e3c1d1180981bffbbdbf8a429854001d990258c615e0e16c8a9f6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00826-of-01024.json.gz": {"num_bytes": 397404278, "checksum": "06a39374c1cda19cc4b034c4877e1fd3bdc84290fdb621fdcdc77f3c5eea9a47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00827-of-01024.json.gz": {"num_bytes": 399316947, "checksum": "fd27a73b130c1cf8256f22212e23799d0dd31281cd29bcf9bb658bcda457b66e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00828-of-01024.json.gz": {"num_bytes": 397514415, "checksum": "3e7d199d05f885e8bba769d21a55a3f2ef2114b66ed738428ceb506fdf272ff2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00829-of-01024.json.gz": {"num_bytes": 397251538, "checksum": "91650563e9520b2d1ec2cd726304b781b4156ffb68bc172635a53f425fa6bb0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00830-of-01024.json.gz": {"num_bytes": 397653118, "checksum": "893ef017cbf7d46c99d9c69ba74344cfc2800bb23faf93e7400c0c282422945f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00831-of-01024.json.gz": {"num_bytes": 397299276, "checksum": "4eb3c91e52547f3b4af586f5bbdb0cdaf6a345b202a09c6aabff5c5f628b2948"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00832-of-01024.json.gz": {"num_bytes": 396915924, "checksum": "9fffd46fc1f1bce010484f2850102e2e153c5695c277efb67f65811630c2493d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00833-of-01024.json.gz": {"num_bytes": 397652261, "checksum": "3b89df9375a906c96eb1e21a6572a07de2f5d875996c01c744933984edb1af1a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00834-of-01024.json.gz": {"num_bytes": 396070735, "checksum": "b758b4cbfdfb799a8615ec9c3678b27dcd9b1d63af4f272879e0dae84cac9d63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00835-of-01024.json.gz": {"num_bytes": 398028152, "checksum": "6e07f1e6a099aa496fef3015514fe5f3cc665c742f8a783389c7da4ce0e0e72d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00836-of-01024.json.gz": {"num_bytes": 395941604, "checksum": "6bef1291a741ea5976749456185a3e3a03c3fcc9ac00370f28672ab39c552db8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00837-of-01024.json.gz": {"num_bytes": 398655070, "checksum": "b0b7e1c826302417630c3e1b1877bf106beefb5a7a11feb9bbf1ac3712714fed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00838-of-01024.json.gz": {"num_bytes": 396374435, "checksum": "3e9bdde8b73397a5fce143e91c92f9e66f46b45edfb30da1cac400b9aa7b2ecc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00839-of-01024.json.gz": {"num_bytes": 396388725, "checksum": "4154322b97c600742660125e6458787e603cf1a44b49267f4d1c569387fd132e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00840-of-01024.json.gz": {"num_bytes": 397564603, "checksum": "f9560028196fc934378389e355101e5e7f8fde9e5c921722704a18b24ebc5804"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00841-of-01024.json.gz": {"num_bytes": 397001678, "checksum": "0dad99ac959765280e6bf6d9d1a1468ef9dc9cc781e8f5bb832f7295e4e79f69"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00842-of-01024.json.gz": {"num_bytes": 397139167, "checksum": "e81fd683da081349629a0a7ae8ff7813351ed23caf4ef87041b64524034abc83"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00843-of-01024.json.gz": {"num_bytes": 396044889, "checksum": "d8e3a5b4148c7e86dea50ee5ba89ef55629d3550fd926c41754e5a26e7e52c36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00844-of-01024.json.gz": {"num_bytes": 397365441, "checksum": "c4d2ffe853b55464961b707b6d0264d6852817077204a0380c906184c077012c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00845-of-01024.json.gz": {"num_bytes": 396477802, "checksum": "7b3c4d435eca57a0fad05c106ec5928750aa01d95047618a3bc84e5342e912c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00846-of-01024.json.gz": {"num_bytes": 395983616, "checksum": "bdad2ba411291435ac0cdd083e46aa8369499f014a788fa85ed8c419fe9cb2de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00847-of-01024.json.gz": {"num_bytes": 397646062, "checksum": "3f6bddcefcceaa4184161432e4f0b9292ae4fe7dac3079d4191a31a38f48c7bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00848-of-01024.json.gz": {"num_bytes": 395958111, "checksum": "5ed10d926e5fd1dcbc777df82391eb3ba57276c7303d488d6f3591022d20cc4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00849-of-01024.json.gz": {"num_bytes": 396960036, "checksum": "ab82adc6f66ab0403cbbb38859009a460e6c8c38c789bc2b2420da8b87096a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00850-of-01024.json.gz": {"num_bytes": 396603592, "checksum": "5a6aa59a01504f5655d429dd5cb3ebc39e3994b22cbaeb5b09ceb29a26b94031"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00851-of-01024.json.gz": {"num_bytes": 396511886, "checksum": "f1954da7e217d893a0237a0f431dd2a9071723e543bf0f4943ce38fab048a44e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00852-of-01024.json.gz": {"num_bytes": 397626831, "checksum": "f5cdcd7ec4f3c855a1006f9278ed4df50574a3fa7aa1c5a2e255ea5fa1a770cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00853-of-01024.json.gz": {"num_bytes": 395811873, "checksum": "24b1033da877ebddc09cfe2d3325868448dab9083b5147d6cfc4fa63ab402a94"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00854-of-01024.json.gz": {"num_bytes": 396513614, "checksum": "419952e0bc38cce474190c0b9ea581ccbce77da5e045dd60f5ff1fa1d2833d19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00855-of-01024.json.gz": {"num_bytes": 396493352, "checksum": "3d2b529871c625fc9c1c59b9d5cede2a77e609041f1ea044d68ac16e9fa6a30c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00856-of-01024.json.gz": {"num_bytes": 396852729, "checksum": "a3b56e6171fc2b14ebe67f6a71af688ea6135597bb8f8cf83e2fb460727aa5eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00857-of-01024.json.gz": {"num_bytes": 396428653, "checksum": "de550a5d608bffde45c149bc0d4c1165cbd3b5baab3d3529f006a02aba6d53e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00858-of-01024.json.gz": {"num_bytes": 397039613, "checksum": "11374c2685676ac2eb3dd0d281b44b512ff1d2968ab320d9c857b44304eb8ab8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00859-of-01024.json.gz": {"num_bytes": 396515194, "checksum": "64879e565e5c467e630566ab75524bb300d58798c814637ffebd15646544cd5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00860-of-01024.json.gz": {"num_bytes": 397764125, "checksum": "7e22be61b3413c8fca2414087655b7ef7bef2ab5ee373fee74d13c8fb991675b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00861-of-01024.json.gz": {"num_bytes": 395314420, "checksum": "29c451c69c8c05f6eee2741b9ef6c241f551257a45da8342a1d6bb341f80314a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00862-of-01024.json.gz": {"num_bytes": 397763845, "checksum": "679668616899f548fb35da32c3e5f121002670cc3296c0c90f5bf45eb3ea1d79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00863-of-01024.json.gz": {"num_bytes": 397356206, "checksum": "43c5b3af2173d4293396f336ec363aa2f31580b65128f44ca8bb891f2022859c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00864-of-01024.json.gz": {"num_bytes": 395463092, "checksum": "77b7b6299955f4869e5db994fa6b20fe3007cf8cf2b6609442fb1ed49284cee6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00865-of-01024.json.gz": {"num_bytes": 396909291, "checksum": "7eca0e82842b52f99640ab574e4b2446309aba6ac262f980fc6d249a337d06a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00866-of-01024.json.gz": {"num_bytes": 397587651, "checksum": "931014d99ab2a765ebf90e876694647c265ca5e6bf2b459eb027d6b06643a8ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00867-of-01024.json.gz": {"num_bytes": 395992645, "checksum": "0976a5389aed40e4bca89cf22382cf121390c75bd755437be474c097c8fee0ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00868-of-01024.json.gz": {"num_bytes": 397789857, "checksum": "6ffd848d165290a746a21767e79a9f046b70534aaf7b14fc01f9365e4e3f7d93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00869-of-01024.json.gz": {"num_bytes": 398124116, "checksum": "5fb85058bdf40c0ee6cf748cda7483b1b3cfad18c26a90c2150c2a3f30ceeeca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00870-of-01024.json.gz": {"num_bytes": 396432487, "checksum": "89d50aaa3620eac4ad593a403ea637b2ff090361ead05c3aa8c7a3351c66ad65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00871-of-01024.json.gz": {"num_bytes": 397484772, "checksum": "490f4104981a9ab3ef04600a4865b9a2a18239e335d7fb7fff79ec1b7a225318"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00872-of-01024.json.gz": {"num_bytes": 397240896, "checksum": "d344994866bc49475f66e9937636afa787e1ff560e3f62dc1a0e4d0220d6ed39"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00873-of-01024.json.gz": {"num_bytes": 395450398, "checksum": "5d3b320aab1f7f09450531649666ded1aba8a9bbcf0f47992c43cb40a6d7a929"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00874-of-01024.json.gz": {"num_bytes": 396365056, "checksum": "346aae20204537ba2f4a865ca80b5d1c6da1e3a3b78d306d7570a69f185cc4fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00875-of-01024.json.gz": {"num_bytes": 396679348, "checksum": "ba81f9c1650d30853edbb9886dde84658c254dee5a3ac1062484f7194cd413f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00876-of-01024.json.gz": {"num_bytes": 398278881, "checksum": "88fb38aad7cadd76c818dbe7a372144dfe17d110f7d2123a80d14686fb43a6dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00877-of-01024.json.gz": {"num_bytes": 397051868, "checksum": "049e4a62056c98284b35d10a74ad5ef7014265a6dccb99a71f93a409933a685f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00878-of-01024.json.gz": {"num_bytes": 396132123, "checksum": "bb7b97a82bd6d31612de66a03af35d404b15808b925e7fd94bd0a8e9e928b927"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00879-of-01024.json.gz": {"num_bytes": 396520374, "checksum": "2a56fed53aa022e6a7956f604d54d99af89a15b6c7fc6b037f94d347f1d15f51"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00880-of-01024.json.gz": {"num_bytes": 397004524, "checksum": "1cadef434909d4508a9a6bf40d6a9323256f3089615a5d2963c83040d5f549f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00881-of-01024.json.gz": {"num_bytes": 397336334, "checksum": "0e36dcd0eb1773eec15ffd0fbbe8951343bb6961dd1838b51e74da2e055db176"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00882-of-01024.json.gz": {"num_bytes": 394949798, "checksum": "78c99406cb921c2b8f5b86e4e7eeed24c799678732e5a5450db6b12b7ceeef61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00883-of-01024.json.gz": {"num_bytes": 398647721, "checksum": "f0e7a0a9970c7fdb5f629771e76bb06bf62b79e9cbf5008e866f954dd436401b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00884-of-01024.json.gz": {"num_bytes": 396040500, "checksum": "05272a55eb2840f94a7dcc30a8d09b957511b983b0fc3fa618a8995bc594d055"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00885-of-01024.json.gz": {"num_bytes": 396460591, "checksum": "27511aa50410260d261866dc970b897b10a95dd4dfd92b0bc3a5fc41e6c75335"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00886-of-01024.json.gz": {"num_bytes": 396149133, "checksum": "e66ba9c7ceca631a4b43ecff1e151524a209368f298ca83624476ee9144cc3cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00887-of-01024.json.gz": {"num_bytes": 397164216, "checksum": "95e341054bd8a21e7f49e4a5aaa5fbe51517ff631e66e67ff1cdaea6e3178002"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00888-of-01024.json.gz": {"num_bytes": 398216402, "checksum": "6fef57de31fa1692d8a4021b317554688657fad3f55dc144e2971d63083e7879"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00889-of-01024.json.gz": {"num_bytes": 396976936, "checksum": "36da1bd0eaa27ca6e8510a3c005695fbbd7b0fedf63f077e3787590d4b1af625"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00890-of-01024.json.gz": {"num_bytes": 396903125, "checksum": "6bbbe5db2c0938efe5f8afe7b30765f45cedc9fd4209bb7826c489381175bc5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00891-of-01024.json.gz": {"num_bytes": 396404354, "checksum": "47601b1b1a0a725c32ae0c32364f7ac188b7e8c68d29a2dffbe1a4dbe39393f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00892-of-01024.json.gz": {"num_bytes": 398144052, "checksum": "a7b6bdafa5a226c22ccdf97c873e4915ed8dd8b59e2820a4dc62f600b4710175"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00893-of-01024.json.gz": {"num_bytes": 397990484, "checksum": "12f08cfa1fb4f94a3d7d9584cc3f5ae9fa518cc095e4cb07939d02ecfb7ffd9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00894-of-01024.json.gz": {"num_bytes": 398271782, "checksum": "004bf46ac7c8d7770b458ec341322f5cef643926aff9255954f08faa1dd43d53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00895-of-01024.json.gz": {"num_bytes": 395489909, "checksum": "3ea14b3dbd7a4c9cb7aad83d1311d335714aaea5b2dd0374debd63c56d02dcbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00896-of-01024.json.gz": {"num_bytes": 397589097, "checksum": "c0f1c7e54bf7a808f66d2acc9aec79f1ce936ba480f5d1e379c6853714413175"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00897-of-01024.json.gz": {"num_bytes": 399215096, "checksum": "20958123acf2d578448a5166f1209b0452db33ed395cfe512015106bf99ad31d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00898-of-01024.json.gz": {"num_bytes": 397044516, "checksum": "46c5145069d861c04b2ac1afe80c4c4453f91869f6cb6a1d9f7b648f1b08942e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00899-of-01024.json.gz": {"num_bytes": 397687759, "checksum": "2a3923d8ff2ce0eab5978a8e0198bc2d1512cfa19c69e673e048b8eaa72f82b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00900-of-01024.json.gz": {"num_bytes": 395192267, "checksum": "9cc72deeea7fbc0fa3782c41938d66315923dd9f53d89f47c00f85f93e454ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00901-of-01024.json.gz": {"num_bytes": 397806320, "checksum": "8cfff74f280636416f523c271f75e5704a570db4cddb8a70d033158868c21347"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00902-of-01024.json.gz": {"num_bytes": 398450537, "checksum": "7df8804eb5ecb79177001f9ce3c66f0ad20cccd8151e817816e9342d07c392be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00903-of-01024.json.gz": {"num_bytes": 396733151, "checksum": "89551a52d1e97b4ec3007f8c43191c1ae1475d0ba5b48d20818a12c85b0add74"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00904-of-01024.json.gz": {"num_bytes": 397497719, "checksum": "2bcde59dfaa642722969d1401a4ce43a35c57930bb1d664371efece1e2e91c32"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00905-of-01024.json.gz": {"num_bytes": 395760696, "checksum": "ec844272b0666a455dfe0cab065e00df44e8da2156a03797100418307c96830c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00906-of-01024.json.gz": {"num_bytes": 398496346, "checksum": "ff68909d470edef08929a91068e1de02841c16a000fbbd17ef042cb76f1fff37"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00907-of-01024.json.gz": {"num_bytes": 397085405, "checksum": "a9b26676af61a6a1355225bce5bbcd67aeaf0fb7dc2209f30235b275536baa85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00908-of-01024.json.gz": {"num_bytes": 397037103, "checksum": "e86688677a46103b0b224333faf1b4f89da062e4ec0ee35752c91ff9772697c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00909-of-01024.json.gz": {"num_bytes": 397394775, "checksum": "93082177607900bfce7fc53f1665a831093bb50caea33e014f327181579c0012"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00910-of-01024.json.gz": {"num_bytes": 396668466, "checksum": "dcfe639607c18a309e2c91864a6912dce3851abd62bbed3ba16390899e637327"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00911-of-01024.json.gz": {"num_bytes": 397926997, "checksum": "aa995c38d953237b1d6d53be7237958a00ca2dbab4a753c7c4404849fb416d5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00912-of-01024.json.gz": {"num_bytes": 397810240, "checksum": "e3f17ac285e8c9b04713713a957602a63e176f476d4a67018012e9cf2a3e5a84"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00913-of-01024.json.gz": {"num_bytes": 397143597, "checksum": "4082ab833be47cf881693ea4442e3940625e0d2c1117e15234886fdfa779bce3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00914-of-01024.json.gz": {"num_bytes": 396398347, "checksum": "7c62dfd17b21ff64af640e4aca8fea0240998596d11ca551a3ab045d5041fcac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00915-of-01024.json.gz": {"num_bytes": 398622100, "checksum": "69abe67cda4b1613d5f741804ccdb294cd5f457027818d9366db8cf2f5f40871"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00916-of-01024.json.gz": {"num_bytes": 397387266, "checksum": "6effa83cbf3345fd7e41e432ef82156bb1334f2cf17589bce313aebee9727131"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00917-of-01024.json.gz": {"num_bytes": 399730979, "checksum": "f0d0ff1ae76a84c07647fa1517410533862f1927fa85dbf38017dabf4607bc1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00918-of-01024.json.gz": {"num_bytes": 396895902, "checksum": "84cc56e725be31047d0b6a025cfacefc462f4a1a546feaa34af95a6f25a4e1a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00919-of-01024.json.gz": {"num_bytes": 395247578, "checksum": "daa3156989ddaa9a7eba228848697ccf6a385679359ab765881d2293bef107aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00920-of-01024.json.gz": {"num_bytes": 398305242, "checksum": "2a9e02ef643962f6009e42304b983c87bae7b74c1edcbf8e6808b320ea7ea776"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00921-of-01024.json.gz": {"num_bytes": 396446011, "checksum": "f83526ad11d81820fce4231e3303d613dbbe56a8fae878d9442c8d7e98023437"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00922-of-01024.json.gz": {"num_bytes": 398010331, "checksum": "e47cb9d7550644ef807c3ea9e19ca4aa1df54eb908b54651bf0e17f0ded9157d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00923-of-01024.json.gz": {"num_bytes": 399160018, "checksum": "470401e5b0777096806113a36dcb92b8d453d6e8f5f4f0b15df2788e382ca03f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00924-of-01024.json.gz": {"num_bytes": 396880756, "checksum": "c86e546c68bf8458951fa723c086d6efa5b210f53cd4fcb2de4b9efc7a71a275"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00925-of-01024.json.gz": {"num_bytes": 396806561, "checksum": "5d9b1105c0053dc9530c911046f4da458f41d92c771282d0df8a3a22838feaec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00926-of-01024.json.gz": {"num_bytes": 397479994, "checksum": "c3253305ac4ef226501e4fd4a6acfc6067a76c084ad852eb2a9f5916aa3d51a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00927-of-01024.json.gz": {"num_bytes": 397083225, "checksum": "8931df0ee597f72ea3592d0a4d236ce655a92cf4e7eb9298145f496246c18c21"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00928-of-01024.json.gz": {"num_bytes": 398000839, "checksum": "5e29e75231bdb413dedd1211bd87e9fc3f4ab8bba41999afc1ddcddc16f4599a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00929-of-01024.json.gz": {"num_bytes": 397731309, "checksum": "03f7a9199b7927a6d78a8aa4eed32c250d32dc409e3bb2847d7db948ee63d46c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00930-of-01024.json.gz": {"num_bytes": 398133003, "checksum": "b22a79dc228697394d0ce25b7d31112f9e1a6508cdc4b57af35e84e65167bfeb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00931-of-01024.json.gz": {"num_bytes": 396694508, "checksum": "dbbc65db3d442f9ace85498a3b27bb598c20cea171b3de17d409f9b989c262d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00932-of-01024.json.gz": {"num_bytes": 396255463, "checksum": "02af4162b084004e99dc6862c88749545593e342a83523597cada140e57a0ab7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00933-of-01024.json.gz": {"num_bytes": 399013035, "checksum": "dc4d3b4f03c36a8f1393ba15195c3f64b128862b812839689fa387e708ffabaa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00934-of-01024.json.gz": {"num_bytes": 396593138, "checksum": "02a5a8e02b2636c9e912a9ef8a79ececde4f4fc92bea74e59791d181bec104cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00935-of-01024.json.gz": {"num_bytes": 396748502, "checksum": "05d1d6290580d5c74b906ab03fe6773ecaaa1ff3be84dfdef48d1a2e7f5e1120"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00936-of-01024.json.gz": {"num_bytes": 397737673, "checksum": "351d3543b1457da9719061948a1b4bdd79be8a0b786ecd6a9a8cc0db49cd2181"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00937-of-01024.json.gz": {"num_bytes": 395377872, "checksum": "d431b01bddcf911d7da5bad74a78d0d1527d60d9720f77868ef08e1a65850986"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00938-of-01024.json.gz": {"num_bytes": 397193715, "checksum": "bff5e755b174e3608ba72b39898a2bb5e9ca6d3362b70bd66143566aeff52690"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00939-of-01024.json.gz": {"num_bytes": 398044482, "checksum": "03facf22c376f03a8078e99d1dcc1c22ed5d7e179de472019cae894f40c7a4ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00940-of-01024.json.gz": {"num_bytes": 398894204, "checksum": "3d3a2125262ee8ca498cd54db52fe626d010a2a93c000ea2b45f931e491ea9e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00941-of-01024.json.gz": {"num_bytes": 396758197, "checksum": "b3957de08e7779d8ec23af02a6d709189796314c70a99f46c90d0bfbd14ad561"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00942-of-01024.json.gz": {"num_bytes": 398181993, "checksum": "74aec8dec794c79683dfe43d8aece4c1c47c5389aa6d4bea847ac461cb5ba21f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00943-of-01024.json.gz": {"num_bytes": 396271547, "checksum": "231f63d05f81d249f618768c9f712cc31314dacf55a6004902a0e7d0bfb13724"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00944-of-01024.json.gz": {"num_bytes": 396603419, "checksum": "d5661730f3ed6cc5bbc5d935a6f1ac7d241b40c52dc83775a421e7a1a672f518"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00945-of-01024.json.gz": {"num_bytes": 396596660, "checksum": "3b5aeb0786dddf0b9cabe2ca071283b276822e2861d8688e38f927595c159b02"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00946-of-01024.json.gz": {"num_bytes": 399900563, "checksum": "6d5549970af2c6987583477991552e1944b411642782c07d17eb52f91e714a1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00947-of-01024.json.gz": {"num_bytes": 395391489, "checksum": "f5544ecb42c385cd5d5120c82140e4a36051f6a401d89ce30c8f2fc08cd69804"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00948-of-01024.json.gz": {"num_bytes": 399257562, "checksum": "1448cca7f1b9824adcf8437a33d14a7e95b705396611f82e7aba9a69e0a25118"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00949-of-01024.json.gz": {"num_bytes": 396371965, "checksum": "a7eb228f1d1ff2744af3d1a1358a94611cd92c25d81edac0e209b9f81c8a0a60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00950-of-01024.json.gz": {"num_bytes": 398022110, "checksum": "8651693d2180e518039da487f638c532c53f6d79a33356922b2d8706aa6a83cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00951-of-01024.json.gz": {"num_bytes": 396224338, "checksum": "c46bc8aa1621153fbd913b5d0b23a82352a28b36ec997c4df4b92dcc6ef26895"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00952-of-01024.json.gz": {"num_bytes": 397581207, "checksum": "02775930e3c420978a9d2785ee0137c3963dba7bc34538b2155eb38dd6ee89a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00953-of-01024.json.gz": {"num_bytes": 397045599, "checksum": "9d54940cb594de6e0f8593f64293e96375f0a5c56f3569c72720476bcef1f1a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00954-of-01024.json.gz": {"num_bytes": 395457873, "checksum": "3c12a1c3061164f345d9e402bed28be9af84ef56d5df1b22a3cf9f818ed47ae8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00955-of-01024.json.gz": {"num_bytes": 396450938, "checksum": "45db78bea4fae6cd69d900c581fccda873d2aa9f24ac5e9dfc18b486c15c3788"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00956-of-01024.json.gz": {"num_bytes": 397120474, "checksum": "7db7ea23446bd8a66737546c5daa0c2dec7bd5c4743f52eb53685ccbf54d9b17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00957-of-01024.json.gz": {"num_bytes": 397403279, "checksum": "89de2950bc3f7dd4f95d8a0b7cba19e9678bfbc23175bc22d9f9599ec1ad9cd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00958-of-01024.json.gz": {"num_bytes": 396861933, "checksum": "f325478647cbec9d79bff2266672144147276a82f665d3014c5d2fa9c112c387"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00959-of-01024.json.gz": {"num_bytes": 398439950, "checksum": "70d786bb337c012269caf6aeea3bf9604d279d3e4335294c72ca6cb5a9fbd951"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00960-of-01024.json.gz": {"num_bytes": 395684257, "checksum": "e1d170b0a4d6954a920ef3923688a7dbf40398609ed2ae04b2635df9ceb07821"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00961-of-01024.json.gz": {"num_bytes": 397526287, "checksum": "47b90e3747f35bf67c872d65d843f6dd9bfca15dcb769b31bf3586c6645858bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00962-of-01024.json.gz": {"num_bytes": 397473683, "checksum": "d0ddb2c104f515144265bd3eed526a65ada46f848183688b420694751b113272"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00963-of-01024.json.gz": {"num_bytes": 397964876, "checksum": "74725b631c1699b1166589eaebb66374c031b170eab3ab359230cd4a23a8ae79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00964-of-01024.json.gz": {"num_bytes": 396523661, "checksum": "fa0d49a2cc726628d9a1b5ae2ace52ee90401af8ae15add27c3f4566dd99a79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00965-of-01024.json.gz": {"num_bytes": 399289514, "checksum": "11fb1878a8b204181f7f776a764f5e9e577d0fe62d4b2e4ce2164ce9fcc30b8f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00966-of-01024.json.gz": {"num_bytes": 397411408, "checksum": "5646014ca3c99f53bd13183187b1e6e8f84cb6c846d6f1f3a3c82edb4accc47e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00967-of-01024.json.gz": {"num_bytes": 395095282, "checksum": "b799b17f36d85235eaf1bed9f4f760a22b75fca736744218e44fae5917a2286c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00968-of-01024.json.gz": {"num_bytes": 397189410, "checksum": "8d9748f5a92a9e0b836fe74b962bd2da04b62a0a2943ea5e440cef19166a5479"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00969-of-01024.json.gz": {"num_bytes": 395651742, "checksum": "f42c71219641fa302692698b4944864f27b7f87d4477a86babe23745dad72715"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00970-of-01024.json.gz": {"num_bytes": 396180197, "checksum": "383d9586f27579b4a97c5901013b3e025f10dc813047d65158d6621430803aec"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00971-of-01024.json.gz": {"num_bytes": 396574555, "checksum": "d2c9700fbac454d3b3a42b2a3c4eb0111eb7cca7cab3d545b0912aba60415c91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00972-of-01024.json.gz": {"num_bytes": 399639122, "checksum": "5d59e643bf20156a28e5e9dfcd811c5a6c3779e1875f375db09a0fa1871dcc90"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00973-of-01024.json.gz": {"num_bytes": 395456709, "checksum": "8b22e82588e30f30f664895b9716cbb0cf38d5ff4331d3be31ab25663c634a00"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00974-of-01024.json.gz": {"num_bytes": 396693438, "checksum": "5fba4f9d634d968f15d5d4fb29d253646494e3e125aaf1c2f8fab38a7e60180b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00975-of-01024.json.gz": {"num_bytes": 395697641, "checksum": "b4c5fceb9fa2397a9b7c75249bd3386b8dbf999d5b52521051a86e067d698448"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00976-of-01024.json.gz": {"num_bytes": 397172005, "checksum": "093aa01a944a222828656d31dacd8ecd57a24a51d361a8742514bb6af009dce9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00977-of-01024.json.gz": {"num_bytes": 396182407, "checksum": "1beef6e248c00abee5f8952641b12d3f5b12d58adc05c8d461c0a073a6ca9b39"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00978-of-01024.json.gz": {"num_bytes": 396180428, "checksum": "0f2bb125af300de2c9fe347899673a4bd2842ba8298146bfe94c9eddc41893cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00979-of-01024.json.gz": {"num_bytes": 396479117, "checksum": "1fe9d0e54b9be79722e6483e386801263ca51d6e9ad925dabbb58a38c4df877e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00980-of-01024.json.gz": {"num_bytes": 395119279, "checksum": "0f262ff2d4701497f6fd6d4f9d3cb1aa3a730ad6bef1961d890a3b0cb4747ee8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00981-of-01024.json.gz": {"num_bytes": 398285798, "checksum": "a295b85e63c176cecd9f5222ba417eeda307e41847eb38c61dec9b83101a8256"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00982-of-01024.json.gz": {"num_bytes": 397811687, "checksum": "2a3a0e0f454dd72a68ed1dd71c508a9b24fb2349ffdfc588cbfcef728cbaff05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00983-of-01024.json.gz": {"num_bytes": 397069906, "checksum": "5b4256392755c4dd79cd37cd6ede645a9a549c4436acd27495e974ebe1d80bc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00984-of-01024.json.gz": {"num_bytes": 397670152, "checksum": "68d4f5dbb3fa349a6811edce8056eb297e771cb9c9939c3a84d30c6ba3ad9dc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00985-of-01024.json.gz": {"num_bytes": 397949975, "checksum": "6ba478b8a1ebf3b1dd67ed7b4a055cc9cc3c01bc90c1852aea8f5a99f6c07e69"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00986-of-01024.json.gz": {"num_bytes": 397730984, "checksum": "a39a23589cc434e573613e3ead44f33adb005c2c13cea8b33601647c97300fce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00987-of-01024.json.gz": {"num_bytes": 399173506, "checksum": "eab46d9d0a0cf05dc5ba475017d98f02f1cfd756c8e707d9823a0463713ebf23"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00988-of-01024.json.gz": {"num_bytes": 398674037, "checksum": "88749d380aac85314df66448542b696e9ae6f61f1b27dc395556737f59ad9024"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00989-of-01024.json.gz": {"num_bytes": 395313344, "checksum": "bc565b662396e3ab4e108635e01873014515663bd5216926a59ae80f6cd4273b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00990-of-01024.json.gz": {"num_bytes": 398567254, "checksum": "e9b9bd97a30ccac353a2386babbd01c3a3bbede8c07bc28d17aecc7ef5af6330"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00991-of-01024.json.gz": {"num_bytes": 396958611, "checksum": "505ab5458d5e52d656048284fd22cc0fcd16e49ba19331669239be37645cb04e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00992-of-01024.json.gz": {"num_bytes": 396102263, "checksum": "59ac5b2b04f224be04a4ceac6a16e29a33681f19cd40cbce3d3e8eb961b9f33f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00993-of-01024.json.gz": {"num_bytes": 396935362, "checksum": "c804f2311de9f7ae5691280e16261b9f8385ef9a71929b2111dfade532b6bdd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00994-of-01024.json.gz": {"num_bytes": 398832432, "checksum": "594727bdc3756e678bd4d156216712ed6c8fc98d3f8e9594cfbed10b2e414554"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00995-of-01024.json.gz": {"num_bytes": 396699737, "checksum": "bb3c73c6d48aebf9c60cde56944faa5bb6727db4cc48ae23d67650742462c42d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00996-of-01024.json.gz": {"num_bytes": 398059244, "checksum": "ac1a7e6e2c2a5468c704f5a2318b5617dd4ce140b98271e2034e00015db6cd76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00997-of-01024.json.gz": {"num_bytes": 397439167, "checksum": "ce9664b29c86c05d3541aee377acdca7a32ef8f0220e0b4b6bf18276b692529f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00998-of-01024.json.gz": {"num_bytes": 397383159, "checksum": "1b4db1b59255f106dd2af7510112eef6d6b611d9f9e000a0e585b623fdb8ae98"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.00999-of-01024.json.gz": {"num_bytes": 396339114, "checksum": "ee5e1508704b03f0a9cb3c4bfb578c08fb83a4d20760e3b40f101c58cbbb3ec7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01000-of-01024.json.gz": {"num_bytes": 395172166, "checksum": "f8cbf0bd9c2b90e588942048848fbfa1a20cf775364cb9c84b4d5dd7cf19e603"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01001-of-01024.json.gz": {"num_bytes": 396629363, "checksum": "7cad3f9a28e5988ef91073c48e9d85ea7030289690f817545cfa9f1165dd33d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01002-of-01024.json.gz": {"num_bytes": 396507390, "checksum": "b4ae1017913509855d6d8d4413ff3de4a8d519d91f354b6e5b5267219d20658b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01003-of-01024.json.gz": {"num_bytes": 397652598, "checksum": "0c115446c159d27e6e1354173ebec29e6dff5f38c4d2ddb46c07c450523309c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01004-of-01024.json.gz": {"num_bytes": 397408971, "checksum": "f0b559a832a9ee50225fe1417d936d6b898026d80a105b976deaeae75f9e30a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01005-of-01024.json.gz": {"num_bytes": 397753911, "checksum": "e001c9285ade7de6ac23716b596ddcc733f05bd6abd7e1a67874894c93fbd43a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01006-of-01024.json.gz": {"num_bytes": 397962701, "checksum": "acf13433824104e4bfc3a8aaf8805eb16712cd97b2dc1d48e7d771bee4bd41c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01007-of-01024.json.gz": {"num_bytes": 395966285, "checksum": "4c6069f6a95d036fd3e05a4246db932ad5ab89b9470274f23a17df0b77b9b717"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01008-of-01024.json.gz": {"num_bytes": 397075505, "checksum": "9b3b9c0cd4ee02e18a5d22142183874586da8fd23b4f97033e354f9681d150a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01009-of-01024.json.gz": {"num_bytes": 396881470, "checksum": "14d2d7cf2ebf3b2c73bad4a6099fa1d2b1cb341b100976b03232fb664a7d020e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01010-of-01024.json.gz": {"num_bytes": 397471393, "checksum": "01e6f56bebe0c874d82135f551a6b917759c41af48d127df181267dc9b8f6486"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01011-of-01024.json.gz": {"num_bytes": 398092801, "checksum": "ead5b6b13bd09136fccd9548c224398401bda0ca7ff62ca4db852760760f13d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01012-of-01024.json.gz": {"num_bytes": 397831436, "checksum": "daa2d1507f9b56de0c4aa9d86d93259c1e6f73f0cdfd553ce075a16807dbcb56"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01013-of-01024.json.gz": {"num_bytes": 395098326, "checksum": "c2b21a1a56e9879335c72008919e8f7998dcc1e8df2258fdf2196ea86194e3cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01014-of-01024.json.gz": {"num_bytes": 396164077, "checksum": "0df125946c83c66c6961eae2aa45ad7eea7038d808281d633ce30686a8245e01"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01015-of-01024.json.gz": {"num_bytes": 397895284, "checksum": "f6f6eee8fc113b7e717654b9305cc5129c3ee1ce9f263b91f0202762f078a526"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01016-of-01024.json.gz": {"num_bytes": 397723033, "checksum": "48426df1f4665d3179251904c96a0e73c041ed5b57885b4dd852809e632685b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01017-of-01024.json.gz": {"num_bytes": 396761053, "checksum": "f33cf2d744585e0338b29a5a5638752123b7b59f9ae3b723cf7e7b536f9f80ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01018-of-01024.json.gz": {"num_bytes": 396562520, "checksum": "72adb0869cac573282c4bd938cdff556f659540dd4a0a6663711974cb2dc147a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01019-of-01024.json.gz": {"num_bytes": 397564701, "checksum": "3b64235effaf41ad61698b2c28f4d73ced1b6ec6b6d79e0f52314176fa0feb12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01020-of-01024.json.gz": {"num_bytes": 396053080, "checksum": "b16b9f815823d176f94388d4c482652ac656aa763ec738ccd8c8a2a3bdefc1e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01021-of-01024.json.gz": {"num_bytes": 394731398, "checksum": "f4c0044abadd339055bf13843938eef4c066856757250fc15f77060fc0881ba6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01022-of-01024.json.gz": {"num_bytes": 396548645, "checksum": "5ecd8432526eda57065e6161f0618a19cd5993c7dfe86575775f1bf01836f750"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-train.01023-of-01024.json.gz": {"num_bytes": 396863581, "checksum": "c6cd29b8f6067152ccd584ded81df1f9cb905515d48815b8a546d104ec7a3565"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00000-of-00008.json.gz": {"num_bytes": 50774357, "checksum": "7cd6c8b1072af3f3ca3fa160d9411960908142743b101f7229223e6658acb42c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00001-of-00008.json.gz": {"num_bytes": 51252663, "checksum": "d36ef5fc04b24117a19d992de06400e5f290f11786be99be9de68818f7495694"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00002-of-00008.json.gz": {"num_bytes": 50860289, "checksum": "ab8b3dee7c0698c3cc3a74f159d85495b6bb9529600ef9246bec218ae6775e28"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00003-of-00008.json.gz": {"num_bytes": 50141661, "checksum": "54d62c9359000b99713a8a0a0fdfa415f1c09824555526f01dc7217b068542ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00004-of-00008.json.gz": {"num_bytes": 51141505, "checksum": "c11e31de558613237533b41354ca29f0635b599a1c9232517dbf4c2cb1197319"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00005-of-00008.json.gz": {"num_bytes": 50797157, "checksum": "20d39c0f52c34a3148c0a235238ed3849576ed895c3a43cb47b0159bf233c7d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00006-of-00008.json.gz": {"num_bytes": 50158887, "checksum": "754a2b7f134bf45f17db7450d5c0eaf2b8824e4a6072be7b20db434f9cb7968f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/en.noblocklist/c4-validation.00007-of-00008.json.gz": {"num_bytes": 50232244, "checksum": "f90c1d79c51ee1a009dc05930fc40e9ee4c3840ca2412cc129855156aaddc279"}}, "download_size": 407016751197, "post_processing_size": null, "dataset_size": 2060282008734, "size_in_bytes": 2467298759931}, "realnewslike": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "realnewslike", "version": "0.0.0", "splits": {"train": {"name": "train", "num_bytes": 38165657946, "num_examples": 13799838, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 37875873, "num_examples": 13863, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00000-of-00512.json.gz": {"num_bytes": 30085821, "checksum": "6666a680b0a34eb8756dcb5fd2b12f0078237f3502e8a513bd3e5b71bb92be00"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00001-of-00512.json.gz": {"num_bytes": 30065900, "checksum": "61c3f9ab763067f76d9bea349d86efb97af7539d481b5d2807f362204971c327"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00002-of-00512.json.gz": {"num_bytes": 30028880, "checksum": "3aa4405d957ed42d10d643efe7c0f51b05e8f29cf4ad8783448083c1cd3f2a24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00003-of-00512.json.gz": {"num_bytes": 30136880, "checksum": "f6eb49e4c0d691e67fe96ddeb3f8370c5e63a7297a31a8da0c58f5cb3a9f6061"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00004-of-00512.json.gz": {"num_bytes": 30110499, "checksum": "6e0908780f555f4b74c6a5055e2c9708333a8466f0b8723a8ea38cc04828ce44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00005-of-00512.json.gz": {"num_bytes": 30097927, "checksum": "a333562df3fcd4c5ccf51b4c00e11f6619ac4a28a878383aefad277bd30131a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00006-of-00512.json.gz": {"num_bytes": 30013820, "checksum": "7c436cd0993077187988239cf74c3e64de440dacad62ba4b02bd4ac0a8d219b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00007-of-00512.json.gz": {"num_bytes": 30557005, "checksum": "dc9e43681c404fef1741e9608295b8dfae0953473993f3fc44fb83af07a6b82b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00008-of-00512.json.gz": {"num_bytes": 30369535, "checksum": "8de7a4005acdb60436b4e5d7274084e28df3aee31a5457c6837452094544c541"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00009-of-00512.json.gz": {"num_bytes": 30033048, "checksum": "32310a6c74cbee1dbb8b196e0cfad41f79e88e48d8f04c88692d42506113b903"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00010-of-00512.json.gz": {"num_bytes": 29948345, "checksum": "b7df217de849e26ecce5ed7a35b6e6238fcc1c08e969023f209307842dd496c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00011-of-00512.json.gz": {"num_bytes": 30558885, "checksum": "82e5428aaeecf27141a7105e48b78dc02516ae6ebc3d6cd4ef13963316279e1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00012-of-00512.json.gz": {"num_bytes": 29888513, "checksum": "f3d7e496b7c85ed7d020c8f8a24a0b27f9b2535abdb22b45c08441a29398c44c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00013-of-00512.json.gz": {"num_bytes": 29936292, "checksum": "bf04d82f0cdddc09ce4aecd9f71910b9858badaf6456253d43d89e6a8c56cba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00014-of-00512.json.gz": {"num_bytes": 30169338, "checksum": "15b4611513154de0dfc1c9d470326fd053adf70de814ecfe8ba7ccee66de947e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00015-of-00512.json.gz": {"num_bytes": 30071363, "checksum": "887bdea83bdefc50786c93e8014d1d49999f8090ff15168598c884cd0724fec2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00016-of-00512.json.gz": {"num_bytes": 30451660, "checksum": "288ad0d553d54052354be506f87878fa7c54b0fa65811c6e456b3262e1d117e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00017-of-00512.json.gz": {"num_bytes": 29940254, "checksum": "b13ad58ae9f38598cb9d560e3ab34c1d0200db73fe86da12230e50086b532463"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00018-of-00512.json.gz": {"num_bytes": 30282186, "checksum": "5a67e71955ab2d8f6531bd3949cd8ab71f4ff91863ea5a6ec3e7b33c31a05dd6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00019-of-00512.json.gz": {"num_bytes": 30373907, "checksum": "a70682315a0cfe0af815c7b2abbcd63310fabbc33ad6e19daad19f1f51506955"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00020-of-00512.json.gz": {"num_bytes": 30104199, "checksum": "980e544ce130a06e9e99ec906342eb0ab8aeaa96ac26eca01c56ebb463f5d688"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00021-of-00512.json.gz": {"num_bytes": 29733696, "checksum": "a69729b8f3ccb9db12476a31917783c1c6e036e7bbbb4089f430362aef71f467"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00022-of-00512.json.gz": {"num_bytes": 30012894, "checksum": "589e698fe450e22cba47813a5a28da5393e79702a528f6a8469f72f6d630caad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00023-of-00512.json.gz": {"num_bytes": 30024851, "checksum": "2a7b036c38fb4d2df6535631018c23d001931e5bf8d8a815fd5b2f9343ec4529"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00024-of-00512.json.gz": {"num_bytes": 29906809, "checksum": "7e512306cb6ebb0b0c3e96ceb16dade9e1e1f484e754bebd0078e7f545fc5b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00025-of-00512.json.gz": {"num_bytes": 30332268, "checksum": "b636b91fcd9a91ce05b8cbeea6f591a0e916175ab23b0cfaf688171c8a98ae8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00026-of-00512.json.gz": {"num_bytes": 30288490, "checksum": "9e2f8e2a37dcfe66873cc5355740448ef75a1de2deeb2d8c047c3c3a7ee485c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00027-of-00512.json.gz": {"num_bytes": 29897688, "checksum": "882616d1e8ca66c0b6e7aa2ccb18d9239021603ab1b9486638a9a3447ddebe0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00028-of-00512.json.gz": {"num_bytes": 30201690, "checksum": "0312b12f50c64fbe7b894a28e0940089ad57af95df8116cd7d43c0435ec2e79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00029-of-00512.json.gz": {"num_bytes": 30237920, "checksum": "1e8677140186b219d32e764889dcc344ccac9db51685363324d1bc13ddef2bb7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00030-of-00512.json.gz": {"num_bytes": 30048903, "checksum": "43558e81c291cbf53a5b6a016aecb0e07e26a98b8fb32f4a000037b281afa363"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00031-of-00512.json.gz": {"num_bytes": 30294528, "checksum": "c33ae8a2fad7e5264d093fbe89ed1611357110a4f0f26dd5a93a4dc15560f205"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00032-of-00512.json.gz": {"num_bytes": 29868168, "checksum": "5dc2a8f96db8da87607efc0b708e6a2172530f0c9b43665dc01286109b5c55bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00033-of-00512.json.gz": {"num_bytes": 30105916, "checksum": "c4cdc2b39a86eff251f903d7f3d39605b721615aeffa6a2753f3588b7dbef6c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00034-of-00512.json.gz": {"num_bytes": 30126174, "checksum": "6d874182112b0881dc929c0182a30ec4f9f1633372a2b822200a7b1faaf4f1bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00035-of-00512.json.gz": {"num_bytes": 30084101, "checksum": "5bea17f0cd4dd888f5d8a2d4092138e4777d80493a1f410d618d4cedf353b914"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00036-of-00512.json.gz": {"num_bytes": 30095974, "checksum": "6e7f42f3012d8ca7500c7e2ec82d27c26b3cd8bb5b8b66a7fc8355d77284f433"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00037-of-00512.json.gz": {"num_bytes": 30239345, "checksum": "54ee45bf25152060679bab3e5fc6f5cb5a3add6acd2664cb152f88c223f83239"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00038-of-00512.json.gz": {"num_bytes": 30247683, "checksum": "f738a2f0f156f7bd897d9d822748d4192a5fe46b566c7288ed5b840c4ffeda64"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00039-of-00512.json.gz": {"num_bytes": 30057005, "checksum": "60235900d69579334660c153c4fe384c08f14f4e729a06a1e8247e8b4ab8a213"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00040-of-00512.json.gz": {"num_bytes": 30185136, "checksum": "5a059d64fd6a1b42a2faeb4088db327c47f9e8328737ab74a0e0457f84433374"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00041-of-00512.json.gz": {"num_bytes": 30314653, "checksum": "2cfdc460c8dd0fb4766191ef2aec0af856af7c95d11eb3f1d731f63b71db4daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00042-of-00512.json.gz": {"num_bytes": 30123256, "checksum": "64e59b8ebde3c12b0a1d218a302252b96aeb5bb4976927463101a9509579ec22"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00043-of-00512.json.gz": {"num_bytes": 30057043, "checksum": "edd200b97394f15f9cf0a6289406a83b42c3d6f961456f031f5814db4f6d482a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00044-of-00512.json.gz": {"num_bytes": 30029900, "checksum": "1b2980f21ee5cffb271591adc8eaa414438841426442f194b5f4b703356f4e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00045-of-00512.json.gz": {"num_bytes": 30367170, "checksum": "83967210891345b831956722e8dcd29cf55fb17b786c85c2dd2778528ab4d1c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00046-of-00512.json.gz": {"num_bytes": 30105866, "checksum": "6921ac4854e2eacaeb4be07669faab85f2bab33f744c7efae1ce17be25176bb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00047-of-00512.json.gz": {"num_bytes": 29957618, "checksum": "e8eba2ba9f51e76a06a2df43b6b120c47b6e41f61e46a2e3331518ebb2d0c84b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00048-of-00512.json.gz": {"num_bytes": 30329887, "checksum": "6af9c44a53d7eb9df9d86ee4d895fb9f7f2b9b3863fd30aae325e79fb792a10c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00049-of-00512.json.gz": {"num_bytes": 30116207, "checksum": "57dc1e94f73b55e0be5690b01d61188a62186ea9f5f85b556ecef3bcaa36fb92"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00050-of-00512.json.gz": {"num_bytes": 30236341, "checksum": "eb75bdf0e63e798838b3d7abfc6a3bfab5de2ba39af833c38048dfe39c1175b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00051-of-00512.json.gz": {"num_bytes": 30357091, "checksum": "f48b1f5e07311ca9d69787019a56ad849932e6868d1f7778681cf7e4cc9fc562"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00052-of-00512.json.gz": {"num_bytes": 29944959, "checksum": "debf9490c057f11e404898b4a57cb424c1eb523fa90bb7899b1317f970481638"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00053-of-00512.json.gz": {"num_bytes": 30240416, "checksum": "9e847a5c6eb80e5c045fbb405729c695911674bd8d29b1d0be0791303d02f41d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00054-of-00512.json.gz": {"num_bytes": 30174556, "checksum": "65a80db1cdde9153e08277ad2d9074dfba1682c0f771fbb9f4aa8f88ca557f43"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00055-of-00512.json.gz": {"num_bytes": 30134394, "checksum": "beb8d280d322520ded21aec92ae087867d0bce64aac4e243a127a88f143ff578"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00056-of-00512.json.gz": {"num_bytes": 29891026, "checksum": "82fceaec35a2456487a59ae652d72f41a940d2d6bafdc4f05a6e02bcd7ed4dc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00057-of-00512.json.gz": {"num_bytes": 29920525, "checksum": "e4fd55ba5fb2825ef4209aec87706ecdd3db040242c6aacfc82f350765fbeff8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00058-of-00512.json.gz": {"num_bytes": 30060421, "checksum": "3cfc894a1853e3d1f2daa314873b7919fa52b7208b590637f8face6536305770"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00059-of-00512.json.gz": {"num_bytes": 30038488, "checksum": "4f06ab7b5ce8e8c696445db4a3e32896b6396e3f67d7414a593e7398d752e564"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00060-of-00512.json.gz": {"num_bytes": 30129718, "checksum": "7923385ee0c6801073feb10437ee3c59e5f5dfe82c2311ad8c4ec670dcc0ec87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00061-of-00512.json.gz": {"num_bytes": 30130505, "checksum": "5cd682e148b8488775622098214fc2009ef9c95355f46341bd78434f1b560fa2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00062-of-00512.json.gz": {"num_bytes": 29968130, "checksum": "53562fc23501f3a1d11c8ae6a59e719d6f4e67db8b8ea1d55e2b1b80849afd08"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00063-of-00512.json.gz": {"num_bytes": 30116532, "checksum": "008cc5c0cb7d60e84ffdfe2132f6bb49aafbb31083fd026067b3859326ca64fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00064-of-00512.json.gz": {"num_bytes": 30236194, "checksum": "8f9eee169071e80c94c248f1c37b7fa631bd75a7f6e401f6a963aecd8815910b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00065-of-00512.json.gz": {"num_bytes": 30077312, "checksum": "8c5e18ea3575cd350e98d062ef88d3fd1df068e4bd410be8732723bda03656c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00066-of-00512.json.gz": {"num_bytes": 29920862, "checksum": "e377b8112dc6ff6834607c27b927636429e887f4ab8edc0824363941b7bb311d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00067-of-00512.json.gz": {"num_bytes": 30278223, "checksum": "ec2c2ac74cc3f4f814d645410cccda266151949dd36aae518b8082b948b47edb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00068-of-00512.json.gz": {"num_bytes": 29940464, "checksum": "ddfc16a17cabf48a2c59fa8ef25ccd12d899d3462d08b45f2a301567ccc105c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00069-of-00512.json.gz": {"num_bytes": 29903118, "checksum": "66d9d1791cda56607b2561199503cef216df86b28d4519d5862905671a4ec4c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00070-of-00512.json.gz": {"num_bytes": 30082323, "checksum": "8072d3bd5e19c005493c0332b73ca5be253397f54be90be1bb7b2ef8df7ad117"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00071-of-00512.json.gz": {"num_bytes": 30128276, "checksum": "b7c68af5a6dcac3fbb3dcbe12123d1045a79baf657a8b3bdada60c1a97404c48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00072-of-00512.json.gz": {"num_bytes": 30458419, "checksum": "cfe5c6ae2ad1531271b0039042e033bdd7caf9604bfa219980ca27513cea755f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00073-of-00512.json.gz": {"num_bytes": 30366974, "checksum": "a132f5e85376b0d0a06c6ae6af9c226dcbc98394461578c4fbc6cd439ba6e721"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00074-of-00512.json.gz": {"num_bytes": 29987779, "checksum": "f905e808b50908a7d2a7f0944e7e6c01ffd97ec16e5f0b6ed7169a60d66b0100"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00075-of-00512.json.gz": {"num_bytes": 30070204, "checksum": "b57458683803936f6bc03b06fc26be9d1a09ba09517b5c1518676f468e404595"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00076-of-00512.json.gz": {"num_bytes": 30129238, "checksum": "81e88ec53e39d6191e40e5852564f592b745abf99c71ff78302292632f636792"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00077-of-00512.json.gz": {"num_bytes": 30051399, "checksum": "218b0f6e219e42113e35d99458861f8511266dee6c17d9e2780a17af8877f822"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00078-of-00512.json.gz": {"num_bytes": 30144230, "checksum": "c0a337619559362e0e1cd0fe87c9ced5c987313a7f3cb65eb44f8b861c41c616"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00079-of-00512.json.gz": {"num_bytes": 30544297, "checksum": "27e257efda6adbce01585b3b6cdeefa95d31f607012fed5dd4310bfb5a790ba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00080-of-00512.json.gz": {"num_bytes": 30188866, "checksum": "26411f1a0a7b299d0bf6cf78db04b0bcc617894cd87d59e54614f3258dd393ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00081-of-00512.json.gz": {"num_bytes": 30418881, "checksum": "87a659f6b24560a754ccbfb6aee019484e48e3ddc7955a6c7a18aa9098952cfe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00082-of-00512.json.gz": {"num_bytes": 30086460, "checksum": "708fe5108042b957688817625c84059c11700b18ddcea3814b86b6c8c66af8a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00083-of-00512.json.gz": {"num_bytes": 30138639, "checksum": "8d8681519538afdb7622b677ca5d3ae2a643382bae9639e3ad90c82d36477653"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00084-of-00512.json.gz": {"num_bytes": 30228150, "checksum": "db708760b9d45e0b20c8dde9b0008f01761d9bb0f37a194845b4d097a60e477c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00085-of-00512.json.gz": {"num_bytes": 30004564, "checksum": "19ba55c7cbc44ae30a6497373fc15b548e5c45667f790c392857f6fdaa7e2bf6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00086-of-00512.json.gz": {"num_bytes": 29696360, "checksum": "4cb07dd259a084818f9a79a4fe4fb7b24ea1adda0cd4fd405ba003e7bd481f12"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00087-of-00512.json.gz": {"num_bytes": 29927300, "checksum": "7c3c07dbc9c57881a3c1abab85a927f1ba609c58da9dcec22d7415079cd336b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00088-of-00512.json.gz": {"num_bytes": 30038333, "checksum": "59158c87d7e9e5011516f98dec1313758072ca6685c7ad9df5ee4a075d9ff8a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00089-of-00512.json.gz": {"num_bytes": 30223506, "checksum": "d3f39f7e90b4a82257779290a3f2de5619049d69b2169577f1e3c81791d85419"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00090-of-00512.json.gz": {"num_bytes": 30266969, "checksum": "88ed3237aadff809cec186fa378e176774d3f32aef1a6d8bfdbc530f64e8aed4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00091-of-00512.json.gz": {"num_bytes": 29885840, "checksum": "b9a247993a8eec31b3f853d1329ae79da29397dd27eb4acdc196b71c091335e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00092-of-00512.json.gz": {"num_bytes": 29942337, "checksum": "3d83cc54c06cad8effdb7a38ed6666b5d912e6fffcf4c82471af064b0aabe05e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00093-of-00512.json.gz": {"num_bytes": 30129376, "checksum": "d72ed9855fa86ceb4089435da3d78e8d4151b92185f828329b534d1adf3821db"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00094-of-00512.json.gz": {"num_bytes": 29613450, "checksum": "f61f74aa65a81616b97cbc34a8be1b563f83f69709642b8156eb76cdda02103f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00095-of-00512.json.gz": {"num_bytes": 30469526, "checksum": "926d1ba2e4b191e75b0bce0cbe4c15f95f244445ec03a6095c009c34e36f897e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00096-of-00512.json.gz": {"num_bytes": 30126036, "checksum": "e74818ad94e408498644dc71f1ed967f356f539418222f1dfea467a21c99badc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00097-of-00512.json.gz": {"num_bytes": 30374980, "checksum": "d9cc8827ee38bddd1a31e48b2b0064a567520e3c0f2e1be745acef57d267e4d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00098-of-00512.json.gz": {"num_bytes": 29928579, "checksum": "090ad37fd9eaeb53308599f2da1053b19b1c6478adaea5a8a1c35d6c35340111"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00099-of-00512.json.gz": {"num_bytes": 29901456, "checksum": "c0e7d9a7cbc3b9b940077508441e471a1eb70e822479fcad726b900e6c196382"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00100-of-00512.json.gz": {"num_bytes": 30033459, "checksum": "b62033de618191de3200205e6e40725baf045e403060d10417211d47854d6bb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00101-of-00512.json.gz": {"num_bytes": 30280468, "checksum": "8726d092785856ec690dcd8a9edcd968cd04af1cfafe8a83192e3c0782f02b4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00102-of-00512.json.gz": {"num_bytes": 29805195, "checksum": "248edf4dd6c9a1137c7b45ab0b5a05a5fc93fd14cec17a5da4d758b9f7b359df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00103-of-00512.json.gz": {"num_bytes": 29995494, "checksum": "d66b75c3f08a0db141d2c0162eb3dbc351e656ba1ba480e77eda051435d1390f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00104-of-00512.json.gz": {"num_bytes": 30318447, "checksum": "09bd2068c20d33783f39322c95756fd3dbd0da91f4380fae3822cb33b7d06779"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00105-of-00512.json.gz": {"num_bytes": 30209523, "checksum": "0a399ecb1116890e1a0189cd2842d64d8ed53213b1623ae38229a6ac4f5c1c76"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00106-of-00512.json.gz": {"num_bytes": 30476739, "checksum": "540f682a7c977d20f920b5af1ec7e40c14a0d54f1718b43271e22dece9cdce16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00107-of-00512.json.gz": {"num_bytes": 30203291, "checksum": "0dd51deb74ab391c54b20862f7df561f74d00be2ee4fc13987f91771870c099b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00108-of-00512.json.gz": {"num_bytes": 30265100, "checksum": "172b09a108b154014077a415f644cd16db6a66f178bf780c120a6c4fecc3c0a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00109-of-00512.json.gz": {"num_bytes": 30342649, "checksum": "214a8f147f2d77ec0f3889b0a2d782e5d44230878359e695e9523561e6723a1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00110-of-00512.json.gz": {"num_bytes": 30152418, "checksum": "dc0d34ce7918b80ecef3528ec2b063edf7b12223c453ac7fb9d39232fecd81d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00111-of-00512.json.gz": {"num_bytes": 30160329, "checksum": "d0594cb69d26f0e853575d86f92b1aa233b5bb236804a2f496a792fa031014ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00112-of-00512.json.gz": {"num_bytes": 30428351, "checksum": "2b0542d973bab88e696fb9efbe042167600da397d776ef65344dce868bbcb0b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00113-of-00512.json.gz": {"num_bytes": 30200133, "checksum": "10dcb929692795fefcf4623040191d9cb6199fbb3b164648b62b9867e8392379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00114-of-00512.json.gz": {"num_bytes": 30205273, "checksum": "f16631d5bcbbe133a01675286ca7667400ecc7e6df13d728015381d21ec71cfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00115-of-00512.json.gz": {"num_bytes": 30164849, "checksum": "bed27819db4bb7e02cb42cdda18acd232659a2eaa43eed910ba26d686cb3f837"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00116-of-00512.json.gz": {"num_bytes": 30117752, "checksum": "4eb4bec7adac3c2f431d356212f8a9d47136f0011f5f9e71dd29d82b1b823e2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00117-of-00512.json.gz": {"num_bytes": 30062588, "checksum": "79639624734885b3051b10f052f5486d7124bbc4bcd18d99348f3683ee2fc54f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00118-of-00512.json.gz": {"num_bytes": 30125828, "checksum": "e922a4a5332a4182ddcf6ac8ba910024fe4fa878b524f7368b27373f75bbfe44"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00119-of-00512.json.gz": {"num_bytes": 30156741, "checksum": "a44aba8779b99ace2f212789389af058d12dfb0706221b296676d5e10528dd78"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00120-of-00512.json.gz": {"num_bytes": 30489925, "checksum": "82bec41bbea7bc5ddb67b3bccea51122da7d0922768f8bda7a0c9d489bd20cdb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00121-of-00512.json.gz": {"num_bytes": 29606989, "checksum": "b49238f5b75aaf876657826cfbd4346d250f564a86bdb010aa1e85b44a969229"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00122-of-00512.json.gz": {"num_bytes": 29770557, "checksum": "0803ccbd505db47cd09b20d86cc6ad459c7a8d1c583a5ee756b0397369d8b6fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00123-of-00512.json.gz": {"num_bytes": 30248121, "checksum": "d73a1bf285a0355bd61a25891cd8c5fd9da66535ec515dc7e1602a769b994727"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00124-of-00512.json.gz": {"num_bytes": 30131013, "checksum": "65d2dcc7e63a28e1911717d149b907d0c74fda6e36db2840353a0290f7880324"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00125-of-00512.json.gz": {"num_bytes": 30348971, "checksum": "5dee3c7afe0364ccb8e36647d01e78ffe61690f29f29aa033efac9a0413c2a47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00126-of-00512.json.gz": {"num_bytes": 30370074, "checksum": "1dc04b3755291842711623d1d6cf042e2d66987103a0c708f01c9136a8c42db6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00127-of-00512.json.gz": {"num_bytes": 30320846, "checksum": "e31a27ba25bdf13e6f929fd38d53409dd3f50be78ad955b69b1956709de5aedb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00128-of-00512.json.gz": {"num_bytes": 30076235, "checksum": "122ee9d293428a7a823c17b3a432b5b2198fa2a68bbb246b97e981bd09f78f0c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00129-of-00512.json.gz": {"num_bytes": 30569486, "checksum": "918bf43ce3ab54d535dd02cbcd09f1081890be3287e23fd81bfa032beec61ebc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00130-of-00512.json.gz": {"num_bytes": 30280169, "checksum": "ab0a53e8c10dfdd139281175b5fcfe3090fa238fcb383e27b1dcdfdbbe8a879c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00131-of-00512.json.gz": {"num_bytes": 30338899, "checksum": "e54771e12a6f3583c3accf9bcc01b598819231f367e7f80cbd44cf6683c5c852"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00132-of-00512.json.gz": {"num_bytes": 29969011, "checksum": "f69d7052ca7657fdebe547a6e196b109285d5d4e4f1a68f3900a37ba6fecc22f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00133-of-00512.json.gz": {"num_bytes": 30179558, "checksum": "cf2130dedafd8f47e97661a5b1555813433e3f7293b5c5cb222cf551d90a0604"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00134-of-00512.json.gz": {"num_bytes": 30080257, "checksum": "1a32902fc21633ae8d41e4e5518804f4c719dc8729b866ebc32d3c36fdadbc10"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00135-of-00512.json.gz": {"num_bytes": 30284972, "checksum": "6e3a78e7a530d91ee4578caf462a4c685a5f221f0cd8eb9639c9067e2b655a7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00136-of-00512.json.gz": {"num_bytes": 30130265, "checksum": "defc57340cbaa5f325994a91b5134789c84a76a4ca7b9fdbf993b0e634735f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00137-of-00512.json.gz": {"num_bytes": 30146793, "checksum": "7ce5035f452eb2e1adeff36d0c6d6d65c245d139a86ef48bbe10c5275975183b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00138-of-00512.json.gz": {"num_bytes": 30180265, "checksum": "298849a53a8ea0e68d01cc137195bc36d686077bed722e1198337a1dee3c51cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00139-of-00512.json.gz": {"num_bytes": 30398387, "checksum": "ef2ac4b8f195141a79a357d934d5d97bd4d2c64027ec7509b5873a4ae32fcb9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00140-of-00512.json.gz": {"num_bytes": 29652990, "checksum": "290f1c99b696e345aaa6ac6d5a882a87dcf5d3939b08ba859a359d2459498785"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00141-of-00512.json.gz": {"num_bytes": 30083642, "checksum": "fb6a38388a25261d86fbd8ffea63e06bcbcbd6846a4eb6f13fd09d7fe5a1fbc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00142-of-00512.json.gz": {"num_bytes": 30131064, "checksum": "b61ccf6166ea4b777629bdc07d543f299bf7569deab18228ec5bb9edc8cd3eb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00143-of-00512.json.gz": {"num_bytes": 30244435, "checksum": "22812c50efdfcf2c0fdcf593639dfea09ffee8068321c30effc669c8234d4f3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00144-of-00512.json.gz": {"num_bytes": 29725094, "checksum": "79cfa65a3115193629d16606643d90dcf27d3108c320cc9e364ba19fdb9fb1d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00145-of-00512.json.gz": {"num_bytes": 30335033, "checksum": "e836f0bc9acba85fd1721d19cc24054e97defb0d12678bdc0d086f40deb9b1a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00146-of-00512.json.gz": {"num_bytes": 29905680, "checksum": "bf684871a235078390d6c6bb03fc2d5bbffec2b095806df652a19baf5e67135d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00147-of-00512.json.gz": {"num_bytes": 29852459, "checksum": "0e716de5b3b09ec287b039be0f0dd6edd7d541aa6d3f9d2be18768e1cd5f4cd8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00148-of-00512.json.gz": {"num_bytes": 30364788, "checksum": "4cef624e6b7c2b73dbfb47227e31681223a5a9369c4b7daef8606b796f010dd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00149-of-00512.json.gz": {"num_bytes": 30096278, "checksum": "fb448ccc7412f5ca8667004a70f3dd6e1b5e6cb7f6facc06564bd22b1d815593"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00150-of-00512.json.gz": {"num_bytes": 29776995, "checksum": "1e14268cf723bc7336b33896537643d21dbefc1f05ffd5201feb5fb1130f9683"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00151-of-00512.json.gz": {"num_bytes": 30205172, "checksum": "797224cf74063fbcaec741535278ccce141e6dbbdd69a2191d07f89816ab14fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00152-of-00512.json.gz": {"num_bytes": 29845034, "checksum": "77eeb2353f544c714deea68d4a781b498c40d7c1e27db3aade4987b381ca29c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00153-of-00512.json.gz": {"num_bytes": 30258796, "checksum": "0fc581e92e70dda031d72a4aa0bbd65b1e9b28884f0ef5dd5e895cbecb270609"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00154-of-00512.json.gz": {"num_bytes": 30249734, "checksum": "ba10dd0a24bded170541e23078264b82b35bc99e402db594e2335e31905ededf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00155-of-00512.json.gz": {"num_bytes": 30198742, "checksum": "fe285ac893126062bcbc20df75a9f65c57d3a7391354fa7e62b7f6a7122d6e77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00156-of-00512.json.gz": {"num_bytes": 30168323, "checksum": "d21826b71bc85dbc496dd947ae9ee79d62885cffb3fa7c47409feee6ab247f17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00157-of-00512.json.gz": {"num_bytes": 30241978, "checksum": "fc41765301b62849eda0b7b08f792e45f03db458fb92063af70c43d7cd0d0bb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00158-of-00512.json.gz": {"num_bytes": 29959715, "checksum": "1eded3ce0bc099c7e198e9277719d578c3fb6c425bb2110cb0ca6ce469d1d19f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00159-of-00512.json.gz": {"num_bytes": 30109595, "checksum": "eccaab5b694c2f0017fe1d423637872d5587f6deb316796f7c0ff5517fa28178"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00160-of-00512.json.gz": {"num_bytes": 30201741, "checksum": "4ceee71372da6112101665f5bbf942a85f065feaab924c6e3f83498169bbe255"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00161-of-00512.json.gz": {"num_bytes": 30176266, "checksum": "6ed829daaad190b2d50b626d840edb750a063afad95315ffe7604a193183a489"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00162-of-00512.json.gz": {"num_bytes": 30018118, "checksum": "dcf8509a55213425a41706e5209ad411afb715fb9cd8c1a8b8edca23fab7d6cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00163-of-00512.json.gz": {"num_bytes": 30236016, "checksum": "d93cfaabcc7197637f233896b5799527f27d5b2dc60f0f0411ee51f05f09c500"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00164-of-00512.json.gz": {"num_bytes": 30150055, "checksum": "cc7de5ed3c774ff1dc350fbb5167dc1610c4f9a0dbc7c5d60ed4cf08aaf23ce3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00165-of-00512.json.gz": {"num_bytes": 30348056, "checksum": "b41c4a3b7b4e96262fe5c87d06fbeb000dc48cc1d304a475bb4f4e1af84a9afb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00166-of-00512.json.gz": {"num_bytes": 30015834, "checksum": "0a0821b7628b9b019995a9f34223e2960ded84331ce1bb55089838becb8a170a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00167-of-00512.json.gz": {"num_bytes": 30282254, "checksum": "1285af56d024efe2166fa892878d471948e1d4c996922c7673e3c0f7f0f76bef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00168-of-00512.json.gz": {"num_bytes": 29815124, "checksum": "29ec54ed647725ca3b9aec3bae341151a8e2b708cf21cd87b4389329298442b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00169-of-00512.json.gz": {"num_bytes": 30346843, "checksum": "1791e3f8371a63f9f849b7bf430e70d3f4011dbdef572c166cc5d49d06162fd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00170-of-00512.json.gz": {"num_bytes": 30175685, "checksum": "de8f82986addfc64b88fd3041d7ee6fdb64e6f770758146dc4c9309df348e965"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00171-of-00512.json.gz": {"num_bytes": 30145505, "checksum": "0dda47f679666862de6343e1109ed92866a42e8fa129ee69e9f0b73f18b6aecb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00172-of-00512.json.gz": {"num_bytes": 30009998, "checksum": "2990dae6c16b7d60652439bed8b80ee4cf93972f33d8511d3d6aabaddfeca5cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00173-of-00512.json.gz": {"num_bytes": 30062185, "checksum": "e154a969bba2bf9430e0c8307561de78599fd2bd527cb1f15bbaf8f8e88cdf23"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00174-of-00512.json.gz": {"num_bytes": 30055129, "checksum": "e714ae153e8a927c88fe577d4c27017985d3ed7f3d0f5470f9a5f25c2e901a9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00175-of-00512.json.gz": {"num_bytes": 30091082, "checksum": "5f47c663d1e15d94fb0057d303048be990c713f3285ada2c6233137b1d84d60f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00176-of-00512.json.gz": {"num_bytes": 30235767, "checksum": "20b05e4e99e5a05f6a4c29b304803b895bb8816caea6203643723ca587d66128"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00177-of-00512.json.gz": {"num_bytes": 30071950, "checksum": "29294e4b224df4695c9342c6f23d5495de9a0ca6a1be7217aa2211506e8ac7bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00178-of-00512.json.gz": {"num_bytes": 29932121, "checksum": "6022ed3b2ceef02324e40d3c7407622c95ead2cd3d3c41ab15ff9dd218265673"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00179-of-00512.json.gz": {"num_bytes": 30119251, "checksum": "42fa0aa883d9db4303a4981e4e308b2432b031fbccc98c3e1994ec775ba8023e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00180-of-00512.json.gz": {"num_bytes": 30175456, "checksum": "6fb2ebd61524846f6b1f746f9c6356045623beb4b685fe265a23446037c9cd9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00181-of-00512.json.gz": {"num_bytes": 30029564, "checksum": "b779d721bb135fceaeddebb0dad1bdb43c9067a5e8595b3d544dfa7a084eb9f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00182-of-00512.json.gz": {"num_bytes": 30437016, "checksum": "b388fc0e862d7f6bb5b879ff7c69c301038faf5b542f6b40cbea4e2096a41e6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00183-of-00512.json.gz": {"num_bytes": 29994048, "checksum": "8208eeca7bc76f8b1786c95939d321ca0c7ae190b1f12dae86738810e412aa8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00184-of-00512.json.gz": {"num_bytes": 30338616, "checksum": "49859e75d999f65de99f9236e649a81989360f0328ba684671057b0dd7cf5e79"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00185-of-00512.json.gz": {"num_bytes": 30088874, "checksum": "ff6d32fdd471d3076a9367c175baab84a5d699ccd6dcfe00c755f0b714ca6074"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00186-of-00512.json.gz": {"num_bytes": 30193681, "checksum": "82508ed104fc57de3062258eaea57854ab9e1934437a88dc0d8a9921f3641bbc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00187-of-00512.json.gz": {"num_bytes": 30171163, "checksum": "409d6576b25ad27455c755e5484e3f51d5d9788962efabe1c32e06bb3febacab"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00188-of-00512.json.gz": {"num_bytes": 30060432, "checksum": "fae94de96fa2962ef51e2ea90a5f760a5cee5de249bfd9f56d7c7b4e5c20f6de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00189-of-00512.json.gz": {"num_bytes": 30180741, "checksum": "25293d5cba09980086f380d9e9ab44543adbbdcd05ed08601248b3a2b16d118c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00190-of-00512.json.gz": {"num_bytes": 30207152, "checksum": "ccfee160de15df5d88f0ff5a898a0c5b2d0ef4ebd6e6832715a9ef8a9904f88f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00191-of-00512.json.gz": {"num_bytes": 30143987, "checksum": "4c579619e465d9d97451801147202826a3855e772ea6dc4e9968e43ce2b8c05d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00192-of-00512.json.gz": {"num_bytes": 30072097, "checksum": "9c32ecb6d4ec9feb27c5b642879b464e68ca8804db161219503f624e7ca1166f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00193-of-00512.json.gz": {"num_bytes": 30172886, "checksum": "8442ddc3843c72aa169ca67801ff865ff85e4183beb38faa664f4f1d1c22a5d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00194-of-00512.json.gz": {"num_bytes": 30037105, "checksum": "2942ecacb22cb9a2953c68f21ddf3368cd47ab1f2b2d8e1f5c76b1c849b28d91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00195-of-00512.json.gz": {"num_bytes": 30014854, "checksum": "9e5c6815a5734403a7062bb27b2565d433a3520a401c836ac3f16e743a1dd949"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00196-of-00512.json.gz": {"num_bytes": 30020510, "checksum": "792712f0073c158b5f96f7a99d97970fca3819b69739d34d7d2b7f4b8b407b7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00197-of-00512.json.gz": {"num_bytes": 30072566, "checksum": "3ece37e2d0d0b26fbd839b5d3facdfd70844945a06867fb68b141f6b1378462b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00198-of-00512.json.gz": {"num_bytes": 30036679, "checksum": "c3f37a9b89987dde4578b394b5c3916c2d4fd87e0902309b4c81af19b1d2d5ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00199-of-00512.json.gz": {"num_bytes": 30195178, "checksum": "ae01bb5515097a083afd498d8530e788d99671e7cf802c4402957d6252b2ec77"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00200-of-00512.json.gz": {"num_bytes": 30064374, "checksum": "2399d4869f3a8bb4a9adced5ec548a9a3fde1d4fbc4e3abd9a0a3b495fb9a8ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00201-of-00512.json.gz": {"num_bytes": 30136711, "checksum": "5c922040697bad8d7807d79f34f2b667eea63ceefba89b2d413fcd4d66497607"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00202-of-00512.json.gz": {"num_bytes": 29962983, "checksum": "e4df518d612a8614de73d5944a31d22ad06ec9ecd26fb52e500df71fe363c1be"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00203-of-00512.json.gz": {"num_bytes": 30178998, "checksum": "e84a98a176451fc82d940a64cdec821e320a648780edba6466b74a1966eca47e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00204-of-00512.json.gz": {"num_bytes": 29988832, "checksum": "c6dc56388bc7c57cbdee8280895ab80da7b4d49c9a0101a685229c50cad2e2e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00205-of-00512.json.gz": {"num_bytes": 30229414, "checksum": "e7e5175b6a7372377ba3a0db439911e189db459787d48588183ac1a0198c5fa7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00206-of-00512.json.gz": {"num_bytes": 29914929, "checksum": "eb263433133660ebe219cd5817dea3b546ef2fba0e15396b2768d7091117cdea"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00207-of-00512.json.gz": {"num_bytes": 29912800, "checksum": "7f8a5f62ba5912b64af5b02bd987b4d81727223ef8eff110022e89d01961366f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00208-of-00512.json.gz": {"num_bytes": 29900590, "checksum": "bc2af142244601bb7a96859dfd9885196940e675ca217cfc7c73ac9c614ea938"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00209-of-00512.json.gz": {"num_bytes": 30242768, "checksum": "fa51a4337faecfc790ca925802f87f10761552e16578b880ced80497f62bba60"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00210-of-00512.json.gz": {"num_bytes": 30039857, "checksum": "3adf7482ec6a3ad106c8edca3645a94032c33f84fcd26bd9876f2b8a1f6b5722"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00211-of-00512.json.gz": {"num_bytes": 29846856, "checksum": "8e931aaa9c1f069c0eca0b4605277610df9d2d0c07a0dbe6191fb7081b0e642a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00212-of-00512.json.gz": {"num_bytes": 30022172, "checksum": "21c8bba1c83544c27977b22b077fd77f8df9cd06bc4eb5e9e9a532c511498d36"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00213-of-00512.json.gz": {"num_bytes": 29877918, "checksum": "b64ebaa088df5c6230e69f207267a038705c38f4d327970e9117979e1c13d1ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00214-of-00512.json.gz": {"num_bytes": 29906552, "checksum": "55d833a2b78ad564e6532d1acd14511e8b48d703030e3bbc92d7c835c1ed38c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00215-of-00512.json.gz": {"num_bytes": 30075441, "checksum": "999c77c136d3df83601e33c823f389b133f33c4c0b03736ceace617b526cb293"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00216-of-00512.json.gz": {"num_bytes": 30507152, "checksum": "0b23d4e57eaa101c78bab46151add537668d2722bf0c50470c1b434ec3389ae1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00217-of-00512.json.gz": {"num_bytes": 30044236, "checksum": "6abacfd53e231a38c714d436018cef9a58f53320026c2ebb27d6caf08f02d7ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00218-of-00512.json.gz": {"num_bytes": 30047926, "checksum": "01120ef69493d84c44d112a41c69a851edaf89232679366e812f240fd26a0e47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00219-of-00512.json.gz": {"num_bytes": 30349211, "checksum": "c4fc219559f0f076f634fc6812d4b13c229908c1ae45c3b74c059fb3b8124f63"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00220-of-00512.json.gz": {"num_bytes": 30063445, "checksum": "11f712439d54ef062cfa1225328fc4faaef5f6c9c0b0d87a0a81d25a71350e28"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00221-of-00512.json.gz": {"num_bytes": 30115660, "checksum": "9a344857ef4f9d141b57df38e25f717153b773436d72c23e10289ffe67c315eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00222-of-00512.json.gz": {"num_bytes": 30134562, "checksum": "227cd1847a948e388b404b5cda9289f05510d4e22f0ae5ec4d5a87a8f7f98a45"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00223-of-00512.json.gz": {"num_bytes": 30120819, "checksum": "e0029aa6b612a98f76e37d82107fcb90f2b57ae8d52beea172b5153b76334f20"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00224-of-00512.json.gz": {"num_bytes": 30371365, "checksum": "1ce5242d163ca12dbb22655eb841bf80750b552353af4f84973285d823d0add5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00225-of-00512.json.gz": {"num_bytes": 30319212, "checksum": "71cb82bb95107a7e0b7777a5fcaa0f76b465ba828ac47401babcf7289eeb2335"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00226-of-00512.json.gz": {"num_bytes": 30020940, "checksum": "b7b8d98ade41f52ece23e896bdc4c19ad034a92ba18adb5fac85c7271afbfa65"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00227-of-00512.json.gz": {"num_bytes": 30109958, "checksum": "b2ec382f44caf4e8e46fef2faf6bd2e4000420e6da2eb12a5d9f6e7efb4e1564"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00228-of-00512.json.gz": {"num_bytes": 29940895, "checksum": "ff86264683d0fdf9d689aa30e7889c4ceed21098b7c60a220db92d396614cb1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00229-of-00512.json.gz": {"num_bytes": 30080588, "checksum": "3a5502cedd61501055eb16adb6ef861c75880524c5468a69cd346bc03e98e219"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00230-of-00512.json.gz": {"num_bytes": 30376399, "checksum": "6d3a4171a1febe9149f6900e3cca5a38046ca9d59214b548a4ef9de7de754bbd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00231-of-00512.json.gz": {"num_bytes": 30031670, "checksum": "a2c8d9bb3eb260d5d8a7dcafc4703540332e2896e5127372d380d7efbd567a3a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00232-of-00512.json.gz": {"num_bytes": 30132612, "checksum": "c9dec917eff4d72c684d6f8373ca66839061e29d25f0aa5fd6fb7de5c30df469"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00233-of-00512.json.gz": {"num_bytes": 30178285, "checksum": "1eb83b8eb7e72b2b3e55420436bb17521b989d0627da46f8cc61fe9f420fd464"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00234-of-00512.json.gz": {"num_bytes": 29991258, "checksum": "5e14e2a9e8c0aba73feb9134c694e99baf57357bb524877322ff5181eedef1f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00235-of-00512.json.gz": {"num_bytes": 30045172, "checksum": "50a118a072498b5338802cceacb97a9aa9242252e8d76d305cf5f0d928fd4af6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00236-of-00512.json.gz": {"num_bytes": 30403542, "checksum": "7d7605576975232579e422a1b72625ad6f9d714d27770725dc7b99ba258e1985"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00237-of-00512.json.gz": {"num_bytes": 30242989, "checksum": "22d152fa02c5a959e978ea4887dd873dfef7267af0a577b4d796ff0cb52d5c56"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00238-of-00512.json.gz": {"num_bytes": 30214634, "checksum": "6d0af6f396fa21867e899a7678c633e47bfe79bcbda29b8072c5d32ab20a9aa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00239-of-00512.json.gz": {"num_bytes": 30255546, "checksum": "d35a93632638b6283053b121f0f30d47ea20b2747d871c3dd0beb13f4ffbcad9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00240-of-00512.json.gz": {"num_bytes": 30347604, "checksum": "fd052d532fcfe811d96f8433f79a684f68f76ec42bd959c76ae3b63aec0b2c3e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00241-of-00512.json.gz": {"num_bytes": 30135691, "checksum": "12c80c41dc4d6313bce4a171999ecda93ffc59f2c70cca363bce214cd12dc9f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00242-of-00512.json.gz": {"num_bytes": 30229834, "checksum": "fca5b81914ac0c5fe0b0c1a554a1e62c64af5c98740df1f8ce8f48f2a62b6a48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00243-of-00512.json.gz": {"num_bytes": 30053753, "checksum": "ba41c505579524e9d244354a70060c9a0131007e0b129f03e628bb7b7b512ca9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00244-of-00512.json.gz": {"num_bytes": 30216889, "checksum": "54a391c1d2de7627e739f3cd94eeccd50a80d56a40606f7c5392f6098df456cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00245-of-00512.json.gz": {"num_bytes": 29887569, "checksum": "c3263ea7e16e0036961dad28fef57ce4f0495219e59b4e800af82b67b3c6c506"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00246-of-00512.json.gz": {"num_bytes": 29906815, "checksum": "a3dcc92aed81708434edee84397010eae4ffeaa38b39aaf3919256f72deee625"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00247-of-00512.json.gz": {"num_bytes": 30074896, "checksum": "019e983a95908651bfae83e37bda5200b3888b03ab235fc8db2d5b16742f028f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00248-of-00512.json.gz": {"num_bytes": 30108081, "checksum": "6f68835ec02cf899f8f44a795b1e3117956ff5bb6c8946435d9861ae7a112df3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00249-of-00512.json.gz": {"num_bytes": 29957882, "checksum": "9bed6b7f56d93fa3973d4f177dde0973fa0eb6fe17d8d85279d865531613f963"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00250-of-00512.json.gz": {"num_bytes": 29822284, "checksum": "1848bef8d11360df55a576c64147e519327b1178f77d3ec14ab9522b33b1c423"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00251-of-00512.json.gz": {"num_bytes": 29956462, "checksum": "425f69c361a8671cf571df577ac0cfafb4894de494360084b7cbe9cb8869bc3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00252-of-00512.json.gz": {"num_bytes": 29733712, "checksum": "7198e831e75eff1e116513f9cbe098c071f051c545b41d1943211a1d996a3c67"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00253-of-00512.json.gz": {"num_bytes": 30450662, "checksum": "0452804e723c919bd3c84217bb1dfc8764112fd70c5581f84520df7592f28ae9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00254-of-00512.json.gz": {"num_bytes": 29944765, "checksum": "dbbff2253d70094537de481344e5706315271fdfce7ebaddc8d277ed05ddfe24"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00255-of-00512.json.gz": {"num_bytes": 30321363, "checksum": "79173dd85d535cee71afb52f7775bbf7289509bc555efe21a8700d36f7e5da25"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00256-of-00512.json.gz": {"num_bytes": 29982818, "checksum": "bacd191568e72da06c564fc7476225ce83440de6aea6c85ebe7f5279f1c15846"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00257-of-00512.json.gz": {"num_bytes": 30338592, "checksum": "998287203665559c27a66e889611ed716b7a389e403b2e857086f548b2c47b39"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00258-of-00512.json.gz": {"num_bytes": 29911193, "checksum": "ed9829f41a71cc187d0ddfeafc9cbde8e362b52914c988708a1a5ffbd3c152af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00259-of-00512.json.gz": {"num_bytes": 30227794, "checksum": "2fe86814499a3379601a179acca1d440b3c79467827ce9ef9787e1ab311904e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00260-of-00512.json.gz": {"num_bytes": 30206902, "checksum": "c4efdad05d3f5e9f27884399ab0ec82081c26486e87f0ed5408a9eb80b223daf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00261-of-00512.json.gz": {"num_bytes": 30035514, "checksum": "e47675a956a626a32b1870c61e6f98c3cfe9cc571901cf477abae982b4e63c96"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00262-of-00512.json.gz": {"num_bytes": 30406718, "checksum": "ae19c1389e26562322f745bafbd7839e7a95b3169743d48baa7ae7f2db2a0b5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00263-of-00512.json.gz": {"num_bytes": 30266531, "checksum": "289c9fee87f12ea22ad5329f80cb379e5e9c22c5cb6639077748958228c62bf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00264-of-00512.json.gz": {"num_bytes": 30100823, "checksum": "7c65dd5d90c6df49ca2dcbfdbf1b9fbb0789cb32043795942d88c5f2d7a99869"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00265-of-00512.json.gz": {"num_bytes": 29957109, "checksum": "e3a1b501b2cc3f5f2667ef179d7876db602daedefd0cd741c0898679b24984e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00266-of-00512.json.gz": {"num_bytes": 30196603, "checksum": "9337dd8240f168da5f6a8b57c5c169a2a400a9a160eccc8a6e44e7b32004ff19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00267-of-00512.json.gz": {"num_bytes": 30304605, "checksum": "513eea4e78c399cc045e25f13bb5f77ddb6c9b606522bed8216945c529894e8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00268-of-00512.json.gz": {"num_bytes": 30312562, "checksum": "0503c5bf6848213c5fcb81a5c94307fc010d910a8989e104ad5fedca58c76f7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00269-of-00512.json.gz": {"num_bytes": 30045257, "checksum": "59bd3011d12d7d70b5fd64bc2dd2016b1a9ca6f0d210dbb3e6c202bbbf74ced5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00270-of-00512.json.gz": {"num_bytes": 30027628, "checksum": "8d3ecf4c61acafc49b624d08b6aa31340643e030f6c2248f689e8a17d355359e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00271-of-00512.json.gz": {"num_bytes": 30014730, "checksum": "b2e4820a0a7287786f802b3b40602c8ca77c7813b5f50db8a336b89b89bbdf37"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00272-of-00512.json.gz": {"num_bytes": 30145705, "checksum": "20c73e4a9056a5201621a4799b86c323c5136af43caa63a74298a5c3bee890a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00273-of-00512.json.gz": {"num_bytes": 30165945, "checksum": "8f07a91b6b40444635d869b94558fa68e3593626808bc6122d4e17403cf76101"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00274-of-00512.json.gz": {"num_bytes": 30097947, "checksum": "9530522c841d8f09ccb89f4f0238f7b9048c211e85b27449fb3c09d3bd2bab7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00275-of-00512.json.gz": {"num_bytes": 30296359, "checksum": "51a358db81805a20df4f920baacf3adea05209282f800fbedfc7fa49638a072e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00276-of-00512.json.gz": {"num_bytes": 30311407, "checksum": "a51253cf73fb200053eb5fd5eca398a7a070fcaa27fc99b23389d09eef7fe5ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00277-of-00512.json.gz": {"num_bytes": 30372345, "checksum": "cc4f6d9040d8c4909d4ea5b661a7e54ba4775ff1c7c55db1ff686a56d428e2a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00278-of-00512.json.gz": {"num_bytes": 30379507, "checksum": "1052defa657524e1211e67d775a32243b164eda431c4c6ed351f0c6727f21b16"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00279-of-00512.json.gz": {"num_bytes": 30195406, "checksum": "6f4fdc92c516ad779fd521afba7d8d5bcd40672e63028f43f70fff4d7605f5ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00280-of-00512.json.gz": {"num_bytes": 29902057, "checksum": "c26f89efd0977465f45fe321036d88e2d6ca3ee1edc4bafe4b40ad1895cfc0e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00281-of-00512.json.gz": {"num_bytes": 29779702, "checksum": "094139d741b7a47faaaaf50093ab4edbef6ad1943985c6f453ce45a67a95b190"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00282-of-00512.json.gz": {"num_bytes": 30063500, "checksum": "280d69bfc795f1502a9e744d53d1a189051a1e771042721f8e6f74f6559e25a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00283-of-00512.json.gz": {"num_bytes": 29956350, "checksum": "505e49b7eeab46c77a324959eeff103f8899da1efc4d0fef5c0e6c6f8879a721"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00284-of-00512.json.gz": {"num_bytes": 30146285, "checksum": "9b075f2cfdb9a90fcdc7f779a52b0c5dad36385214844d4fd9df1e528ae78b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00285-of-00512.json.gz": {"num_bytes": 30160056, "checksum": "d9b9f3cbb9ce2a0a0a1a2f7ce91e98621d48a7a900c278aeef437dc6c0a7cdf0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00286-of-00512.json.gz": {"num_bytes": 29844025, "checksum": "6de9ff1013484662305e414725be2d0a4a1873a941250b95b80b5dea8919cf95"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00287-of-00512.json.gz": {"num_bytes": 30089218, "checksum": "444ff132c4a5330653b7319d34b2c7f4ae3b960d8b510cbd7389e3881f65ac5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00288-of-00512.json.gz": {"num_bytes": 30092170, "checksum": "46dc5b3b84e4387ad718fdf96b751354d7048e898ec664e0d3bdfc21ee841ec2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00289-of-00512.json.gz": {"num_bytes": 30365397, "checksum": "b42e35746112198143ac18509e4f0148772db75e19f5eea9ed0d7e2849dbba48"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00290-of-00512.json.gz": {"num_bytes": 30275920, "checksum": "25d99877235c4b9dacd5d1dd7e9d16bba76cdf6cb1725fa617209142873dca0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00291-of-00512.json.gz": {"num_bytes": 30125784, "checksum": "51da68b6f2751a83e2534c342b6e9d69c419fb606b44c42b872d69f5f726df3c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00292-of-00512.json.gz": {"num_bytes": 30201021, "checksum": "1e0a42b5e7ea7049c3c86b96d37c5d1c36f3ba2e2dab02145a897ef056fa6a87"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00293-of-00512.json.gz": {"num_bytes": 30124224, "checksum": "8c744f5c6eb92c0de70649cd773c0ad147bc7a1487b2ae7f1107bce9d19da601"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00294-of-00512.json.gz": {"num_bytes": 30074708, "checksum": "b3cfa4c4408c1a9f39b48e18a62e112ec3c132b226efe0850f9e58e2a517aa97"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00295-of-00512.json.gz": {"num_bytes": 29990007, "checksum": "012f63e147d22e34249e930975a2d8958a8d0b17350a9f6e368d702189b40d5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00296-of-00512.json.gz": {"num_bytes": 30093755, "checksum": "5573859cc485ae4535b83fd408dcc6a82f644832c93e6125db9a16dd6ded338f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00297-of-00512.json.gz": {"num_bytes": 30078472, "checksum": "25e694485171ba1347ccbd7916c1b87a0d46acfd13795a8aabb1cb57b5eb1221"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00298-of-00512.json.gz": {"num_bytes": 30327122, "checksum": "6d6832cb3b1c86b6392bc9ca52f69a0bb16bf71c3c7664d9fe668ee259a40a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00299-of-00512.json.gz": {"num_bytes": 30214180, "checksum": "9f3c3d87a525874ea117e36e0b30d7f5cc6c64564506808058a0788d74943634"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00300-of-00512.json.gz": {"num_bytes": 29895171, "checksum": "e99d296965da2f731ea660889ce834cd1d21edf427298bab3a059ff3ebc64a2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00301-of-00512.json.gz": {"num_bytes": 30131063, "checksum": "e5eeb0f237cf986134c946bb3c2a4b5483fb9c88b3c2b16b9db26135043036d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00302-of-00512.json.gz": {"num_bytes": 30184609, "checksum": "4ac9bf5ca6fac7f7293238852424340326347ceaa6f5dfa6fddef8003421bebd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00303-of-00512.json.gz": {"num_bytes": 29956412, "checksum": "559019fe1ef1f7e77ac53ad98b3556965ebc524ecb80bbc3f26255d5ae6e3609"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00304-of-00512.json.gz": {"num_bytes": 29974071, "checksum": "3c54edc4b6a7e34048cbbadb55cb3b16496a4e6e7334b4ede4e1368daf4c5301"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00305-of-00512.json.gz": {"num_bytes": 30338106, "checksum": "1c91c0c5bcc2bec0a698318ad6f576a06db7885c20ed7f36782427b80580a75a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00306-of-00512.json.gz": {"num_bytes": 30178986, "checksum": "fff99f2758c2de57ccbfbfc6388f67e624d00d4a6cccb5820a7a8f5fcf02d386"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00307-of-00512.json.gz": {"num_bytes": 29493455, "checksum": "5d08c6e3909e21bed456ff9d06c983f14d3a277cb399a91047a692184f87c4c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00308-of-00512.json.gz": {"num_bytes": 30228844, "checksum": "04bffac195e24383d06b0ab9ebf019959a4e7abe8e8e6a0cdfbf0a8e7c23c899"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00309-of-00512.json.gz": {"num_bytes": 30351688, "checksum": "3ce14d5104d1318c6a16d042735f0a71f4452897de60d17408181ec5b135bbb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00310-of-00512.json.gz": {"num_bytes": 29993012, "checksum": "afad2f39bf4cb932e50d9a0be93940b423e7abcc3d67dac15b1939e4e40f4ce4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00311-of-00512.json.gz": {"num_bytes": 30448951, "checksum": "a049c31ef6304084d33cb7bdd2e21ada0c60b40b1002b2369e60d36a5098c4b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00312-of-00512.json.gz": {"num_bytes": 30034189, "checksum": "557d1e88400a6d1d8ee4d717a959239edacbdd3e18d8cd20c5c85b77174dc302"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00313-of-00512.json.gz": {"num_bytes": 30066486, "checksum": "e4823ea1e9a59d5db84564a5b90c28fd8058450f238c60ad689ffd6b673d65f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00314-of-00512.json.gz": {"num_bytes": 30397706, "checksum": "1b4c0653e7ccf7fda0a53d8cbd5ddd57322ac83822e9d05bbdb9eb8ac979cf50"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00315-of-00512.json.gz": {"num_bytes": 30219107, "checksum": "9c364c9cab4ff7acdd1818b13de2f36713df8fa6c504ba15cdf47fe8e3c30206"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00316-of-00512.json.gz": {"num_bytes": 30098661, "checksum": "84dd8a8739b5abc39d8180f0894b1fbf2930d6d333d7c86b646f40763327397c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00317-of-00512.json.gz": {"num_bytes": 30178992, "checksum": "16e4791b4e5ab3719dacf79fedb0b88ed54346372874c37ccb71d86bc419edc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00318-of-00512.json.gz": {"num_bytes": 30022982, "checksum": "98345a826aab12bdaf5e639205d5dcdc1da8fecd7cafc1982df89ac8d4df7ebf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00319-of-00512.json.gz": {"num_bytes": 30360409, "checksum": "d53a39019a1627b42ae6bff68e283d37d0bb5f48b328c2c5cdcc1a3897f4e992"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00320-of-00512.json.gz": {"num_bytes": 30347267, "checksum": "c343a0eedf58484055e58762802ae8cc05f2cdb0b923785c493d056a2cbdb015"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00321-of-00512.json.gz": {"num_bytes": 29967877, "checksum": "cc5795d254ad749ccfe613034927bdf95529545ae1f277b694dd24a5996aca83"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00322-of-00512.json.gz": {"num_bytes": 29885538, "checksum": "d5eaaa1eea983bd37ed34651e6c16b746ff7c92e48038b234149fa6d04d3d866"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00323-of-00512.json.gz": {"num_bytes": 30308848, "checksum": "a42cfaef5e088fd6b24dfc121084a6cd038f5b0bfaecb9f33997ab22a97fb155"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00324-of-00512.json.gz": {"num_bytes": 30351634, "checksum": "0e2e6933f93466e9c8fe966f7770fe4c34caf182c713dad3206f4132eed1d41d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00325-of-00512.json.gz": {"num_bytes": 30077168, "checksum": "77cdbf7040ce7f38d735fef41813ce63aaa16fcd87fce80e6ca6bd56d350c369"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00326-of-00512.json.gz": {"num_bytes": 30031750, "checksum": "8d994c2dc1b766e3270dce3f0b8f6f8fe22d5c1e0e9780e1bfed52c1292b8641"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00327-of-00512.json.gz": {"num_bytes": 29845765, "checksum": "f6279e351d016769d6fb5482d01a15ba054d5fe6f9f1c4e92c0663cef0083002"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00328-of-00512.json.gz": {"num_bytes": 30253188, "checksum": "2ea84aafd94d1843a2cc4428279dbb079c6ae0aae6c00f90ee4b5ace3c827afd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00329-of-00512.json.gz": {"num_bytes": 30124922, "checksum": "49e3d91126d53eada7bbd87bfe9eaae74f059c69cd70a3a3b8101f49c1aca154"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00330-of-00512.json.gz": {"num_bytes": 30026414, "checksum": "07442fc4f7fb1732362293bc15a6754d70ecf4743392cf89c4497b3cd96269fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00331-of-00512.json.gz": {"num_bytes": 29961847, "checksum": "f437c6f5f758a5d32c8fc949037060259162864c29aeaabf37032e79f5a1cf0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00332-of-00512.json.gz": {"num_bytes": 30167166, "checksum": "96018497eb6dec020436c1333ff81980a64fb615997855fdd8cf35fe3f658db6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00333-of-00512.json.gz": {"num_bytes": 30192963, "checksum": "1c12ea6b9031049dbc84e4da6b5fdedf480e989385d758c88322c415a1cabbb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00334-of-00512.json.gz": {"num_bytes": 29847008, "checksum": "c269285f15f626b4b15a7d1705ffa08e3f4d49ce13de8174b72f9f6276a1c6af"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00335-of-00512.json.gz": {"num_bytes": 30262244, "checksum": "179ee564e6fc644d9ee139bdb02d470a1172221b0f6e510ee5935683500f8257"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00336-of-00512.json.gz": {"num_bytes": 30262910, "checksum": "317933afdd8dc8a3a355e44ee3d84bbab12a2f30c98ea1172dde7074ed4c0557"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00337-of-00512.json.gz": {"num_bytes": 30155329, "checksum": "c5b850399252ec41b0fd9cb2da87ce25e5a44df9f44c6ed9d8c559a5729e5a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00338-of-00512.json.gz": {"num_bytes": 29952961, "checksum": "48083123ba97a6212e0501799bd01936f0795bdd4d9c2710b9aa67d54b29037e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00339-of-00512.json.gz": {"num_bytes": 30403399, "checksum": "313b60f985dcf591f34d351b758eedace655b6c6d3946dd2ddc55f34a9a97ae9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00340-of-00512.json.gz": {"num_bytes": 29917484, "checksum": "2c72290f3bd51dea2a2877d68a968dc2b75dadf99ab3cc2230e41be45f3515d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00341-of-00512.json.gz": {"num_bytes": 29905522, "checksum": "1acd83a0da4a7a4912b589dbeb68b37396d0454371b2b71af4ae18b854d482ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00342-of-00512.json.gz": {"num_bytes": 30022369, "checksum": "8756be42335bba12d06de63e247659f8d603a092ff342360dfed645aec135c47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00343-of-00512.json.gz": {"num_bytes": 30229313, "checksum": "863e29987a3ccfa08e14ae987c81367a53b9fe08795184db086117a9555e058b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00344-of-00512.json.gz": {"num_bytes": 29924335, "checksum": "aa9003a7cc3527fb658fd807c78890587a8b35634a1f0838bc221a6374205d20"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00345-of-00512.json.gz": {"num_bytes": 30229482, "checksum": "a7e88b015bcf7761217e9b3ffd413f13cac48f6afe083353436de6cbd0d0018d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00346-of-00512.json.gz": {"num_bytes": 30029147, "checksum": "b862ea62ac032c203c0038c061a44edabe4644be03b876ec7322e96762374940"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00347-of-00512.json.gz": {"num_bytes": 29808182, "checksum": "62915b86cbbf61a76f73d05509a8e839aae0b965134ef79022377625df7ef741"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00348-of-00512.json.gz": {"num_bytes": 30091116, "checksum": "6c384c2c6bc8340b88e085f8bbc2616be68c96fa7b8b88306b4500367d053a49"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00349-of-00512.json.gz": {"num_bytes": 29867618, "checksum": "bfb19508ecf8bd4d9a8847f0edab5acde6896182c27da706a6f2863bec43c152"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00350-of-00512.json.gz": {"num_bytes": 29723106, "checksum": "a645c62c94de9018175f15a0b38aa8bd2484601ee189b7c27d589288eb5af97e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00351-of-00512.json.gz": {"num_bytes": 30047620, "checksum": "991061a23834e6bb3dc0595cf0e8328e07746d10fbf7a7ba397c1410cb66175a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00352-of-00512.json.gz": {"num_bytes": 29808328, "checksum": "6c8e377a6cc82e81d66e2be3d23c1cdd42480015a68a1db458d542b7ff64ab7d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00353-of-00512.json.gz": {"num_bytes": 30040117, "checksum": "ead6f32d98a91c47fb9c21334143f02181efb0b831705baeebb9820d069598fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00354-of-00512.json.gz": {"num_bytes": 29953984, "checksum": "ba349e503d017abbc1c83da2314c0a4892a9f3e5e480173812578f44d9b5904c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00355-of-00512.json.gz": {"num_bytes": 30179912, "checksum": "2bfeab794bbe0432db52cc595d25864b17fdb0744a80d6d907f6f2ffc5c56b81"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00356-of-00512.json.gz": {"num_bytes": 30312163, "checksum": "d0dec696d28c601d3a1f75b0b6e6e711e00809f0d5ea915f63cb6d9b7adcc597"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00357-of-00512.json.gz": {"num_bytes": 29931515, "checksum": "d43c75371e32d0c1e65f43acc00aac3ca43762d4c6eb6bb61759ac5fca593a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00358-of-00512.json.gz": {"num_bytes": 29739788, "checksum": "96fef1b4a5d6a080ff5d4a10bc90911dcb2ddecb4be91d0c9620e6d2484e3ee3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00359-of-00512.json.gz": {"num_bytes": 29913841, "checksum": "05b065d2d13b787ddee4707be7e2be46173c23794b9e8c773d0da743f435db17"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00360-of-00512.json.gz": {"num_bytes": 29805295, "checksum": "826104b9f4c2634d128f15564bd4990057dfbbb4066f2a082039d243bab56935"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00361-of-00512.json.gz": {"num_bytes": 29839676, "checksum": "ee5ba4cb14ecee0c857828a866615c6bfe45f67b158173dcac44146a02d97738"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00362-of-00512.json.gz": {"num_bytes": 30154783, "checksum": "d67b49e6fa5dc293fbd3057b7ca0beb7e0bd1ff692cdad7f2dfb7abadc1f4599"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00363-of-00512.json.gz": {"num_bytes": 30126118, "checksum": "6940704da6cde5822d48dc806280b8d57e0593ba299731e68ca9c2a4f7cf65bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00364-of-00512.json.gz": {"num_bytes": 30184894, "checksum": "e740b4a0240e691f16a423fd658aa3c7539986695418af3b5a171a48524db74f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00365-of-00512.json.gz": {"num_bytes": 30386766, "checksum": "5a6a9461ef9ca579a849f6bef4d6225504a885aa797d3b2236ed8df6f5ea72ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00366-of-00512.json.gz": {"num_bytes": 30208411, "checksum": "8e0ce2447dfadaa4d41b991a2ce1be63b409e58e88944594dc8591bf9ab41403"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00367-of-00512.json.gz": {"num_bytes": 30266003, "checksum": "04ea00b46a583edea7740d74d719ef7f303b7f3873365b9ff4e94f08ef80832a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00368-of-00512.json.gz": {"num_bytes": 29993752, "checksum": "38b1a55dd4ff1b504d2dbc0b2ad54fe43ab16c8bdba55bd97f4a55dafa8c83dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00369-of-00512.json.gz": {"num_bytes": 29833222, "checksum": "a25c405918920ed00edf5f3007cb8895b59fb67618dfea266b048273303b9592"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00370-of-00512.json.gz": {"num_bytes": 29988999, "checksum": "2812e6d9865d77ca8ac2d1499ba86be1ceed868a1da2bd13fbd0967058a3516c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00371-of-00512.json.gz": {"num_bytes": 29866636, "checksum": "ecd1d3bdc41c3f41f8c9d3a63c75766c173f70ff117af748a08c221ca4273b18"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00372-of-00512.json.gz": {"num_bytes": 30296883, "checksum": "723d2c5ebbdd95ab84c53e458d81944b6907d08c7aec67300f012880624d0010"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00373-of-00512.json.gz": {"num_bytes": 30310322, "checksum": "ae45d088521f2faf9852cb169962176e84bbb81d5ba157d4228d348f7fcf60f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00374-of-00512.json.gz": {"num_bytes": 30340527, "checksum": "9b09c9e1b424fd05540b720c5a85f71eea43d743dc4ebb318e839125ccac9383"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00375-of-00512.json.gz": {"num_bytes": 30193692, "checksum": "c3ca4bb179cadf872f25f1cdb5c3667933bb8dfb7af21068a24b1b09c961dfa8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00376-of-00512.json.gz": {"num_bytes": 30184130, "checksum": "5d801f4bc20c4c6d8821ccfff06cb5dfe4214e571734feacbea3325462afa280"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00377-of-00512.json.gz": {"num_bytes": 30259301, "checksum": "ebf08508c24e29a8a14b72248f090d765b02ee7a31296811d0391f2a2e73c046"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00378-of-00512.json.gz": {"num_bytes": 29650049, "checksum": "c13e994e68b938ca069d2d412e7891cbaf2ee205d65b1c17c6acfea01adce157"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00379-of-00512.json.gz": {"num_bytes": 30265211, "checksum": "667da6f0650dd684aa50bc691b5783968ae8cab847dea14fc8d8bfe203e351f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00380-of-00512.json.gz": {"num_bytes": 30429631, "checksum": "7cf0e9ae00bec72f571d152730107efdd944176818600517fb2d0412a859d366"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00381-of-00512.json.gz": {"num_bytes": 29889471, "checksum": "f781b3128e92c54365be7771695555378067a65fb922e04062ab6f3f092ec827"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00382-of-00512.json.gz": {"num_bytes": 30029894, "checksum": "2d133def2bc4b840312ebe5c466c9f22729b67aa4c2a41dda2e6a9a55ddcddbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00383-of-00512.json.gz": {"num_bytes": 30249255, "checksum": "e8610abf7e2bd70b1067a1b2dbf392ac32be156945502629228969974d3899b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00384-of-00512.json.gz": {"num_bytes": 30362665, "checksum": "f217071bd0c1b1bddb3342c85064d7ebb54bcde2512997636f0638a0b3641588"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00385-of-00512.json.gz": {"num_bytes": 30080234, "checksum": "2db4b15c7391b6e6d3791721ee574d09101df597110feebc59e4f0aff4df6c26"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00386-of-00512.json.gz": {"num_bytes": 29897704, "checksum": "035daed74487c5262b8cfbefdfaefd17f2834c7b4a1d293934d755e059b58f5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00387-of-00512.json.gz": {"num_bytes": 30072139, "checksum": "73013fbd06eaf94a7c8a0f0de420f83bed56655fb2d4e5d93972e8ca1847d130"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00388-of-00512.json.gz": {"num_bytes": 30123843, "checksum": "5db846c3d0b36774ce771ddfa8c53a915767926a2ad48222256d839326336f19"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00389-of-00512.json.gz": {"num_bytes": 30278955, "checksum": "9e4c590e67b2fbd357af955e39864ffe73dda201d76759935fda80b10b463500"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00390-of-00512.json.gz": {"num_bytes": 30013591, "checksum": "90974ba6eff489e0f4f52187b6241120740c782945e86525cb5d1e551a54e322"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00391-of-00512.json.gz": {"num_bytes": 29925212, "checksum": "10fcd62813434e2557b5861fd8604f534952561065bee9dc525b1cd3f5b2730f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00392-of-00512.json.gz": {"num_bytes": 30016498, "checksum": "da88b36bd3f15551d8fad115a86f111cc5c3d9a3c6fa9497214aabec7bcd6aad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00393-of-00512.json.gz": {"num_bytes": 30061083, "checksum": "1ed9881020f240e1277e6513bc2abf24ea48e9cb0046d7e87a6d3669c8b42a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00394-of-00512.json.gz": {"num_bytes": 30043459, "checksum": "a35c3de1b0c982df8471705574e6eb7cc730fff122ff17d1381f2c7b9f20d6bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00395-of-00512.json.gz": {"num_bytes": 29921106, "checksum": "f4cf52f8d6a1288773cc366469df140f885b233fb6aa1cb75387a450d88ec94f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00396-of-00512.json.gz": {"num_bytes": 30024980, "checksum": "5ebe04e54e4242d52aacb4c2e107dd10e609d5a7a6ff0425d9952bed98ef4921"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00397-of-00512.json.gz": {"num_bytes": 30096825, "checksum": "3ac381004d8257aa50fb28f0fd2171abbb93ad825c3f43422b9dbec6e1c6f31b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00398-of-00512.json.gz": {"num_bytes": 30059739, "checksum": "40c38af325f4d01ae7c74aa9cd8f8d1c96c6af851175f80d3c50d85c5f5d3585"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00399-of-00512.json.gz": {"num_bytes": 30049826, "checksum": "2ba0109b2d5b88422250bcbd2494cc6e11528710f38fa6e83a1f699b840b68a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00400-of-00512.json.gz": {"num_bytes": 29953506, "checksum": "010610ba3af3dbfbcf2fac93136b7066fc58eb914dce9ae999722d0cfec4d331"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00401-of-00512.json.gz": {"num_bytes": 30271141, "checksum": "29587bb4be2c367f6479705b5c3c28716affeefc857ac1f77e4c33e55264def0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00402-of-00512.json.gz": {"num_bytes": 29861236, "checksum": "8e399149c335ec599f881fada448c9b4be22326357153c74b0de627078f1d43c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00403-of-00512.json.gz": {"num_bytes": 30175831, "checksum": "0d2800836914a1e2ef4a1aaea6e70d19699fc2555582ec670223177cac05a4fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00404-of-00512.json.gz": {"num_bytes": 30097682, "checksum": "f9665e9199978b123feb962ce347b30cc1520626c32dfef0ca3cd8895a45e445"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00405-of-00512.json.gz": {"num_bytes": 29810961, "checksum": "8ea29cf9f7774a16a4c2aaeff1b6353de2951073676a9c411f19b0a5fb755b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00406-of-00512.json.gz": {"num_bytes": 29963498, "checksum": "90b10c91f6e0006576ec9b426c424e50fc1726c25ae8eb91bf91bb9001ade2e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00407-of-00512.json.gz": {"num_bytes": 30089554, "checksum": "cfa905514e4f19c4eb82e438f5eb987731004476f026f4bebbeeafbe519ec85f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00408-of-00512.json.gz": {"num_bytes": 30148002, "checksum": "dddada59e2ef306cdf83b7c9ce3c912792237852053a4ea683224438a242c5ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00409-of-00512.json.gz": {"num_bytes": 29989174, "checksum": "907667ac304b6cca7100a9606e915c003fee43f1640d5b01405beb16eac4c379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00410-of-00512.json.gz": {"num_bytes": 30519580, "checksum": "acd5cd2ecc46927046c81c9bb3459dd72a98e346ebb59c13c0db08fbb60961a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00411-of-00512.json.gz": {"num_bytes": 30408107, "checksum": "6a9c2d42717f853cd4a76fc5275e95e2a584b7465c6059f586f6a06417048a42"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00412-of-00512.json.gz": {"num_bytes": 29699198, "checksum": "29e76bdab47496ed61a102edd3c61c20e60ab52abeb8e6068f7aa4ad1868f4fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00413-of-00512.json.gz": {"num_bytes": 30065457, "checksum": "b4a33941d0b994b82e3be351542cb4a832742e050ebbd71481e7ba34c8dcbc3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00414-of-00512.json.gz": {"num_bytes": 30342960, "checksum": "4ba7edb3c77a45f0e4cb7e969053db6f44ce8c0a8ef262582512814b1161d9ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00415-of-00512.json.gz": {"num_bytes": 30201576, "checksum": "25cb4eb4bdf3cd1b29289a23696be8bd41c5f577294e94607bea7b91252a04fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00416-of-00512.json.gz": {"num_bytes": 30021170, "checksum": "60472bd2a2896bfb57baabb583fc6cdd402a1d776f6a4c9bb58ed556e67cd76f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00417-of-00512.json.gz": {"num_bytes": 30237505, "checksum": "aea8fd33c2acf1cef890549b1f88b18a2eeb37f6d4dd22b552f735811ad0b8a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00418-of-00512.json.gz": {"num_bytes": 29999334, "checksum": "93583d771ce7f0e1d044de2919a3ffdd48b7b7dab0cd3b6dc459200dd53d8762"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00419-of-00512.json.gz": {"num_bytes": 30194801, "checksum": "cd36e129487272742f3e60ab6512dd79b3d1ce3c22490d2e47c00c2ae595cfc6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00420-of-00512.json.gz": {"num_bytes": 29903898, "checksum": "6f18a5ffc7efe5f555b02d3a31ed43714e09e73f7462206220d70450f47cd6f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00421-of-00512.json.gz": {"num_bytes": 30015573, "checksum": "cfacef2cffd953425eaf4d7b2b6cf5d2637bf5d58c6ed2bd0002442795c7d36c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00422-of-00512.json.gz": {"num_bytes": 29966521, "checksum": "14f646b15948cf586ec1abd4bf4bf45bf180913e4d09049fa779bc7a196e455e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00423-of-00512.json.gz": {"num_bytes": 29972805, "checksum": "ad7d4ab443c7a8122976570891a225a44ff86d2299d70706066633a6204eb0de"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00424-of-00512.json.gz": {"num_bytes": 30317886, "checksum": "37c8bf3b535ea4053aa2424c846e3449f9eb27d5ff999e1e93b6cee0aa975333"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00425-of-00512.json.gz": {"num_bytes": 30059310, "checksum": "674ca5eaf6a88f76881c8a1c48e1e0f93794785ee5ea17fb70f49228d7f39614"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00426-of-00512.json.gz": {"num_bytes": 30182498, "checksum": "988d08cd18162d9a309155d2e75cd4980f76ab4c73ef8286edae94ca4628ebcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00427-of-00512.json.gz": {"num_bytes": 30253874, "checksum": "aa8c08a684ea0bbfda9297aea07429172a2fa4a161268b964421796173275b35"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00428-of-00512.json.gz": {"num_bytes": 30055421, "checksum": "b1ed26e826bee7fcbc31cf1c368c9a63eeedbea1c2fd0fb07370b461a03d1a7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00429-of-00512.json.gz": {"num_bytes": 29830674, "checksum": "3efdc67ad7a108416dae47886e542da5c2ab1cd7e1aedd25c1c5d4e0607572f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00430-of-00512.json.gz": {"num_bytes": 29938000, "checksum": "3221ef5e4c28d44c1da4fa04689f318217991c07aff4fdee5e1091fe8e1162ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00431-of-00512.json.gz": {"num_bytes": 29829687, "checksum": "225f4e22df1b45a7dc9fef2f5a44da8f8ee25608cbe34195e21b49c8cd10f3ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00432-of-00512.json.gz": {"num_bytes": 30006209, "checksum": "9fc53637db7b16c8cf6f824adf21d4602efab715ad78eab62c4be7981a8bbc1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00433-of-00512.json.gz": {"num_bytes": 30656456, "checksum": "6bf7b701dc18f68d0facd7cdea49a26cdcfdd7829d5346eefe555485cfa7f336"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00434-of-00512.json.gz": {"num_bytes": 30138891, "checksum": "793532f72aa41c1dd7c549e9597fe8e73796c53eb5fe410a73de418ec446d686"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00435-of-00512.json.gz": {"num_bytes": 30430276, "checksum": "0d13d345ad12999fb4e7a9675e08bb1c90980fd193ed8530e4258e07bd6ea754"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00436-of-00512.json.gz": {"num_bytes": 30173309, "checksum": "fbce5fadb4b49bf833f77337929d873b2b25c3b564f7622f3672dde7a044e5d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00437-of-00512.json.gz": {"num_bytes": 30142240, "checksum": "76c34800a3223f5fe0f1960f3d3c9dd9ecdc2e652493d71ef245415b5027c902"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00438-of-00512.json.gz": {"num_bytes": 29979673, "checksum": "4784c3787d24b9d46ad7c835683c6506c2e55c84835391e2aca0355f032a1888"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00439-of-00512.json.gz": {"num_bytes": 30169105, "checksum": "5012d03e637769d7494bd3cef0a8dfc8b38c995e0d5780089c15d6b1495b3a8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00440-of-00512.json.gz": {"num_bytes": 30107004, "checksum": "529beaf4ad0251e35be574b1f623571526ec91a588ebd7df43e9d1cb99445f53"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00441-of-00512.json.gz": {"num_bytes": 30324563, "checksum": "f5e5fbf5e329f5bb0e83f758b8fc76516d65c3f91ad97e328187eaea83e4b667"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00442-of-00512.json.gz": {"num_bytes": 30335681, "checksum": "b8a26ed60f87a87347886b4467aa576ec5e8c106931589a1aa821b99fdabdb54"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00443-of-00512.json.gz": {"num_bytes": 30155655, "checksum": "e27bfb813fd6aba96ada81b095a559f0b7847cd25f7f8973663b19cdc5b8985a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00444-of-00512.json.gz": {"num_bytes": 30340540, "checksum": "705dec13ba2824d45e801bc2cf3e709d6492b1ff6de2f9ddefb5a57dbdada4ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00445-of-00512.json.gz": {"num_bytes": 30248960, "checksum": "09a6b83910369cf269c4f095607fb2f0ac0ec7e25b501f577fe13920a8573ee0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00446-of-00512.json.gz": {"num_bytes": 30316703, "checksum": "8f88b794c08bb492f50073337a30aafac0d05819505b507ab283dba0cf17d125"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00447-of-00512.json.gz": {"num_bytes": 30184407, "checksum": "38c819df823197bea6d647c3f78bcc15024aabba814cae322c1663c45fa8382e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00448-of-00512.json.gz": {"num_bytes": 30238484, "checksum": "8c0abfb8dca37a179b01dadd2227206cbe6e5b916d0111c0b00d2edc3951c7f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00449-of-00512.json.gz": {"num_bytes": 30143151, "checksum": "9731e9644e5615d5d5ebdbacc6efa6382df856c8763b7485c9a5838864c1332f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00450-of-00512.json.gz": {"num_bytes": 30122606, "checksum": "3b746f616f21c91277cde8e6d0d7f792ead7874de7ecdf11830a4a56db3dc799"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00451-of-00512.json.gz": {"num_bytes": 30128179, "checksum": "d6cadfc64ee39c9beb93f0bf8c169ca9d9053e0f76e1c9697841438e20dddef3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00452-of-00512.json.gz": {"num_bytes": 29979326, "checksum": "42de19ffc3ec821fbf5ff686d1b36d189ad9ee5c4553a2ff0d003ee1a754c9c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00453-of-00512.json.gz": {"num_bytes": 30118272, "checksum": "22f9b2d3a9f089f1015f74d1ca0aca8f2a4970595326d964817177cbe6859271"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00454-of-00512.json.gz": {"num_bytes": 30018294, "checksum": "17c16895edccbb8b40fcc52cbafc0c15957020eb530e071dcce34544d5958bd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00455-of-00512.json.gz": {"num_bytes": 30155903, "checksum": "8b9d49837b309c3389d03dd3bbae92395bf7086134fbc69d28d9fff60a90d4a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00456-of-00512.json.gz": {"num_bytes": 30282104, "checksum": "ab63fd2efb0cc883d303241b3488a8135a196db7edc844458cfc1483898ceb3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00457-of-00512.json.gz": {"num_bytes": 29920723, "checksum": "dbde2eeef90144b209ef5afa6d5165ad638ae57d919926a379a10fccf6850a61"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00458-of-00512.json.gz": {"num_bytes": 30163167, "checksum": "800307106f5861e0bc246bcaae214e6dadeee849905cac184ecfe6d0b560fa68"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00459-of-00512.json.gz": {"num_bytes": 30248893, "checksum": "3e78d327a9463929f33311e18116f5d1d2ae4926f7a600378875ba854cf5ee47"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00460-of-00512.json.gz": {"num_bytes": 29840067, "checksum": "047568a5dad00b04ca1ea4aa262c7a4af9b61e87bc4ea02ffd5c6c8c049bf8a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00461-of-00512.json.gz": {"num_bytes": 30179062, "checksum": "ed8abe7b465bc19150b831632cb7afa298d6cb4beb9b6043a35a0f8afb5f730d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00462-of-00512.json.gz": {"num_bytes": 30266398, "checksum": "d7b74f5c1c1f7bb489700adcfb7e48400c4fcca7669e2d56396d9fabb5a63b91"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00463-of-00512.json.gz": {"num_bytes": 30158800, "checksum": "224815aee29f6d04ddbc7457c84338eef9b127a767e7b50ed77283ff166d4f93"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00464-of-00512.json.gz": {"num_bytes": 30393915, "checksum": "0dd019fd2c19936ce2e6410b65872f630131c5da7543c8e66fa87547fd1a2209"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00465-of-00512.json.gz": {"num_bytes": 30148939, "checksum": "6d74dc9d74d28c2b8ba8d43ba3d594af0cb176cfa7bf738f3933be2a9c37bb85"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00466-of-00512.json.gz": {"num_bytes": 30268228, "checksum": "0e201327066f28c19b082fe35e4fb3bd76c8fd2d32236d1d6e2309489152aa66"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00467-of-00512.json.gz": {"num_bytes": 30121937, "checksum": "7352e5a9ee66dcbeed2c9e1fbe6c9355f0e5dd1b30b592a9fd5690958945e5a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00468-of-00512.json.gz": {"num_bytes": 30004669, "checksum": "53876848336ac57c082c9d5735bc1717f69ef38688b221d5e5ab9cd9cb4ec620"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00469-of-00512.json.gz": {"num_bytes": 30049860, "checksum": "a5a720b38f106dd5d2a2b7647748b52b4531ac12294e3b0d8dbc92062639c0c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00470-of-00512.json.gz": {"num_bytes": 29961380, "checksum": "9611764fc4f84b92e86fa6f9ea41464f6c26b07d1c51241b627a3d155e99d163"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00471-of-00512.json.gz": {"num_bytes": 30449164, "checksum": "db508df549d518c3e8b99b2f0098ea93fead1e632f53d8ae2cebff1d3476577c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00472-of-00512.json.gz": {"num_bytes": 30312620, "checksum": "1993b5e292c6c60a3373aabe896f1a57afaad73fdce0ec60e30696368f7c0afa"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00473-of-00512.json.gz": {"num_bytes": 30406764, "checksum": "913045c61fb5a145379d9fe08c91ea63092b197400c0c87bfa65af91720b563c"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00474-of-00512.json.gz": {"num_bytes": 30078563, "checksum": "c495119e150b083d709ca915abd760683793361ebf3e079b04efc9b7e1900379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00475-of-00512.json.gz": {"num_bytes": 29860761, "checksum": "50bb5f40d2e91ab136aa63063fff860529c8961f2a38500a645b10339751589e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00476-of-00512.json.gz": {"num_bytes": 30199778, "checksum": "c969cfbb7ed7716f665b336b2ed9f7b10b532c7adc6d8a347964831a39cfef0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00477-of-00512.json.gz": {"num_bytes": 30130742, "checksum": "54c8b89102cf882eda5208544a6c5d317c1defa8d997f9450ebd576e58f91830"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00478-of-00512.json.gz": {"num_bytes": 29901444, "checksum": "f669299d794ecc0523c64ad31af8fcce5cf3f880e87fd73f4c3f434425e9b238"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00479-of-00512.json.gz": {"num_bytes": 30587214, "checksum": "25d0fbd9027deaf140650f0b82a2316c37939f199fe7633b9f643684404f2029"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00480-of-00512.json.gz": {"num_bytes": 30145237, "checksum": "68a29728290e1199ce8d1ac060365bc443ea67c24292b2b04f1b4ca44ca7238d"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00481-of-00512.json.gz": {"num_bytes": 30204159, "checksum": "1605034b89e33f6794c901adac1eb200bb489f76b9bae6bc56b01e9f6ab4c254"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00482-of-00512.json.gz": {"num_bytes": 30430794, "checksum": "2dce9df095e89ea6645fb599f518612511a62b6c475808ad004c32968b19bae8"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00483-of-00512.json.gz": {"num_bytes": 30102412, "checksum": "c7c626977521b0d1f5bcc02c484b3eb4f517ba71006a4802df08a0f4cfb8ea9e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00484-of-00512.json.gz": {"num_bytes": 30171871, "checksum": "519ed997f1f1f1de7864b0bddf202b25e25bed349f63593a88337262d7705968"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00485-of-00512.json.gz": {"num_bytes": 30049539, "checksum": "8d2314fd3239ba3dfa99962c1d0a38e05edf9194e1faebae88f6b19ecab8fbf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00486-of-00512.json.gz": {"num_bytes": 29949995, "checksum": "a7521e09cbe77098c23172427bfb931dd50f0c9d58b034fd1621687849a8d379"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00487-of-00512.json.gz": {"num_bytes": 30345072, "checksum": "ebc6254a4d241afb886b8df20819301121fcb234a32a1dd4ee8ae49571081f92"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00488-of-00512.json.gz": {"num_bytes": 30300622, "checksum": "509bba28ddf770d38554a2e846f2ce0d2af59e3662a6d6ec4dddb75fb509f8d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00489-of-00512.json.gz": {"num_bytes": 29949909, "checksum": "996e61f8e674b0a016a568630ee13a7473f99a919437c225a4198d232861e628"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00490-of-00512.json.gz": {"num_bytes": 29995429, "checksum": "9730024ad352eb12f74ac446ed32b9c57898658954be5dd639184fc5264527cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00491-of-00512.json.gz": {"num_bytes": 30293919, "checksum": "65b2a7de3284e892441b0fe8e850d89de842355d78fa9944358b1ee5912a948f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00492-of-00512.json.gz": {"num_bytes": 30115831, "checksum": "26b535c3175bb86ef721593f81d9cf006d4c3749f156c63ccd2a2c04e1201236"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00493-of-00512.json.gz": {"num_bytes": 30187809, "checksum": "a0918223c5523da20bd8230de1985b0a3cbb1e239af3d62a83d720a3a528c567"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00494-of-00512.json.gz": {"num_bytes": 30149878, "checksum": "6e9a5e329f834e41b4a8a9a6809df3243e5bffc580327912288ad7f790b43ab7"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00495-of-00512.json.gz": {"num_bytes": 29711944, "checksum": "3b9ba9d667e1241692ff9a654a68e98e8e94e32244a9419b2542137b63fb4705"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00496-of-00512.json.gz": {"num_bytes": 30114815, "checksum": "24b78cc36bb0abc67c998320e7029b6e7bbbee267a367eb538f23956c13f27a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00497-of-00512.json.gz": {"num_bytes": 30048480, "checksum": "29c3606acf298498fc3498bd769544e2879afbd0d5c46cee298cb25058694aac"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00498-of-00512.json.gz": {"num_bytes": 29934973, "checksum": "8afaffea92dfad745be8aa8cd3de0ee97cbcc26fbad6c71d56683aef6a27055f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00499-of-00512.json.gz": {"num_bytes": 29796509, "checksum": "9cbbd8f6d8fe92207c4cb2f0422284726deca1bde7f30cb01cce7fcd4665b380"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00500-of-00512.json.gz": {"num_bytes": 30221736, "checksum": "902904aa9fadaecbe698402a27b4e68b00813e67b79f84d4c696cd9c72f08f55"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00501-of-00512.json.gz": {"num_bytes": 30108320, "checksum": "76e848f8dbc082158fc5d3a2f7c10cd6e03585667c00efc639f2c6f47d44aeb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00502-of-00512.json.gz": {"num_bytes": 30381907, "checksum": "885bbc9788235abf33728737f72f267e60d1f5d4a77493cae76f161651d89579"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00503-of-00512.json.gz": {"num_bytes": 29983805, "checksum": "5134934392b13e3f84dd32dcb1c59f4d5416d6dfd925bf896f3eb61881d82136"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00504-of-00512.json.gz": {"num_bytes": 30041413, "checksum": "4978245a7f545d676bad6edfdfe60ffdad94de47af0fb10649fa39e9b068939e"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00505-of-00512.json.gz": {"num_bytes": 30021620, "checksum": "64933c28ea3f608326f1c6ef56170886767f1ab4f9ecbc4bf3263c7043901fce"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00506-of-00512.json.gz": {"num_bytes": 30260343, "checksum": "84667dbe68ecf1f9bbdaba0e73eca6fe0444f6594a1e9a4b46e9812ae7bce7d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00507-of-00512.json.gz": {"num_bytes": 30173739, "checksum": "dd6d44e4f344f3ab1cd61bacced7b5f1429cf6823fc9282452a539012bda028a"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00508-of-00512.json.gz": {"num_bytes": 29903443, "checksum": "4afc46096ac2697867c3a75896c5ceb36617c4c21a749dded58a1ea4565e41df"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00509-of-00512.json.gz": {"num_bytes": 29862664, "checksum": "74a720dc16b389e8122d61aa94bc12a5bc4253ca6f39679781c938e2eb556878"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00510-of-00512.json.gz": {"num_bytes": 29744368, "checksum": "6a302049e7a1668c5fb2e4b5afca518fa53ba1a9dc717015ecb5768e85ec4139"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-train.00511-of-00512.json.gz": {"num_bytes": 29896714, "checksum": "48b89e909c0e33fd59c9623f8517cdfa90fa35a4641f999c6f68e1cc9f2a309f"}, "https://huggingface.co/datasets/allenai/c4/resolve/main/realnewslike/c4-validation.00000-of-00001.json.gz": {"num_bytes": 15284943, "checksum": "42ac859dc1c4d48d165ec602909403e2066ce1d4854149ed70b9ec9cc96dc65f"}}, "download_size": 15435025687, "post_processing_size": null, "dataset_size": 76369191765, "size_in_bytes": 91804217452}} \ No newline at end of file +{"en": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "en", "version": {"version_str": "0.0.0", "description": null, "major": 0, "minor": 0, "patch": 0}, "splits": {"train": {"name": "train", "num_bytes": 828589180707, "num_examples": 364868892, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 825767266, "num_examples": 364608, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00000-of-01024.json.gz": {"num_bytes": 319308785, "checksum": "8ef8d75b0e045dec4aa5123a671b4564466b0707086a7ed1ba8721626dfffbc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00001-of-01024.json.gz": {"num_bytes": 318039285, "checksum": "b945059cd1a343cabe311881b7840a6f0363f570e745a0eff0e687e266f6b55d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00002-of-01024.json.gz": {"num_bytes": 319748667, "checksum": "2967dc7e587ced6ecb9ba617ad2d4c44901467969de5bf5b0f5a9e5b70555d75"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00003-of-01024.json.gz": {"num_bytes": 318564193, "checksum": "b79d9abef5741578929be0d59db9ca652a8276207ef18a944b7a5f11fef5beb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00004-of-01024.json.gz": {"num_bytes": 318579884, "checksum": "cd9f98eac2bc6062f55d9a36bd744cc924a78ea2fd998830e0034e4456f5d014"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00005-of-01024.json.gz": {"num_bytes": 318003681, "checksum": "8ac5907a54dbc7ab9c14624448c7c3f6afed33af9d0a855f1eae955e62e255b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00006-of-01024.json.gz": {"num_bytes": 318495137, "checksum": "8fd9b9a4b74c9414466b245ebda7db041e7bd8603971de51b5db782bd758aac7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00007-of-01024.json.gz": {"num_bytes": 318417273, "checksum": "41dd377a1ba6b72eab0260c39c626fe45ab6b649d42d57b311d3ba21a0337cd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00008-of-01024.json.gz": {"num_bytes": 318131845, "checksum": "64da652c235f089a0b52f6db5883ef5f1e9c31edc4c950332b34dd12439c99a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00009-of-01024.json.gz": {"num_bytes": 318185592, "checksum": "807a548efbb10153c9eff0df5733a97a1b51ab1743242530de1b02a8ea17ace7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00010-of-01024.json.gz": {"num_bytes": 319045292, "checksum": "3bd0f6f664069c3bd964ce48ceae60ba47b55b54745a4b00c207bdb3a1926b17"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00011-of-01024.json.gz": {"num_bytes": 319686980, "checksum": "5baa0c010083459ba58e34b4e93bb758caa878f7db6fba0528921329fa1a6cc5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00012-of-01024.json.gz": {"num_bytes": 320119088, "checksum": "fdee7442c06856e2c4b7665cc51978e9011b5e0a2112c30dd15bc9e53818842d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00013-of-01024.json.gz": {"num_bytes": 319474856, "checksum": "a4ab3b24087781c3577945492525696e182ffd7ca5265b958f49803a02867ecf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00014-of-01024.json.gz": {"num_bytes": 319693210, "checksum": "62215b2451e71b117018ef73570c944aff890624b384c538950b64c37f184c49"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00015-of-01024.json.gz": {"num_bytes": 318427305, "checksum": "9893c9f413a1223e7b535527829bcd6df3219929fb1abf8f2a114dd8f6ea0919"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00016-of-01024.json.gz": {"num_bytes": 318785714, "checksum": "bd0ade8b8a57348952ca31c39efdab538f54c852941a225ccd13d0a7170724e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00017-of-01024.json.gz": {"num_bytes": 320134331, "checksum": "4132cfff3f5126d9e783191a5ccc34e5d85938bebf0b8489657805277a227202"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00018-of-01024.json.gz": {"num_bytes": 318653930, "checksum": "4675ab1d77da3d676d9743dca15bfce8478498f7738f79816a25ed790d28fa46"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00019-of-01024.json.gz": {"num_bytes": 319468974, "checksum": "1d2f3a6aeb0f6c159295f283d302794cd3eb944cff3fe68691997bb2dc4c7780"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00020-of-01024.json.gz": {"num_bytes": 319109754, "checksum": "b5f26d832a0ec9b0489a27169d94496f5ea33c7fb046868c565c7b5a2407221b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00021-of-01024.json.gz": {"num_bytes": 318514423, "checksum": "428da5a8d4585de16f6b3f30865a5ca7a8d1ddcd3b6002dcc1283368b0c3d60a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00022-of-01024.json.gz": {"num_bytes": 318715623, "checksum": "9bc4812ba5e08c0b2d83cd3804129ba3d77cf84ba3d8828159788ee02e155a51"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00023-of-01024.json.gz": {"num_bytes": 319874293, "checksum": "38843ab4f5c60ed2b9ec0cdc65074eaca454014d5702edd809a266190689d2c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00024-of-01024.json.gz": {"num_bytes": 318105764, "checksum": "4fa0c7ec94445ea57dcecda7864b1346275e711c9820c2c39dbb9fdb95c97674"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00025-of-01024.json.gz": {"num_bytes": 319122521, "checksum": "0758514fa2e2c133c995c00d5f4abfc14b66582a4eedd0e721bdd95c4632a755"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00026-of-01024.json.gz": {"num_bytes": 318116783, "checksum": "56a73b9a556d6794d9c706e1b1c7e729fa13b711ddc25dd403b110eb5ed857f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00027-of-01024.json.gz": {"num_bytes": 320171191, "checksum": "fea1eabb734cda33d72f3d959234a240080b4fd42cc70494814a8429b087f9e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00028-of-01024.json.gz": {"num_bytes": 319047090, "checksum": "47d1c385952d6c18c431a7294339a030c213b8832f970ac987965b621c8181a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00029-of-01024.json.gz": {"num_bytes": 318705639, "checksum": "3c744d3dd915ceef3a93fd18c3ff5b117fb5118d1ced2089979b6cafc81c4525"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00030-of-01024.json.gz": {"num_bytes": 318327902, "checksum": "7f6959020242fdc841adfc10c102bbe79e2ef8502a09dac8451e0cec6f2add16"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00031-of-01024.json.gz": {"num_bytes": 318990600, "checksum": "e56f29011594c765192c34298558e7227a829313196748f9a16ec34ecdb76d23"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00032-of-01024.json.gz": {"num_bytes": 320451482, "checksum": "9ea843dfd85e449439f3106d657762daff8f326730fefb342455c43cb48144e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00033-of-01024.json.gz": {"num_bytes": 319878207, "checksum": "2633cdb7b058f126173608897f69add614659b0b21cf54ecc8a2f4a79bc16073"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00034-of-01024.json.gz": {"num_bytes": 318701510, "checksum": "853c4b9ff2d79621ed27a6be826dae198af609d9f9dbd1c2773b778241cf6137"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00035-of-01024.json.gz": {"num_bytes": 318529104, "checksum": "fb50dac3f35cb71472464f511e6b8aee72ded10b3b6896d0d1f74a18ded2b8d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00036-of-01024.json.gz": {"num_bytes": 318849657, "checksum": "5cef5cfd50cfafd58feb452b85324a3d8198fca48789f0ce69227755e72d8e53"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00037-of-01024.json.gz": {"num_bytes": 319621215, "checksum": "f0b67abf30e2d58d291aa9bcc9c8a03668afe819549802e4e591a261c171d970"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00038-of-01024.json.gz": {"num_bytes": 318135467, "checksum": "991bad578a83294d34a1b11649af07339aa8cb26d49330afa9fcbca0b87942c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00039-of-01024.json.gz": {"num_bytes": 320131759, "checksum": "abbbc21f81555e94484e6afe1975e13f67af19a820cd6f8d090c987a250bd4fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00040-of-01024.json.gz": {"num_bytes": 320214476, "checksum": "48020d2656709899abd2572b3424c0455df3c1089a69fe26b776aeb24f0da0ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00041-of-01024.json.gz": {"num_bytes": 319581259, "checksum": "db6fb8db7162ac87ea002c153ef0c54322f24c8f7ec263cfa290ac8c3683b194"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00042-of-01024.json.gz": {"num_bytes": 318100985, "checksum": "d499cba2383b16bb0f26b98416211eabf2599641ecd6708a5ef487692ca9e791"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00043-of-01024.json.gz": {"num_bytes": 317803029, "checksum": "dc6f1ccc3fcce79b16c5157f7125942e351d74744efc593f8372f8a408720340"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00044-of-01024.json.gz": {"num_bytes": 318837063, "checksum": "6170fced793461bd687640a658a085d02f971c2e609f6ff33b90df944fb56409"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00045-of-01024.json.gz": {"num_bytes": 319659188, "checksum": "b2f79e8600815578ec326cfc6c5242c2827cedbfac51772fdcf15ef5d027aa38"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00046-of-01024.json.gz": {"num_bytes": 318771753, "checksum": "e4b4a3e53ee66c280a5e7ee33602ea0e910903748db8c2adbbec4b48bab1580e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00047-of-01024.json.gz": {"num_bytes": 318088661, "checksum": "bf8597fc359d8e9c721fd1d98b8ff3db5c011afd0fec9640670f31c7a7dddb79"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00048-of-01024.json.gz": {"num_bytes": 317777133, "checksum": "369db8e9646b8229a23044a7257c2face97b8e05738f0413b581892876f268e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00049-of-01024.json.gz": {"num_bytes": 319329891, "checksum": "5cb2aa0432984b355b0ec6aad92f926b2fb75aea2a0e08b97f4c6a62838e6cc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00050-of-01024.json.gz": {"num_bytes": 318172322, "checksum": "11a7cc48539ac97eaec87beacef9d9bbb71fc875a0bff0c9ff096044bff46a44"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00051-of-01024.json.gz": {"num_bytes": 318704544, "checksum": "ac2beee992c2b1ae8b1f162054e843e2b971bbd7cec45a0a7a7b7795fcdc7c26"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00052-of-01024.json.gz": {"num_bytes": 320806303, "checksum": "3a591fe9993c3d98a9e7949e98ca215ce164cd313fe53f3ce762c91b5fec7c53"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00053-of-01024.json.gz": {"num_bytes": 320565764, "checksum": "60e67c8e6f3bfdf8b490ecfe62c79a13c5d04d393fbac712a6cda49fd78e883b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00054-of-01024.json.gz": {"num_bytes": 320425170, "checksum": "d69305c853e9e516f5fd4e2a9afb1939d829925f71102d8aa09387ded5d000df"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00055-of-01024.json.gz": {"num_bytes": 318713224, "checksum": "e01737df8097a1526d6c31d37d7aeb1b92c0a7253b39f6964fcc897bf0eba9fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00056-of-01024.json.gz": {"num_bytes": 319441227, "checksum": "fe516c8c0a9e59f9f035ac5fdd13e973d25dd6635eee05d648740d3e8c1fc742"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00057-of-01024.json.gz": {"num_bytes": 319821142, "checksum": "7e058ed9072e968e9c8b92f9b50dab318515873cca6c617b544dacab5a2f018e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00058-of-01024.json.gz": {"num_bytes": 318643105, "checksum": "3479dc5a5b111b7f45f87e5a91c433907af97dbe15b9db1637bad666dcbdec40"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00059-of-01024.json.gz": {"num_bytes": 318053548, "checksum": "8208b0943f59b5914fa13d29108ede31a8d8d34bc6d603a2278ab8b80d28b1d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00060-of-01024.json.gz": {"num_bytes": 317935826, "checksum": "71324b62706aabd6faee682205cdedcd10dad289579b534d0e53f8d9b92bf2c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00061-of-01024.json.gz": {"num_bytes": 318870698, "checksum": "cdf0abc5804f0991871de48b249e30b666cb96f2254762a570c39904c5780f8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00062-of-01024.json.gz": {"num_bytes": 318945246, "checksum": "5ac676e16108446bd2980f9601c787eb754811a68e92ab6403c333820a6b9622"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00063-of-01024.json.gz": {"num_bytes": 318827790, "checksum": "a26f7cfe123cfdf3db7687996d0163212e70ff7635872b0754c03cbd5c31213a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00064-of-01024.json.gz": {"num_bytes": 318914155, "checksum": "858a145617a5902ab02bc77e47ee2f036a6211384c4f2285767c7558eb93e245"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00065-of-01024.json.gz": {"num_bytes": 319794084, "checksum": "52742215df5aaca43bed5405a397571efe7c22107ee2caa8c05e3ed229796efa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00066-of-01024.json.gz": {"num_bytes": 320294453, "checksum": "5b11cd54de0e95a75e53e4e32f72912cb01053d3fb609de6b7a45afafab414d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00067-of-01024.json.gz": {"num_bytes": 319468309, "checksum": "4c6c69b3eba9bcd6786d7dce893340f2d7093012ead04f3539352beccd2794ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00068-of-01024.json.gz": {"num_bytes": 318800742, "checksum": "ce94afc3c612e9de423a412147505ad7757216100becba2677bf5eaf443c4b6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00069-of-01024.json.gz": {"num_bytes": 319416585, "checksum": "ff3084a3e5a3960425a5c605274684c42fa638f99045527f77e74d165e52b6ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00070-of-01024.json.gz": {"num_bytes": 319165846, "checksum": "04c368b05f0ea42b3a51ed9bc0e817894f205c0ecd74084da015158d509ff2a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00071-of-01024.json.gz": {"num_bytes": 318017381, "checksum": "e8320e9982fa377b07c5b3e8a4451ac143b05ab7a4a03f748034b37fb998bfb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00072-of-01024.json.gz": {"num_bytes": 318874499, "checksum": "920f8d5ef2cae6bdbd52f724d0952e04146ff29f4aaec4dbf10bef7b66a98f40"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00073-of-01024.json.gz": {"num_bytes": 317890112, "checksum": "06a41bdb7bf0d52e2fe8e71f594de8d36d77880639ffdfb41e883237f76e8a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00074-of-01024.json.gz": {"num_bytes": 319201956, "checksum": "e0267d6782d30f1619a82c49c20be1c8b5424e653c093e4652a5c8ed117c6533"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00075-of-01024.json.gz": {"num_bytes": 320575937, "checksum": "42108758abc3c3197e7dca8293eed3800f3e79ceae80d3208d90c7a9fd205594"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00076-of-01024.json.gz": {"num_bytes": 320070510, "checksum": "c904b6e6041e23edeb1d88b7b69f07a339b7ff9835d0c22e0b6c354519369842"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00077-of-01024.json.gz": {"num_bytes": 319042024, "checksum": "1eb2b70ad4d12b7587eeb1ce86477817ad992c08fecafe5ccafc26af6b5657f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00078-of-01024.json.gz": {"num_bytes": 319997520, "checksum": "070370654960e02f766c10321546b280e9933531b796c252a94999d645f360b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00079-of-01024.json.gz": {"num_bytes": 320736487, "checksum": "3aa4f007660706563030b590cef9be992c18ba7ec1876210bc92665ec42c4be2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00080-of-01024.json.gz": {"num_bytes": 320082337, "checksum": "3b54eaf407bb593c2b16df99690446f26497530d21cf433a7d525e0eaebe9c3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00081-of-01024.json.gz": {"num_bytes": 318008114, "checksum": "d01975cdbd4360331b1a0f55e9b7e731d7d9fc70c7cdd0f33f1c772eff7aa03b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00082-of-01024.json.gz": {"num_bytes": 317829809, "checksum": "2a65dd37027fae03819ea5a5f6c3b16d921706ad758442881dc1d15b08bc5048"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00083-of-01024.json.gz": {"num_bytes": 319265318, "checksum": "e14cf18c687f7eb304df6abef7235e263a5736c799d742524205dead2abfb043"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00084-of-01024.json.gz": {"num_bytes": 319166958, "checksum": "1dc3fa8702a4477e3a3128440b68d4cc17e6d2ce7f3c53da28d50a57b8332020"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00085-of-01024.json.gz": {"num_bytes": 320338078, "checksum": "0222db7b1ae14c9b10aacdb05d055d1432b6d035e3937df5640facd242c52aea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00086-of-01024.json.gz": {"num_bytes": 318941314, "checksum": "55ddf7a27dc91bf8d932a5efec4aa458122ee337f2cb050e2c4b0ae8e770f3a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00087-of-01024.json.gz": {"num_bytes": 319218368, "checksum": "c61552d76bedbfa750c599a674d6732fb224c8a1e6c6583fca7ccabb20532920"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00088-of-01024.json.gz": {"num_bytes": 318974308, "checksum": "693fae3d50068ec39ad27a14335372c3e1530138cc65931edac5268dd62b7e96"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00089-of-01024.json.gz": {"num_bytes": 318781044, "checksum": "2d90b9318432a2313dfaec542c8b91431505035cca7416a63e3197ab26ad6e75"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00090-of-01024.json.gz": {"num_bytes": 318569651, "checksum": "ee674beda8ed39395e69c899f666990c5190dfad5494867e51fa727e4d38d86a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00091-of-01024.json.gz": {"num_bytes": 319683433, "checksum": "add2489350310ce500dde6637518c747c156f95f079a34367842bf875a8fdf5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00092-of-01024.json.gz": {"num_bytes": 318734793, "checksum": "5cfd4f25e9effaa2f7381bfcf49f9263e10619811aeaa32a77d3fdfc13517006"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00093-of-01024.json.gz": {"num_bytes": 319161014, "checksum": "bed8774909bba5ac656ebaad6e5cacca9e5ea12c80a41fd5689e6798c74f3c89"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00094-of-01024.json.gz": {"num_bytes": 320143246, "checksum": "96abe370925f6962b4e75da530b5234eec21fab820d6cb02ae59b6070ab63859"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00095-of-01024.json.gz": {"num_bytes": 319707377, "checksum": "37b68cd632e8f86f364fd61c9581f48ad7602122b7f33c55103ac5bd727f015d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00096-of-01024.json.gz": {"num_bytes": 320159279, "checksum": "fb93c7467f0361c1d4b186d5e25f4bce4f237adb33b4e0ef56f57831b4f97f81"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00097-of-01024.json.gz": {"num_bytes": 319841818, "checksum": "7f4d4a9536e37a0c2b9a1806fcb472784ff4d3840aa57e9603e74233b877fbac"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00098-of-01024.json.gz": {"num_bytes": 321001731, "checksum": "239b9fefebe3815c8d785bd48086013d1a6dcd76c142786502c674d2d874fb11"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00099-of-01024.json.gz": {"num_bytes": 319475885, "checksum": "0a610d25a547839b8b6dfc2fd964e3ca64b23f0edc52d311c89dcb5e8a44a2c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00100-of-01024.json.gz": {"num_bytes": 319515329, "checksum": "f24d17cbd27296a15f51b9edc713c74a6997bbe82267403fdb6282404c2f4e6d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00101-of-01024.json.gz": {"num_bytes": 318803422, "checksum": "54b8b0c72ffa325abce3dd15bdcd0856b5594500c37f4bc6a6327721ba91e4bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00102-of-01024.json.gz": {"num_bytes": 320934688, "checksum": "24b99b4afa3b631a718a487d679026c91e2c936132df01df969e3173b49e091f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00103-of-01024.json.gz": {"num_bytes": 319835920, "checksum": "a2c68654ba81fa55bc24beb4319c8905f7b532fcb6793a6a311344d4f98a82b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00104-of-01024.json.gz": {"num_bytes": 319402378, "checksum": "27764d82793e35b8a7be3a3fb0470d018243a89283b5501c0b76056de1879389"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00105-of-01024.json.gz": {"num_bytes": 320100928, "checksum": "3bb2499337ebe52b63a5f20ec6ca6283971937962439699bd5e483cf80fed02a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00106-of-01024.json.gz": {"num_bytes": 318707110, "checksum": "83510312aa188431a8dda8746903d70cfc7ffdf5437e44c1f74b7670b78bd52b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00107-of-01024.json.gz": {"num_bytes": 319904239, "checksum": "40d42c39dea8e4898efba1886aa3be67742501f7a51d5bc635b03a2c6c2bd63e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00108-of-01024.json.gz": {"num_bytes": 320050265, "checksum": "88ce3ddae88e8024e76614a1b701c157f66fe39c6f0852a4869c5063876f6e87"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00109-of-01024.json.gz": {"num_bytes": 318053254, "checksum": "865a124b663037f36a5738f25c82f8bea2ab54d4bbf8255ca0d1d00d76f8b250"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00110-of-01024.json.gz": {"num_bytes": 319794699, "checksum": "b17e210c8ceef98219ee12eba5dddd2001ded0d417c93955743c238360d96e76"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00111-of-01024.json.gz": {"num_bytes": 318761540, "checksum": "05be318a057bb33bf9d7faca58569cdb0880fe8eeb0fc3f57f5999d5f2af55fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00112-of-01024.json.gz": {"num_bytes": 319121509, "checksum": "858dce8e43b06a0c1e26ab3e4f109814b6cc50c6b0e4d146ec79fda001ad471d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00113-of-01024.json.gz": {"num_bytes": 317916736, "checksum": "2e3968e48cb15a3326457d5a6ad49838d20d38c8138c529eee51f94e6bf269e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00114-of-01024.json.gz": {"num_bytes": 319319540, "checksum": "b72dc8207d93848f4fcb265b3e618d0eb8649445f7b9187c5165f4adec3e0708"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00115-of-01024.json.gz": {"num_bytes": 318863372, "checksum": "85ef0bf3cb12bc2fede4158853ed2259dff5d25adf99b43e8c35d7e0b9d4fdd3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00116-of-01024.json.gz": {"num_bytes": 318898370, "checksum": "a0c82c8b48e086be7396338cdda0fed52e8c4753f04fd086b9472c1bedfb150c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00117-of-01024.json.gz": {"num_bytes": 318153138, "checksum": "531d5d03fd8099806d92fbff2a48a0d68dcf46325e732e698e9c142902d152f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00118-of-01024.json.gz": {"num_bytes": 318966511, "checksum": "24b1c5ebbd07d50043be0d5d5c5427e042bdc53280825260226a2823e9b7546b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00119-of-01024.json.gz": {"num_bytes": 318733748, "checksum": "ce1fb1192b770e625430798aee94c93bd748ed474ff815a7f95cadebb826161a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00120-of-01024.json.gz": {"num_bytes": 319672996, "checksum": "4c2a6874921ac4a626a9c8ac4c6e91dae58f1f5b52e79124b3abf254b7433119"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00121-of-01024.json.gz": {"num_bytes": 318779046, "checksum": "029d3ab92f3e1724e3708790148e63b4c211d2ddfd04e3d194b24145e97c922a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00122-of-01024.json.gz": {"num_bytes": 320861175, "checksum": "4bb595140e5cf92147f99b58d236634ddfafbc0b160b4c88b337255482611ced"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00123-of-01024.json.gz": {"num_bytes": 318338141, "checksum": "d508261be287fa3d27e5f44524e22870269054213b61011ee8a6728a77910cc0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00124-of-01024.json.gz": {"num_bytes": 317655056, "checksum": "7612cb9fdd9f4b3a4f8958087ace120d4a73cf26bd16289bb20fc871f5744f2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00125-of-01024.json.gz": {"num_bytes": 317524610, "checksum": "049ebe4971811bb1fdcfd10cc264b2074b3ace18536340644e718dcc3cf3affb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00126-of-01024.json.gz": {"num_bytes": 317902192, "checksum": "d97bddf003b8f647c587fe9a9a9aed75ea604478e0b550d501ad7f07b6061b86"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00127-of-01024.json.gz": {"num_bytes": 319243191, "checksum": "6da4c882f88816a452af54ed217f84d6e4601c11a8e33bd47c49c0a1ea04f49a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00128-of-01024.json.gz": {"num_bytes": 318045852, "checksum": "ea43f63e6ef3bb5723ce75bb51f7183a525d8ccb00c93f49aaf2d9b560f7bdbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00129-of-01024.json.gz": {"num_bytes": 318436174, "checksum": "72ceb525367d6e8d1c0fca94d99d4fe5353ead08a5d52bf00e30e3b596fa90a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00130-of-01024.json.gz": {"num_bytes": 319017217, "checksum": "92f1b2687bee78441eeb4e05bbec2a491469b23c3aad0d951fbbe35a3c27998a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00131-of-01024.json.gz": {"num_bytes": 319237739, "checksum": "0fd07585a82b7d71ddabbc315195c84e2fa78a8319de7dea971cfcc9b38707b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00132-of-01024.json.gz": {"num_bytes": 318123742, "checksum": "c9f5604ca28ea2a9ae5267db50f6e3d1e576841abe840134b3817f370c057073"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00133-of-01024.json.gz": {"num_bytes": 319009751, "checksum": "7ec982de577e0eeff57dc60346ce35a7b35b3c4f037987316cfc071b0ed58a87"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00134-of-01024.json.gz": {"num_bytes": 319750057, "checksum": "2619d265d76d82f6b84e2686371e5b6d6c08058cbd5765dd2906af9f549af092"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00135-of-01024.json.gz": {"num_bytes": 319068231, "checksum": "5e1bf5b09f2cd132a7747116442d6f26ce0002eaeb9f56fb02bc00e3abee8716"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00136-of-01024.json.gz": {"num_bytes": 317800994, "checksum": "80ebbf64fbd91215da553e3a8d9442380cee6c3b09fbbf8353a0817993d15862"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00137-of-01024.json.gz": {"num_bytes": 318954070, "checksum": "3b5d2ccafe526a19c52ac0fee50109b6a95ac3c8f7f2272a9a0302c4219e82f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00138-of-01024.json.gz": {"num_bytes": 318452853, "checksum": "2dd88569a62003383a3bf70d68143f16f234535469bdc8ab01a8764f6babb5fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00139-of-01024.json.gz": {"num_bytes": 320013821, "checksum": "f32ca62f6a9d2c8a72901e6f2c08880c2d1907f52beb4e8fdc30f4c02c7ad10b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00140-of-01024.json.gz": {"num_bytes": 319510423, "checksum": "7799838d8019d7cd71a505951f155bdfb862b4a3b3b77e182c706a624617169d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00141-of-01024.json.gz": {"num_bytes": 318339814, "checksum": "1601f6dbcbf4e7f1db119b232e862f3c9fe29e9abe5827177458079299ed511e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00142-of-01024.json.gz": {"num_bytes": 318438444, "checksum": "71d891be156e1b608733a3abe8f8dab7a6213c02931117b99889bc3fe8329d38"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00143-of-01024.json.gz": {"num_bytes": 319413540, "checksum": "88fb2e7c3d426a6bb5775041658c07005a469306af0d97df7d68f148b64cbfe8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00144-of-01024.json.gz": {"num_bytes": 319901095, "checksum": "2734ff57f4265653b0b1f292f513017ba791c3091cf8ac0bbf6d75d0074e3386"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00145-of-01024.json.gz": {"num_bytes": 318500183, "checksum": "da2e6747f7230af5941c6bee262a606b4f7792da359dbf7516d82d8301cdf90f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00146-of-01024.json.gz": {"num_bytes": 319315120, "checksum": "6daac97153d51addc8b1e43b686e3d641666df3a106270a141d734079db2ad35"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00147-of-01024.json.gz": {"num_bytes": 320621434, "checksum": "fb2584e0ce366ad30c8110591484b84798e9f06e8a27cd864e7800b8d5e2d225"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00148-of-01024.json.gz": {"num_bytes": 318269045, "checksum": "1c963c0ceb6cd776822352b186ae7e3d829ef334efcba0fbdd9182dde4deed05"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00149-of-01024.json.gz": {"num_bytes": 318576426, "checksum": "6a21397e0104c7fe0fcd9f1d43a8e546000596d896a95eb9b6c4ab92235e6a49"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00150-of-01024.json.gz": {"num_bytes": 318447048, "checksum": "075b113a73e6e21d7cac49391ee559ee8aaa2bb3338f709017077a4007a7bbb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00151-of-01024.json.gz": {"num_bytes": 315388730, "checksum": "bd47e3ac0209676d8a32490eb20ca8c07ca3c45c2beb88dae18b5c8d925f349a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00152-of-01024.json.gz": {"num_bytes": 319701880, "checksum": "241d9cf003f49d95168ebdeccd8209230507d4dfd0d170fa1b57d2355240a95d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00153-of-01024.json.gz": {"num_bytes": 318370254, "checksum": "3aa86900a749224dfed8a67960c166e43c3b9ef3ac7b49d28129b496c7193e30"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00154-of-01024.json.gz": {"num_bytes": 320064875, "checksum": "3160c723cea6717fa9f5a9eb627d76107040d084a64106973099fa0e8de48758"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00155-of-01024.json.gz": {"num_bytes": 318089754, "checksum": "5b6e76a85bb1093eaba698864a54a938329b04494f9f72c3c3bbb155174da5e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00156-of-01024.json.gz": {"num_bytes": 320049467, "checksum": "cc013e8aa7c1cf7fc28ebecc64d893d03b092a09d725b5e626851de0b311c814"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00157-of-01024.json.gz": {"num_bytes": 319931950, "checksum": "2a27b4c29455bcd813a84aa3a54100d16cb6bfed25171aa3c552ea452ae569e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00158-of-01024.json.gz": {"num_bytes": 319963615, "checksum": "e477f769ea1513cf607932a29d793fdf1722cdea757e00c814dad594329cfac7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00159-of-01024.json.gz": {"num_bytes": 319000491, "checksum": "ff5d09415753c2aa4b51196e8f4bd6c77ba100ab281314aede118f501565cea2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00160-of-01024.json.gz": {"num_bytes": 319069618, "checksum": "e08c35aef8a20dccad80f6bb1579d6d2ce80113c8bf8459730c69fb7048c3cc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00161-of-01024.json.gz": {"num_bytes": 318750642, "checksum": "13eef84873b58e29894f9bf68a4de72a530c1bfc80a5654262fe71420292b8ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00162-of-01024.json.gz": {"num_bytes": 319847814, "checksum": "a8579c6bcc906fe018881a8474724576c3d0f7f1787f1568b79e5accbd9f962c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00163-of-01024.json.gz": {"num_bytes": 320370365, "checksum": "b97a74837ab9f659c13dcb4deb53c600584beb9e5ceed29e99974c4953f644c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00164-of-01024.json.gz": {"num_bytes": 319894618, "checksum": "9b63afffa2b84c91b749991ddb384399f1d408bd7b6b643e7329e49531ce9a53"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00165-of-01024.json.gz": {"num_bytes": 320166197, "checksum": "5b2414477dc4e2b080b34f3b98672bfe3de6028e7ad83c323a7dd1ee08c05a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00166-of-01024.json.gz": {"num_bytes": 319612575, "checksum": "2cda682db53000c14fcb5d251bae4f50c8c4159348f8594c3ef020260f277a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00167-of-01024.json.gz": {"num_bytes": 319183884, "checksum": "5c406d7a8a404436039fde7c2019f0174ff8855caff319fa62bb7960d341b41a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00168-of-01024.json.gz": {"num_bytes": 319396348, "checksum": "df6a422d57a2e1443d10d61b13ab2c5227734195c82b43e1ead2db723cdea293"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00169-of-01024.json.gz": {"num_bytes": 319452933, "checksum": "81c81138e7163072e3779dd10ea8af7dff12b705fa008665298e08cfc2699f03"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00170-of-01024.json.gz": {"num_bytes": 317748609, "checksum": "6586ae8862b8ac925f424afb6ba779e95a147323fb83fc8c4bb0813877b17718"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00171-of-01024.json.gz": {"num_bytes": 319052376, "checksum": "8b3cd21d8ffbe963ce935ef9e0b6efc45f4d5abab703fdfed19a1309b700dca8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00172-of-01024.json.gz": {"num_bytes": 319068859, "checksum": "a42f5f5a10bfc84d51dd0855166959462faccd6a182af4c5d2115ff9995f5324"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00173-of-01024.json.gz": {"num_bytes": 319142377, "checksum": "e26514c5d6cea27c0cf7fcc1daadfa6f218ef9e62039c6d6fccfc31660c0c96f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00174-of-01024.json.gz": {"num_bytes": 319134484, "checksum": "75349aa8c734ed894965500eab2fdf59657a63e40e5a53e822ef1e5a12838a02"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00175-of-01024.json.gz": {"num_bytes": 318330467, "checksum": "a3d0d14b28a5a3cc559d6d89e2ec09e49e92aa189e44e68dbb4ea47978e1eca1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00176-of-01024.json.gz": {"num_bytes": 318584643, "checksum": "dd68b42e5bfc656b71fe5701bacb929edae84055131f1dd65bbf3f3ad734e57d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00177-of-01024.json.gz": {"num_bytes": 319275087, "checksum": "05a8ff159006241cf938ef27b292f65906158ac25ac28919aa6761eaa634052f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00178-of-01024.json.gz": {"num_bytes": 318490550, "checksum": "a3aa38083c85baada29b207240bcca1a0d562a93971b420428d039092e58bd31"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00179-of-01024.json.gz": {"num_bytes": 319083249, "checksum": "12858fecd1dec728eba2c8c4311b17e4f2ac1fdb27c23e9adcd9258c5c4fc777"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00180-of-01024.json.gz": {"num_bytes": 319752094, "checksum": "67e968cb8d3ebec2f68eddfc539ea7402aa72c9274034494a43ea7d207b69a88"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00181-of-01024.json.gz": {"num_bytes": 320476195, "checksum": "c1bd59eb7ca799e31bf037dc7c087c1ad94e4f88a4f12427c454510d97e1c803"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00182-of-01024.json.gz": {"num_bytes": 318538551, "checksum": "dbe7205a1919dca9d6936158d5653a20d239f2e547ec73280956da4f8c609220"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00183-of-01024.json.gz": {"num_bytes": 319620265, "checksum": "46f9e603e04040b59df8da6ee01d1c30588aa7233a00526d6f0fd84c4172ba93"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00184-of-01024.json.gz": {"num_bytes": 318301621, "checksum": "880a02eabae231da388a5782a7194eef0d0211c2d1314db0c56d740647a114c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00185-of-01024.json.gz": {"num_bytes": 320515340, "checksum": "f522147aed30ebb3ab352c92a9dd24cd2e8b93df1d4c4a6284d89ceaa2858509"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00186-of-01024.json.gz": {"num_bytes": 318374733, "checksum": "5005f1c42038769e225a626a88c10bd4f6af98dcc14deed475954b00c088bc53"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00187-of-01024.json.gz": {"num_bytes": 319116182, "checksum": "cbd7e0f486c6dac13090cd344337da1c336973e7ec75e32b0bd5b18b98f24bf8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00188-of-01024.json.gz": {"num_bytes": 318981305, "checksum": "064ce8c30b7a960b20720c133c3dd3281d27752a66def44d5133ff8f1b8279e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00189-of-01024.json.gz": {"num_bytes": 317036462, "checksum": "acc052da4501691fdd28f269c633ed826840f2634be49b5e2c5e1273de0cb4a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00190-of-01024.json.gz": {"num_bytes": 318061662, "checksum": "5a436e97c59b8636ca5081b71ca6fe8f8a3a99dd3f426c79edb2bf53345ee810"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00191-of-01024.json.gz": {"num_bytes": 318556228, "checksum": "2eebc89381ff78ae63f311c98b07853cefcc42fbcc210995095d568a6ff70ead"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00192-of-01024.json.gz": {"num_bytes": 317987733, "checksum": "99de46c4702c06a2303262b185b92fad82e12e189c923d5b76d9d8f96faabfa5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00193-of-01024.json.gz": {"num_bytes": 320294532, "checksum": "bccb7d8fc34d6cd6eb41e2a1c6234596b00a5517fdca7c47562fdee0e675377c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00194-of-01024.json.gz": {"num_bytes": 320852679, "checksum": "bb1e7768a57145fdbca7957ed964648d1deab5edc5dfad4722a81ad411c5e0f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00195-of-01024.json.gz": {"num_bytes": 319016077, "checksum": "ac520468a5bd933dbac1aa5f7f21ba276bdce15abf99963ef9d73af294e81e70"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00196-of-01024.json.gz": {"num_bytes": 319289881, "checksum": "9eec5740115ab52ce98ac9efbed4fa1c5c06787fe93b4b28f6a1e4df06272870"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00197-of-01024.json.gz": {"num_bytes": 320180232, "checksum": "07a03763b84b4a86b4f71d725927d62c40925823ee454122a00fdb625ddb3a22"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00198-of-01024.json.gz": {"num_bytes": 320004709, "checksum": "a1b250b01289fdaf6dcd997ef31c59c580f81f961aa0fd88ae0d175bd07c02ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00199-of-01024.json.gz": {"num_bytes": 321006991, "checksum": "650e57c3dbbf4ed929da8c6c5d78f35fbac4644722a84d98f93342a8d33b2140"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00200-of-01024.json.gz": {"num_bytes": 317913111, "checksum": "42caf6dee42bd73d9e4bf0c7bb16383caa936b2e0a913489b9f0aef57b6004cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00201-of-01024.json.gz": {"num_bytes": 317897148, "checksum": "990974a82de2b1c27465f6d097d7a5718c5ff334271e722ab3736e7aa5b89d4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00202-of-01024.json.gz": {"num_bytes": 319510250, "checksum": "8467066f2417af774363d4984a37968a0189adfe3a581723eab15004930e621a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00203-of-01024.json.gz": {"num_bytes": 319762388, "checksum": "4e7e20980dea2d5e77f380b24580f0df9319a0d1d73ec319e17d8cbe044e53de"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00204-of-01024.json.gz": {"num_bytes": 317418128, "checksum": "2c027c5225ea7ce3c31f5f32dda12b7c892c6fdc9c52da6d0af749171cdce738"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00205-of-01024.json.gz": {"num_bytes": 320157174, "checksum": "d953e79c60be0e2c3b072c2186a845a351392ef395fa95135f47e6b8491c6f88"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00206-of-01024.json.gz": {"num_bytes": 320459080, "checksum": "bc70c34931942ca143f7eb555e86458afcc36110aa9559151f31d781969d4458"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00207-of-01024.json.gz": {"num_bytes": 317361718, "checksum": "fad5ebd7a81bb737e12e9d4c803aea1a9e905d43a3fa87cace32a64eef01e8e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00208-of-01024.json.gz": {"num_bytes": 319976693, "checksum": "21381c727d945d8d3b4a275e3622bce64b07ed87d7f2371ac28b5d2023359cae"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00209-of-01024.json.gz": {"num_bytes": 319550585, "checksum": "8b74e5f1780c4bf12936ac3a86be7a3d11287866522da8275aa4232c1e3d8898"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00210-of-01024.json.gz": {"num_bytes": 319574289, "checksum": "1594bd49cde9641b49a1ad9373a53e10d65440000363f7532a7d326d17c44236"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00211-of-01024.json.gz": {"num_bytes": 320615302, "checksum": "5b6f7eddfa3a9ffb0d6668d10f398b1d86482b64daa9817ca0af549433071244"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00212-of-01024.json.gz": {"num_bytes": 319395225, "checksum": "db58fa453269c794fedb595c6193dea5a85c72ff8b2d43e77c9bb371b8c86b78"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00213-of-01024.json.gz": {"num_bytes": 320131797, "checksum": "1d21d19b5e36820559590b339c049be29f27505ab4e88572edbdb84b649e0b66"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00214-of-01024.json.gz": {"num_bytes": 320153141, "checksum": "55c9b4ff1cd8cc88738196f867aba620dec3c8b27b9a485c7e75d3129d76e9c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00215-of-01024.json.gz": {"num_bytes": 320525443, "checksum": "dfe9f44676c1abf0e2875924c094c0d788f8a0172d641d5f810258e948e37feb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00216-of-01024.json.gz": {"num_bytes": 320100146, "checksum": "57f19f5437b0428d9f40799af14f8bfba8f6c82ebacaea8f6fc7531524a6d4af"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00217-of-01024.json.gz": {"num_bytes": 320688377, "checksum": "fad4f3143aa303c9c35165a15c6d90087c204c586fe20b0c0f45cf4238311b70"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00218-of-01024.json.gz": {"num_bytes": 318896471, "checksum": "aabd471960d6db1e93e1129410d9138d9d9efa3292af7491b3b6844c2bd3f543"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00219-of-01024.json.gz": {"num_bytes": 319298204, "checksum": "f676701589e39802779a0947585638347bb4fe55376a33c6d0afcdc40c5f8938"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00220-of-01024.json.gz": {"num_bytes": 317757045, "checksum": "f3d0994379d244054c5e2db366a081caee28d301aa6b0d9431e7d9eb1cb38c30"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00221-of-01024.json.gz": {"num_bytes": 318568870, "checksum": "8026854c8a8cc1d16b52a898b9dd8a8df7901dd8cdf285f5d937c4d5d45919f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00222-of-01024.json.gz": {"num_bytes": 319096912, "checksum": "71f76f898864de3ae60f7c0cdbc68d53cbfa04b2f8493c40d55e1cb56727b275"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00223-of-01024.json.gz": {"num_bytes": 319350414, "checksum": "ba01faf3fe41a738c255b5da83daf53a5858144557af6c6f8d6208a049e4245f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00224-of-01024.json.gz": {"num_bytes": 319007151, "checksum": "94200d12c61f7c73a9e3a2bb089a05b017a215348d52018a34e3224578c0da06"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00225-of-01024.json.gz": {"num_bytes": 319502985, "checksum": "0b7ce650e555baa546bb329d7f0567a3dc0a7ec9d49149792032a86321a73d6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00226-of-01024.json.gz": {"num_bytes": 317983607, "checksum": "40cf6d4b3deb05cd97ebed01405d08ae67be6e896736e4f371d15e5404567599"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00227-of-01024.json.gz": {"num_bytes": 320199564, "checksum": "e65ee475e3b6682b57bfa3f7b9c1cdabf36a7282fc793865df63dbe6a6a3d1fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00228-of-01024.json.gz": {"num_bytes": 318852183, "checksum": "8b27f2fbb0233802229fc776cfcb0b6b43af3149d217d0ab00cca0f1286482e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00229-of-01024.json.gz": {"num_bytes": 319407418, "checksum": "f2d5199a0022134ae127c88f0ac20d1b2b8a88014a774b5432b41085c83ecb5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00230-of-01024.json.gz": {"num_bytes": 320787790, "checksum": "e1b040895ac6068dd1aa892ec93d733096afc4adda698379006ef89926491255"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00231-of-01024.json.gz": {"num_bytes": 318220053, "checksum": "648a6349206c50c17d4e3562fd6fcb0a723b4cb40005890173d5de0c7ecc2ade"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00232-of-01024.json.gz": {"num_bytes": 319702777, "checksum": "0a44b7cb4f354e1eede683a697aba4051c1542fd030dd59767065f5f0204554e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00233-of-01024.json.gz": {"num_bytes": 319154465, "checksum": "4070448b7844776db6754bd33791900bf9ac8dbd81e4cd774a3055ada67f6fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00234-of-01024.json.gz": {"num_bytes": 319846160, "checksum": "b1e8c73078c347fa062ed408e81bbdcb2f714675bab2c082016e822e91ef63a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00235-of-01024.json.gz": {"num_bytes": 317722912, "checksum": "d8aa694e870157b2b5411f496db46dc71dfeed01a42973a65499596921198abf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00236-of-01024.json.gz": {"num_bytes": 318593592, "checksum": "e0c4ff6c8a12128da88777074d0b097664cf2f2395913c4d82b0eecd501946f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00237-of-01024.json.gz": {"num_bytes": 318902831, "checksum": "adce772ed699d7e908ae1fe1ddf1d9875305c7875c93cedf1b3ea0bbc21ff922"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00238-of-01024.json.gz": {"num_bytes": 318696723, "checksum": "926f9fc42cd248077afec1f4b88603c646fc5ae47c4ee3e9b8a5f6b8b6ff7f46"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00239-of-01024.json.gz": {"num_bytes": 318321822, "checksum": "439d756b0ffc97ebecc6c48a7dc90da77de7ada05a6eae929db98057ea15bef1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00240-of-01024.json.gz": {"num_bytes": 318992553, "checksum": "1f57af6ff9477263806c0827c0dd8e494e103b6f54eec2cd5f8f8327b01ee39b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00241-of-01024.json.gz": {"num_bytes": 319345185, "checksum": "493932a44e09f4b311ac5bdb519111fad0982708d4b467688f2b1105316544eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00242-of-01024.json.gz": {"num_bytes": 320108156, "checksum": "de5603f1b276f1373011c8884f06af017c71b03c5de3b3bb89cd6d550a0d5902"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00243-of-01024.json.gz": {"num_bytes": 319855563, "checksum": "7c1b74de8ae3699c567edaa6e2d1a1f1ae82f4810e769c710a23cd2dfc536c60"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00244-of-01024.json.gz": {"num_bytes": 318966332, "checksum": "d3ada80bad9fa776374878bc7504138e14c161bc9798ea8114b0d187d4c815f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00245-of-01024.json.gz": {"num_bytes": 319541864, "checksum": "3fe5f26e32795c49743d1b2497c333be57248c9db2ce12fb93e103d1a9595347"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00246-of-01024.json.gz": {"num_bytes": 318530369, "checksum": "a0bdeb2dcb5dfb46f843c4086230ba918f2d3ec125654cb924ea11e7c75cafbd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00247-of-01024.json.gz": {"num_bytes": 319496627, "checksum": "0c4099f832ada6b24ef6c1d15267cd3c179f5b3d79e3d813d944e3ebea908c99"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00248-of-01024.json.gz": {"num_bytes": 319132981, "checksum": "608b1cd27ad345f6511fb677c00d56b6e827f288877d68aea1bcad3b02dd040e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00249-of-01024.json.gz": {"num_bytes": 318529093, "checksum": "8fd580be09f913cc3809e3b0e467e2faf657a5db6f71b75aa931043267b9b0f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00250-of-01024.json.gz": {"num_bytes": 318248903, "checksum": "faeac675c3634b0834939046e60cdfad6a13558d7a6799c5bde25567898d86a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00251-of-01024.json.gz": {"num_bytes": 319184870, "checksum": "038972e03db75417fc4cb25e54c3aee01e4f022eb0fab202142f539e4d866e28"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00252-of-01024.json.gz": {"num_bytes": 319631399, "checksum": "2fda0c2cec4624c6068556e16630c3551ef3110759bed59628913a9debd547a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00253-of-01024.json.gz": {"num_bytes": 318275716, "checksum": "b5da4bfa564fcc6c49a573b90e679d60c4e222249858f4e58fdb3727a5f279ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00254-of-01024.json.gz": {"num_bytes": 318638865, "checksum": "279eb2978fe94e1570318a247b82487c04d7494ceed74dccb1d7a5734ea84e5c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00255-of-01024.json.gz": {"num_bytes": 319640339, "checksum": "aa0a1ef845d0df7d81d2588d53f29205a4e3858a0888c1b7d9c83eb2fe1d32a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00256-of-01024.json.gz": {"num_bytes": 320353593, "checksum": "407133ea3b32a9e004b992a1bccade0440a39d0bfbd12993ea78c6526c0864a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00257-of-01024.json.gz": {"num_bytes": 318165587, "checksum": "72b7a72b8402b22cb51db44c9e7859460366c7c9d33e16a4c038ad07f7ad8f3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00258-of-01024.json.gz": {"num_bytes": 318003534, "checksum": "e5f9f2f74b7f9958dc9535f04a8965749ca4bd68005a6efa36f480fb487ca930"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00259-of-01024.json.gz": {"num_bytes": 318990454, "checksum": "7cb3c284613537fc6b1a85d7187dfca30b37a7a1a5708094f17486e3184e2d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00260-of-01024.json.gz": {"num_bytes": 319514850, "checksum": "0067e36b7156196e2451cdf78dc8832352f2481a4740afbef9046104b6810bdc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00261-of-01024.json.gz": {"num_bytes": 318747661, "checksum": "b1e4597420035c355abe15efc576751169e2b5e4c38e073c178346a7202d5ab2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00262-of-01024.json.gz": {"num_bytes": 319868329, "checksum": "374f4b951e545968da45b5055af2aa0b128c1d65d6c854f5b8f7e02d22c352e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00263-of-01024.json.gz": {"num_bytes": 319268788, "checksum": "7168e635a32859a85a152b29bcd1f699257ee4e340517e218ea9b8dac3922210"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00264-of-01024.json.gz": {"num_bytes": 319270640, "checksum": "1da08b65c83e79a0f5b7215e5a4ee58f21383b69f09dd9a3ba95381ba3d56d25"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00265-of-01024.json.gz": {"num_bytes": 318744354, "checksum": "0c908e81d59b2099eda038731b387a0ad86fa3d168eb2955413dde9cf29d947b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00266-of-01024.json.gz": {"num_bytes": 318518406, "checksum": "115e375464931638de4af669b7301b6112d18b23835f2db2b092f47545b1a855"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00267-of-01024.json.gz": {"num_bytes": 318921711, "checksum": "6d66c715137885a46f2472489b21751284ec8ecfde6dca6be3ec1ee75f6cd5af"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00268-of-01024.json.gz": {"num_bytes": 317786222, "checksum": "588865d8f9d3da5a70c958997060ce4792e175c8fc5323f1887787070c8c160f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00269-of-01024.json.gz": {"num_bytes": 319004956, "checksum": "163ec7497602931de2eaffad320704e508e491937a2965e39907a086f640d975"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00270-of-01024.json.gz": {"num_bytes": 319175186, "checksum": "794e0e7ceccf28457a8ed5b0724337545661da16feafd0a53e4823b2cb1c92ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00271-of-01024.json.gz": {"num_bytes": 319785821, "checksum": "9c9ec0348f7d4ffc61e5f19f1f60c8382b33ca2fe4b852567cbc3c16024a4627"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00272-of-01024.json.gz": {"num_bytes": 318933435, "checksum": "883d85985237948018b13c20f4d4ee567c6ee36a135b326e8117d73dad4fe37a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00273-of-01024.json.gz": {"num_bytes": 318456664, "checksum": "fdca13067e8e118e538b8de538e164fb5397724045a5b1b02764510c8de90969"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00274-of-01024.json.gz": {"num_bytes": 318418161, "checksum": "27556558fe8a91a4aea4800ba9b7e844336a7638c5b96e652fcdb359f631b04f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00275-of-01024.json.gz": {"num_bytes": 318437784, "checksum": "6ad4e6a3e1cee04aee3051a66531e3f4aa97f7bbb7602c6aa5f46a727b319f2b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00276-of-01024.json.gz": {"num_bytes": 318470946, "checksum": "145a4d85ddf1e72fcdb8477dcd2f70a5554d9cd9349e02e058d3e7837204b6ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00277-of-01024.json.gz": {"num_bytes": 319580624, "checksum": "7116de0dbc5c7f6621f7c107dded9d85788937a87f2d56efca32ae9f25fc6865"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00278-of-01024.json.gz": {"num_bytes": 319619699, "checksum": "8dabdf2d26035d30c22204e6f46f292c58f4a4c3b0b77a1826a43341d4282df9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00279-of-01024.json.gz": {"num_bytes": 319344020, "checksum": "c2b7d5bf62be1772c6bb80f597b28d948cf3cdefb10b6df6f777f0ab7d8fb015"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00280-of-01024.json.gz": {"num_bytes": 318997864, "checksum": "025457720b0045e7bf01f9b4b847f28ef94af9ca250675efeee73eeb340a3f36"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00281-of-01024.json.gz": {"num_bytes": 318718146, "checksum": "2979c0ac06570a9ee437521778c514bd8755193b9f1ae6a5a671ef885243f019"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00282-of-01024.json.gz": {"num_bytes": 318434530, "checksum": "a17bca50ec20c364adb899a9073bbe3a1505f81803a58190efc5d4f3f78b58be"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00283-of-01024.json.gz": {"num_bytes": 319317663, "checksum": "9034f524fc5c2e246b22e2dee00b47e0c4da0316bc60d0a11d966c28db917f9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00284-of-01024.json.gz": {"num_bytes": 318957832, "checksum": "f08b96047e711831dfb8a44d90cb712d3e78c98dd28ec6b937ee83949bbef5b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00285-of-01024.json.gz": {"num_bytes": 318643283, "checksum": "c5df1f2e2dad46d71f8aadf856a5139020da8afc2ee010d53c0372ea09b2362d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00286-of-01024.json.gz": {"num_bytes": 318064839, "checksum": "16f7fd6abcbc69750b8131bca3e38ddc40bd7c86c48122ad2a9a77cb9cfd552e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00287-of-01024.json.gz": {"num_bytes": 320328448, "checksum": "41e82bd357b47a28f28a4a203d5b54263aadb3c9a08899f78302c727c56d8b38"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00288-of-01024.json.gz": {"num_bytes": 319559271, "checksum": "970b9df224b58ca50b3023d92f6be0c37dbda479155c29c535e457ef6f2bca0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00289-of-01024.json.gz": {"num_bytes": 318786822, "checksum": "36a6515e7f516335d3fe057bb6ed9890a2aea033e08edd8588b3168b3445b2f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00290-of-01024.json.gz": {"num_bytes": 320634782, "checksum": "7d19fc82b9a5aa0e0046cd17cd2c46f356f8a4a7d203d5e03e1f319156f05cb8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00291-of-01024.json.gz": {"num_bytes": 318746713, "checksum": "86d610d4590bca69281348dbfaaec9e704fd6194141c50c71e84aad51ce26b91"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00292-of-01024.json.gz": {"num_bytes": 320049630, "checksum": "d045df646213e29d4e7de4ec8915eb3b65bb962f35b0d74abf00889bd5aae8ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00293-of-01024.json.gz": {"num_bytes": 319966146, "checksum": "c66fff1a64b495211bfdcea650ff76115f8c857b9154c1b869062e702714b9ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00294-of-01024.json.gz": {"num_bytes": 318805332, "checksum": "ef3d9204ec85a1e65ae48af7924f614403d297a15f232ba41eb0e4fe223e507f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00295-of-01024.json.gz": {"num_bytes": 318898465, "checksum": "2a071fc28b1216f2dc0579528d9b04e597b5cdac9fd14719e312092242da190a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00296-of-01024.json.gz": {"num_bytes": 319406630, "checksum": "ea71e9fd444860d70d3728f7e2213a4bccf3aa31a164c9acfa8df7a0b6619786"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00297-of-01024.json.gz": {"num_bytes": 320312971, "checksum": "ddaeba8aad38b7e9727c579cc44f15b3c82d292e2901b47b785e9c8d3d5cdb9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00298-of-01024.json.gz": {"num_bytes": 320660744, "checksum": "814460ccfda29b45edaee5f44e3c980889aee2ee52e4e5323931ea489fbe938e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00299-of-01024.json.gz": {"num_bytes": 319848186, "checksum": "3b91fe32d3a731a5be3bf778eedfe13e8a7e26ba9eda51c278c5212aa7925681"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00300-of-01024.json.gz": {"num_bytes": 319647278, "checksum": "1e0424631f7f354bc63b3e71c5c6516c85343dafd3896acb9560eaf93b672799"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00301-of-01024.json.gz": {"num_bytes": 319080252, "checksum": "46c21af013f611729cc06ec033dbae80151987f9098e57fb98e2631f6fe76c8f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00302-of-01024.json.gz": {"num_bytes": 320028246, "checksum": "d1ca8ad6e5bd6cb18db1f1be9154dbc8ba9df7ca02db4c1f8a7df9d40820d8ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00303-of-01024.json.gz": {"num_bytes": 319388787, "checksum": "bce87161f77464adfb1fc04fc2993211bcec502d7172b86f726daf7096b04f82"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00304-of-01024.json.gz": {"num_bytes": 318627831, "checksum": "235b8085cbeb7b13f8e1a5f6d2225a9461b7bcd76e21466a189c2411ff4c4107"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00305-of-01024.json.gz": {"num_bytes": 318148428, "checksum": "f13f124e0ea150da13ebeb3390c311b3db54018de0d640579307bbcf2c46068d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00306-of-01024.json.gz": {"num_bytes": 319451712, "checksum": "de5c3fa2cd6a47551ab43268484d017602e2c3e1f66f43f1a1d8f95bac52cad5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00307-of-01024.json.gz": {"num_bytes": 319026244, "checksum": "88769fbf393671db352227a64cb8ba6b4ba60c5bddb4a14294b1ad9a65a750cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00308-of-01024.json.gz": {"num_bytes": 318447454, "checksum": "555bcfc0ba4db0551ce5ffb18057027ee695af166856125aeb79f7ce013851cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00309-of-01024.json.gz": {"num_bytes": 318147676, "checksum": "bf28e60a7970c548190cf0f4fe56f27ea55a1ad8313fa353a8013f0a0e7919f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00310-of-01024.json.gz": {"num_bytes": 318930650, "checksum": "45a68c0ef70ecd10838d604d51fecd26e5199f5372022b9c2af461a71c24c6ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00311-of-01024.json.gz": {"num_bytes": 319955339, "checksum": "fb3c4e93166f1cb2ccc8a7b68da0246f0827d3a81bb5614c8c84f1c01c6d53c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00312-of-01024.json.gz": {"num_bytes": 318554567, "checksum": "0dce2ac88ba7ac5340d551add9fe7b1a30772a6cc082347c536427b48daca598"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00313-of-01024.json.gz": {"num_bytes": 318978931, "checksum": "c5f99dab085fb705769a514626c9af8a26cf846fdaee4b403a3d6f84c892cb66"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00314-of-01024.json.gz": {"num_bytes": 318158197, "checksum": "79de4fa2aed5e3efa71e75d13f08d7c1869aa59f42a819f4429430b3db6c1b27"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00315-of-01024.json.gz": {"num_bytes": 319744521, "checksum": "5a47a89a1537662a91853bbe2a5b3e243f5de74489f820621192cacef192593f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00316-of-01024.json.gz": {"num_bytes": 319861527, "checksum": "1cd34f17f3ae3c8bf8e1636714a9ff600a26799d5ec02ba42abefa5db9d00e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00317-of-01024.json.gz": {"num_bytes": 319286030, "checksum": "a3e34af81264a72b523b63fdc0268f450675f7993fa0885eb2b4c747b0d6703c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00318-of-01024.json.gz": {"num_bytes": 319054871, "checksum": "02fa8cf278578108083bc9a3c5cf07b0a9d243f2162397091ede6c85a1df31e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00319-of-01024.json.gz": {"num_bytes": 319943810, "checksum": "93ef0d7f1610043a6f7634af73e89ee9f3d7e87828ad34558a4d688e6fa6b6dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00320-of-01024.json.gz": {"num_bytes": 320037211, "checksum": "06fbd99a3d64df293db2655f321117f1afcf1cda51e421edef9335a25cb1a902"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00321-of-01024.json.gz": {"num_bytes": 318584237, "checksum": "a224e4d902f7368f91d6a72fc9f5730996dc37de576bc2211eb632e3690f1b38"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00322-of-01024.json.gz": {"num_bytes": 319686632, "checksum": "57fba28c7104ff659f8a0f330ae89c68d3a392dd14a78247fa357a3bcc8b94dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00323-of-01024.json.gz": {"num_bytes": 319834993, "checksum": "e61c760cd3c42f71a1a7bb6adc4e0bc970bbf864b69e2a4a5d56bf0a14d4e0be"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00324-of-01024.json.gz": {"num_bytes": 319243057, "checksum": "61d21ab1e7729f172ade5ab6c0dcaf07eaeaee6e047ca1c24722c06ddd919678"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00325-of-01024.json.gz": {"num_bytes": 318569583, "checksum": "2192a891ecc2a6aa9f6ea64f1d76ce763e0a3963ae03c95275ccd626171835ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00326-of-01024.json.gz": {"num_bytes": 319175980, "checksum": "d35e4d5f8e924ad97520db51a2c361bbc02097721195932b6768e7460df092a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00327-of-01024.json.gz": {"num_bytes": 319892298, "checksum": "ce967065d3915d466982b5258e07ad2c46b02d7637057e0547586657ea0f53a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00328-of-01024.json.gz": {"num_bytes": 318004026, "checksum": "0676d556f46b1f057669d3378c6fc335db6e3ac67a02e11dce3823658730f4c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00329-of-01024.json.gz": {"num_bytes": 319066225, "checksum": "b00bb4bda957e1287b98c432165448b3899f9155363f7b61bfd0f0181181acfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00330-of-01024.json.gz": {"num_bytes": 319268288, "checksum": "d14d1883941966ef3b35203d06e6fa1bb485dd77118bd7b6c811b0d06fa72fae"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00331-of-01024.json.gz": {"num_bytes": 319131311, "checksum": "4d5d41c2b2242b299fb67fa8c9327db8b4f612bdf4ee9af4d4e45aba8cd1e409"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00332-of-01024.json.gz": {"num_bytes": 318827508, "checksum": "68cea08d4805b392bf4c2894a4501ee3fbbe9aac4b1b6533e686ea749ced2dcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00333-of-01024.json.gz": {"num_bytes": 320572240, "checksum": "06f211ae2fe1c4eef5e41caceda8ebbc289261057911fcf2583a59c730b7951a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00334-of-01024.json.gz": {"num_bytes": 318121862, "checksum": "46c62769e04ce8acde4562ba24d72e245babacdfb50600da4e6217948ad71d24"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00335-of-01024.json.gz": {"num_bytes": 318692168, "checksum": "dca69a6976e7387a12c8da16b696ed4f604254693a3280be0f90fa694700b595"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00336-of-01024.json.gz": {"num_bytes": 319479902, "checksum": "c52969fad97f1dc0e1e115428e7dad1ac6cb6d804db0cd34f0fc7846b1b50c7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00337-of-01024.json.gz": {"num_bytes": 319987407, "checksum": "2c570f02aa6a6bac96be1e02663996c87f9a94c160f22101ce8ae1d549ae1de2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00338-of-01024.json.gz": {"num_bytes": 319051086, "checksum": "77132df95b147c471ead74bef16ed4fa11e15209f518dd460110132358816834"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00339-of-01024.json.gz": {"num_bytes": 319473192, "checksum": "7f3ac20a72d395c02ed3cb50052821521dc2d8d97303d00e0d0982e2c29e7659"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00340-of-01024.json.gz": {"num_bytes": 318423485, "checksum": "d1127da89e960d939cfc06cf1985df415b60d4bf02b12b7fab02b796100feaee"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00341-of-01024.json.gz": {"num_bytes": 320087690, "checksum": "f753423f82157e95506566d3653d32af6a181e69ea0e10b4d4eb24b626d3ca49"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00342-of-01024.json.gz": {"num_bytes": 319767100, "checksum": "db7410e6a6ca74163098681038f497faa373e1d81434b45c1a2f273d467c0a2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00343-of-01024.json.gz": {"num_bytes": 318389429, "checksum": "7ea1e432a1ffbed8f4ad6cb985c5cf1b2584d8eb7d2fa091a2db3f104a3f7210"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00344-of-01024.json.gz": {"num_bytes": 319117212, "checksum": "c7317a81a6224dec9be07b41134ac7a7db4039b7c98b2061b20bb59b82ed0a1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00345-of-01024.json.gz": {"num_bytes": 318504232, "checksum": "1498efe8280609d9d66c324e332c9433c6351bb7b99c5891a8f27d6841410407"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00346-of-01024.json.gz": {"num_bytes": 316721169, "checksum": "0cbc6b494d653878c9d52a37572064b88356058ed291aa773e5f47259fbfc722"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00347-of-01024.json.gz": {"num_bytes": 319007736, "checksum": "6265505e19a42a01a159297d33b1a91cd0e042a31ba6a1a867404a143ae565a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00348-of-01024.json.gz": {"num_bytes": 320167918, "checksum": "cc8b29deb44c8348aa4d05836f89cbae995c946f38d9cb8e7fedbd4762168ba0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00349-of-01024.json.gz": {"num_bytes": 319901226, "checksum": "2a0f2188b43ffedc8b95a8276c7647147587c5e544c9e6475e790f4b5e362992"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00350-of-01024.json.gz": {"num_bytes": 318999223, "checksum": "1fde48c503998872aa71fc524c7408dc84cbc1faa0d885895d5c57708a15fced"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00351-of-01024.json.gz": {"num_bytes": 318935410, "checksum": "72d577eabcd814a7ff61b894b3fe9089f483a793e692d3ab20ce4ee59921f975"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00352-of-01024.json.gz": {"num_bytes": 318655907, "checksum": "8686dc0e4ff7b35cbc4fa6f3abce50c06f8b95378031c132a117e1d458cb4616"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00353-of-01024.json.gz": {"num_bytes": 320619683, "checksum": "cd5816469ef54bfeb0db6b55a78e0d34eb2e1f82448a41f67dfb70061c3ea91e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00354-of-01024.json.gz": {"num_bytes": 319352400, "checksum": "bf082c093423d562da4984b1f0428225d853a05b5f8fb3696273f36ebb5a235d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00355-of-01024.json.gz": {"num_bytes": 318868462, "checksum": "3b8baeca48e55a2cd268d6aef75f7eed96ef10fceca593a5179d52a2b0121f8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00356-of-01024.json.gz": {"num_bytes": 318903295, "checksum": "4c9a9926a4bad6721807d99cc02a9b6bd28bb0a6254aa1c15527b745c56a06a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00357-of-01024.json.gz": {"num_bytes": 318881446, "checksum": "84b4c2e05bc162fef4824e97ba7a03b1cecb41eda08a3e0aedd264b66e859a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00358-of-01024.json.gz": {"num_bytes": 318521100, "checksum": "aee99528ffd0323fe81e4ed26ed1b9295baa2a3910771dd2a42f4f378fd82569"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00359-of-01024.json.gz": {"num_bytes": 317796778, "checksum": "7b01f2d5ae54f60c2aeb7b96bd366d21e558e2dac48c83a78df9850f37e02f1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00360-of-01024.json.gz": {"num_bytes": 319502919, "checksum": "5b54f9a050e6f9008a1806101ea553d90eead56c949a5f3f46c8ccb88812081b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00361-of-01024.json.gz": {"num_bytes": 318595505, "checksum": "49f4164d66187d46adff7f9bbac97b232ab7906d812e571c2e0bf028895e7f47"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00362-of-01024.json.gz": {"num_bytes": 318851572, "checksum": "17accad3c0706c54530f128260cacbf986cbbb20427d4ba8d3444a3702a22c55"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00363-of-01024.json.gz": {"num_bytes": 318555337, "checksum": "2327866e541aa6aa73f7289c3ad82a19ff154d39657d98cb78a2f481a8765920"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00364-of-01024.json.gz": {"num_bytes": 318641145, "checksum": "6f52354d804e8d4a1af1f6c2c6b759ae115c4f23a63f1206a73e7e25acfbdd02"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00365-of-01024.json.gz": {"num_bytes": 319212614, "checksum": "8f1834eeacc9bbdee95b1f0a4078eb9488bd1a7c5693489bff7943869674cad3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00366-of-01024.json.gz": {"num_bytes": 319336585, "checksum": "a9cf01b76104eebb4ef8462a924f61c262fa197a7c68a50e48d925cb81586e3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00367-of-01024.json.gz": {"num_bytes": 319161263, "checksum": "5ac822027d50c3196026fbaffc7d968e1ca702b947688a6f4d268b942b5067b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00368-of-01024.json.gz": {"num_bytes": 317911640, "checksum": "f9acffbe3c6617e85911ff9dcecec2378b3469ab4546a6973cceb460f9003cea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00369-of-01024.json.gz": {"num_bytes": 319585031, "checksum": "9234553649cfa5265c5a9ccc88486402f88eb81275067c51d9deef16bbe7211f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00370-of-01024.json.gz": {"num_bytes": 318345879, "checksum": "2fbb410346d31a33e8532602f4e3340fcc75c96be803250e9f0f1a6894ca0052"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00371-of-01024.json.gz": {"num_bytes": 318996184, "checksum": "b069b0c8a830ea841e82077548706f286308ef0420e163ff6d8312c8853af172"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00372-of-01024.json.gz": {"num_bytes": 317989343, "checksum": "bfd62e448d4d9f89353abaa384007b0b72bd860402ade3a9d938051a6446530b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00373-of-01024.json.gz": {"num_bytes": 319770759, "checksum": "e4e176250aceb7362ce38d496556a46409e9872e69f45166afe71aa750de8fcb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00374-of-01024.json.gz": {"num_bytes": 319212902, "checksum": "28aa4510c3ddb9ee0ac56aab3792bfe5e899531919ccc0214a4b68bbf2ba18a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00375-of-01024.json.gz": {"num_bytes": 318968029, "checksum": "35326b1f2280e07dd754e89dfa29989d0dfa5c78995d393b36a752d8364bfcd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00376-of-01024.json.gz": {"num_bytes": 318685188, "checksum": "0060dbaccf7f2f956fb8b57891cb176914ddac1bc485dd86c2fd110c46d174b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00377-of-01024.json.gz": {"num_bytes": 319291982, "checksum": "99fc38654197e506868e099c15b2cb15b93238dafd33f81a7d069b3e01c3b085"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00378-of-01024.json.gz": {"num_bytes": 319259094, "checksum": "9b8d97f9d57dd97373c4f57eae2b9c01a58e49017ee41d3969e94fb4dbabc260"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00379-of-01024.json.gz": {"num_bytes": 320228224, "checksum": "82913f2d182d2a57f6c93e9b229862cb72feaa6331d04cd4419113e1eb9d52cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00380-of-01024.json.gz": {"num_bytes": 319738339, "checksum": "e0de43f754ab97d103a02c708d1cd7e771ba079bd9e1f7c532a80a30bd5182ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00381-of-01024.json.gz": {"num_bytes": 319210620, "checksum": "df74823f78564b544677410508e675e2811905c56afe2a60d19d3e049dd65394"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00382-of-01024.json.gz": {"num_bytes": 319810275, "checksum": "f5d5291a695fe2cd228213fa2bf090bf6513c49c6911826aa43ecaefec0622ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00383-of-01024.json.gz": {"num_bytes": 319190426, "checksum": "a861ae79a66b72d6cd5e0a030daae52cffb85ba1272c36ae2be04a9b7c0287c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00384-of-01024.json.gz": {"num_bytes": 318501845, "checksum": "b8d0f5078ae82980f0f64120530bbeb20f627be0a8629d68885acb867091417f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00385-of-01024.json.gz": {"num_bytes": 319530458, "checksum": "7da119f3f63e25ff63cacd8ba0d77987b2d576be1f4b86e7e45aa3f2d194624b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00386-of-01024.json.gz": {"num_bytes": 318938980, "checksum": "c21f3de56fab26d7fb60bdb47c216b22793f67b8fa6d382520c79b88d1896f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00387-of-01024.json.gz": {"num_bytes": 319207426, "checksum": "e28b0884092f75836eed4d73ed24b7403d7b0530fc389386a68887420b0c2603"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00388-of-01024.json.gz": {"num_bytes": 319835376, "checksum": "b4f0db632cc9af66e8aea109c80d73a6281207e29ece131d5bf8b57ff8f81262"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00389-of-01024.json.gz": {"num_bytes": 319346837, "checksum": "413a8d8df1f6cf3094839b57231da5323f33f7115768c65d83f0af1574f71b6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00390-of-01024.json.gz": {"num_bytes": 318632301, "checksum": "a3e8664fbb3ec2af5a217225dbb7fcf3e93b427e5da1a88e35c04c319d61e4c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00391-of-01024.json.gz": {"num_bytes": 319066082, "checksum": "e22eed3415c90510e97768be5a685e0a8035e2635ef773c56e9ce2718c278658"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00392-of-01024.json.gz": {"num_bytes": 318356286, "checksum": "ddbf325390648d9d86f1e7901b75c99fe8db538d203de8dfb4c304282f82cd74"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00393-of-01024.json.gz": {"num_bytes": 318048288, "checksum": "974fd05f356c86be2f9109b0272eee69c5b2eaf0b16104cc573846c925d13b4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00394-of-01024.json.gz": {"num_bytes": 319444683, "checksum": "0d27d6f8c3b935cef23ea60abfa82bd6a4f5e2e061080419dc9c6bc455b9f868"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00395-of-01024.json.gz": {"num_bytes": 318353166, "checksum": "24d9956bd857484ffbabb3ba6f6ac688f48a94b50228238c7c9153a5c6878a7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00396-of-01024.json.gz": {"num_bytes": 319960396, "checksum": "9425f4f18e1690ded866c4b5313cbac8a6210092dc42f720200b7143b69eabe5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00397-of-01024.json.gz": {"num_bytes": 319030577, "checksum": "dee166674b835b9849d281a87238aa136e14d26edaa72d0ecb6b7e82d556a72e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00398-of-01024.json.gz": {"num_bytes": 317664320, "checksum": "f85e08272f73ce4aa602719d59205db54d230a6b7247830d78f91eac63d753be"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00399-of-01024.json.gz": {"num_bytes": 319623875, "checksum": "85dea0672a0362a08503b70623907c8c92bd105f788fbd7f3816212a9181e7c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00400-of-01024.json.gz": {"num_bytes": 318840274, "checksum": "a104345698500611cd1a71a6647555300d315490918740a8c6e3b8dcff315407"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00401-of-01024.json.gz": {"num_bytes": 318336377, "checksum": "808327d156e183e102fd75cfbdb7b5a1fbde3740168f59b767ea380608305b67"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00402-of-01024.json.gz": {"num_bytes": 319270185, "checksum": "b6a5f7c1ade628091fe86744a6011147ec32795ad694ccbc82929791b93aa307"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00403-of-01024.json.gz": {"num_bytes": 318038520, "checksum": "108904ab05b3ad23318f8aa0f7ddd00d97aae1872fb157eea73273e011cbec04"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00404-of-01024.json.gz": {"num_bytes": 320933185, "checksum": "cd0c068c0831218849149eaab8f8a98748823911c745ca0ea33ae839bd625e04"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00405-of-01024.json.gz": {"num_bytes": 317694827, "checksum": "d99909ccd59e2ec183b41a7c6d1bd5677798bd7fd784ab681546a7bf8292f353"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00406-of-01024.json.gz": {"num_bytes": 317937468, "checksum": "c7f2bd7a366b8c389e41fdfad4891068c86039e1a5fc3b8a0b993253badf33d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00407-of-01024.json.gz": {"num_bytes": 320226074, "checksum": "765db6f9f0c8c3d9bbb0499f0010928fe4f90d5915dfdd3b6d09d3dc78ad07a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00408-of-01024.json.gz": {"num_bytes": 318613788, "checksum": "165e78c858dfaf010307392474d4917846c9d21658558912e5ffc915803bd2fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00409-of-01024.json.gz": {"num_bytes": 319212414, "checksum": "5f7d5952aad1ae31413962983971b2b422d77c262ededd2ce1c1e186aeb6d87d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00410-of-01024.json.gz": {"num_bytes": 319023647, "checksum": "24588d41f40e3fe389575b97d41ef761be46bc9a9b3965c5e3f994760f7a4070"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00411-of-01024.json.gz": {"num_bytes": 318408922, "checksum": "b35d4ada5a000f51169557b00e508706d51a7becd33370014ff07c8b8dac1af5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00412-of-01024.json.gz": {"num_bytes": 317166932, "checksum": "d3ed1cae269ebefe4716843bd7954bf7e44ee889f72066afbdcd95f4e1f06703"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00413-of-01024.json.gz": {"num_bytes": 318519121, "checksum": "07fc61a7e164301113201e78c99d40289d88e0b463048e14aa5fe69c7490ccac"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00414-of-01024.json.gz": {"num_bytes": 317417235, "checksum": "c5a7222b2eb8e8fe690f29a0fff7e214ba94e4d9dae62f67281fe25dd385b721"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00415-of-01024.json.gz": {"num_bytes": 319690993, "checksum": "37052fff729bdff124577d5ba041906b2ea7420c5cb28195e6cfca0e41d560c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00416-of-01024.json.gz": {"num_bytes": 319466518, "checksum": "6e8ce2b9e6e8208ad7e43ce709454cb0b96572d793e0b11c15892f5df18f6137"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00417-of-01024.json.gz": {"num_bytes": 319694381, "checksum": "20892d7a33c31d7967ae0cf595a2108de96a61c0bbd773aebc5d3d083f6ed93b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00418-of-01024.json.gz": {"num_bytes": 319048918, "checksum": "fd795ae8d53e632bb3e89a2becc5b801e10db781b14f2c0ed50b12def5376c8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00419-of-01024.json.gz": {"num_bytes": 319791424, "checksum": "5a8e56faaa0892249e5694ae01e2e4dcd22d9750a9aeea5ca390117c77b8de2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00420-of-01024.json.gz": {"num_bytes": 318060925, "checksum": "795ee64f4c9e2e35d9dc0c91ea593c9e41a3924162901fbf782dc7112f8094a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00421-of-01024.json.gz": {"num_bytes": 319328927, "checksum": "2670b7b6b53e9082c90e4a4e915f72673831ff15e9f55918a1244e0c19c8f963"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00422-of-01024.json.gz": {"num_bytes": 320065363, "checksum": "34df2d1afac2ae4699524492d6b93e4a2a1e551cb4a4ae35fc19353930afab8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00423-of-01024.json.gz": {"num_bytes": 319349887, "checksum": "a2b19afafb45cf30493ac2a3eb013e136e7213f63bd633374ca0d9fe2780efe9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00424-of-01024.json.gz": {"num_bytes": 317515288, "checksum": "ec2a84fb16dd16f9547f0c3314a91968324f2c537118ca36e982b235e23527ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00425-of-01024.json.gz": {"num_bytes": 319092219, "checksum": "1ac0b93c0faae7d446add3af3173637a4b0d638dbd5285b0f4e1bf3abd0d1542"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00426-of-01024.json.gz": {"num_bytes": 318421245, "checksum": "bade501dc71c0b4968a9a7c833751cee5d8f7067a45dabd53aa03534df48886e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00427-of-01024.json.gz": {"num_bytes": 317847935, "checksum": "7aef554aa2b120c4d787395e28aceba743e309f2540fab283e077a1429a2f7ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00428-of-01024.json.gz": {"num_bytes": 318822008, "checksum": "cd94547fe1953a1cc074d97558a70d1e55834606379a8f5e6e60e1b15b56fd35"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00429-of-01024.json.gz": {"num_bytes": 318507684, "checksum": "4d3c9245565a808058293558603c657d6e9a0c87b6d2d4b871b856cea2eb3a19"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00430-of-01024.json.gz": {"num_bytes": 319042136, "checksum": "9c5a4fe50db5d0822923fe29a5aa8ca6cb09e3629472b1bf61f670388b6c2076"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00431-of-01024.json.gz": {"num_bytes": 318925124, "checksum": "8f18b35bb952da090ade742753e30861ba39c6c54c8ff2d76b358ca7be475ed6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00432-of-01024.json.gz": {"num_bytes": 318680251, "checksum": "7968c370d0efa4601ab8b5ee68e480b211fb969593608bf7e00a0153f00f99b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00433-of-01024.json.gz": {"num_bytes": 317822797, "checksum": "f62d7e74434d52c36b22f6a8cd56ed3937ed6aa03f140d0fbdf5e360632d51fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00434-of-01024.json.gz": {"num_bytes": 320094364, "checksum": "55d7678c7e197e165b4e09bf3f8ac159853120acbe5801ed6ab3ab0f801c11bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00435-of-01024.json.gz": {"num_bytes": 319008936, "checksum": "09b451c8ee06bc06507b3e75a60c544a6b70f27e3d07daa29c59803f785faaf5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00436-of-01024.json.gz": {"num_bytes": 319023456, "checksum": "6fbcb93f9dfe65e12b7efeecc8af7823471787438b1ce90e5f48b68b2dcb1d14"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00437-of-01024.json.gz": {"num_bytes": 319484997, "checksum": "9e70c8c1ccbfe93ec9296811ae496a518dcafbf38c81b7972f885e297da9e726"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00438-of-01024.json.gz": {"num_bytes": 320319141, "checksum": "eaab759d8c603e8a2ad3ebacd99e30338fb904ba307aeaba0d2e0e63679cfadc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00439-of-01024.json.gz": {"num_bytes": 318410397, "checksum": "7a03a92bf97b6750941c1070f933c68f1b2a3e13fb68b3a21a4726676ea75d34"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00440-of-01024.json.gz": {"num_bytes": 319447470, "checksum": "bc899e436da7b3bf13c1bfa2fd2bbf9d90b42a0c00f2971259a14d858ca3e5ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00441-of-01024.json.gz": {"num_bytes": 317582955, "checksum": "4d777860c2750e43038ef709d77bdc403b3b3bcf0f08e3c4562952c9ac70b113"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00442-of-01024.json.gz": {"num_bytes": 319592118, "checksum": "d9e5dc244bb6f0b629b2a929aedf506dadaf5eacc80f0997816b95279552fe8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00443-of-01024.json.gz": {"num_bytes": 318104403, "checksum": "56133bbd7cf96dbe87d48898b886a024af69ca405d7cea1799bbd30f185e9c1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00444-of-01024.json.gz": {"num_bytes": 318547808, "checksum": "8be0270c3cc96dd7f7b3aad08bde81ea245feff4a09923277fb0d38a7c095604"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00445-of-01024.json.gz": {"num_bytes": 320463920, "checksum": "e02316fcd355914e4d08ecf37036d4727ae9ebe45bdc5c98279aa3437c2c1eb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00446-of-01024.json.gz": {"num_bytes": 319583221, "checksum": "80c9b8c47665b2cef6c291b0eefdac5b14be1d7cd4a4c06c2e14cf48b42da92d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00447-of-01024.json.gz": {"num_bytes": 319546881, "checksum": "a18d5aaca1717ec33fb1822a633268003bf88093dd7b48db080503c3d01b6ffb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00448-of-01024.json.gz": {"num_bytes": 320234711, "checksum": "c41595d2b9cbf0e23fd65df1cb51499ee262d345d79d2625388cf149c3c39f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00449-of-01024.json.gz": {"num_bytes": 320043698, "checksum": "3bef99334be9d39f41296f8f134c88f04fe66502da2d2639f0d6d2485338e607"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00450-of-01024.json.gz": {"num_bytes": 318033740, "checksum": "9cd05b1b70ffc3c004b4b4a2f21f91abee1395f3a485efd1aafda550193df9fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00451-of-01024.json.gz": {"num_bytes": 318549622, "checksum": "b2ef6cc4ac7c4c69fb1661d7ed9b2ce4da261c72f9e49dc3c934180501ef3a24"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00452-of-01024.json.gz": {"num_bytes": 319317230, "checksum": "89927f1fd79a5b1439988fd37e0377175176d9ed22d14611f67a81e185a336b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00453-of-01024.json.gz": {"num_bytes": 318952561, "checksum": "427f55bbcfb6c1a0ef12f96cb122f362b975169770ce1d392b763c4b4408cb34"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00454-of-01024.json.gz": {"num_bytes": 317545286, "checksum": "2fc3b172ea721bc92b0f7614e8fea61b0781e6f4f3e6b7263cf0190beef3ec52"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00455-of-01024.json.gz": {"num_bytes": 318975631, "checksum": "c96f688ecb19bdb1592b0124021fb80d48965303442de76751d82fa03ab8f6d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00456-of-01024.json.gz": {"num_bytes": 320016575, "checksum": "61d2be7a4b9e34cfb994ae2c120ed5a51a6669564046637445a46b9872812416"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00457-of-01024.json.gz": {"num_bytes": 318236935, "checksum": "a74dd51c3c490458ea0e61196d7e0085aff80d50cd149a673f54f661b364a671"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00458-of-01024.json.gz": {"num_bytes": 318495925, "checksum": "adf9cd717f2c79504dace22b5929d4c4064353e869457c20cc81a0b2db390c89"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00459-of-01024.json.gz": {"num_bytes": 318956821, "checksum": "d7be5bcb738a75586125e56a25aa234618528accda620eaac421beab6288b992"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00460-of-01024.json.gz": {"num_bytes": 318968681, "checksum": "6181280df5418fd9ebb52aa26a631100b6c3da0750dc5fbae152a6a44fccb942"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00461-of-01024.json.gz": {"num_bytes": 320810761, "checksum": "5e943c458674371dffb2466274b8f2a9df9902a370901ef97992bdf920cdae0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00462-of-01024.json.gz": {"num_bytes": 320154899, "checksum": "76b3d1b120cbb7cd71d004440e0c6bd9f9c4395424c568e8362973038017a90c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00463-of-01024.json.gz": {"num_bytes": 319247449, "checksum": "9de2c86d85289113b24c2f7eb4771ec1391511930f5f26a12133d41faf0ce908"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00464-of-01024.json.gz": {"num_bytes": 318150152, "checksum": "85fce3104ef0b247798c1de8d9d616d3de754841fb6c49a01cca5b9da5efa94e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00465-of-01024.json.gz": {"num_bytes": 320342803, "checksum": "ddf312f0b8de8f53ed556483fd998ae308d4829d18195a48869db6bf1866c332"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00466-of-01024.json.gz": {"num_bytes": 318619029, "checksum": "01239a1ff6ffe9032da320c5a7d1a93125d0724851e3e10746821c9452070887"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00467-of-01024.json.gz": {"num_bytes": 317677227, "checksum": "41783d20189a4bcfc33f543597a5473900e692ea13fa522f2724e27e810b4e9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00468-of-01024.json.gz": {"num_bytes": 320038217, "checksum": "7131b6f4dd423f2efe55c3f598893676300b31651cce7eed32ce633a015f8ca8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00469-of-01024.json.gz": {"num_bytes": 318359701, "checksum": "925bc76c045f25532414f29820adb0cf1a56c54b406333a6f348c29e5efda9fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00470-of-01024.json.gz": {"num_bytes": 319329235, "checksum": "9be740483aa7bbaf94dce550f2c20404c89326f6ec4ebe1b7070f85f93507038"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00471-of-01024.json.gz": {"num_bytes": 318792779, "checksum": "0e3d9492f15dc9867bb0dc803bdf45608fbe67255014b4488902d7bf2e2554cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00472-of-01024.json.gz": {"num_bytes": 319552622, "checksum": "00484bbc10bace3dfd93b57fc53d6f5fac26b7dd54fd5b5428d75eb9e6dbb0e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00473-of-01024.json.gz": {"num_bytes": 319466828, "checksum": "5db5d585798e8ed8e4a3bc540871f1185f67125f397a12942d21b24e6b374519"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00474-of-01024.json.gz": {"num_bytes": 320014669, "checksum": "db07fd0e972c1a474806c1b4464ad4cefdd2e8fc15806ba0d259d4f9e594c3f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00475-of-01024.json.gz": {"num_bytes": 320379280, "checksum": "e6e36a9eed8be84c928980fffd8177b177182726c9e13b41a47343d431f76a7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00476-of-01024.json.gz": {"num_bytes": 318820301, "checksum": "0543ed2d0b3aaba0b0fccbf0311836143bd19175c5eed9bf0f024ffb9ce3c50a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00477-of-01024.json.gz": {"num_bytes": 320577830, "checksum": "a62fd62ad771dbcfb7af73841e15a49e9d7239c53dbbbd84de2282131bca9c99"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00478-of-01024.json.gz": {"num_bytes": 319593908, "checksum": "beae9334a8e93e4b036c4a9b3c5b3a75fff17264177184d243d9e6da286dbe2b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00479-of-01024.json.gz": {"num_bytes": 319728825, "checksum": "ae5b475c7be35d98b77d6c4aed5d61cbd1c98544c9a6e73a53ef2911757ab7f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00480-of-01024.json.gz": {"num_bytes": 319903674, "checksum": "51e0611378455d909e8b0f292eb62038848aa7afaa4f93c9c83061258b211a95"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00481-of-01024.json.gz": {"num_bytes": 319998409, "checksum": "68c640304ac952f544ea88c88d7c994c8d2955b95036f8352a67b57a836fa1bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00482-of-01024.json.gz": {"num_bytes": 319047238, "checksum": "74cefa57158d0008a06ae85b2a7a1c04d57a79b7ae3f7b4b3426dbe9918b36ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00483-of-01024.json.gz": {"num_bytes": 318775875, "checksum": "e99faa71222017521f1fc9999bbb0832df5c91f8b9f6e2ef501d3f827d3a1e85"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00484-of-01024.json.gz": {"num_bytes": 319190491, "checksum": "4518faae7c9d51a51f0b02cd895cf27e7c87a623b787346c844a8d9f0b52d6ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00485-of-01024.json.gz": {"num_bytes": 318974502, "checksum": "1bc8b207583b9f36169e0e9facd258de8eb73dee8bf831051dd1ab04b7726c6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00486-of-01024.json.gz": {"num_bytes": 318599424, "checksum": "0b1d9900e1921483b85305491f914b6b78fabcd0686a20695e61b89b7380a894"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00487-of-01024.json.gz": {"num_bytes": 318958015, "checksum": "c0c789c5f3b34d170d2aeb72642c70d2fa5eca567e7850d0c89b3d170f3bbf64"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00488-of-01024.json.gz": {"num_bytes": 320205671, "checksum": "6eef7a1ea80be43e84cb0c974215a477c909844899ac694afe1af2e8f4ac171c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00489-of-01024.json.gz": {"num_bytes": 319193967, "checksum": "eccf5d7f682a76e11332f07e7d54a080f76c0be58a98a853a9fe90c815a22087"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00490-of-01024.json.gz": {"num_bytes": 319833603, "checksum": "afe99e32ba36134f23b59a2ee43965bf185432de947740fc19e26eef41027aef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00491-of-01024.json.gz": {"num_bytes": 318912982, "checksum": "e981151b23b233bd3e5798f78658b5f52a73f69db39c30615f615069cf0c4984"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00492-of-01024.json.gz": {"num_bytes": 320057824, "checksum": "0cc5f7df318e0718fef93d24e7ff904b3e8e2728c4fc0b1d13893c81d8e6e2c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00493-of-01024.json.gz": {"num_bytes": 317967559, "checksum": "93749543b04a5a7093177d2a03acfc0bf6f26d5b53864ae35839a9421fb48169"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00494-of-01024.json.gz": {"num_bytes": 320426917, "checksum": "e461f56b461a4d5ce353c60889dcb99e10818985d3788440c6119bb145876277"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00495-of-01024.json.gz": {"num_bytes": 319528392, "checksum": "e530f3030ddbf7191bc4082e8209f63eb48733d7085d79a8469ce3611ccb79b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00496-of-01024.json.gz": {"num_bytes": 317570766, "checksum": "ddec34b528bd5314019d12089e600df27e781d78f43b6722b9c0202ccf385755"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00497-of-01024.json.gz": {"num_bytes": 319154838, "checksum": "e7438a08000fc7a158f887755cc496edcf51c8bdf2bc4a888ddd2c829bf8fa3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00498-of-01024.json.gz": {"num_bytes": 317955368, "checksum": "ad133d808ca5b6181bae1921ab1261d79630c09bf9d6c904db036f22e6f32e6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00499-of-01024.json.gz": {"num_bytes": 318286671, "checksum": "cb40879ea08db5a9eb6f2c23756574bda34deb9acf039b992f0ab90fdbb01594"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00500-of-01024.json.gz": {"num_bytes": 318510936, "checksum": "21e5f7468a907f38c3dc0a5c19f09921476f9186beff967e829329f191dad6b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00501-of-01024.json.gz": {"num_bytes": 319611074, "checksum": "38829434c8539bb9fa9ea32bfba3c6732c5021ffb60c16fc502fe61de83906ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00502-of-01024.json.gz": {"num_bytes": 318630954, "checksum": "22d1ca1edae179d2587495fcdf1d3e515c6f547cebafc54996c93a121731fd8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00503-of-01024.json.gz": {"num_bytes": 318253198, "checksum": "e95689993390086880e630ec4540e0629551076c0cad2c70f5aedd3aebfec181"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00504-of-01024.json.gz": {"num_bytes": 319497151, "checksum": "0cd7b986d247e010fd76fa2ab2b62d5f9eec292b28c1e7bd3e4c577042b598af"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00505-of-01024.json.gz": {"num_bytes": 317498965, "checksum": "f1504912fc53cc3690e26ec3babf736ddbeb8f7d9196dac83f757699310b30ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00506-of-01024.json.gz": {"num_bytes": 319684193, "checksum": "9f6defbac132e097cbf7cb7d181cb154bace6af48964fe09d111bc610fdcd2bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00507-of-01024.json.gz": {"num_bytes": 318394726, "checksum": "a58f39d0bef19abefc089342d8bb6d75dbb2c663f67127673ec395404bcf15ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00508-of-01024.json.gz": {"num_bytes": 319013108, "checksum": "176443b39840826bfb1db2cef2541449a6fd0c465ff9bbf0cb2479f07fb8baa8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00509-of-01024.json.gz": {"num_bytes": 319832758, "checksum": "cce5a142cd7a121eba8c182d499442f4b0a397ea1484c33ccd79b1acbae832fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00510-of-01024.json.gz": {"num_bytes": 318762241, "checksum": "bfc910625f0fd6074955906bb86e789b0d0adcd1f8956cb8da276933dceac256"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00511-of-01024.json.gz": {"num_bytes": 319240643, "checksum": "ce53021b90d1c86e2d46293e7053aa174387d7408bf0cf907898be69b1a7befc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00512-of-01024.json.gz": {"num_bytes": 318353376, "checksum": "e9333c6f73c30c9cb7f31794025eb9129455fac2edd64f8b3f22f879124c6a85"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00513-of-01024.json.gz": {"num_bytes": 317653011, "checksum": "d9450c6f541e82922b37d3b7cc25611707b44884f27825db4dbd65466b59e8b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00514-of-01024.json.gz": {"num_bytes": 319391160, "checksum": "20b77f5fc2a939fc291f901e8774acfbf04ffaacb08192b724673eadc9f83c12"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00515-of-01024.json.gz": {"num_bytes": 317994258, "checksum": "32ca1f60d0deb395538a93ce5044a48fde05864f2c26af42dc53405b6dc05031"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00516-of-01024.json.gz": {"num_bytes": 318786801, "checksum": "eba4f34749eef4da2b0729abbdfa2ada77bd65383c01213d4f86625670430a65"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00517-of-01024.json.gz": {"num_bytes": 320010732, "checksum": "617765f971b879182db7debf879025f8dad4fd8846b11728ee1230767c031c04"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00518-of-01024.json.gz": {"num_bytes": 318681019, "checksum": "6987893764c56b84fca014532824a05d4187db5c313be4f7bdcb363b7e8cc8db"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00519-of-01024.json.gz": {"num_bytes": 319951543, "checksum": "ba151c4734db52e7c220dbefe380825ac6d66a9c6abb901b8096a87d97a2deb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00520-of-01024.json.gz": {"num_bytes": 317948056, "checksum": "7e53ed26c3c068b0dedd026219b7cdab79775545ebbf31b5dadadb45364c9985"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00521-of-01024.json.gz": {"num_bytes": 317993802, "checksum": "4d1d4a5583430e373bd2cfd191e59cd8911953fbd73fa924e0c15be76499b54b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00522-of-01024.json.gz": {"num_bytes": 320189449, "checksum": "71d851498785e312acf93861a43169794d4d576f5fe8b960303419316c8c898a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00523-of-01024.json.gz": {"num_bytes": 320443871, "checksum": "587867d619115c2accb69322b197239b79f12de41ae80427fd369813ad8d81af"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00524-of-01024.json.gz": {"num_bytes": 318192840, "checksum": "7324c02db00b06d0f41d6e5ebfa4e4dd6554f5f4849d6de187ebb84162d0446d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00525-of-01024.json.gz": {"num_bytes": 319294602, "checksum": "24ae3495e5b59883967c62b8fb3a4fa7525d33c40957fd5fa3be413d66c24eb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00526-of-01024.json.gz": {"num_bytes": 319783465, "checksum": "27cd95e7bc6a3f156f1f8f26dc5e490818fc4810562e3964a19fad401cceacd2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00527-of-01024.json.gz": {"num_bytes": 317240081, "checksum": "6b84920fe7e28c01a03800512915c7a9e47816267ac652f9ee0314e3428bca72"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00528-of-01024.json.gz": {"num_bytes": 318320694, "checksum": "fec06589f714ffe1343cb6781898e29e5d0cb789deba3aa4a4ccf86514d3f690"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00529-of-01024.json.gz": {"num_bytes": 318391515, "checksum": "a98c34c04c1b6f0ca3acc9e10fdf4bd0ead2ea7271832ce4972df8677590918b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00530-of-01024.json.gz": {"num_bytes": 318473966, "checksum": "1677d541c7bc10971c711f1eb030faa2e85e0967112ba57d7f04712908e4f040"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00531-of-01024.json.gz": {"num_bytes": 319463272, "checksum": "92b5d82a058554d3396a2b54504f45fa88581cb2951140c0f0bde67ed11bed0c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00532-of-01024.json.gz": {"num_bytes": 318228175, "checksum": "291bb3d7613f7f00b6910a0de78dbab0d87602243c9c83014de341c131200853"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00533-of-01024.json.gz": {"num_bytes": 318966937, "checksum": "a0ce39eac6d6ecad3478373c264e88b2ea20b77fb2049537c229ad3da2769c85"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00534-of-01024.json.gz": {"num_bytes": 318968162, "checksum": "387db79d4aacf8fa4c512fb78023ff94a43d5d597d5a8c2ec6198e62e4b8c98b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00535-of-01024.json.gz": {"num_bytes": 319253588, "checksum": "3ff8f4a926fdfb6201a94d75c17ec5afe662a339a65019eb5e1193c1238bd388"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00536-of-01024.json.gz": {"num_bytes": 319662526, "checksum": "0c805e83d8cfd979701df5714713d062e14853d7e2b0f77c0b414a626686cd33"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00537-of-01024.json.gz": {"num_bytes": 319177095, "checksum": "f9a0ac216e316075e5c2219449a954f989eb160ead2ca07ac9f3813274e18f2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00538-of-01024.json.gz": {"num_bytes": 320109104, "checksum": "a425ef4dddefb40bac5a8cd3191161a41737aea5088a614410d10d83bbab5e37"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00539-of-01024.json.gz": {"num_bytes": 320600564, "checksum": "3580ea8da9c4aff1296e89136c5d7f1a37d021e0b10f3ebd1e05612c092faebb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00540-of-01024.json.gz": {"num_bytes": 319993281, "checksum": "ad8dc83bfbe7c8976f08708c5f0229cd4e1a2d80e272b225a8d208133b129dfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00541-of-01024.json.gz": {"num_bytes": 318256020, "checksum": "c7452669237323fdd09ce97624791a0261f3ec07d8a5f98e71a4b1252a2805e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00542-of-01024.json.gz": {"num_bytes": 318843744, "checksum": "1e5a11c25f82ce717302dbcd9acc1f8b916d83eca88d345d8434b1f88768137b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00543-of-01024.json.gz": {"num_bytes": 320482002, "checksum": "bbf96edf50c913d5162ee154423242e7c8faf490ba229f325bac98a5e3eb9477"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00544-of-01024.json.gz": {"num_bytes": 319059260, "checksum": "22c04506b5744df8c71727fc6527fa2bc495a10a237c71762c66d09625d34097"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00545-of-01024.json.gz": {"num_bytes": 317874034, "checksum": "84a78bb62eb6f72de7a75325870d9ecd419f77c4f6728d29609b2f7ab1b8bcf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00546-of-01024.json.gz": {"num_bytes": 319891407, "checksum": "28631c527dc398c9626fc60b39ad94ed880b41c71f55b9c7c670f6a1837f98d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00547-of-01024.json.gz": {"num_bytes": 319361268, "checksum": "273b8598405def0165ceaf9723d1425c9b74368fc22a414616c7ac9327930225"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00548-of-01024.json.gz": {"num_bytes": 318360761, "checksum": "59990568c0ea055fab27f2b9cd028e1c7177df0479712d1e2d8372e9b017ccad"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00549-of-01024.json.gz": {"num_bytes": 317320452, "checksum": "fd1e361f28cf099df6088e26d06d79f7f62bd8bd89b4524b9baa80ea49a1a4a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00550-of-01024.json.gz": {"num_bytes": 319017444, "checksum": "4424833afcb143f6fdbfc2f5fa2508d6226a4a1df391969b2a751d2d0070158d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00551-of-01024.json.gz": {"num_bytes": 319118159, "checksum": "77b78f94a8bc8f905cf8b1997df1fc3b8c6d77ce65fc28bef68c6083275a832b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00552-of-01024.json.gz": {"num_bytes": 320058125, "checksum": "e7b71167c4ad947232b6acba26e4d3cc9214c25b50b853b5745333bba942f50f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00553-of-01024.json.gz": {"num_bytes": 319220671, "checksum": "ce7891f3820ce065e3bd7afa006e90889428c80bd8e771d66fbbf023bb2a9eba"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00554-of-01024.json.gz": {"num_bytes": 318858928, "checksum": "015a707235f46f179a08d3f6674b6d368dc9612841e2bf39f700f11fef8e64c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00555-of-01024.json.gz": {"num_bytes": 320490725, "checksum": "041dd2e902ed04dfa143476da03d5fd00c30ce1259c0658150af5b77a5a092c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00556-of-01024.json.gz": {"num_bytes": 319863694, "checksum": "22e3d9e4dbdf2b1b822a7bc8c889f4747aa16c71f4c91436d028a228bffe4b87"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00557-of-01024.json.gz": {"num_bytes": 318940362, "checksum": "4cb8b113ad9687b7dee590242c5f50fb3ea3a8775c67492a8ce0cb5c15fc26d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00558-of-01024.json.gz": {"num_bytes": 319797786, "checksum": "ad157a34c6a8d496859f55b00c79fcedf7305d8502ca86a511026f39cdcaca59"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00559-of-01024.json.gz": {"num_bytes": 320156705, "checksum": "816d84753b71fae446428587f41de5b3490e88321f1fa0cfa2ef1fd5eef851e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00560-of-01024.json.gz": {"num_bytes": 318346216, "checksum": "0b1b3d26316f2c0e973ff19820793bcfffa957c3869f74f62fb40cb6839227e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00561-of-01024.json.gz": {"num_bytes": 319571572, "checksum": "4f92594382c897bf94211f1446dbb38c2cc1fff3647acba731dfe0ad89ba4061"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00562-of-01024.json.gz": {"num_bytes": 319453711, "checksum": "2a6ba0c64806add776081f417c8d1afdb324dd8b9aebb603372afd7fc2c4cd6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00563-of-01024.json.gz": {"num_bytes": 318990092, "checksum": "e3032365b9b86883c24bfe387d810c2d9fd1d0a55ff88acd1f5b5357246b13ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00564-of-01024.json.gz": {"num_bytes": 319491917, "checksum": "da6196ab8650fc9f8fa391b821ff070070946412277bd423c40d9fa1de325f93"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00565-of-01024.json.gz": {"num_bytes": 318756269, "checksum": "edeb5b13aa0d65354d78a5ca5d1698732e95f1fcba249c42825a0351d4a34f79"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00566-of-01024.json.gz": {"num_bytes": 318461036, "checksum": "f179addbca50d8612612b0e09138d7ecc89ba7ef2d6e857d7ef0b10223dc71d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00567-of-01024.json.gz": {"num_bytes": 319625728, "checksum": "eaa1d0ee28eb17c6ebe3d85c8af8b7adac28a720b2975f86ac83f3f4d2bffbcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00568-of-01024.json.gz": {"num_bytes": 318428567, "checksum": "3677e88545f2d76b601995cc3e2b6b12fcf65e350ed7eb4137ab4beef3d475c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00569-of-01024.json.gz": {"num_bytes": 320114923, "checksum": "2d8810d8bcfc0fc19d82313be6516b2fef4cf68f56b0448af48b512c98e1ae8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00570-of-01024.json.gz": {"num_bytes": 319148416, "checksum": "8e5356dc0fa2b4e5fa16b36a1586f16920306af1227c765e5d2f0818e74d30d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00571-of-01024.json.gz": {"num_bytes": 318223973, "checksum": "c87cf8b88e8e4fc0a664f4b3a381b78b317680253a83a672cb86e02adb43f2aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00572-of-01024.json.gz": {"num_bytes": 318322508, "checksum": "2bdc857dfeab99c8f83f0267ed5ed7529bca8ee086fce268534bc0264ff738f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00573-of-01024.json.gz": {"num_bytes": 319203246, "checksum": "564fc77dec25ce0d47f4e3d8d04bf114dc06119b28b3ab00d6092a799d496e51"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00574-of-01024.json.gz": {"num_bytes": 318397937, "checksum": "dc3f206e1b5da963184da72e47959844bb164335c76e3261f3a189a4b7b022cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00575-of-01024.json.gz": {"num_bytes": 319183651, "checksum": "7f0c46955e37d5d52b305f71b4ce4fca5368d72e8698e8b832ac0177f868e145"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00576-of-01024.json.gz": {"num_bytes": 318690625, "checksum": "b37d0fbd439bdc05021a71c192ce5e61ebce27448a17819bb53156d9d5f27e17"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00577-of-01024.json.gz": {"num_bytes": 317926085, "checksum": "3092d1ad70fb2d262ecb33f3fb6ea554af3ddd26498ba42b644c383f6d4bd1a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00578-of-01024.json.gz": {"num_bytes": 319190472, "checksum": "d9833fd591a618a167b31b7aaca420f3e719ded98987dbc0f46fd4bfd12564c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00579-of-01024.json.gz": {"num_bytes": 318958744, "checksum": "a11217af10c85ad828de38847eeddcde6af6899563585d581c20adaed3c9e7dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00580-of-01024.json.gz": {"num_bytes": 319893900, "checksum": "71e8be705bfa8563e33392d1c14decd84f52d6a0139b98344f1a0ed9bdc94198"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00581-of-01024.json.gz": {"num_bytes": 320109861, "checksum": "c5f13ba973803ef069762d22bc37ee02a4348af379c75848d93b2685fc4280cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00582-of-01024.json.gz": {"num_bytes": 319238177, "checksum": "da815527ca68b5c2ed604d00ccbcc7c631c60f33e3132f79212634a82c266844"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00583-of-01024.json.gz": {"num_bytes": 319375634, "checksum": "a332b791df0801f0b7227117f0ea3971563e8e420ae24dd94b38d532c1ab0573"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00584-of-01024.json.gz": {"num_bytes": 318596018, "checksum": "e6496d31f42921eaf9f85047e7c2eeb5fef46e01e99760fa676da96481d7d5bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00585-of-01024.json.gz": {"num_bytes": 320156294, "checksum": "08b978ec05d65edd22c301ddc6ab44174eeb7bef5c5997a84342b6faaa47a79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00586-of-01024.json.gz": {"num_bytes": 318716838, "checksum": "567ce600ad99e543507fdf27b9009fe1782bc867f44f3dabbeb93fab1208f337"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00587-of-01024.json.gz": {"num_bytes": 320247814, "checksum": "8f5c82f5eaac4a315d8615c9700cd81f3b9c2e1a17376d3b2482f8694dfe2492"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00588-of-01024.json.gz": {"num_bytes": 319546079, "checksum": "bae91422f87091b3974ca92781a14fae8f10c5c41de9c9132f745b3dcb8bc468"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00589-of-01024.json.gz": {"num_bytes": 319771959, "checksum": "babb615d77f80e5ef99aeed3889a26cef5c9918a7fe68b70a503815e69b0b189"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00590-of-01024.json.gz": {"num_bytes": 318926571, "checksum": "61f2ed732f3b2b5e24882f47b4eb84fea28bf89d112f6f173cbb50523a43c4b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00591-of-01024.json.gz": {"num_bytes": 319669791, "checksum": "3aa2e792ec775a52ee78447b81204867e58b0a46727bab4b7974977aaec2889d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00592-of-01024.json.gz": {"num_bytes": 320393142, "checksum": "1419c263fb74409cb0e39ebd87b1c020ee6863a3a6f2f427be27d3c76b84043a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00593-of-01024.json.gz": {"num_bytes": 320977171, "checksum": "4f16f33217c35a2b155d5b6fe8014c2e52014e63c419e7d3aaf71a35246c1323"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00594-of-01024.json.gz": {"num_bytes": 318211092, "checksum": "c9301ddcafea22d085ae48f551f486e73089a76c7990871f787064c61e4e60b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00595-of-01024.json.gz": {"num_bytes": 318978629, "checksum": "349e104763320eaae96ac3bc53c5fa7a73e7dec93b8cc3afaad108a97e7c170d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00596-of-01024.json.gz": {"num_bytes": 318573003, "checksum": "0eb6c25cf57764ec3aa7f74d6d967c52003f872f2f3b140fe6d5ac6360241a8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00597-of-01024.json.gz": {"num_bytes": 318931514, "checksum": "b42b7b984aad729185ca9b3a6ffa856b2a79165ce2feebe519b10f8ff42c4ab9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00598-of-01024.json.gz": {"num_bytes": 319002677, "checksum": "8306c5971408767b3735288fd0ee7ee7d01d9af4ef4cbec2e57c97b1f78e6d63"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00599-of-01024.json.gz": {"num_bytes": 319637870, "checksum": "844df34f2a263011f9d1d85eaad5a1d95243769e9cec5a104807dd55e1fe431c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00600-of-01024.json.gz": {"num_bytes": 318099852, "checksum": "b05e66568a4472feee31f20918e9813aeae2d881f47b5281ff29fbcfedf4d5b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00601-of-01024.json.gz": {"num_bytes": 319136069, "checksum": "8dff2d56c9915d73e6154533e5de0ca9d867c5fdedcfeceb3e0ab22f3ba509cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00602-of-01024.json.gz": {"num_bytes": 319369121, "checksum": "45b2c1757260395afeb168b545892b315fa0bf14b3d144bfcab1fdaa6d79086f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00603-of-01024.json.gz": {"num_bytes": 319499076, "checksum": "46edc9f556ccae692900b222b8e4843360dd5dbe0798a8ad9cb51c07a451dbb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00604-of-01024.json.gz": {"num_bytes": 319132921, "checksum": "0cba8c8738ea7ff9a08bd1bab215010b03c6c83fe35206d83344d78005bdee6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00605-of-01024.json.gz": {"num_bytes": 319315562, "checksum": "0dc0d37658fd672c8d72775bd8855dce9037cf9715feda35a76afb1f0e87bebb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00606-of-01024.json.gz": {"num_bytes": 319223528, "checksum": "f679e437a3acda1a81013dc0f3fa93fde6c3309905e8142f8699a76bc04b7114"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00607-of-01024.json.gz": {"num_bytes": 319326218, "checksum": "7fe91f86f751b9aa3abf1c5ed0fdab89a76c7fa4eb7ab8b809ef29b0cf4a78d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00608-of-01024.json.gz": {"num_bytes": 319393715, "checksum": "a5daf706100eb797b5b0770fe0c790856637b22dc849aeda5b445ae5fa63cb3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00609-of-01024.json.gz": {"num_bytes": 319554192, "checksum": "4434338fe97d398d9565ae940c62539e868fa261be361ede1b5b0feb004160f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00610-of-01024.json.gz": {"num_bytes": 319786301, "checksum": "6b0d0e0457a721af6c67a31f5016432011e717302cfdc7ee39feb253fbae4754"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00611-of-01024.json.gz": {"num_bytes": 319356910, "checksum": "bfe201b1775270afef3a09fcfc074920cbb01093eef90d46f26b6b813d603994"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00612-of-01024.json.gz": {"num_bytes": 318780229, "checksum": "29248c4732fdfda2ba97ed38192ab391457e20fd70f713ef4a7cf084f9865846"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00613-of-01024.json.gz": {"num_bytes": 320190496, "checksum": "f5cb9be2442797d967b9041e48771196a6c0595933ef2102840b704e355f4d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00614-of-01024.json.gz": {"num_bytes": 320245862, "checksum": "89b74d0daea02fb69289ad259bbd0ddb1a64c5d6380848f7d51669be952f8a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00615-of-01024.json.gz": {"num_bytes": 316874605, "checksum": "78600c8703d5ebf80c99c089bb7a7c1cde843a66d706fd219eeac304f80e8525"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00616-of-01024.json.gz": {"num_bytes": 320237707, "checksum": "630ee29d4dc4cd5062eeca7877e5c1b204b36eb0b3aeacadf036cdb75c1ce840"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00617-of-01024.json.gz": {"num_bytes": 319739365, "checksum": "d418fd284d06b1d2d9daebea3047ed06286640ac75d23893f1effc2ee9d7aa14"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00618-of-01024.json.gz": {"num_bytes": 318634299, "checksum": "f5d75d129ab6c0f052028cf0139c3cf20eed3a9c5cdb151cd88ae42d5d1a32d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00619-of-01024.json.gz": {"num_bytes": 319086471, "checksum": "c558908f6e08b0d02f377c9aed1655d80106f4cfe26e955774bb420d19b2f74f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00620-of-01024.json.gz": {"num_bytes": 320665446, "checksum": "977f959e5b5eaa24081ce025d137647fffd65f1a54d2c45db9805a232e0c0364"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00621-of-01024.json.gz": {"num_bytes": 318576410, "checksum": "d07f3c31d7ec1c71b5ab9539a2ed49f6d5f46b48ee2e51800b9e28cee588a163"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00622-of-01024.json.gz": {"num_bytes": 320053075, "checksum": "58b897603eb83f789a1cfc6bf40a091093cbd8a0c20702018c411adc7b07a437"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00623-of-01024.json.gz": {"num_bytes": 320045187, "checksum": "3665d7579b3c57eb21ec9e55850e39307cc6f4ef8aa8b9937076ad6f142063a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00624-of-01024.json.gz": {"num_bytes": 320136842, "checksum": "35db069ae090e95c5a4d3db44eae73bcb29463c120584d7f6ccbe235983c5fef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00625-of-01024.json.gz": {"num_bytes": 317314201, "checksum": "7f6ddbbc8815e8bd10c99361fd8113cbbd84ebd92799eb6958cf98af825d2aa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00626-of-01024.json.gz": {"num_bytes": 320219970, "checksum": "4e2c46d1e3a94957717bbbf1e1e4300bd27ac17e588d426e0ba688983e83f4e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00627-of-01024.json.gz": {"num_bytes": 320083102, "checksum": "851ce6dfa6a4d1a4e3b8bf439e36db9ceb59eefc60558d429e2fec80655e1775"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00628-of-01024.json.gz": {"num_bytes": 320386844, "checksum": "86d8927f16d0790a07d6c68e745501188d13887df4a137e937ae00497d07c055"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00629-of-01024.json.gz": {"num_bytes": 319476643, "checksum": "c48cff721137b641fe9d5bcf30462c7e4e3a3ae631b7b4e39979c8c77f0890ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00630-of-01024.json.gz": {"num_bytes": 317961579, "checksum": "cde626b34c6c8455227fbb18a577877b518f529b6c8e16881cfdf334f2875cd9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00631-of-01024.json.gz": {"num_bytes": 318952266, "checksum": "0401582821f7b15f0b406f7ce00c56351b8e86a3c3282bdf4dd45b2f6146ea22"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00632-of-01024.json.gz": {"num_bytes": 318261820, "checksum": "be48396ef18ce0f3650eca86eb36039f90b51737f9848086494f34fa28d60e70"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00633-of-01024.json.gz": {"num_bytes": 319748854, "checksum": "9d5c342d82fcace21de2900202c3f2af47229aeae9d487a8b77b7f5b86c05f74"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00634-of-01024.json.gz": {"num_bytes": 317806530, "checksum": "00a70705afb91f6570d17257057c15b45386597b917061686f131bd41ddce421"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00635-of-01024.json.gz": {"num_bytes": 320313573, "checksum": "22a1286582d65975ed94f0ba25bf87e94d52a55214d0a51979a3e0fd9f95e3cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00636-of-01024.json.gz": {"num_bytes": 318151690, "checksum": "026c699ac6fa30f9e156a957026d8fa8df72daee3407c8fdc5e0bd7d6a3b50fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00637-of-01024.json.gz": {"num_bytes": 318665365, "checksum": "9bd931dfc074bc99df31d7fd31a5ac1dc8c8bc75f8e87b763545cd824edcdcbe"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00638-of-01024.json.gz": {"num_bytes": 318521250, "checksum": "4b30ad531f7502ef7bc6398ab286e5c6c63d340c22792da9258ea95b496d1c0d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00639-of-01024.json.gz": {"num_bytes": 319997068, "checksum": "2bfdf36396e49ff625138d29925f54eb12b18d35f6d0bf5ca9e79194977cfb43"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00640-of-01024.json.gz": {"num_bytes": 319355927, "checksum": "d0d0ed7304b5d79318b5230a1ab48d3ed03183f1eb11d96070604a7008cd7b30"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00641-of-01024.json.gz": {"num_bytes": 319002081, "checksum": "1461ecb6b92819bfdc12808a5442d70f94538931f856c91dea602a23ba86ab98"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00642-of-01024.json.gz": {"num_bytes": 317689465, "checksum": "aa0af0169cf13db1f8133e8d76afeeae5f71d63d179794377a55b6c2eb938dc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00643-of-01024.json.gz": {"num_bytes": 317523344, "checksum": "5c060166e776f8efda48882c118dc0fd5e058d9ef40be578bad31e477114a16e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00644-of-01024.json.gz": {"num_bytes": 318876813, "checksum": "ad98ee119742cb8a6efa1be46e9670969397c7bde10049886d7d6fceb82387ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00645-of-01024.json.gz": {"num_bytes": 319981258, "checksum": "8930ae8e14c124218793d2fd1bbfb1b624e918cb092b21c6ca74347abd9dea4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00646-of-01024.json.gz": {"num_bytes": 319624889, "checksum": "a40705c4f9a4db4d2d698cf96e43b99fa0790b886506300eb4986a26de7063e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00647-of-01024.json.gz": {"num_bytes": 319240920, "checksum": "7129182faeac82b47127458e92903a209acf8272166024e8313c167d6f358456"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00648-of-01024.json.gz": {"num_bytes": 317305623, "checksum": "3124091a6c438fecbfc948b1a35ffb1462287ae06866b02a6dbb1a6651ccf1e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00649-of-01024.json.gz": {"num_bytes": 318998755, "checksum": "fdb286cfe9e9091a57b31be61a56a425fae07d6b44f0b45f8743d7aab0e980dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00650-of-01024.json.gz": {"num_bytes": 319612451, "checksum": "ff88c4310f049344b8a3f701bce12d08ef5f9b037e82fef7f1f670b3d51e59c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00651-of-01024.json.gz": {"num_bytes": 319098081, "checksum": "9c3b1843082aae39b057bbc7364e69cbc39bbdf91d5bff4f52b12cf1a264adf2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00652-of-01024.json.gz": {"num_bytes": 317107981, "checksum": "e6199d12a893ae5d05c5388ae7a679df419ef6a050c8e3ce3c15fe534943a774"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00653-of-01024.json.gz": {"num_bytes": 319623884, "checksum": "333ac93cf1f1f4da0f72c5e57b675052453b42dffe1e4d45ec680f4e3e075d97"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00654-of-01024.json.gz": {"num_bytes": 319055728, "checksum": "1efe352f2f2eba826231a5bff6c79390630b44039b226a5041a087e116b60f5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00655-of-01024.json.gz": {"num_bytes": 318539829, "checksum": "613c741cfb738017b3fa233512296d9127d661738721d3fccd806aad54d19d84"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00656-of-01024.json.gz": {"num_bytes": 319970377, "checksum": "51fa9b217b6bcf664c472cc2b258813e1f1d7a0f501c29b822221bccafa4e201"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00657-of-01024.json.gz": {"num_bytes": 318548629, "checksum": "c542c6fd2f3284d64f8d53b71ab8308bbba59f7f13e9d9eb20bbbaf13ad4782b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00658-of-01024.json.gz": {"num_bytes": 319845984, "checksum": "b3d8fb6ed2258c463367108e2942742e88eac657c859cc8d128035110fc87e7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00659-of-01024.json.gz": {"num_bytes": 318887872, "checksum": "02feb4e03020d767a4468251786d4857d5dc833969626bee616c7882bfda9ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00660-of-01024.json.gz": {"num_bytes": 319854892, "checksum": "a997d9187a185a29fb3bbeb1e696d32898efba8f5e9d6ed816493669f0c5ec02"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00661-of-01024.json.gz": {"num_bytes": 317599289, "checksum": "86d9189ebc534c99da5a4407624a623561b159f758fb04373a270887d0b45709"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00662-of-01024.json.gz": {"num_bytes": 318138720, "checksum": "9c626f7aebcc4fc9afd533b6c8a372d884d01f508ce49c01ddd830e4e9e8b2d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00663-of-01024.json.gz": {"num_bytes": 318110835, "checksum": "441d4dd0d5d2ea7b6098a3fe006b9d7afd526188824a3325d44538fc5655942c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00664-of-01024.json.gz": {"num_bytes": 318996945, "checksum": "08ab0739c3565643b6a83d7091936f5d75a4d8418c956146114aa0315f205dd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00665-of-01024.json.gz": {"num_bytes": 320612903, "checksum": "1ab7bc2d0f7c6704c97848a9325015f06228339bc52cc1fb593d9c56145e7c48"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00666-of-01024.json.gz": {"num_bytes": 319241006, "checksum": "8b1213325ceb2a2c89dffb891a31317e903d08fff911e4ba1ae66fc3bcce9973"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00667-of-01024.json.gz": {"num_bytes": 319650665, "checksum": "14676f97937eb3d0734e5f121c5f63002ba2d2c62b6c41b4b46d2fcab9ea9614"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00668-of-01024.json.gz": {"num_bytes": 319198651, "checksum": "a406fceed5b7d17ff6d5773679c3df50e747215e39926228ddc9a60c6bf9d152"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00669-of-01024.json.gz": {"num_bytes": 319363200, "checksum": "1d3267d77f43d3d720dcd79c40bc3e8c0cd777d421b1b7d0e69e140199e34552"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00670-of-01024.json.gz": {"num_bytes": 320079826, "checksum": "85111c229b8fcc8428b3c13676bde8268f027fe06e1f576a3adcd82bce1603bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00671-of-01024.json.gz": {"num_bytes": 319494773, "checksum": "eeeed8d9f63a5c16ab9d62454fae5bef1896973cfa69cedfcfaac4565a793b27"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00672-of-01024.json.gz": {"num_bytes": 318304853, "checksum": "6793ec3ffbc147c36e471e1c06a664ac2143408c9ee46305694708eee0fb38cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00673-of-01024.json.gz": {"num_bytes": 319031236, "checksum": "3c886ff71973805a59312d8d43ee9e616bcfafd76c03a64d53ab548036b1fa90"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00674-of-01024.json.gz": {"num_bytes": 318647345, "checksum": "fd7f4efc0c8af611e7e137680342843d0471ca072421ab3c172a169ba2f5d217"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00675-of-01024.json.gz": {"num_bytes": 318313871, "checksum": "3b797b2ad717749a24866a97acb95aace0dd4e91ee7d51dcf1fdd46a9232b794"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00676-of-01024.json.gz": {"num_bytes": 318858652, "checksum": "2ccdf652fd413dc624643d35a76223e8a44e6241997841ec2d13ae11b56400fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00677-of-01024.json.gz": {"num_bytes": 319236091, "checksum": "bbf069c696f09e5467b17ba98479948a85101efa776094084e37581e72c01123"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00678-of-01024.json.gz": {"num_bytes": 318996096, "checksum": "3e3dd21861c713bd38d1803c32da1c0bc2496899648b4cffe1fa2e61b35ca056"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00679-of-01024.json.gz": {"num_bytes": 319915466, "checksum": "6ed56468a31564cb25668ceb5df325ff7138dd231afa85f676ac7af5e81e0642"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00680-of-01024.json.gz": {"num_bytes": 318537417, "checksum": "959ce407e7a892495c477b9e0071dff496fd20db9cfb04dd035ac59dd5b2f309"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00681-of-01024.json.gz": {"num_bytes": 320181225, "checksum": "0aa77d778f24bfdc8566b390a7a1ef1d7880a42b98b3e82e9b37ee3ed821a8e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00682-of-01024.json.gz": {"num_bytes": 319087756, "checksum": "a4da802570ee7bc27e752069612b633edf226078f48d5f55280f73a6dc934127"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00683-of-01024.json.gz": {"num_bytes": 320019766, "checksum": "587497efb7bcd4ca85ec0559e372ea285c1b95e3889d406f142cfe454d8e0e2f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00684-of-01024.json.gz": {"num_bytes": 318814245, "checksum": "6e904f73976ca18aed3375d1c1b308d749b9a4405a333dd0a2cf85360822e205"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00685-of-01024.json.gz": {"num_bytes": 318586686, "checksum": "c51012772c5bae73821b67f72c035f22a40725d42bcf51e439bbdfcd84393ef2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00686-of-01024.json.gz": {"num_bytes": 319648436, "checksum": "890b7408abd0cc04a84be3a3992d05714dbd30a9d33a8a9b05316a980fe51313"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00687-of-01024.json.gz": {"num_bytes": 318909835, "checksum": "b54b20c21ae9834b630a8aac057d47069cf137577d30b91fd1475f5824b61561"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00688-of-01024.json.gz": {"num_bytes": 319381735, "checksum": "422091d5ba0d44c64bb0c84ab4757318414bc01455a97f53190eddda89c2f3f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00689-of-01024.json.gz": {"num_bytes": 318995026, "checksum": "ad5080fbddc914c649027d5e2214f1d75e0cf0617eb3ca0b1fdb8ed9129f99cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00690-of-01024.json.gz": {"num_bytes": 320745318, "checksum": "d45492346bb4bf519e657356ecf1805b6b592683b98c20c93da2f07c50b06092"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00691-of-01024.json.gz": {"num_bytes": 318575084, "checksum": "43a07e8a98bc99f381558c938fc83acd4a37d565459c0f3f83aaadda816f66c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00692-of-01024.json.gz": {"num_bytes": 320651368, "checksum": "21a790ef1dcc9c6ffa071d1a2e21e330d6afcb45368dde9cfae8933c6d029742"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00693-of-01024.json.gz": {"num_bytes": 318429145, "checksum": "85558018ee61e33c4f3e05acc2029e69447a5717be880e9a0aa8fa715dbd0c05"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00694-of-01024.json.gz": {"num_bytes": 319562061, "checksum": "894f4c906a33c644ea80c3a00155ced807a62e1bcd9f6e254cb6c88efeedd142"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00695-of-01024.json.gz": {"num_bytes": 318298964, "checksum": "06eb05f651f1d2fff495c48475894420334070df10c051c7253b7afb0bc38291"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00696-of-01024.json.gz": {"num_bytes": 317473664, "checksum": "59ea4f951335553945a644f7628403ba1a99a27e0d93fcfe5db18cbc3dd48ce9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00697-of-01024.json.gz": {"num_bytes": 318839008, "checksum": "f0203b0f2caa3287b8f7a64288af52bafbf033bcdf31dae54e501e4da47b9935"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00698-of-01024.json.gz": {"num_bytes": 318288032, "checksum": "fe2a581cd174429a81424e407aceb1d81b61d9796d74db4590327778fbd5016b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00699-of-01024.json.gz": {"num_bytes": 318696527, "checksum": "edf3aabcdb28fa2feb532b3bd55cd167c2200a6d8e19f05152be194e48acf87b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00700-of-01024.json.gz": {"num_bytes": 318900366, "checksum": "67d89417d1440afeeefd59a0993e4d12fb5731e917ec7f4e65d9319541b4b9e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00701-of-01024.json.gz": {"num_bytes": 318901212, "checksum": "64d302459e6871325282fd890d2922cb1fb25b47d677ce793bc065acc8d1bd07"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00702-of-01024.json.gz": {"num_bytes": 318913325, "checksum": "f0bb360189166a0bd717bad85edf06943333b1854687839864aef3ee02814795"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00703-of-01024.json.gz": {"num_bytes": 318730274, "checksum": "c4e027079b9cf9b1adae3e285c5cc5dafeee5c74cf3621c424b6df9801d508f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00704-of-01024.json.gz": {"num_bytes": 320112232, "checksum": "37540f6a00523cbf429764893aa15aae6a57e53c89cf51d82a815feef02b1210"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00705-of-01024.json.gz": {"num_bytes": 319643559, "checksum": "9dae018569fa4bf33674f67ba03732a2f85cfceb53ec2cbb9457eaea607b8dfa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00706-of-01024.json.gz": {"num_bytes": 319941519, "checksum": "03926405dc629f0664a3d27c700a4fa2f606496f0b52a9bbf2fd2d75faae2f46"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00707-of-01024.json.gz": {"num_bytes": 317628508, "checksum": "fac92295e4c85f087d27e0a6f231d782be7b2448e99cfc42c09c0e1e20964c3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00708-of-01024.json.gz": {"num_bytes": 318863059, "checksum": "39d4880d3e47e65ab6351e94b015810d66295a86a9f08534260ccbef41fdaf04"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00709-of-01024.json.gz": {"num_bytes": 318412651, "checksum": "044fc99a1307737bc8d6d8a9b67997010309fc695eda6e8dd42e5b6bab2256d1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00710-of-01024.json.gz": {"num_bytes": 318631334, "checksum": "0b2c93cf298051864b8660e57182b38408ad738cf930afc09afdde26d952f819"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00711-of-01024.json.gz": {"num_bytes": 320587866, "checksum": "f1f6bb9770b76742d0131495879fa38ed8aebe8a0b38463e7834f0697f174ede"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00712-of-01024.json.gz": {"num_bytes": 318191204, "checksum": "b6873a7d375aa29ff39ca17c3bbc7e328292b1671b59a35e7b01c0e992da90f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00713-of-01024.json.gz": {"num_bytes": 319472539, "checksum": "3bb12a0a806ecb8a5eeaa00188c655f399460609b8a19005a7141bbcb3a7a694"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00714-of-01024.json.gz": {"num_bytes": 320196397, "checksum": "ca6e1fa6f27c9dbadbbaa767fd21dddee7c84ca96bbb6735640ba2631668ad0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00715-of-01024.json.gz": {"num_bytes": 320075706, "checksum": "1a773eec7d738c0e1e253bfd4533f0c43c0d133e564c3458159e0c47d767689c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00716-of-01024.json.gz": {"num_bytes": 318736413, "checksum": "c17a6b2115e56cc3d6bbbd94e8565fb14287057f80199528e6cba20adf557bf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00717-of-01024.json.gz": {"num_bytes": 317351537, "checksum": "cdba391e16c3bcb5569d978a8d11518103e7687714710ef4eba4f7c0821d67d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00718-of-01024.json.gz": {"num_bytes": 318017965, "checksum": "a25c494e4baead0af0afe6eabaa054bc15f80b6ca0ac8dadb1b354d72ffbe63b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00719-of-01024.json.gz": {"num_bytes": 318124432, "checksum": "94f5dfbec85a8c5b22ff1368a16ec2eb7fb4be25c0c8f004096156ae40bfa2bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00720-of-01024.json.gz": {"num_bytes": 318235852, "checksum": "c0248326e698599dcad01eca25d747c138881c61b5636ba765b21f9cd0df996a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00721-of-01024.json.gz": {"num_bytes": 318817834, "checksum": "c11df487a966e748cec522fae4ed76abf3e8cc9bcd28c301117fa52ddb83dc6d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00722-of-01024.json.gz": {"num_bytes": 318553851, "checksum": "63d3d0c3f5dcdff29a0a6ef41e3a9df3fb505c73c8554839e3032293a78bae2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00723-of-01024.json.gz": {"num_bytes": 320174720, "checksum": "29c97bb8ff301080547255af29bb5019a2c1fbc74f0a2711e626461d5a5f0b54"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00724-of-01024.json.gz": {"num_bytes": 317805413, "checksum": "65f8932f3c77b0fee5f2224643a71ff95246720368fe66d45c22df25ea4b9c2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00725-of-01024.json.gz": {"num_bytes": 319460597, "checksum": "dc785a8aa3a1f4ed77512d51a9139dfb24b356b5499ae67dd5b860101b1e0e4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00726-of-01024.json.gz": {"num_bytes": 320934004, "checksum": "45d857536d3535d08cddb6cf50d08d89cc28138a5be082465c3a8c27c02ae2bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00727-of-01024.json.gz": {"num_bytes": 318393879, "checksum": "e4a02e43eeabbecb81b971f4201212104b6214078cafd9500d5b5f323595f060"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00728-of-01024.json.gz": {"num_bytes": 318826577, "checksum": "cfaa0d0c8dfb333899c73e0c2aa00dfdadd00e5b4a3d477e7518c4141899c8a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00729-of-01024.json.gz": {"num_bytes": 320390067, "checksum": "528fe99b0c8dc917ac0f02a555603f9ae81e690b4ce1040f65ebbad3390c0426"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00730-of-01024.json.gz": {"num_bytes": 318156386, "checksum": "786e6913b4417a87cd4cb1882e181d8b2e1eb4b4db5b4b9ad2120b5efdf3e2ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00731-of-01024.json.gz": {"num_bytes": 320013543, "checksum": "f28fc2794c280fc1de263b9b2a81e42423f8dac3af7c4fbd3b3aff888821ca9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00732-of-01024.json.gz": {"num_bytes": 318753697, "checksum": "69491eb25dbaef78235f769422e773de7a2578e678ecde29dcaa663f4ebfa78d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00733-of-01024.json.gz": {"num_bytes": 318640706, "checksum": "dfde8960d738b873bcb75abe1661fcaa096d70c76aef21846b173b8adf049bbc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00734-of-01024.json.gz": {"num_bytes": 319447398, "checksum": "145add76dcd73916b548e7e3b161757c1bdc1f22a0f127019f24827afd6f85e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00735-of-01024.json.gz": {"num_bytes": 319868149, "checksum": "dcd4ba95672630f89e75b70dc08cb918bbe896f5d32ffeba7d3e4921b27c1f4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00736-of-01024.json.gz": {"num_bytes": 318404586, "checksum": "4710b1569342b7aa7ca610d8b8cbb2248a1c5fcd8c6ab3b7f875657dff4779cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00737-of-01024.json.gz": {"num_bytes": 319915151, "checksum": "7091dc758fd14c206514663eed0ae446178ff38e76c4cb7e711c63d419506e49"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00738-of-01024.json.gz": {"num_bytes": 319709793, "checksum": "afe1a96ced49662b14bc60b4ff8fc1f610bbc6f3c515bb73f2fade7a0ba67678"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00739-of-01024.json.gz": {"num_bytes": 319789716, "checksum": "9e2332cfc994483d4b913c6556ca9c1698b95e81033b7bbc5a4f5271e5cce708"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00740-of-01024.json.gz": {"num_bytes": 319102226, "checksum": "61ddcc3af919b753638dd46f18f790d7783cdc3090dfddbbeb40faa93bed340e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00741-of-01024.json.gz": {"num_bytes": 318717589, "checksum": "aa3038c23a37561f2ba92e95ffeaa3e3641c1a69f8688b724116edd128e9ba52"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00742-of-01024.json.gz": {"num_bytes": 319456536, "checksum": "ea9d23abfed6e3e8ab900291a3bc1faa27751ff94e35378f8c4eb07207036a9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00743-of-01024.json.gz": {"num_bytes": 318641730, "checksum": "6efcec6cd087be4eaa98491e463d0fb9c1253aca275971de08c56a20be9aa579"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00744-of-01024.json.gz": {"num_bytes": 320264992, "checksum": "71653351253c8f7fa18673a3f956bddebd158978708c5a4c9e9b5318f598e1f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00745-of-01024.json.gz": {"num_bytes": 318665967, "checksum": "347dfd824d6f4afe58c6f418ab5d332909038c880f4dcda7f774d3d7a588c3f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00746-of-01024.json.gz": {"num_bytes": 320005833, "checksum": "812bc3c082e3a65c8c77fc7767bb435f9be9a999961d84eadc9e0c602e5ce168"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00747-of-01024.json.gz": {"num_bytes": 318575441, "checksum": "a4414d376c69ae8dd5e60b206315cf920d5a797c6ef7c08fe0c4b4e28b4eb4ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00748-of-01024.json.gz": {"num_bytes": 319266882, "checksum": "f08aee694b85d5e7120652350bfafaa05495e609aa6d2fb0b913ed8a718d7dcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00749-of-01024.json.gz": {"num_bytes": 320205042, "checksum": "b3402b16a5cc817d89a19fd3456a50b5b6d5f3f555eea725167558cc85366d12"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00750-of-01024.json.gz": {"num_bytes": 319198252, "checksum": "6b95232f6d53cff8045bd5ebaa87d6e6c511a74dc646d2a960eb87e801ff4f2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00751-of-01024.json.gz": {"num_bytes": 317855407, "checksum": "badc9d82efdbc8db5dc328e8aa5e80155c52f00b105b136d8c5c948fe237d61d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00752-of-01024.json.gz": {"num_bytes": 320283992, "checksum": "67c32eb497533d6fd20b206c38483d171275029ff525bba3da13b0c62e1ef073"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00753-of-01024.json.gz": {"num_bytes": 321030653, "checksum": "5e95b1cb54d7d7f12bec1559ababcab0c364a0af99e10a42a08357647ef5d3cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00754-of-01024.json.gz": {"num_bytes": 319059779, "checksum": "32cb59ad16dfda8a5b52615498fe2e6d85753fa44ab667af2f525a2467508da5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00755-of-01024.json.gz": {"num_bytes": 317737268, "checksum": "0ad2fef2fe37d59b163e29c2287938a768ee87acc34752394809295d0710c602"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00756-of-01024.json.gz": {"num_bytes": 317293218, "checksum": "db737ceace329fb1f8fe1aca38db048a1dedcb5226a4132485f26afecdc6c3c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00757-of-01024.json.gz": {"num_bytes": 319529375, "checksum": "8b823e97964894189a13df393e1b3978342fb24bd81f07af6e54b7bfa2992796"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00758-of-01024.json.gz": {"num_bytes": 319297548, "checksum": "3f31d7ad99d88dde757a651b12db909a30cfcae5796fe3f85722598d92344ba5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00759-of-01024.json.gz": {"num_bytes": 318154496, "checksum": "a4b780127d6f22aed49d155e234e21a847a60626143a8e7dc6e31a5f204e79f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00760-of-01024.json.gz": {"num_bytes": 319386997, "checksum": "020e68dc60004d0661de8a22fe2b9fa7f481fcecaef8fb06efa43093a2a9cc52"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00761-of-01024.json.gz": {"num_bytes": 320035555, "checksum": "8d7b5a97770a062276ca909a3bd20365cbaf3931fcbeb8b7e479f5ee03b47053"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00762-of-01024.json.gz": {"num_bytes": 318099583, "checksum": "b8fcbbf9b55cde2ff66ca046884870e1e5f2d2a729a8eedb253c16fe0d7658e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00763-of-01024.json.gz": {"num_bytes": 318354409, "checksum": "ce2d9e44161b13f6226cfb9f93ad42fa0edd18eeaee923c8ab31c25aec1fc976"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00764-of-01024.json.gz": {"num_bytes": 319181291, "checksum": "53ed1ef77f24bdd7c189aae0905d63be97f48aa3233fda139e59af53baab242a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00765-of-01024.json.gz": {"num_bytes": 318147738, "checksum": "26b9b9ea2f94b322c03d1b83b25ab4e9a1a203fe9923728c5dd91f22d5f8fef5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00766-of-01024.json.gz": {"num_bytes": 317964368, "checksum": "e59fec52abde3fb4cea58a5a4e511f4cc61e21062bfdd1e3ffd60131a847e0ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00767-of-01024.json.gz": {"num_bytes": 318750919, "checksum": "0e5eff983e793a3d7cdd1ec85a45d58e5e6ecf7a12cf83a01888e148ab08acf9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00768-of-01024.json.gz": {"num_bytes": 318978892, "checksum": "171509b0bed8854b6de92fe146993be80ab31e0aa56953c7b0a66eeb738ff70a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00769-of-01024.json.gz": {"num_bytes": 319386097, "checksum": "704e7daa85c0e3ac974d51a6e2cf6df2ee053613fd2b77b5fe16d10b29a50a4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00770-of-01024.json.gz": {"num_bytes": 319623528, "checksum": "e787064473427fe17ba95d9326d009e9723148fb314a7a9605dcb6698854dad5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00771-of-01024.json.gz": {"num_bytes": 318911381, "checksum": "c54aaffd8162b30280e974e81e9d0669357b74394e0da2d1ca2ce613f5715e4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00772-of-01024.json.gz": {"num_bytes": 319386949, "checksum": "2f9c83681632482df6c65e4c70718c83f500305ee1d061626cdef35bd794a412"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00773-of-01024.json.gz": {"num_bytes": 319962599, "checksum": "f47c487ba09051c9a4bf320d69db9546e98948e3de68050ae2ba025c71e09146"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00774-of-01024.json.gz": {"num_bytes": 320370991, "checksum": "69a1eacfdb6f6fd49ea2b729a7ab291b96fd5bd42f993e2306d044871b069aa7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00775-of-01024.json.gz": {"num_bytes": 320433220, "checksum": "d35934fb537d1283d40897d05c1486f629776fe9e4ef127694ecfd0221f860c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00776-of-01024.json.gz": {"num_bytes": 318809986, "checksum": "9079970aa1618b6be51caeab7a2cab26e61c30aa53af361a6184ef6249bf65a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00777-of-01024.json.gz": {"num_bytes": 319617796, "checksum": "5e200e354ece1713a32a3e1ebcea33412de814dd5843df3523afa1ec9a4d5275"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00778-of-01024.json.gz": {"num_bytes": 318039278, "checksum": "b79309eb335c0c860c85d2b724df52c3613f61b92ab6cd6276c2be8c25a7b01e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00779-of-01024.json.gz": {"num_bytes": 319078058, "checksum": "fc6053d53255e4d4a4c22c42049ce3eabc224320a51c94c1116f3201f87b377b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00780-of-01024.json.gz": {"num_bytes": 317637428, "checksum": "e38c933003910b02beef64af2d330f32af6e6f3b7346fa121e89045c136c13af"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00781-of-01024.json.gz": {"num_bytes": 318792407, "checksum": "b6795b4db199f7a7a92ef195aee3753e5e00df05fad2d8401b2b9feb56d71a76"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00782-of-01024.json.gz": {"num_bytes": 319081289, "checksum": "dc20640bded03596eeec689f1293be55e72d138cf0c576df9768c7631931ceb9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00783-of-01024.json.gz": {"num_bytes": 318663257, "checksum": "ac2b4ee9ab8f25ec010a17358d2f3f1fb9d8d50c9f4b73357429277710e6564f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00784-of-01024.json.gz": {"num_bytes": 319687102, "checksum": "fb93dee8a974f2ea204c240ed4c24e1b64f91ccb421070be305487e4e53ca083"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00785-of-01024.json.gz": {"num_bytes": 318909034, "checksum": "2f298b358cc619fa72097e3dbd9ac91e7dc3f7c5f9c4f2ff6881c988921d2a6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00786-of-01024.json.gz": {"num_bytes": 319213094, "checksum": "60ebe35e0f23ccc61fc0eedc891ea9deb43001beb8205d31360a05b5d58e31f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00787-of-01024.json.gz": {"num_bytes": 318335621, "checksum": "a7b0aa4dafdda2f3dc3c1832b71d4a92af08f99a70a315b4cf9f60c1768bf2c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00788-of-01024.json.gz": {"num_bytes": 319444037, "checksum": "874dda510a01a2f78e51d917d309bcf1a0f21e7e1ca46661f93931a6200b3d01"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00789-of-01024.json.gz": {"num_bytes": 317955670, "checksum": "ec949a05ec7750dacfdf692c1ba118a33454097fdcaa56626fb042eb93933811"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00790-of-01024.json.gz": {"num_bytes": 319033823, "checksum": "0939164a602d7c7140c619130977b6814639122d0038aff7bb840093def5172d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00791-of-01024.json.gz": {"num_bytes": 319366402, "checksum": "fd6ea942b3402b5da4acb1a03bf59b17df402e90c47dbb66fb198ca2f4b5e1cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00792-of-01024.json.gz": {"num_bytes": 319218667, "checksum": "9e8af5aaa6d5ed915eae334c6101948fbcc7bcf6c8c6beaf80fd1adecd67b078"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00793-of-01024.json.gz": {"num_bytes": 318865241, "checksum": "675330d6736a677760d854dcdd9a174eb7c1d426f94e34836a048c2139befac0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00794-of-01024.json.gz": {"num_bytes": 319384084, "checksum": "fd4c2623d9cbaed3fefd6bb88c2d88b58fe8f08e9e8ef0cea6bb22cac68dabd2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00795-of-01024.json.gz": {"num_bytes": 317654308, "checksum": "157533ddb56290662e25cb60842327daec23e377e116496338c9313cbf6991b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00796-of-01024.json.gz": {"num_bytes": 319298258, "checksum": "fd90f055499095efa9cb848dee62406d25820f929554b0e07674d4c95db574b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00797-of-01024.json.gz": {"num_bytes": 320048871, "checksum": "e089a95e96a081dd76e38acf9506bfc7b86c682892d3a8774e9784019db39306"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00798-of-01024.json.gz": {"num_bytes": 319291246, "checksum": "e29133ab6f83c84a69752a451053dfe20887ea884e09cc373afd89bba7458664"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00799-of-01024.json.gz": {"num_bytes": 319175282, "checksum": "8f3f3a67946615bdf499d64341d200477280947e5be8538748e28db768115947"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00800-of-01024.json.gz": {"num_bytes": 316687275, "checksum": "c9a17dc92658ce5d062af25e5c8610a7fbae501627cfc7324ace7ca6a8d75d8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00801-of-01024.json.gz": {"num_bytes": 318710698, "checksum": "4b7d1e130fd8ba536da073069221f68d567492b2bff27d8769fb4ef124cec3a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00802-of-01024.json.gz": {"num_bytes": 318914381, "checksum": "9f186b8d08f5d3090b7c9eb8a6954cf3202caec7cbf5c308221333cd115af561"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00803-of-01024.json.gz": {"num_bytes": 319111424, "checksum": "117b0590a976805001a879c49c42db55579e5bb9a5d4db9ce20e42746f59d574"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00804-of-01024.json.gz": {"num_bytes": 318186018, "checksum": "ea376d6cc1043dee9a00e1eca1c431aa59755d8966162701817f9cf274a758c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00805-of-01024.json.gz": {"num_bytes": 320382848, "checksum": "1e69e7896202206f9f804b2497c4d99cca5c1d139efc782b8ede2cb88f68b48b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00806-of-01024.json.gz": {"num_bytes": 319508172, "checksum": "9da7e230c7abed9beaed9d6090efa8ae1029a418dbbf6d04bb4386aafde3dbce"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00807-of-01024.json.gz": {"num_bytes": 319995091, "checksum": "2e3ba0dbe85c004c6a23b4caf340282e0d0004ab574a14bedc9c83c67cc2c0c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00808-of-01024.json.gz": {"num_bytes": 319880961, "checksum": "f53fd08fea0f874d727422357521176c6810a54abf4fcc7019357b50f1928daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00809-of-01024.json.gz": {"num_bytes": 317100774, "checksum": "dbeed220f330b489cc262fbd7cbe84f04ba8a5118ebbd8f48bc7a4f5f63ae7b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00810-of-01024.json.gz": {"num_bytes": 319625750, "checksum": "fe5dced88ccd54b258c6740d8988e10b128a869ecf28e7096e689c59fa147d4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00811-of-01024.json.gz": {"num_bytes": 318375975, "checksum": "e4bcc5571fdc4f51b733d975e78ff02939d3463264a02d7e651271ab91c81df8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00812-of-01024.json.gz": {"num_bytes": 319663092, "checksum": "b1e41c198bc69d026ab997fdeaa4e687f7a8ddfca751add9bc85f00481708a63"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00813-of-01024.json.gz": {"num_bytes": 319094357, "checksum": "c07287aedf6854f581aaf83b75c4939aa4b10181977d4c4be97c20989ab8f992"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00814-of-01024.json.gz": {"num_bytes": 319521327, "checksum": "c96203ba5461ef92a7a2b0d4e598efda943b5b3adf42a7268c26f1c224410c01"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00815-of-01024.json.gz": {"num_bytes": 319098749, "checksum": "72f2e65c5b482be0d9e3a3d8f5cdb703cec7a515e927bc4411e2f6ff5085ed5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00816-of-01024.json.gz": {"num_bytes": 320377295, "checksum": "df95ac17a25cebb854088cca345f60c2634d07f088e45e251d7f9afdb334c0c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00817-of-01024.json.gz": {"num_bytes": 319007451, "checksum": "bad1cc25de4f66ff36c69284e6b615f68bdc25e45f08e04e33ee463a0c6ef0b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00818-of-01024.json.gz": {"num_bytes": 319609737, "checksum": "acf1b390f1c492d97bf027f06898f1dd5cf8cc6def41f4d43b38a0c99f4a85e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00819-of-01024.json.gz": {"num_bytes": 319164157, "checksum": "3d973eb401876c57e9cd1420fc938da9dd7b08f97d4596c66a8c159e2b56b1b3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00820-of-01024.json.gz": {"num_bytes": 320181073, "checksum": "101d5f0079caa840b934c14800ba5cbb7fca22e9e6915b98b4dc5f37c57f5b4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00821-of-01024.json.gz": {"num_bytes": 320949305, "checksum": "34ba423c93c4262234e6e2005aba0436daa99b05570cff0a58e9d27b65d76896"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00822-of-01024.json.gz": {"num_bytes": 318392521, "checksum": "4a586e220fe34f544dd068f4e1c310459cabd5dbea9a991c21c09f70079eb4c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00823-of-01024.json.gz": {"num_bytes": 318526893, "checksum": "3b10a8e32a3a8f6541400d697516fcd3fffba3554e8d8a96451f01fc6b729d8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00824-of-01024.json.gz": {"num_bytes": 318640792, "checksum": "c921270db8004d309f91e3209340c476191793d47b3cfa9d19fdc602d43dfe65"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00825-of-01024.json.gz": {"num_bytes": 319524026, "checksum": "a6eb347db464976ba5d1aaa4fa64e103ba36520dd1e9c103644caf187be471a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00826-of-01024.json.gz": {"num_bytes": 318469810, "checksum": "dc5f88e6161ac06165f3cd4cb91a00cdff75d2f900e8f53d62bacfd833e352b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00827-of-01024.json.gz": {"num_bytes": 319391185, "checksum": "66a240be851d6622adf7801d9634a456e83e9edfd135601c0dc1aab48902d7cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00828-of-01024.json.gz": {"num_bytes": 319625277, "checksum": "2e989beeeb2a63bfb87a5a401619a8e4155a961b44441cb5f627c29f25962dd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00829-of-01024.json.gz": {"num_bytes": 320001237, "checksum": "0653e4052fb7a4ef503bdfbbee332d650492e99c130a85c04250e18d91cfd30c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00830-of-01024.json.gz": {"num_bytes": 319240468, "checksum": "bd56e55e75a8237b5292fa65e5ecb0dfbabef6ef0dec6695b13522803210f40c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00831-of-01024.json.gz": {"num_bytes": 319174603, "checksum": "ca9d6c643127a390823655256a45462ee6e75aa2485141f6530a3bdf6ce4f572"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00832-of-01024.json.gz": {"num_bytes": 318909883, "checksum": "e91c35d94e183515e660cd8c874c12bbf22e1fd683312446f02287b0d032fb68"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00833-of-01024.json.gz": {"num_bytes": 319095835, "checksum": "971d9a4f8bfce564d42dc0a80009acfa7d2f47557ac19836ab426defe1877714"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00834-of-01024.json.gz": {"num_bytes": 318319786, "checksum": "159412a58fb8deb59e039fa0102bdb746065cbc6b4d1d3da892930fbf8b0f178"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00835-of-01024.json.gz": {"num_bytes": 319959334, "checksum": "814518d53b3023e3b8ac22dad9d65dd50d455a4c7db1490022f447f793f4d24f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00836-of-01024.json.gz": {"num_bytes": 317642779, "checksum": "19ad4fbaa3ff5c638b77980300b8c162c21a8237b87d054a30c46aee67d0ad94"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00837-of-01024.json.gz": {"num_bytes": 320687986, "checksum": "190de7948a4b163047ecdfc856e5f78bbff52ca883edfad26b32fbc0b57ffe36"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00838-of-01024.json.gz": {"num_bytes": 319802866, "checksum": "ccb4d342791a187f3bde225e008ff8cf70465f7fd3eacaa8bbce1ec4e52c2622"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00839-of-01024.json.gz": {"num_bytes": 318621894, "checksum": "3ff5cf5b33996a663df5783f3f41a5b5b2f6e08a2cf91e74cad3bf82291192fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00840-of-01024.json.gz": {"num_bytes": 319757379, "checksum": "8292e0854c01ca79ef03dcc1752ddc1f0df747ad67551b7c0fa5208b6aa3f822"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00841-of-01024.json.gz": {"num_bytes": 318779722, "checksum": "9eee9e089bd396adf5a276eddca9f6352e07f8c33877f85c1f65968aa0c06128"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00842-of-01024.json.gz": {"num_bytes": 318692591, "checksum": "caf3f40a144b43af08687e41a1eb7d08da1b78cd1600574566e11f29fde9cd34"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00843-of-01024.json.gz": {"num_bytes": 318944616, "checksum": "e74d624534091173546755ca236e5912cc8acf8cfef5f9c197b541ebe76f0818"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00844-of-01024.json.gz": {"num_bytes": 319392887, "checksum": "e47d3f44f996398b54f18729f4e81d88d04b19bc529847e86277a6a91ae74e6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00845-of-01024.json.gz": {"num_bytes": 319215311, "checksum": "de7cffe64f422b02668137272943537946c15539954b564345d6722c4eb06345"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00846-of-01024.json.gz": {"num_bytes": 318129297, "checksum": "1d5ea0ab8fcb3975735aa421d646cea4544087f60a79ec209b63c93b6318523f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00847-of-01024.json.gz": {"num_bytes": 318134095, "checksum": "6fa4c50808df2aa8efebae3bbf832ba2b0be2f7113633fef720cffb3c50143a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00848-of-01024.json.gz": {"num_bytes": 318521356, "checksum": "3aeb657aa448af82551c653802c669c985c00b7daa593de07f80733ae5dee84d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00849-of-01024.json.gz": {"num_bytes": 319541694, "checksum": "1cc016f58a4a2c54625214f028df05247ed319b8c1868c96c2efe8147a73d08a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00850-of-01024.json.gz": {"num_bytes": 318861613, "checksum": "eb5fbe6eeb4b0281604df264a5b04a3a0db96ff0d04f252375a788a0d3345c67"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00851-of-01024.json.gz": {"num_bytes": 319356648, "checksum": "ffe1397f1d412979cc66820555ef27345f3a2a48b8bcfe682d48301135e8c12a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00852-of-01024.json.gz": {"num_bytes": 319662372, "checksum": "fa78ed98d602276520e823e17adc7f796320d95e27e08d84d06e66e415b79161"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00853-of-01024.json.gz": {"num_bytes": 317625507, "checksum": "b10cff62fac5191b9cb5e2025227adb838088773e79bfec0937a34bb857e1b1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00854-of-01024.json.gz": {"num_bytes": 319665550, "checksum": "15441b2a7c09a477389a8fbd7401c549dc8281f2bd44251b1546077301e24624"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00855-of-01024.json.gz": {"num_bytes": 319059897, "checksum": "f6127845b162181dd7157dd316021a4e6b5d41393c66d3e577491cdb74657f2e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00856-of-01024.json.gz": {"num_bytes": 319243991, "checksum": "ec9f0884c5ddf82550105f969222d3ee8b0d4907a0a2540ea6c8c67c2d2e9179"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00857-of-01024.json.gz": {"num_bytes": 318546680, "checksum": "840205fa73336ff51d75008ce8c530164ebcef3b50f1ad8deab879a67acf8d5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00858-of-01024.json.gz": {"num_bytes": 318306547, "checksum": "e9b3819e9dc98d66a61f8f4e8f6ecb03099c79ae87a175fe1ae484174b173b44"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00859-of-01024.json.gz": {"num_bytes": 319088302, "checksum": "eced8de72f8755fa0dfb690c626cefcacf5fbbce97029d4589058913c31b9339"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00860-of-01024.json.gz": {"num_bytes": 319704792, "checksum": "90a169718609f16abe120c4b63a20adc0bbedba51de14b004d34dabe530339f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00861-of-01024.json.gz": {"num_bytes": 318444445, "checksum": "d020840f09fa426ee15d19f05e5afd9cf674048e0dc4438dae0b6f02c7227d9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00862-of-01024.json.gz": {"num_bytes": 318606300, "checksum": "e02bf9d3f1a398972f7d78b9b1aaff9a92146554a1358ea1b16ce7873a9f8fd8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00863-of-01024.json.gz": {"num_bytes": 319273730, "checksum": "c977f143cbb5e61160ce76f1cabf7bea6c158abb7e159ec3362aad1cc7af0ade"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00864-of-01024.json.gz": {"num_bytes": 318143165, "checksum": "bdf20dbde61f0663feb70be419c39c60acdc7ecbbe1430d47bf79ae2e114f168"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00865-of-01024.json.gz": {"num_bytes": 319041356, "checksum": "11c9c068ec5c1b612494c1473b7cace67a55ee66155559b19035df180ee260a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00866-of-01024.json.gz": {"num_bytes": 319758401, "checksum": "ab4436f283af0ef2d33b93cf026907cf68255beee9d9dc1d6c542dee9c3f48a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00867-of-01024.json.gz": {"num_bytes": 318991336, "checksum": "56beb5edbca3b66981f5f8e65f2a13a0f6e99e68ff50cc263cc529a4d8ebf371"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00868-of-01024.json.gz": {"num_bytes": 319984390, "checksum": "b9368d2ae0eff869c70c1a1214126c1d084f56887102d3d46e450b2c934102be"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00869-of-01024.json.gz": {"num_bytes": 319462888, "checksum": "68ab404e0ca2247686eb264a0d7feeb9d2460162434f5babb2b1da82d865343e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00870-of-01024.json.gz": {"num_bytes": 318426018, "checksum": "2d60208a558f6ba92d6c6307e1ab626acd7ff3b7bc25963b09e87e464751c42b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00871-of-01024.json.gz": {"num_bytes": 320233396, "checksum": "ee2517922079c713605dafffe6bc0db0a947abf64ff92c409aa1015b92cdb099"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00872-of-01024.json.gz": {"num_bytes": 319570251, "checksum": "83ca4f125bd628cb28210fb874db717635009e36c60b42237bda48fcb611a53f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00873-of-01024.json.gz": {"num_bytes": 318755978, "checksum": "d94ce49fd17da5f70d1a89bc9e5323daa54f0b8417e1ee5d991467c80c068ec7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00874-of-01024.json.gz": {"num_bytes": 318986904, "checksum": "f634915d1b529d9d728fd96993bb151dc07016767cd44ceeedddec73eaf37074"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00875-of-01024.json.gz": {"num_bytes": 319116193, "checksum": "6367b1216e1c6ab18af66471d866f39caeb9a538209134a9e6bbbcb81bc51db7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00876-of-01024.json.gz": {"num_bytes": 320829257, "checksum": "c9ad4ab8c6e5995aaacd72ebc6654b43b4756804bf3cea808610f9b618f98fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00877-of-01024.json.gz": {"num_bytes": 320082625, "checksum": "835ae7d54732c309bc9aff231268474af66653b06ad6ca17b54dab6f4a7d30c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00878-of-01024.json.gz": {"num_bytes": 318964554, "checksum": "49c761449d5052dd6c408268c77196bffc5125eb5189390f73ba0ce8550f0175"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00879-of-01024.json.gz": {"num_bytes": 318699617, "checksum": "521e1c5fa967a6f29641e7c4c2b210acda0736b32f318e24aef0e587895ed492"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00880-of-01024.json.gz": {"num_bytes": 318723630, "checksum": "dee1814b24f9bbc3aa3430cd80302b08b863eb1b92698158960b6be216845843"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00881-of-01024.json.gz": {"num_bytes": 319839271, "checksum": "9e57ea6a0e3d8a7798a0cb3e6344e1711e8fd879e2e396294718ff360fc7c4df"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00882-of-01024.json.gz": {"num_bytes": 317773196, "checksum": "2e5e5749618e53668222c7d310929e2177772dd7c14592e61dc86f163e353c8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00883-of-01024.json.gz": {"num_bytes": 320262049, "checksum": "f80afaa4495a2d41ad4d7380b79040569179b24ef5c2df17f75ce8e135d786b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00884-of-01024.json.gz": {"num_bytes": 319146213, "checksum": "77338479b420dab9316a4737fc243de84b5e88392cbbb46fa0619045a42432cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00885-of-01024.json.gz": {"num_bytes": 319022605, "checksum": "3a67fee2fb77e64aa13fd595d7786b432203f36712ff723ec5999a341834b38c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00886-of-01024.json.gz": {"num_bytes": 318624429, "checksum": "2afe387f2500c57294acf1403a8c27f27f6c7c2d228dee0f1ed70a02c438f838"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00887-of-01024.json.gz": {"num_bytes": 318733911, "checksum": "3fe087b3441f74730ab137ba9486650cfedfe2d724573c3d166565d7d1e40938"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00888-of-01024.json.gz": {"num_bytes": 319926754, "checksum": "dd2df1977458cac34ef1e52059bbc28738e541761d7ad11c0ffc8ef3ca061190"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00889-of-01024.json.gz": {"num_bytes": 319085344, "checksum": "4172244cc3fc4a4e9e09f04f8097cbc678aebaedb9d1fb97b1daae16b0b8ef45"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00890-of-01024.json.gz": {"num_bytes": 319838671, "checksum": "8ffaf34eb8209e7ec250303298f9eebd2833fedcf80414c20331e8dbed42251c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00891-of-01024.json.gz": {"num_bytes": 318169092, "checksum": "daaf74ba5d12a7415da94be0f4454336aa3d86ad5cd300dbe30cef596835ac8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00892-of-01024.json.gz": {"num_bytes": 319662776, "checksum": "6d99c0419a6c9633620fb0aa7b7610cc5d06696e839a1a52953fd7db7a18e053"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00893-of-01024.json.gz": {"num_bytes": 319541919, "checksum": "5f246aeacef0dc8d40a036bb1eeecf278f66d7215a134fb746d30f3420d18c18"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00894-of-01024.json.gz": {"num_bytes": 319528897, "checksum": "9975fd5d23d25938f00de3fc9240d77c27b4784c2f443b1914652a06d3b59fcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00895-of-01024.json.gz": {"num_bytes": 317548307, "checksum": "7af9e2abfaebd4afe05a0e28d3e6e3126800a8b9b7ad49de360e42f2eb2c8506"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00896-of-01024.json.gz": {"num_bytes": 320278601, "checksum": "1941689d6a0e449423faad6e41714f33d5b23cdb1bb73961a888a87678fc74b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00897-of-01024.json.gz": {"num_bytes": 320161831, "checksum": "3d951cb1ae4a9b3c6ff70555139435febda83d24bb04ea27b229a05424b470c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00898-of-01024.json.gz": {"num_bytes": 319341305, "checksum": "3227b97aa9ff57b62be2a26fd8131e9ea45f7731673acb43432e529ea4978a25"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00899-of-01024.json.gz": {"num_bytes": 319658969, "checksum": "c746f8bd5fffac933640ff39db0b9d7b022edb28d7a4b3237d8c69fd919b7b48"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00900-of-01024.json.gz": {"num_bytes": 317494627, "checksum": "0327f0c57a668b2b34e72f4c53d4cfaeed787d879843d0bba27b5be58d1ee5fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00901-of-01024.json.gz": {"num_bytes": 319683481, "checksum": "886449092779ee26fccd11e0c89c36e449346dc6b1f0a7cb15b6b53c897790a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00902-of-01024.json.gz": {"num_bytes": 320228529, "checksum": "6960d8539df78e98858ba8cebb2e637b6c2ef20890b5f2af1cbf4621b52c364e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00903-of-01024.json.gz": {"num_bytes": 318961279, "checksum": "4ddb3c9e9276d220f1d4dfc32bb61a090e895e9e3c9f53c169db99a024e7cd95"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00904-of-01024.json.gz": {"num_bytes": 319926290, "checksum": "69a941cbbcb673efdb254c162854fcfff6fe1132182210235b91d1d21ed4d2ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00905-of-01024.json.gz": {"num_bytes": 317982280, "checksum": "1d9613f366b91102d018e57894df520aaf1910aa98e06cf369d9676e498610c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00906-of-01024.json.gz": {"num_bytes": 319012210, "checksum": "4855989c814582f5cc0a5e9b8f9d1f642ae33de81625d4bbafaafb709c1cd260"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00907-of-01024.json.gz": {"num_bytes": 318515420, "checksum": "8f34dbaa454215922a29fea975357e4e705381a65e4dcaf8b0d8c200f9a277bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00908-of-01024.json.gz": {"num_bytes": 319286320, "checksum": "536bf0610a2c14d1d59aea0b52fdc29cec19cd7eaa4c3a5e5fec04dee103b29e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00909-of-01024.json.gz": {"num_bytes": 319938295, "checksum": "3bb3943183f579c15d0d30440f6c82d0c9c64d6ded398dfc7c67502d73868781"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00910-of-01024.json.gz": {"num_bytes": 318423425, "checksum": "adbdcf170531c725b54c1e5713676b789589b2fb77310f3e64a0cc30b83602ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00911-of-01024.json.gz": {"num_bytes": 319578185, "checksum": "a1342a95ce77013820c36e7d038ed47ca4d40cdf3584a66abc310132435b25fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00912-of-01024.json.gz": {"num_bytes": 319154715, "checksum": "4973afcb1d7b4816e3a3df1b9ce1e48a0eea4fe8ead5f83ea753e46a934e5ddc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00913-of-01024.json.gz": {"num_bytes": 319011218, "checksum": "c9a158f69a123859569e1cdd475355afda32d7e5c48001591f0b6c20dc17d572"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00914-of-01024.json.gz": {"num_bytes": 320027387, "checksum": "61f6c0f839908e7d3105a6926c501bcacd293d1ba50c3b8639ee227c9a8270b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00915-of-01024.json.gz": {"num_bytes": 320280632, "checksum": "a74fb91d8f7d79b09017a7f996b6ca5d59e4ecad9fec354ac977c0076d53fc66"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00916-of-01024.json.gz": {"num_bytes": 319278877, "checksum": "cbbb8dc274fabb4435db5fef5da1d91671e1a4c7f3f652742324f9632b01c5dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00917-of-01024.json.gz": {"num_bytes": 319616831, "checksum": "31e62cbd6209fb7831078e4a262d1b25c0590f9425c62b2b208d4030ed5722d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00918-of-01024.json.gz": {"num_bytes": 318635363, "checksum": "95e5c2f51abc9ef4c0422e91b77f79ff83c8cc38e585df621fbc0dfef48a84c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00919-of-01024.json.gz": {"num_bytes": 318885096, "checksum": "ea5960d4fbc7d5e7097edbf2c9c706e6b7c7e9d3e36633be9bd68c4038955f10"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00920-of-01024.json.gz": {"num_bytes": 319228627, "checksum": "73b721ae576dcfa83bd963e49530f73d76b788a669e3abc1c02189900c80cf02"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00921-of-01024.json.gz": {"num_bytes": 319557114, "checksum": "710c65cd504e87b5019c01f658e669d1e023473d879913a9522760d33546cf24"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00922-of-01024.json.gz": {"num_bytes": 319356053, "checksum": "f0b54b3c6b51a356debc9414df0438ee525ae5114cbb7c8176634b7493095022"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00923-of-01024.json.gz": {"num_bytes": 319766600, "checksum": "d5b80091c8113c283d91ff5826b46068b96c423c0dc74a646e2c8d1c5d815cea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00924-of-01024.json.gz": {"num_bytes": 319733540, "checksum": "56a54c7d4114c21c1657df0d295839c2bd4904cd1b651104e2a155c2bf1b5aca"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00925-of-01024.json.gz": {"num_bytes": 318944357, "checksum": "4d396c29cd1d9ba16016fac37c333c0a872f6cb0e9faae7966e53f6e5c879d67"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00926-of-01024.json.gz": {"num_bytes": 320276135, "checksum": "39a64c261a76d5e13f187f12c886b22e2db08fba968bc9d0c1cb0d3c241abda7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00927-of-01024.json.gz": {"num_bytes": 319181837, "checksum": "86db529dd52fb67173588fcbc9f0e52c99ad6dd34e44865150bc6c962de5b3c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00928-of-01024.json.gz": {"num_bytes": 318966114, "checksum": "d232df8033ddaa7397dbcfa8ba4ded9421ee9bfc091c725b311fd963b29f13eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00929-of-01024.json.gz": {"num_bytes": 320087917, "checksum": "fca6bfe8fe17c867681c58df081f2186dcc6bf22e46ce3783f85b918644c0b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00930-of-01024.json.gz": {"num_bytes": 318921677, "checksum": "b8031359e758cd835c44e81303e04ef7b2137d2e1a9472d7e04552c353d883c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00931-of-01024.json.gz": {"num_bytes": 318978028, "checksum": "bb5f2ea8a2e56c69813bdc08cb243c0763126e7b5f6c5cb57e7f4767d2126f89"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00932-of-01024.json.gz": {"num_bytes": 318627424, "checksum": "f6fd2065ce202d5347243a2b396707bb606be20c1829989bd7dff6d9fb7adec9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00933-of-01024.json.gz": {"num_bytes": 320226802, "checksum": "b303d2ece81c1f7b882703b915765212796518010aea6a108a441dd0a84a6128"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00934-of-01024.json.gz": {"num_bytes": 319908526, "checksum": "e5b05714922d132073122e83933853f52f0046c9f51f985cfbdbd310e8d677de"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00935-of-01024.json.gz": {"num_bytes": 318941663, "checksum": "4296055a31409a778c516afe25a8108f23dfffaf13cac33e5ed834a37c46b37c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00936-of-01024.json.gz": {"num_bytes": 318430860, "checksum": "4634630c012ed184b264ea01c97f7bb3f1af030f2466f1d99d20bb0472f74511"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00937-of-01024.json.gz": {"num_bytes": 318008229, "checksum": "131cc9a2fef4ebe81749f1844b7c4b194b97de7db4f5253ce59207e68d8b4df8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00938-of-01024.json.gz": {"num_bytes": 319099506, "checksum": "fff55e3b2ff8b53e56ab99def626a7334ce67d2414351b2e83d84298052dd9b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00939-of-01024.json.gz": {"num_bytes": 320457851, "checksum": "8431e38c86516ed88d5c028f4a1dad32b02bcccdc03f9687d18f8312e493bcb7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00940-of-01024.json.gz": {"num_bytes": 320607829, "checksum": "a68c577555781adc777c09c68f623431469d67e9b66af7b0813f09a512b7d777"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00941-of-01024.json.gz": {"num_bytes": 318923471, "checksum": "807ffde4034b6b95a5eacb71f093686586ca11e417517894cca99dfe7b12563d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00942-of-01024.json.gz": {"num_bytes": 319880902, "checksum": "d03d04f619a8f3afbefa6d67986f50d5ee264c45de36c0ba67b069e343e002ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00943-of-01024.json.gz": {"num_bytes": 319079341, "checksum": "e482c4dee03a34a1a5756e6def26134c9a3f18ee386f5569d6cbf16d3875a429"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00944-of-01024.json.gz": {"num_bytes": 319436318, "checksum": "6241f9f35640598c05bc5cd00d8cc024dde59c0065c8935da229a8a583de32fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00945-of-01024.json.gz": {"num_bytes": 318998098, "checksum": "85f192c1ee9734da0f1dcad31c2b8111076977582e139ecc1ba959bf2df6b262"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00946-of-01024.json.gz": {"num_bytes": 321951470, "checksum": "44bccedf6a8db115bb6563d6775ff03c67511ce4e23a2de77e79edcb568c9fa1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00947-of-01024.json.gz": {"num_bytes": 318689631, "checksum": "36f0bfa191ad7d51452d51249c724150f8c3774142df3720f176f2772f42f3fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00948-of-01024.json.gz": {"num_bytes": 320347661, "checksum": "f4a7afa90b6d81a4cdc99100b75b4d3174c4d5d670042766c3e0418b7a97ef80"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00949-of-01024.json.gz": {"num_bytes": 318054841, "checksum": "f39d0c9bfc0a562ede67b8cfc57e6974a8a999e2bbc1b6940f107169b4f06e4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00950-of-01024.json.gz": {"num_bytes": 319722042, "checksum": "bf376260e5a838b3b901ceb22f922829619be710718446ee95c24400cbc73495"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00951-of-01024.json.gz": {"num_bytes": 318315382, "checksum": "987cd895f63bb74c9d4ce229ee853c7bce53c75c324366a0d06377c36030e39f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00952-of-01024.json.gz": {"num_bytes": 319247792, "checksum": "d218dda02748a22821c2ecccf1cbb136dc8772a25ddfacc7ab354fc089470e87"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00953-of-01024.json.gz": {"num_bytes": 318411551, "checksum": "698768f3d7959b33fa74a3827e995b0c184bb3b4c46eba667d7dc3365fdd07f3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00954-of-01024.json.gz": {"num_bytes": 318809810, "checksum": "651d9ff43d5a3f7f5945ccf26b9410018248bf64956f3485c50b0df9034fb2ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00955-of-01024.json.gz": {"num_bytes": 319761211, "checksum": "29fa5c68fb8d3719e5f5f17568ce888522de64499554b5f0f4dafafb4ee5b40b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00956-of-01024.json.gz": {"num_bytes": 319255736, "checksum": "333a90a9c13f71e41a7cdd4784684bc142c79ef99155b9d62d062db318798b93"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00957-of-01024.json.gz": {"num_bytes": 319504417, "checksum": "730c90615fca09c81d9644cfae40d325851bb9bbc1af696caaadd67d8282ab5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00958-of-01024.json.gz": {"num_bytes": 319066016, "checksum": "bb565af6529720ba2a3e989769b33d978ef49cb2aae49c60f2ff98a981414280"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00959-of-01024.json.gz": {"num_bytes": 319887940, "checksum": "8992783693dd0ad5ce07427f6b5739c818f13952d90bb61312ec98f9c813f313"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00960-of-01024.json.gz": {"num_bytes": 318051437, "checksum": "4773edbc822ff8d51ec13af6c371214aea7545047d9babeeac0b29180d52fa0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00961-of-01024.json.gz": {"num_bytes": 318373291, "checksum": "ff33854746566f7d3b4ba9eadd1329ece48c034345fda000d9af73cb26d197af"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00962-of-01024.json.gz": {"num_bytes": 318572513, "checksum": "a6d07f7caf55fda0df74a22b454d196fb2e29312d433bc5506b00448c22b579c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00963-of-01024.json.gz": {"num_bytes": 319488084, "checksum": "453f666c6578376508b1fe8bd3fb8ea5bf030aca5cfedf383cd23b27de15228f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00964-of-01024.json.gz": {"num_bytes": 318905670, "checksum": "74f64ed6583e6a4df4b3c3f8a76263a2d63905d51d5680d9683d86f5039d5b56"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00965-of-01024.json.gz": {"num_bytes": 319452844, "checksum": "88016c1a0663b89dc3d76689c827c82a6d128401ae05f7b70c8727d75302cd47"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00966-of-01024.json.gz": {"num_bytes": 319334588, "checksum": "dd9300bdc27513dd62578e1cf3c8302647b49c61185c282a684011d788c43d17"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00967-of-01024.json.gz": {"num_bytes": 317872396, "checksum": "90747ee63ac7d8176fde1f2afce8deb7e39bf19e682e17d0fcc1711d09d5f1d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00968-of-01024.json.gz": {"num_bytes": 318988069, "checksum": "2cc785d650013d35d5d31b1e85c5530b197687c69117881362bf6b98f47c22fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00969-of-01024.json.gz": {"num_bytes": 318324244, "checksum": "83750d93c788ad32a256862b8173db3549eedf52ac131f09f662f1fe0f46bd13"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00970-of-01024.json.gz": {"num_bytes": 319494164, "checksum": "e0e46e185851ec569dc13a18519988ad926bdcd9bf448eff00aebf6df141f5cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00971-of-01024.json.gz": {"num_bytes": 318714665, "checksum": "941c9bf116353230417950d292c38b12b00935184162227eaec01870ab7f4510"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00972-of-01024.json.gz": {"num_bytes": 319518275, "checksum": "de30e19a155a6f4303afb0311416aa84cc3baf5a09cef55b8e2adc2a4f478f6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00973-of-01024.json.gz": {"num_bytes": 318092574, "checksum": "f70bf6727f1f308d93684ca41e9c2c68dfbd737a90da6375b58f162e8470fdea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00974-of-01024.json.gz": {"num_bytes": 318555677, "checksum": "109fe184ac9498ac571cd9c6cb38ae5ed566b0e98e8b7718984656a70cc6b224"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00975-of-01024.json.gz": {"num_bytes": 319045215, "checksum": "03c4257851857450f7397ac3d627a60ffc98708ad5aac6e1f73e6ce818fe7be8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00976-of-01024.json.gz": {"num_bytes": 319172031, "checksum": "7d98fa662aa9d0ff7ed50cc72195bdda2147212b34a3d22f0f757a4eb158d5b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00977-of-01024.json.gz": {"num_bytes": 318650530, "checksum": "bb8ccc07ecc6fd39ae97136418efc543efe5541e85910a7f333ee5cebaa3b595"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00978-of-01024.json.gz": {"num_bytes": 318609909, "checksum": "40b49f3fbb2fce73bb1851304b290fc7fb400d13c2448ac7e5e559dccfda7ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00979-of-01024.json.gz": {"num_bytes": 318881197, "checksum": "b29f96cfba574428cb66f54b20c4a848bc83438256167afdaed576a3931117a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00980-of-01024.json.gz": {"num_bytes": 318506081, "checksum": "a15996adaaf41e5615cb5c7fa2ef1b4e3003836542d0851d1c6907522f534fee"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00981-of-01024.json.gz": {"num_bytes": 320000305, "checksum": "38e282b433c4e3dcc9fc2b056f6ddbe4eb857c5137f7c51301d53ca259d6bdc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00982-of-01024.json.gz": {"num_bytes": 319959158, "checksum": "97d5e58088a87a15b71db975d5e09b69daf497b7dff3ef809e1b8292caa27905"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00983-of-01024.json.gz": {"num_bytes": 318921242, "checksum": "f062e04f89132576ac1969fdaa43db761a0ff7e4269a6f173d87fa011a4c289b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00984-of-01024.json.gz": {"num_bytes": 319577980, "checksum": "e52a6c08d5243717f21120b4c3ebc8fcf77168928945adf68bc665392a6e8d11"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00985-of-01024.json.gz": {"num_bytes": 319812101, "checksum": "8b4f5645ae0e0b190af4ca5335c57735ae919d3c6402438af506c7907f1d1494"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00986-of-01024.json.gz": {"num_bytes": 319582409, "checksum": "3654109968d918aa4d8db17cb7057111c42894cfc7eee093df13036cfb3ac6fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00987-of-01024.json.gz": {"num_bytes": 319957581, "checksum": "4b9e6febb461940b993c50945a2ed06736c6786aa8f758565ff545814ebfddcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00988-of-01024.json.gz": {"num_bytes": 320346479, "checksum": "2891565dd75fd4354777b4f4f393983180584ee9c64b5d9b4557dbf26a3c4cfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00989-of-01024.json.gz": {"num_bytes": 318546717, "checksum": "929d0236c9fb77d638e0a18aa97b00004316bbb0ef3c4323e39f61aaf7c0af53"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00990-of-01024.json.gz": {"num_bytes": 319606761, "checksum": "6ebd2552ecdcce7b194d4f6d5b5e66ede9d65da4e4999ee8ec4705d847e473ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00991-of-01024.json.gz": {"num_bytes": 319117521, "checksum": "1b3496964d0a895b347529ddb7b712d211c9419317fb41cdd6e20bba43f39f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00992-of-01024.json.gz": {"num_bytes": 317781551, "checksum": "9f9cfb5f9152b9a60121b03c24d944129c1ee43e862112fe3896e2772fef99a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00993-of-01024.json.gz": {"num_bytes": 319341839, "checksum": "fb329b7470ae127efe1be4adc960b06eec4f55bbcbe1f3f0f0b794d70a8aca14"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00994-of-01024.json.gz": {"num_bytes": 320357337, "checksum": "bbe9a60c3c2b3b5b11a5d531d1d85f0a90ebe3dbc79189b3825e169ae302932f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00995-of-01024.json.gz": {"num_bytes": 317824612, "checksum": "26643091ae3425b63036453ffca7ed82c85c24b6a24264197e6516b68a39a4c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00996-of-01024.json.gz": {"num_bytes": 320453890, "checksum": "db33809437e62bf1f086f40e4d66ad0133db7c7d406b2ce52ce5d9c9b0809961"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00997-of-01024.json.gz": {"num_bytes": 319469732, "checksum": "3447b74f09dc4d63dd04d6bbd4382147071504338e6ea428b37c3a5174877537"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00998-of-01024.json.gz": {"num_bytes": 319562604, "checksum": "270a1c19e6321541398836d3d982c2e396db99abf94317912714251d1f68e8ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.00999-of-01024.json.gz": {"num_bytes": 318895764, "checksum": "d68f8f4d85d91679c20e972b2b1955d41a8f6601873bb311a2621f4b3f3152a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01000-of-01024.json.gz": {"num_bytes": 317697031, "checksum": "68b47464ca3e97e9d3f4075b656f804c1bab667f231701db9cce1f0b0a921088"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01001-of-01024.json.gz": {"num_bytes": 318915840, "checksum": "582216879b058ccd4d0ca2edccaa2db49b64459371f8798a1d9c66c06a0cf908"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01002-of-01024.json.gz": {"num_bytes": 317811256, "checksum": "6864299a7d0174f92abc696dc293524291623891b86cd69132348fdf78760a4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01003-of-01024.json.gz": {"num_bytes": 318605529, "checksum": "4ef35b7546266f99eae5f332cbe3e284801c5d7b39f840297d67e71c036edf62"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01004-of-01024.json.gz": {"num_bytes": 319379897, "checksum": "040dfa80eaf8355370d8a50692bc3ad03a1d57272af340d70031a4398f37b9ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01005-of-01024.json.gz": {"num_bytes": 319515177, "checksum": "012ac70ef2715181ec1fb578a2366d68e786d3a9ea41c59c08d7c494b89b429c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01006-of-01024.json.gz": {"num_bytes": 320078217, "checksum": "46030d85d8333ae224320fa54e487f3770de7de280cd0001344136b0bd87c431"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01007-of-01024.json.gz": {"num_bytes": 318526753, "checksum": "dd432d865ef3dba4b5af30e42b11ace96900bd7b97af053ea892292e75bd142c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01008-of-01024.json.gz": {"num_bytes": 319407137, "checksum": "165cd3a688be6f9f5a4cedde198a9dda4f9d3dbc1d275d1e99411f3ee96a0d62"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01009-of-01024.json.gz": {"num_bytes": 319763066, "checksum": "e44e86d497f8471e53531374b0e6ee61aac54996b6af64a4af0f5620673f9f7d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01010-of-01024.json.gz": {"num_bytes": 318653930, "checksum": "61115f16e718d3a2b66574cc17841aa5d02739762138abe3c9a7f325cf9f2e31"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01011-of-01024.json.gz": {"num_bytes": 320037079, "checksum": "65e18df845f1e6cce1bb92a45f71274dca94d3f0ece1d556116085b5c0e6338f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01012-of-01024.json.gz": {"num_bytes": 319753418, "checksum": "cd5a8ee1bc7d9ad58e98aa6fe56d60501115592519a19efcf9fa370668c6327b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01013-of-01024.json.gz": {"num_bytes": 318657671, "checksum": "986ead2c1b37f4094aa6f7a7882824ff013e6393323d5290d7f3e9215589d07b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01014-of-01024.json.gz": {"num_bytes": 318028602, "checksum": "3c82c0611fb1fb0f635eaedd2bbe7cfc9d53d1ae967a9cbd0416def046e4b104"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01015-of-01024.json.gz": {"num_bytes": 319164504, "checksum": "5eb5cf76022b12d8751a2fce5c4d4831066785a68edd7b3cd3dfc10017f91621"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01016-of-01024.json.gz": {"num_bytes": 318474894, "checksum": "a99d827be814e27d948264d6ae55c6a032a664f3ff0ef6ae94bda90f7faf29bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01017-of-01024.json.gz": {"num_bytes": 319516762, "checksum": "7eac25ebb9383a4592023634b852d88a128604c494972a8fd9e2b183fbb303a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01018-of-01024.json.gz": {"num_bytes": 319433935, "checksum": "35adb751748043a36f22b412d3ea0e01166037cd96216f516abc547e9d2609ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01019-of-01024.json.gz": {"num_bytes": 320305440, "checksum": "54c4d52564221e48dc5354cb51d447658707ab8edaa3d6d8fec5ec379a29d462"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01020-of-01024.json.gz": {"num_bytes": 317445661, "checksum": "edf1c6ab9900d75b91738fc7e9e3db8cdde3f9ef2234ff249833b5cdb04c65a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01021-of-01024.json.gz": {"num_bytes": 318134525, "checksum": "1c5e670ec9d815637e9bdbd75289c7ef7f3ecf384e32f403ae8a9fe2595cc983"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01022-of-01024.json.gz": {"num_bytes": 319809162, "checksum": "9def881764ca614c88ceabb41032d3e145f06c843a7ceebd87dba6b93c974a6e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-train.01023-of-01024.json.gz": {"num_bytes": 318155801, "checksum": "552a6a2be423c0ecbb767611074200c5b85c1cf76c8640c79e3be5e967b293b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-validation.00000-of-00008.json.gz": {"num_bytes": 40471190, "checksum": "1f25b6af12da84115301d4ee93ea5246c8fea5bb4a2008472794d95b917cc97f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-validation.00001-of-00008.json.gz": {"num_bytes": 40675053, "checksum": "db4c23d7a336032de37dfe2f3ed39653c8afd94004d4e8d9c73c03222299292c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-validation.00002-of-00008.json.gz": {"num_bytes": 41175078, "checksum": "4bf6b248b0f910dcde2cdf2118d6369d8208c8f9515ec29ab73e531f380b18e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-validation.00003-of-00008.json.gz": {"num_bytes": 40728516, "checksum": "082b72c1ec600502df2e4403df6884390c85627ffdf37a5b700397c9a1ac6b8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-validation.00004-of-00008.json.gz": {"num_bytes": 40920200, "checksum": "37c2ce46864db0b6f1fe89220ebf4ef811ea10485c8336f1712227bbbdb530e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-validation.00005-of-00008.json.gz": {"num_bytes": 40921460, "checksum": "00b164e59df49df5dc1df170db99bb0d9207a6329cb9272ed8b6ef7a55058359"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-validation.00006-of-00008.json.gz": {"num_bytes": 40549809, "checksum": "86896a9baffe0ab9df39a2901f0e515009989ca1fec9a42583d718ce16166b5a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en/c4-validation.00007-of-00008.json.gz": {"num_bytes": 40446172, "checksum": "0bf87534c7050091c60466df50f174c3147d052ec7dc645da9574c902445beaf"}}, "download_size": 327104523018, "post_processing_size": null, "dataset_size": 1658004128680, "size_in_bytes": 1985108651698}, "en.noblocklist": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "en.noblocklist", "version": {"version_str": "0.0.0", "description": null, "major": 0, "minor": 0, "patch": 0}, "splits": {"train": {"name": "train", "num_bytes": 1029628201361, "num_examples": 393391519, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 1025606012, "num_examples": 393226, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00000-of-01024.json.gz": {"num_bytes": 396728190, "checksum": "06fcf4d9bf6ae45fac94245952f000c924d2a0b5cc8841c916b3ee949333410d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00001-of-01024.json.gz": {"num_bytes": 395686133, "checksum": "8a0b64c5efb1db1ebcc0a664c801221049f5812652dc1a727a0e9f8d0df0cd0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00002-of-01024.json.gz": {"num_bytes": 397762165, "checksum": "087fabf9563297a6eab8bc39b68c0c6d15169032001d3a17c9bd964080759f2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00003-of-01024.json.gz": {"num_bytes": 395307518, "checksum": "1e5b89200528320e354f60be0868a3ab6dbbe667a6b16b48e4739b988a6360e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00004-of-01024.json.gz": {"num_bytes": 396280504, "checksum": "8291badbe84854960c0ddac3d6c226cb519268d1b3fd267bd72cfb4f10800de1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00005-of-01024.json.gz": {"num_bytes": 396636600, "checksum": "c74226ceada7d78e3e7a2ad931d0a99df93f4cc4377ec69d4f1fab4164c3d845"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00006-of-01024.json.gz": {"num_bytes": 395364336, "checksum": "4e52e99dfc4e55c41226978b4dbf48fac2f886b9b0446bc3bd576f32bdd7cfea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00007-of-01024.json.gz": {"num_bytes": 396428805, "checksum": "283ae93ecc3f8daefa9c47651ded763dc5f339ddc619c8cb5e32dce9cb9cfe4c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00008-of-01024.json.gz": {"num_bytes": 395030041, "checksum": "d3fc7fffdf9c2172d233bea3bb7dc485d753319e6196672d0186b8ba04a1d903"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00009-of-01024.json.gz": {"num_bytes": 398255693, "checksum": "61e10cef5c2cab162fb1d26f97fd9d76b30c9ee989c01ef8597d2a4e35b303da"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00010-of-01024.json.gz": {"num_bytes": 397825333, "checksum": "f72040887c2a2c17564c2c6a9a4b5ff95fce6a0eed4f0800cdeff8277af651ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00011-of-01024.json.gz": {"num_bytes": 397877458, "checksum": "ee34ff11164e10a86f76593205cb13986c70ea3d3a8849174a6dfb5b4ec91262"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00012-of-01024.json.gz": {"num_bytes": 398317059, "checksum": "7a3ef558efaca3e5d19e9ad02b47dd61f9639dd806130b62d66e9c3341c0edce"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00013-of-01024.json.gz": {"num_bytes": 398518794, "checksum": "f5a6c18992ab2b59a9c02469d20768bf5757624e03bcaf92957ce736a3a9edb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00014-of-01024.json.gz": {"num_bytes": 397026214, "checksum": "c174b625c1534c69814f8e4879169b58af96f801dbb433113740af0d78535abd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00015-of-01024.json.gz": {"num_bytes": 395621683, "checksum": "4e8e52a602d4eb4b27104780f4a36617505505fb66a82f36e90631a4e668f5b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00016-of-01024.json.gz": {"num_bytes": 398138551, "checksum": "a3e7a95b16f09e09e45f1c3bed3524415581e21b065d8efcc66cece705dee4d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00017-of-01024.json.gz": {"num_bytes": 398720813, "checksum": "79cdb89052e8dcecd1f1319e47f4c4ae1d350ab81777a9ba8077cebdb558e795"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00018-of-01024.json.gz": {"num_bytes": 398538940, "checksum": "8da6aac3a794ce326b5a3971fb75a2ee848f008940d4f1bedd724ce7c5874278"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00019-of-01024.json.gz": {"num_bytes": 396834319, "checksum": "b57c93502949dad9001e89847947f6c65943927eb519e16de4eaf5590b235faa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00020-of-01024.json.gz": {"num_bytes": 396402861, "checksum": "05e14c7e21df3d4af7be7a597fa22463868464d6475282376536e12e82367401"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00021-of-01024.json.gz": {"num_bytes": 397560852, "checksum": "756d15d8b07414dffd7cff3efde606aa62cf8f73b85d8e1cd17408d6a339414b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00022-of-01024.json.gz": {"num_bytes": 397210987, "checksum": "60aa08d9c5d813d5f2448d910bc23a705cdd0828a9403c18ec223e53623889cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00023-of-01024.json.gz": {"num_bytes": 397563062, "checksum": "bd865213ffb2b40c2cd3eb16724b68c0f37e29f68215990dc84d91852c7c0d72"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00024-of-01024.json.gz": {"num_bytes": 395799120, "checksum": "08ff3615ecea3eb5b55703e123475c95afbecfe7107eedf05750147c9ffd12ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00025-of-01024.json.gz": {"num_bytes": 398336372, "checksum": "e3e30b97e585fd881b3a1b006775854a11a2b967d992e7eea886338d8beefb13"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00026-of-01024.json.gz": {"num_bytes": 396819084, "checksum": "fddc9e1a8405c5e05e63ce98b19c7833c0fd46392b4b55532b317e7f81426590"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00027-of-01024.json.gz": {"num_bytes": 397912380, "checksum": "d3e597b3a96b993840e47adb761cce2f2ae1c96aefcbd6c250198dedaecde15a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00028-of-01024.json.gz": {"num_bytes": 399078461, "checksum": "abd6d2341b6c61cdb89b80a8b9bfd938bb6d8a423a89e6a9f997c22c6479d537"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00029-of-01024.json.gz": {"num_bytes": 397303107, "checksum": "ee35a3af1056cdab79b644f6352150aeb6fb19a630cd6bc893a072e35fbfbad2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00030-of-01024.json.gz": {"num_bytes": 396602401, "checksum": "1d04d4bc295aee2ab80b24f587f8c483599db7d5a8157acc99a1d8b001f8353e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00031-of-01024.json.gz": {"num_bytes": 395941329, "checksum": "cf1dd244555511245c0e6a5b1dc9c24f747b8377674aa3690677ce08ebb8c26f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00032-of-01024.json.gz": {"num_bytes": 398049663, "checksum": "c83e5572647eba5ab14fdc4dcba8efb6981740b99b8f634e2c6b1942a051c249"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00033-of-01024.json.gz": {"num_bytes": 398044404, "checksum": "b76815aadcf4ad802071428864ce0b406cabd73dfc2be5e20b44885ec6a85419"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00034-of-01024.json.gz": {"num_bytes": 396885224, "checksum": "da00d92418fbdb9799d8f16977b3a33f67cb98a31808544cb68cf3b42ea9adf1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00035-of-01024.json.gz": {"num_bytes": 396185021, "checksum": "265ad43ce00666c83fd441d35ff29ba1ebf7d62442cc3e3c176091b4c725ea9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00036-of-01024.json.gz": {"num_bytes": 396702503, "checksum": "4733156df48f2dd0f2e859fef28f56d12a84e8012085ca9318073ae647b0fcdc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00037-of-01024.json.gz": {"num_bytes": 397582277, "checksum": "7d62d03c3496ee2e17ab6b9635710efef9e4cefb88ddccdc16ed720a414c38c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00038-of-01024.json.gz": {"num_bytes": 396186761, "checksum": "670affddf8fcca6933af3f5b30efd1bf490c3e38c3e90f2e8e9a464994d613f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00039-of-01024.json.gz": {"num_bytes": 397056953, "checksum": "4acbd97f9c8fd9a930a6f4284a11cfe37f6cca3b5858ae3c2cde747dae35e0d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00040-of-01024.json.gz": {"num_bytes": 397809786, "checksum": "d350e48a36bb1ba3125f72a07ed8024d26eae6d89ecac686ac0bdf3d5d89e1a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00041-of-01024.json.gz": {"num_bytes": 396944358, "checksum": "817a58dc40440b8b1f54d129db08ae9124e0293e5a0e45f034fbffb2140d90c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00042-of-01024.json.gz": {"num_bytes": 394327995, "checksum": "6bd6bc1269c2dd81db466ae9c41f76b8b8cf71cc7bd6e131452fa1a1318ff459"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00043-of-01024.json.gz": {"num_bytes": 396476043, "checksum": "f3525d9c861d984ea0cdacba7fddffaef058d8f95aa99ef1f09f9f0792fde5e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00044-of-01024.json.gz": {"num_bytes": 396893614, "checksum": "292ca2b6b9ba41567fe7cc60e5424aa1f3e431ac874d06ae8eb98794563a7d35"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00045-of-01024.json.gz": {"num_bytes": 395885483, "checksum": "ea2c8fac41ededba7da8bf2bb48463d83f148e5c0970a689876d4932ab18a3c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00046-of-01024.json.gz": {"num_bytes": 396963386, "checksum": "97672d9bca357cd2721f51301aa37d37a271dd3ca7487244c057570b995da66d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00047-of-01024.json.gz": {"num_bytes": 395856712, "checksum": "52c517670ba4eefb262cb71373d6370f86ddeb0aea7391a47a22d52a55bff7a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00048-of-01024.json.gz": {"num_bytes": 396091027, "checksum": "49f5b68e29c55eb50da941eab1cf446c7d8c9d0b30290318977edb39ef0b887f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00049-of-01024.json.gz": {"num_bytes": 396892998, "checksum": "82a51eb6f301c00d927ca7920338247038cf4e9e0072d74c02bac897701f5859"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00050-of-01024.json.gz": {"num_bytes": 396308050, "checksum": "d72f92ecd27b716cd90cc4abe562d25fe6d49740b4a3d1fb9beac2526a61988e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00051-of-01024.json.gz": {"num_bytes": 396137777, "checksum": "a956e4d086077f7ab309ff10b0eaf4833e4d3ed74435293e96588f4361e1536d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00052-of-01024.json.gz": {"num_bytes": 398302544, "checksum": "5a54f7faa07661ea6a5f0585ca49ad66c8f7025fd9627b3af832dc886d50f78e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00053-of-01024.json.gz": {"num_bytes": 399616791, "checksum": "7f8fa496d50a0b7c399faff4c1864e24717b3f9c86b2552536c8f91e3e0cf9d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00054-of-01024.json.gz": {"num_bytes": 397332881, "checksum": "ab862f26b4fa38b6c16d8cfd0d63a9f0973827e45915e85aefb95d4e182b7b9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00055-of-01024.json.gz": {"num_bytes": 397075146, "checksum": "cb67aa9229bec8b88e496829aa0a60ca1c3ff4a2293632cf7782b69aa71aebfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00056-of-01024.json.gz": {"num_bytes": 397827600, "checksum": "2f63e3ec40d32237d4a50c873b966d7fc2c16ef5c04a2bcfc33328b128654e7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00057-of-01024.json.gz": {"num_bytes": 397533583, "checksum": "7c90bf39bddf8ad0c6a8bb3dff02caea8bbc2abbd76047c5d523930d2a00dbc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00058-of-01024.json.gz": {"num_bytes": 396411363, "checksum": "ee6059f3c8a2df34858a0110a06ec4e9673555fa56c1a2b40930337ba5b1b39c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00059-of-01024.json.gz": {"num_bytes": 396735510, "checksum": "d9dbe2421edba1820294e757d88aa25455db42ce8992f8933b51cd84cfc35a36"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00060-of-01024.json.gz": {"num_bytes": 395694553, "checksum": "b05d6502fc95587fa7047fac64978d6be13761dcc6954629332812e5937c2731"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00061-of-01024.json.gz": {"num_bytes": 397740757, "checksum": "39303faa5dc33995dfec683b44fc24066ecccdf6b5001b9c0644d8e9899d45f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00062-of-01024.json.gz": {"num_bytes": 397358263, "checksum": "fe27dd467cc2c34abe5b0bb34473ee68859f2198eeb78304e1d2e54460a67383"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00063-of-01024.json.gz": {"num_bytes": 396826654, "checksum": "1da2c414bd03e5547d8c9c7447e42b8dcff5f6ca8ba35c53076f2895e8ea63f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00064-of-01024.json.gz": {"num_bytes": 395781869, "checksum": "af96de4d6b5bc1ab0527efa33a73d7eb788dca15829acbb7291ce72ad05e6c66"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00065-of-01024.json.gz": {"num_bytes": 398192274, "checksum": "7f46ccfc1703fee106e932bc9a1bc5dedf7de944172cfa34ec9b31413bf0bbda"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00066-of-01024.json.gz": {"num_bytes": 397133438, "checksum": "dd3b67d8578927d7474dae76bdca35f35a2aa125fc50873e4a9f6e73d7a81831"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00067-of-01024.json.gz": {"num_bytes": 397204214, "checksum": "4cdc87a7c9fea33e15d638e5c921f45149212769bfba5f59f0a5943398ca0d55"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00068-of-01024.json.gz": {"num_bytes": 396489592, "checksum": "64d175c23574998f8c5d28ce3d3f3934144b1fd4f6527ede1aa3420c28bb90d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00069-of-01024.json.gz": {"num_bytes": 397697351, "checksum": "3329857f531c9fa22d98bd567638f0564f73062da1478ca84385246f71baabff"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00070-of-01024.json.gz": {"num_bytes": 398449973, "checksum": "bd13494aa03a95d943a01f3436f62c46ee3390b30f6ff0fec0636f3c0b09fa1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00071-of-01024.json.gz": {"num_bytes": 395498960, "checksum": "5e69529ae82c305acbf1f58a7021b4e3fc67285a871dcbcaaff0781d0e721070"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00072-of-01024.json.gz": {"num_bytes": 396170387, "checksum": "9b9c7e11b9bb2cf6ea0fcdfd58754f522a95070feae74c29559522e12e1b41f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00073-of-01024.json.gz": {"num_bytes": 395915819, "checksum": "87a2069589fee8de23730b8b994ba59d63d5128175b5326ba0a8c8ac9e01a3dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00074-of-01024.json.gz": {"num_bytes": 396986018, "checksum": "e073efb3f00db65c1ee14e8bfa6e8c807f7827d0f3dd4d4026f823bc6f61b1cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00075-of-01024.json.gz": {"num_bytes": 398555103, "checksum": "a1793748c7979e241ca34291c843ca3cc90dd7643f04810b6cd324220efbd6e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00076-of-01024.json.gz": {"num_bytes": 396357420, "checksum": "7b1cd69788ca9a7e614de70a8b908183f41f316eaadf3b0236a7c4e126db9844"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00077-of-01024.json.gz": {"num_bytes": 396666167, "checksum": "aec828d3c2a1f7fa970de328a8fd1a85a90493dbcbec4f50816ccbc2275a1fac"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00078-of-01024.json.gz": {"num_bytes": 398167446, "checksum": "e14bdf5af810574aca7c6f3daa67e503f24ab1705435a62129c66c248667ee97"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00079-of-01024.json.gz": {"num_bytes": 399696096, "checksum": "b63756f81b8b19ecdc9bf227045df10840cbf973b60bd8ffdf28f58a53cdb028"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00080-of-01024.json.gz": {"num_bytes": 398755610, "checksum": "dfc118f680b79260e7ece75f27c0459484eb8458f2422df9f1918f726b54ccb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00081-of-01024.json.gz": {"num_bytes": 396606787, "checksum": "17d6a503947f5132728f53ea62fd093f55bf2dc6a32316a5c0413353cf13eff3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00082-of-01024.json.gz": {"num_bytes": 395714484, "checksum": "8ca41818ee6a0ffd5b00714779289c18cd97d620258c5d3d741c482b72344300"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00083-of-01024.json.gz": {"num_bytes": 396807173, "checksum": "12d87c0a948f32f788497858751c3ef22f289136e6ae58518a97a2e976f5cdc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00084-of-01024.json.gz": {"num_bytes": 397241529, "checksum": "7c3da4ca4d2b2077f0ab7be511038255732fc88d954f2f17cb0f3ab144216206"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00085-of-01024.json.gz": {"num_bytes": 398357369, "checksum": "26df55183e78f8d69fb16e21d07edf98659b69bcb3c48f340da6a5bc44007f4d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00086-of-01024.json.gz": {"num_bytes": 396997317, "checksum": "09f0641e9075cb88800d0eaae3f7b99b047552edbc71d1fd2d8594f645d22c2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00087-of-01024.json.gz": {"num_bytes": 397978000, "checksum": "c9437ef5f58a46b8a6d8efcae37fa658da3f2c4f1cad0f9cf47fbcd09bb82f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00088-of-01024.json.gz": {"num_bytes": 398468913, "checksum": "be187fc14017f666b84ed7049c169c1a28654441c2f523eee8b655b3b9d9ba8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00089-of-01024.json.gz": {"num_bytes": 397071121, "checksum": "637c3f964ee2c750a0a175f2e5d24b786a37d37701f10616b448804d68b72f4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00090-of-01024.json.gz": {"num_bytes": 395753807, "checksum": "8eef7ff1a8080aebe5226cc3539baac46ab64d93f8e3ffb6e8b7ab3346e151dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00091-of-01024.json.gz": {"num_bytes": 397039764, "checksum": "a2904ae5bf69b393a697afd62ae9b8a560c1f076e8a141e6f3feef29cb5d1352"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00092-of-01024.json.gz": {"num_bytes": 397058578, "checksum": "eb4d7e2712a9983bc1581133fa8eaa2e1d28b314861833bd8d810d615ec1ed81"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00093-of-01024.json.gz": {"num_bytes": 395855981, "checksum": "5c9a7573a5644d89d46666306d333ff1e4af3213f287cb9adb48ef87a023d479"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00094-of-01024.json.gz": {"num_bytes": 399516118, "checksum": "de7ae1508815e48ba031762c084cf6946b084871463821407090d23c197c6474"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00095-of-01024.json.gz": {"num_bytes": 398236235, "checksum": "616cef1f21ef078ffb9fc2b4148735668debdd15a8bc1be281183ba3659e9fcd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00096-of-01024.json.gz": {"num_bytes": 399526010, "checksum": "eb754381b8a6f3c74dda5ee5852958f7b69c707a3908cbaa9410c972e002a0cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00097-of-01024.json.gz": {"num_bytes": 397935028, "checksum": "6d6d2ca80708b7c6ad4240a042dddc2170060e8976c2e7b4ace446d2f2395076"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00098-of-01024.json.gz": {"num_bytes": 398645934, "checksum": "568db6971230fb42df8973ecb5a2a6d77204aa8cf0bdf47b386c04370da8dfd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00099-of-01024.json.gz": {"num_bytes": 398110916, "checksum": "9bacb381e3b06976619e816e40ac2ccd3bcf3cb9ecd30c294b388cfb75c8bf77"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00100-of-01024.json.gz": {"num_bytes": 397631228, "checksum": "7d515ac0f767736600a216ebe7280b9751f16e70df969ba601d1aaae15f201e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00101-of-01024.json.gz": {"num_bytes": 395102356, "checksum": "87c5c81e154e136f3e090ba91682ad54fe678653f86f6f32002ae5ec3c9aa743"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00102-of-01024.json.gz": {"num_bytes": 398926159, "checksum": "2df85a9ac13812c3870180901dbba99b52e53fc045da019160a3f06d0dfa5e95"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00103-of-01024.json.gz": {"num_bytes": 398383820, "checksum": "8134d12e84ed4a58a5f8f6eff8a4349f7d6ded6a1d7539b5c23193571569d6c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00104-of-01024.json.gz": {"num_bytes": 396628542, "checksum": "208f0cb3365b0243d70e7b4e52ff977e9b11d8e451adea521a5bf6e10cd40ee0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00105-of-01024.json.gz": {"num_bytes": 398737797, "checksum": "855ac7b8cb621a240319ef00197d2f20338d17db71a1aec68fb66930bc17c59c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00106-of-01024.json.gz": {"num_bytes": 397281064, "checksum": "544d5d91d066f2450bfe622ce55bdfe16a300aee9c05aaffae8a645966bc695e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00107-of-01024.json.gz": {"num_bytes": 397919761, "checksum": "f4af405c0f19c9139d93b3073f3fe328be998c9dc6f74afc7e21ad068964b92c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00108-of-01024.json.gz": {"num_bytes": 398810219, "checksum": "bdfce29353c6caa33b178bdebbf7e48526c391bc6c71180e3fa378b723879563"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00109-of-01024.json.gz": {"num_bytes": 396605124, "checksum": "ed6acc172bc9af0e31170f5533001a8fcd344e6732a4b3a714b7ad43740f25f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00110-of-01024.json.gz": {"num_bytes": 397491755, "checksum": "428b6c91f12c4f7032fa692bbe887f1a4c02635eb88b91d876da4c71f3da5e4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00111-of-01024.json.gz": {"num_bytes": 395754897, "checksum": "a723863559edf291fd8a6c2736cc1cefed70dd3c8625b967df049ce0d373f68a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00112-of-01024.json.gz": {"num_bytes": 398567649, "checksum": "a90ddc9ccfbca20b9c75bd2b7d63ee6abd03236a0f0dd2827eb9f7350d9c3931"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00113-of-01024.json.gz": {"num_bytes": 396706569, "checksum": "479052b6b9edcc2bbda40b982976e7e28d84fad7b2dce46b017f4e3d1f61e0d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00114-of-01024.json.gz": {"num_bytes": 397384355, "checksum": "a95984e4c261a3057d1bc51939aefd9413853111e19030b19c5d26f778be00ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00115-of-01024.json.gz": {"num_bytes": 397702826, "checksum": "5eaf7fc2c9d4b2ee3e216c215da7f4fc7558e89d6993033b95a940a78061ab05"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00116-of-01024.json.gz": {"num_bytes": 397252590, "checksum": "268033cbbdf3be9790cb6010791693f1b490af06f9fef91b0b307420a4e30a08"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00117-of-01024.json.gz": {"num_bytes": 395506730, "checksum": "cb80908eee1054ddaf7e2e5d66c9a41505025c2b6dc7fe6aa287db0a9f3829ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00118-of-01024.json.gz": {"num_bytes": 396452136, "checksum": "d75bf895c88ff2e9c4031c1f65b067222cfbb1a937d685ab4dd33369f5f5ff7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00119-of-01024.json.gz": {"num_bytes": 396777389, "checksum": "2c00362f4d99cef2bae2f13f17b79ec56a5ef8aca18ffd56a12fea2308e5017b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00120-of-01024.json.gz": {"num_bytes": 397730478, "checksum": "e31296949f7ce2e2a74fd2443552cb64b9f3cddcca691097a56992f51033fd11"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00121-of-01024.json.gz": {"num_bytes": 396593647, "checksum": "c2f0f81e3c835848a47532d8fd1c215a624f47740196a7bb45b5099916853014"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00122-of-01024.json.gz": {"num_bytes": 396576172, "checksum": "72edb7581a623e20f26cae4885f3b9d7f329581921253ca4d7ceedfbca17b7b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00123-of-01024.json.gz": {"num_bytes": 397378329, "checksum": "4f045ce7bd077b7f878012aead8c51073022448de66d2e35a755d4c8c4a6f59d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00124-of-01024.json.gz": {"num_bytes": 396545003, "checksum": "dc7949657328520d31a27d8e267c2ab07cd4e8639036d4b1bb59454c309f862d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00125-of-01024.json.gz": {"num_bytes": 397630505, "checksum": "530bd95e5ef9a1d5989c595e60e0ab11583e0f42d16b2bd37c49ed09a67af207"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00126-of-01024.json.gz": {"num_bytes": 395483747, "checksum": "d9df071edec6959ba842509f72ad43be3ea3f529b60d48f3dfbf390908887a5f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00127-of-01024.json.gz": {"num_bytes": 397295159, "checksum": "02b61f5bc7d1d241484c4f04fd517960ae755a69f35192bdd5bb471baeba5614"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00128-of-01024.json.gz": {"num_bytes": 396276865, "checksum": "0c7d618df232c36ba018269ddf3b2863cd6d63bb7fabeaae33fd508715bd8ce2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00129-of-01024.json.gz": {"num_bytes": 395314703, "checksum": "03443afda032187d2dc2e696ce6eaecbf2219e6dabbdd593379e97c0e00e3112"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00130-of-01024.json.gz": {"num_bytes": 397411481, "checksum": "8969873d5efd3df0cef1742e4bc67f2df7a5b5d9e641f7a12e77c7e8e96a1bf1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00131-of-01024.json.gz": {"num_bytes": 396925311, "checksum": "31adc39ea4eda8667662608bdad6bb32bbc82b1ee1ad53ceb4df50924a933bdf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00132-of-01024.json.gz": {"num_bytes": 395826124, "checksum": "d2f035ba2c388fec2d847bd43449c885eadd0bcab5fb8afdf031a53e72c4ec32"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00133-of-01024.json.gz": {"num_bytes": 398892794, "checksum": "b7ed60983058a5f9f0ef72602789f50359f415ecbe60dc967e7a869866d833b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00134-of-01024.json.gz": {"num_bytes": 398206890, "checksum": "9ba78624879aabb72bae0b4119fa2625793915382031ed897a0b4c3f2863b8aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00135-of-01024.json.gz": {"num_bytes": 397161888, "checksum": "9fa6fee55f5e8f887dcc64d94cc65ada6f283a580edc7926cb159b80d0084ea8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00136-of-01024.json.gz": {"num_bytes": 396185585, "checksum": "81a1fcafcedfdd9bcb32d2467d9c963cc7d8b2f32e13e52ee04db41b0d3f5483"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00137-of-01024.json.gz": {"num_bytes": 396933735, "checksum": "c7558304b614e1cff13b0f6e967fc5ef77e4953a1eea1f39ed925c33076d7723"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00138-of-01024.json.gz": {"num_bytes": 396371698, "checksum": "3e896da8bf296403f7b4061ba0b24d3c3978993de4854fabd688cfce9fbf7bba"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00139-of-01024.json.gz": {"num_bytes": 397289537, "checksum": "1a5ffa3aaf565ccf4db7444983643ad06e386938a0a2d313aecdb972c36111e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00140-of-01024.json.gz": {"num_bytes": 396983259, "checksum": "4047916916fd9dd7b76a8cbc595d52803344467135f744b23bd10296004a47d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00141-of-01024.json.gz": {"num_bytes": 394947050, "checksum": "7edfc9e5870d80d470e3797e8bef5183e9d170eab410ab50957e946dde2e8199"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00142-of-01024.json.gz": {"num_bytes": 396852755, "checksum": "4affc3a24616858fab84211e3825e90a1ea7d9c8f2cfabbe9a5c9b24c21a116b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00143-of-01024.json.gz": {"num_bytes": 397579248, "checksum": "d5aa9ba68e9b30576bd640f647d4069b6c56db276cc5229573440e4a38a7f1e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00144-of-01024.json.gz": {"num_bytes": 398800367, "checksum": "fa104e63eb7a8a6b066a5f00bf05b3ea095bad35a902bc728251f096173f1417"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00145-of-01024.json.gz": {"num_bytes": 396709510, "checksum": "b615ecd58821b1697c82094cb3435375924263827c342ab1b87e53907d4aa63b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00146-of-01024.json.gz": {"num_bytes": 396042389, "checksum": "6004c782f3235490865b6634b2c4840a989745b70ef2da674e75c62aeedf8a6f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00147-of-01024.json.gz": {"num_bytes": 399840661, "checksum": "5e8b46726f7ff2c3dfd381fb252f1b4bddf9436fd9ffd10fa300cb0fbe76998c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00148-of-01024.json.gz": {"num_bytes": 397098215, "checksum": "0851cb274aff2ec4f781c82af11c94f8938a797aca5097fb0089299cb4c75aff"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00149-of-01024.json.gz": {"num_bytes": 397540697, "checksum": "7cadf4ef9b0e29d9e8f68474464dc072b78e909a0f03c74e61b67912ff9b551d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00150-of-01024.json.gz": {"num_bytes": 396347701, "checksum": "521e4f67d12ae47b8f2a02b6f77e0c85cdf9a0efbcb45602d09ae116110ebe66"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00151-of-01024.json.gz": {"num_bytes": 394890490, "checksum": "2255bf3e1940ea28da9656028dee26865a9ee682cbaab4d5aeb34c081062f8fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00152-of-01024.json.gz": {"num_bytes": 399584675, "checksum": "f8ca4aaf5706ffb0f5518c7461d9045d18c645df068aa436137299e5ca77df82"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00153-of-01024.json.gz": {"num_bytes": 395606567, "checksum": "24f0e81dc3140f063ac89173fc262b01f2420133025b114f29632262cdd2e7fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00154-of-01024.json.gz": {"num_bytes": 397925578, "checksum": "5f40a87b15b0acebbd324e7c5cd2c0f31f911558d57f774f278634db94f2d5f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00155-of-01024.json.gz": {"num_bytes": 395428741, "checksum": "36281c154f187a09a83822878da815cd9b7f659a41cd90ac64653b437e798c72"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00156-of-01024.json.gz": {"num_bytes": 396799274, "checksum": "0fb66965107e54c9fed0013962763e874b940b0e174d775b21fa5e688fa53b33"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00157-of-01024.json.gz": {"num_bytes": 397321211, "checksum": "014d1443a4940fe95089bf87e245817d3a90c50e3e371a703098f5b9c3f6c759"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00158-of-01024.json.gz": {"num_bytes": 398736992, "checksum": "f912d27d68318fc0089fbaf8e0481ebe8dc5d2963cb89ed315f3bec637460bfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00159-of-01024.json.gz": {"num_bytes": 397250687, "checksum": "1bfd02a301b09bfd53058522d0613e1fbecb788d3173eb30b58115cd1cbdb477"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00160-of-01024.json.gz": {"num_bytes": 397492158, "checksum": "149a7bd76e9ea41185d99d21df870ddd4f32857fdd628cee927d6bee7d6a527d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00161-of-01024.json.gz": {"num_bytes": 398383574, "checksum": "0c385b4c9b33574cdc75070309a0aed46aa7b2e3b8754a7692035a3c5a04f916"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00162-of-01024.json.gz": {"num_bytes": 397126197, "checksum": "5c012b2a6bbc9413914ed1420b6150a5549cd74185bf2788d8809005034d433f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00163-of-01024.json.gz": {"num_bytes": 398201223, "checksum": "79448c338e86cea2609399705268fc6011cb21c4f0aff82e3fb7660391ce85c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00164-of-01024.json.gz": {"num_bytes": 397914908, "checksum": "dfb89631dce146ab4713a03f184e864472eb133b2cd04db8b4bccab688e9e287"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00165-of-01024.json.gz": {"num_bytes": 398142696, "checksum": "74acc88d6612aae7bdf5187d3b9eddcdb04cf60f1cc350661ffa50219a747f9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00166-of-01024.json.gz": {"num_bytes": 397533050, "checksum": "757d23402b3a155cfcb6b30bdc305c8014c9b64ba4e067753664670c2c5e9534"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00167-of-01024.json.gz": {"num_bytes": 396241119, "checksum": "521bd7a9dcfa0390c35e50a3d0cde3ea627ca538dfc419a97ed83b251d8a3005"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00168-of-01024.json.gz": {"num_bytes": 396041761, "checksum": "dc540ec27d5999f6a4c71f075ae1ec64ea84415c720cd2b6ef3fdac925e576da"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00169-of-01024.json.gz": {"num_bytes": 396350882, "checksum": "36d5d35075a82038dfdd5abd29a839f4e9ab79d51f0bbc635d3dcf3f5f1e2732"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00170-of-01024.json.gz": {"num_bytes": 396885157, "checksum": "db9a3f6a7e085007eee381357ea9e4d5d6f702580d38220860967ec441ba3525"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00171-of-01024.json.gz": {"num_bytes": 397266368, "checksum": "7f8098cb6532bc888d3c1f0ea5072cf8419ce1689b9ffe1c370ca20071e7e1c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00172-of-01024.json.gz": {"num_bytes": 397140430, "checksum": "90ae7e2551b1f3bf2e5ccf4fb3fac8fa3512add5e299ba7c90319611baf8c840"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00173-of-01024.json.gz": {"num_bytes": 397069631, "checksum": "a86f5ab72e1a9b1d491988154fd6400e6ee8c74378a9e64276df438a3c4edf9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00174-of-01024.json.gz": {"num_bytes": 396743897, "checksum": "451cfe8e14c17113a2f6673ece27e01f8d54bed1b57d1b20cb84f125879939ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00175-of-01024.json.gz": {"num_bytes": 395780705, "checksum": "3252e9781545bc3f9f19ac6e8fdb87d81cdc5a94838798daf6037c9f4f473db4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00176-of-01024.json.gz": {"num_bytes": 396205053, "checksum": "49d1648d37150b90632a6459828eedd82deb2fce7f108bf4e1b050f2f9ad1668"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00177-of-01024.json.gz": {"num_bytes": 396248718, "checksum": "99346ccda762ae85038a10baba937ef8ef668a0beab483c4005dce77e331768b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00178-of-01024.json.gz": {"num_bytes": 396634813, "checksum": "8d3bb1610ce79cf359d75f32e7624b6203140ed3eb276362b040615e9ffd4b54"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00179-of-01024.json.gz": {"num_bytes": 396524113, "checksum": "971e5c9499425294cf5945436b2ee419379a75bdd72d4cd6a33b1d17c17de298"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00180-of-01024.json.gz": {"num_bytes": 397938782, "checksum": "dd6b3e60219788b82ab3fc63a9e65f38f64aa2f7b294135ec2d16b36350f1f40"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00181-of-01024.json.gz": {"num_bytes": 399155769, "checksum": "c6a806d627a9d197789bfc6257a92b0223ca51e724c3c2ad10fe2397dbe30848"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00182-of-01024.json.gz": {"num_bytes": 396136228, "checksum": "2c48e3237253eaad9afc121e6946a9e1856bbe82c5a7cb287b05cff3e6ea8e8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00183-of-01024.json.gz": {"num_bytes": 397083292, "checksum": "52645e03ab47da01bb40226eb90042be914f1170688ae940314871e16cbb1037"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00184-of-01024.json.gz": {"num_bytes": 397402964, "checksum": "1edbdb41edeabc108f0147e18b439a75e390e0a843ed915f1cbf73a7c7f7867d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00185-of-01024.json.gz": {"num_bytes": 398411052, "checksum": "ef071e52174a19597e567696262470906275c2cd1cbbb0b1e98864999ea2d463"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00186-of-01024.json.gz": {"num_bytes": 397122443, "checksum": "0d87080bc08f7f8a1952a7df57ce2bdbf61e40c05b61937c8c19ae0ecd952b1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00187-of-01024.json.gz": {"num_bytes": 397244868, "checksum": "4aed75ea9f885fc3dab599c19c7bb98f7d57ce2b2ec11ac8ab3258fa479fc0db"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00188-of-01024.json.gz": {"num_bytes": 395677432, "checksum": "342882e436ea826cda9fd38c0caca68bb35444a2a07596f8de0e53a3e2169f59"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00189-of-01024.json.gz": {"num_bytes": 393653750, "checksum": "22ed9e389f6c8410c9bde898d97ad798c236c2da4d0b2c76b86d013f8686da03"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00190-of-01024.json.gz": {"num_bytes": 395437920, "checksum": "b3f9ba5834d4f0280d6defd3bd50fdf961bee6be4c71ed47046cf4e115acab01"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00191-of-01024.json.gz": {"num_bytes": 396944861, "checksum": "4e7ed636a60edc44b5ba709dcd83bf4263ad8d5a06a02827d3d27191bf3731a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00192-of-01024.json.gz": {"num_bytes": 396611165, "checksum": "4fea34466d9b470bf0bc44455183b2c61994c4e71e4bfb684dff3b5e3870d1e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00193-of-01024.json.gz": {"num_bytes": 398283211, "checksum": "4c4e6d31f455831330971ed1e0c33221203401b817adbda5b53de16f8299a9ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00194-of-01024.json.gz": {"num_bytes": 398915952, "checksum": "dfd0b1ceb2a437da8cd38c9c791af809e94f2e36ab4399b2a45a5b916f4ccaa9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00195-of-01024.json.gz": {"num_bytes": 396352694, "checksum": "0ccd90ced34b3ff28c21d015a87eca3f31eae2bf31f11f25ac073139f9d50c22"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00196-of-01024.json.gz": {"num_bytes": 398582922, "checksum": "f22e59765cec074a0c687c500f4e6348250d0e418d12dcba211e39c133aaf290"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00197-of-01024.json.gz": {"num_bytes": 398839554, "checksum": "95fa68cd75d77a1b5bb526dd5ef16a2f04a3520604f734baeb6e2d95608b5973"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00198-of-01024.json.gz": {"num_bytes": 396202192, "checksum": "f0e6343e8105178b38f75eade6774aa6e85b62a271622fcfcbe2745f1cae11ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00199-of-01024.json.gz": {"num_bytes": 398029364, "checksum": "4c58736410c8d3c7174ce011e2f281cb16e4949d756ff4ace86b4a9d4795c04e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00200-of-01024.json.gz": {"num_bytes": 395867629, "checksum": "1cb798ee6609e670053987d881d130d5b73db19d9f37fecff7a6da41152aba05"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00201-of-01024.json.gz": {"num_bytes": 396858169, "checksum": "7357eb22b2aa75c55885252c62d12e08cf8f7ef285c0052cf1d706c3f0f74fef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00202-of-01024.json.gz": {"num_bytes": 397955766, "checksum": "8901d0f27c4c11916cda7cf806cd00000771b6351954c8503bc312cca5ad3a10"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00203-of-01024.json.gz": {"num_bytes": 397737882, "checksum": "ed51917fc8936701b681cfc49ef95b2dab451ca597e76b34ba90be9405a1a0b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00204-of-01024.json.gz": {"num_bytes": 396094006, "checksum": "88692bb8da78347cb97c0e0849d1a10a97b1686cde1f75626236b89bd507e2b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00205-of-01024.json.gz": {"num_bytes": 399027636, "checksum": "fb17fe19d1f0fcaa43fb31a3ad9b105b3d93fa287351c7f93fb599edb7f40bc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00206-of-01024.json.gz": {"num_bytes": 399406254, "checksum": "668d2a9927080b686a4d728236e4cfc780b262f9045dfe9575cfc48cb69d6adb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00207-of-01024.json.gz": {"num_bytes": 396291803, "checksum": "928f451dddfe42bb2ca791dbc61c36ddc618006ef709eaccbc2beb665c8427e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00208-of-01024.json.gz": {"num_bytes": 397807368, "checksum": "11e8627b758588056b61d31de07c50092222013a38ba802b7a9ae34b6b8b84a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00209-of-01024.json.gz": {"num_bytes": 398085408, "checksum": "d49d31d1719698ab7a2b9ee91d887f3192c8fc1b6108152a75b39de2a0ad25a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00210-of-01024.json.gz": {"num_bytes": 397670254, "checksum": "049b3294c3e22e6db6c115979a4a55f0650966c600ca17250e91b241cc97bbd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00211-of-01024.json.gz": {"num_bytes": 399643598, "checksum": "7772f26fd90f47033670e7f1d3f6fe092116486bb9a991577f9560b54ed3832c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00212-of-01024.json.gz": {"num_bytes": 397390768, "checksum": "7a24e4a70f43f6227fe6491fcc7bb6b2a19cae203521c803bedf8882c995d7e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00213-of-01024.json.gz": {"num_bytes": 398657925, "checksum": "21d0ee8d1a01957b56ac503aa88c6f3269b4e4692762a3f929fe0e7069be8c0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00214-of-01024.json.gz": {"num_bytes": 398282324, "checksum": "ede2d9824d8f99dd578a36ea82caae942ebcafd99f308cf5d0ff8aa4a56f0a05"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00215-of-01024.json.gz": {"num_bytes": 399178235, "checksum": "82516fa361dec02c7ed59ea2d0510d9ee4187609b449dca649a04141b12bc037"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00216-of-01024.json.gz": {"num_bytes": 397630870, "checksum": "4a6d5e60354b7b93f005010c6fc55c0a81596e98a116cdeec99e1ab4e58fd03e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00217-of-01024.json.gz": {"num_bytes": 398628848, "checksum": "02dffb623b628a3a3ea38084fe6bb840aafab8419feed3d1f2bd3598cfa80aab"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00218-of-01024.json.gz": {"num_bytes": 395087998, "checksum": "e1e9a7ac7a922d6a9bb90f82cb48dff11ab7208dac08511e9613cd2726ca67ec"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00219-of-01024.json.gz": {"num_bytes": 397622792, "checksum": "955afc7d45a080ae137e9dc25ba3d85629a6a14c3d9bbe4065aa37d710345b7a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00220-of-01024.json.gz": {"num_bytes": 395112655, "checksum": "a3560918bec20087e9908009a362957ecb06401924789e20b36c26e363db5ae7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00221-of-01024.json.gz": {"num_bytes": 397132000, "checksum": "d8459bb5b6fb6b341b24fe517cfc5dc099765ad70c3383bae913229e06cf99e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00222-of-01024.json.gz": {"num_bytes": 397138513, "checksum": "20d3c6219921dc9c2928d637000e488635fd9a12b5636de5a6a7e52c1b67d781"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00223-of-01024.json.gz": {"num_bytes": 397167661, "checksum": "43a18accd194646893324537991e0162f6f98a9cec5ff59fe8fb510d81d707bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00224-of-01024.json.gz": {"num_bytes": 397905941, "checksum": "a516485cbefdef2e31a493cd8827a5f936f10674ff3525b71d414e17f48241c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00225-of-01024.json.gz": {"num_bytes": 397218123, "checksum": "791c85c78c5e7f3557855a1fc71acd860521710515b89f92e54e02960549f46e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00226-of-01024.json.gz": {"num_bytes": 396619135, "checksum": "52a36037696e6245efad80e00d1f123c36dbd79e7ff52b1fb99f579e712d2b30"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00227-of-01024.json.gz": {"num_bytes": 396654998, "checksum": "e31123ab579fe95bd50afa10d52a51e9c15a4af28c06583fb5aeac4e3418f129"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00228-of-01024.json.gz": {"num_bytes": 396899165, "checksum": "86481361fff334dee3183fac8ab3f346e44ab3e6e7b35bbd7e6e062b2d2fa0d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00229-of-01024.json.gz": {"num_bytes": 397489378, "checksum": "bbb717711fb4c78ebe8a0476296a21a50285ec41d9fb9f08d5d66d899577e04a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00230-of-01024.json.gz": {"num_bytes": 397462301, "checksum": "054414aac29b5c8faee71a918f2586ad3fce8ee44c71e7a2e2af4b91e0169523"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00231-of-01024.json.gz": {"num_bytes": 396097584, "checksum": "8136e320fccba75a493954fefbb560f92532be44a6e0990404edae659d48ce1e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00232-of-01024.json.gz": {"num_bytes": 398984795, "checksum": "3d9362aab157beef3b5fcd4a0a0236d59de635a565b1c86423f45b26e8b437b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00233-of-01024.json.gz": {"num_bytes": 397258012, "checksum": "e1a532922477d17f7cbea7db72c2391d26b4db580e526ebd5a90be23607a8d31"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00234-of-01024.json.gz": {"num_bytes": 398350453, "checksum": "c464829565bcaafdba165b2d886be4580f3c0a516b5417853ffc4fe30049cffe"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00235-of-01024.json.gz": {"num_bytes": 397147353, "checksum": "573a6a1d33ccc6c5b605d381f04d73989504bb6d24514b938e92c3d4f61501e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00236-of-01024.json.gz": {"num_bytes": 396963006, "checksum": "21318462014bc185d0da7cbd342fddd07521401ca2b73e47eb5cb4bd42a82bbe"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00237-of-01024.json.gz": {"num_bytes": 397087111, "checksum": "49459c97b078726bf8377748d4bb2066bdfa47e2717315a9b3c8075cfc4b9b10"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00238-of-01024.json.gz": {"num_bytes": 396984031, "checksum": "befb46e9f928876edc580c60ea4242f63cf6df77c6c107fec6e4280d279e348d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00239-of-01024.json.gz": {"num_bytes": 395915197, "checksum": "dc5ab17e04e4f2678771094af67909dcaa8be36a6cb047cfa66e75f986c91312"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00240-of-01024.json.gz": {"num_bytes": 398321096, "checksum": "25b92f7a499e9aaf0496a57f6292a7f65941b34dd6c78f14b08358d180070029"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00241-of-01024.json.gz": {"num_bytes": 396626980, "checksum": "1ae21ee5585ec718763a3c7bd70d9338aaf77d0e02f92a41f6ed213d1eefa5b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00242-of-01024.json.gz": {"num_bytes": 398220596, "checksum": "c29f98174a0c02a817d5cfa3ebb2a92d5f49df8a34fa40abd360f1b39b4bde05"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00243-of-01024.json.gz": {"num_bytes": 398250083, "checksum": "819387c95ea7183b1f9e1e78d077de65023c4809198ef3a0c946f46f8b6c19b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00244-of-01024.json.gz": {"num_bytes": 396943969, "checksum": "7a0b0b984d7afc4181827705212f917cf4ac12412f640a2c8120513763cdb390"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00245-of-01024.json.gz": {"num_bytes": 398365865, "checksum": "a424157137a5eeca89819d600deea2a1619ea8f5ae1ed395c88ac600a85e3afa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00246-of-01024.json.gz": {"num_bytes": 397285385, "checksum": "73029f721bdaccd9d126e871973e70a551f48f077f5903656b305ea9885c4798"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00247-of-01024.json.gz": {"num_bytes": 397132841, "checksum": "b223cf1270d2c728592ec65b09599bbdef8d64f7df2eb525e114f86268500daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00248-of-01024.json.gz": {"num_bytes": 396316645, "checksum": "94102d9bcc086ed5b203bc0c6b830dd245c9bf6c695b23b19922b2a98eeb6a52"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00249-of-01024.json.gz": {"num_bytes": 396644237, "checksum": "36be793f4d76070ba1c696b3274e6dbab43f415c8fbaf752145cc99af6558680"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00250-of-01024.json.gz": {"num_bytes": 395860541, "checksum": "313febcf026d2cd1495fdd3d5ba3b492ce5d5749153e189672b6d9dff3e26a61"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00251-of-01024.json.gz": {"num_bytes": 396709140, "checksum": "7e2480b3d5869ba35007c40e18585f3fa208cdf8e004078cc8de4fac36773507"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00252-of-01024.json.gz": {"num_bytes": 396508847, "checksum": "25df46ae56c0d4a6f945922e31fc697d12e0b7c525be9bc2b8eced802641488d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00253-of-01024.json.gz": {"num_bytes": 396364816, "checksum": "6b2125b9eab9bf893e7f8913a6beedbeeef5de53893fbd6172f706e33bab5177"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00254-of-01024.json.gz": {"num_bytes": 396122930, "checksum": "7947e5152c5305863e2d664622e3de49f9386b4384eb09630c5bfcad21fb458e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00255-of-01024.json.gz": {"num_bytes": 396929803, "checksum": "a1ec8c609ac969c24e2524f0f3dc31ef43ca0147ffe66569d3135e4f28394325"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00256-of-01024.json.gz": {"num_bytes": 398432943, "checksum": "3fd0373f5a8974a3499c436d96ea73be95f5619b8388dc316f51aff01e9ecad7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00257-of-01024.json.gz": {"num_bytes": 396003748, "checksum": "516cf3626076f083962983b2d6c596ef355609492f2e81c6c3cdec01acf8c5d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00258-of-01024.json.gz": {"num_bytes": 393890690, "checksum": "700760a7764f890c8aae337e7ee458c8467eb9048347edd237e341dd2bd5d236"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00259-of-01024.json.gz": {"num_bytes": 398130606, "checksum": "d868f8ef5e1cc971ffd00908bdc7eace32ec151d7405d7cac5fac22df9ea10c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00260-of-01024.json.gz": {"num_bytes": 399765969, "checksum": "7d5eb3b88eb8a0291ae70c1997458cf5aecac645397e50a67fab3d1193064353"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00261-of-01024.json.gz": {"num_bytes": 397418895, "checksum": "ca607c9e13d7cfb73a29ee3131f77e6bef3130d8627037cef9f57ed459185f0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00262-of-01024.json.gz": {"num_bytes": 397925991, "checksum": "ca789394ab4398c41490ec6147a41ffc8847155ea9ff74d7ff8b3402ed0634e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00263-of-01024.json.gz": {"num_bytes": 397082336, "checksum": "aac81d1bf0ade80758c14d01842b9b06c89ebf2fcdb9a06b1472bf2f70bbc348"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00264-of-01024.json.gz": {"num_bytes": 398101079, "checksum": "3cf56a2989b5c3f26ba94124cc534f5c9ae9770bdc6a3431dd745603b480ab19"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00265-of-01024.json.gz": {"num_bytes": 396949669, "checksum": "d4f252a6c2f43833d6d89bf69337449b4cae5dc88fd08fb20b35fe7194a50ddb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00266-of-01024.json.gz": {"num_bytes": 396242007, "checksum": "71c745968d8ee4a0d64f38930a76e65d68ea094ba3e0b963d5d6878f65f51b34"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00267-of-01024.json.gz": {"num_bytes": 398342031, "checksum": "706a560c862979594265925c3200d4bd0981a9eaa279841f2cba673634f7074b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00268-of-01024.json.gz": {"num_bytes": 396399468, "checksum": "eb3dea553c37f220b3b9b5f377d5a4ef94243b3c0b6b46981e3e5b7ba5b4a935"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00269-of-01024.json.gz": {"num_bytes": 397181296, "checksum": "4f0feae035dacaeb720ca3b6ea17685144895a0d78cfa358e30983f8d6c4ec76"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00270-of-01024.json.gz": {"num_bytes": 395712883, "checksum": "6e0f6de1e5a5c6d4bf23d0539ee72ecc2b4285da2b0f1ec2cdcc443d2e22aa88"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00271-of-01024.json.gz": {"num_bytes": 398066980, "checksum": "4c5cd1ef1917ed762d7d8c5c54e1da05db74e45721697df8b0626e0aeac96966"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00272-of-01024.json.gz": {"num_bytes": 396667308, "checksum": "77a33c37a5d88e419e2b31cf560d53f129a38e5bc2306b5baccc187b7e94e589"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00273-of-01024.json.gz": {"num_bytes": 396020214, "checksum": "b18e40c00b8e0e02dfac40ea0519964e231c8a2f28bc1294b044fb090f41a9fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00274-of-01024.json.gz": {"num_bytes": 396300833, "checksum": "34c8945a6ebac564fe87881d6968d05363a89985f297692a3df7104128b9c26c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00275-of-01024.json.gz": {"num_bytes": 395206463, "checksum": "1e41d7e2a6117224dc23fbaae8e9d20df9d7744adb4687d2b0e570bf8d9e47f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00276-of-01024.json.gz": {"num_bytes": 396667995, "checksum": "45973b91c2f1140f79265a24f484fc6d6653f43f83d5bd2d18954892dfa4dfae"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00277-of-01024.json.gz": {"num_bytes": 398134029, "checksum": "b7da91889b6695cf01bceddfc139b23f9465bda5cad54088b84a1f5a4d7a4f9a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00278-of-01024.json.gz": {"num_bytes": 397422615, "checksum": "e794a2903bda1f3c082e8f590383c714a518c202ecb99eda5513d6b320f70e86"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00279-of-01024.json.gz": {"num_bytes": 398776175, "checksum": "a5528d3e33151138ef9bdc2433744f1797de2b20673a570de5bd4d81b306354a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00280-of-01024.json.gz": {"num_bytes": 396208086, "checksum": "1be2d8c3d0eca510fac7b06a5401b2b8873bc6dfbf85a3c736301756f9681309"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00281-of-01024.json.gz": {"num_bytes": 396893734, "checksum": "1db3e9017561d38a91c417ffef875b7a948c4f64c51b90b0983c71bc9d950903"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00282-of-01024.json.gz": {"num_bytes": 397411883, "checksum": "4e23d39fcec2c310cbde3fdc5d9c185046086877ac03bbf9d772b092614f93da"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00283-of-01024.json.gz": {"num_bytes": 397906911, "checksum": "850eb5e60b84bca4d2f10b2e511fdb2661e3d08444a07db1782ad85c754fe808"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00284-of-01024.json.gz": {"num_bytes": 396043261, "checksum": "fea24050c6aec13eb706a6f3854b4debde62b1b842f2992fc027820c66218b0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00285-of-01024.json.gz": {"num_bytes": 396961329, "checksum": "6052f82887cd2362320f72f6545d2e5b5a775e9bef95783c9b9995ecb7a5ecc4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00286-of-01024.json.gz": {"num_bytes": 395697481, "checksum": "f4361838b5b679c8306447364166c1c3083af392b4c8793399c122af09c7312a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00287-of-01024.json.gz": {"num_bytes": 398773520, "checksum": "9add91f23f31ff8c5d8d84e6a0af75fc6fa08ceef8ccd9b633d8c49aa1d0104d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00288-of-01024.json.gz": {"num_bytes": 397684645, "checksum": "64dc94555a122353c3a3c9999e67d17b0e4b682096ba80be2258c791ce1c2b9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00289-of-01024.json.gz": {"num_bytes": 396655864, "checksum": "2472c76b1cbcfc3cb82126795673126e8f532119a03722a304396ceee9b7db3a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00290-of-01024.json.gz": {"num_bytes": 397415313, "checksum": "960b71edbdc6a6a62a0d3cc1069bbbfb11893cc017aba543e10c9a23cb759d1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00291-of-01024.json.gz": {"num_bytes": 395617977, "checksum": "96e582d7a750bee597331f373ec2e16d3a9686f48a49d39765d39550c8cbbad8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00292-of-01024.json.gz": {"num_bytes": 399332500, "checksum": "cd6ec4941aa5babbe274684945bf899447ec2459b8f7076ec8c74d2b3fe794c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00293-of-01024.json.gz": {"num_bytes": 397021546, "checksum": "d0d0c4d80e75c5d02103b49027d9e2e6f7db74c12f8b53f600d7fe420b2d0a7a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00294-of-01024.json.gz": {"num_bytes": 396272726, "checksum": "caf5708a6989f867ec6c4c56f338aca9f3a43a1806a27ef473d9b0f219001cb4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00295-of-01024.json.gz": {"num_bytes": 395233811, "checksum": "a7b5f904e34c0b370238e6beb19149d4bb96d0cce43a1eca3bfaf181952ede53"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00296-of-01024.json.gz": {"num_bytes": 396480926, "checksum": "4fcf284d98c2f7b63e47573e9d084eeec2516fbfa62be42c3ff94e1cf518e313"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00297-of-01024.json.gz": {"num_bytes": 398883718, "checksum": "c1cb458076497e7dee645f50281d1af2fe5dad556d28a2cbbd73abe6537c8a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00298-of-01024.json.gz": {"num_bytes": 398733629, "checksum": "4a612c715025292e62860fb0018e9fa2d3fade692342746d044be6297e25a034"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00299-of-01024.json.gz": {"num_bytes": 398155026, "checksum": "d33f4043fad9551f92084a45b7f54d920ded9d6fec271cbbf85f71b021f9ee4f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00300-of-01024.json.gz": {"num_bytes": 398612975, "checksum": "61b1181b796a2f40db3cb6954f2890397c3722c486dccd4075d74679cf61a70c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00301-of-01024.json.gz": {"num_bytes": 395385748, "checksum": "95a78e9d3cece0620430c85822fedf4021ebd88ece57d6714933c268d3b6af6c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00302-of-01024.json.gz": {"num_bytes": 397620059, "checksum": "321aed402a5e779febe9766294ad040a3f8dcf57bae68648c03d3c59023aafa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00303-of-01024.json.gz": {"num_bytes": 396549027, "checksum": "4198f6a2b5bdaf90ac4251f013908123a5964429870ccd6b245a9069278c4e17"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00304-of-01024.json.gz": {"num_bytes": 396596460, "checksum": "74a6440e93d18d0d6d0622ab7d8832d7ccc91c03297faf20c8090d16f7c042d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00305-of-01024.json.gz": {"num_bytes": 394881271, "checksum": "654deec494bba4eece19c27140426049574cf529c93ccb422fcc09fe4496af15"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00306-of-01024.json.gz": {"num_bytes": 397760377, "checksum": "e0840cbc94db6cfc35df66d413a11261756392dd59b0fdf89d9ff166ec76f3e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00307-of-01024.json.gz": {"num_bytes": 396671816, "checksum": "31ceb8cfcd09fda621a9a483b09dfb43f5436e867363f6736ea3f710a6af10fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00308-of-01024.json.gz": {"num_bytes": 395961013, "checksum": "8c1e5acc3f964eaa5aff300731a74dde84ed0671cd764b121ea638fb08c3dd0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00309-of-01024.json.gz": {"num_bytes": 396035179, "checksum": "7d555942b1bcb2518aa5ff9c0549d98fabe7bb563cdc6c73d3f11e6a0bc502b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00310-of-01024.json.gz": {"num_bytes": 397140669, "checksum": "859eeb7a9d2ed03d5299bbf7f1c3e719236477950d7601112a458ea5a2adf7c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00311-of-01024.json.gz": {"num_bytes": 398170419, "checksum": "1e7661637b0a4445119ba403e4f8ede129c829fb7d1907ca7660870b536b8b29"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00312-of-01024.json.gz": {"num_bytes": 395605627, "checksum": "87a3ccd2ac9deff1ac4a5dd02bba269a48692d4598c5899630e8d2e4136dbb99"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00313-of-01024.json.gz": {"num_bytes": 397081206, "checksum": "c6952116cf573a6e20c849cf1b7d8d0edf3b9d00fc7e717e7bacde915c4c52a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00314-of-01024.json.gz": {"num_bytes": 395555727, "checksum": "762066fd85c596ee01b3b8070708517cc5759bb1e3c4bb65f4645fd62b550d13"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00315-of-01024.json.gz": {"num_bytes": 397871218, "checksum": "814f19cc5e81144f5bfd7037f5f522dd5c44faf150c10337c675174a5965a5b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00316-of-01024.json.gz": {"num_bytes": 398577523, "checksum": "27643c7c3c0a1a78c9003b936ea27785709a2df80d09817278a179eecaedc352"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00317-of-01024.json.gz": {"num_bytes": 396388623, "checksum": "5f840180e2017c41c6b1c865784788dc3b002478a9ecb43c3859174af788ba5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00318-of-01024.json.gz": {"num_bytes": 396173471, "checksum": "2aeab99fbc84a2640a05081e2c7438451e75f76cbece3cbe5d82e85463a61966"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00319-of-01024.json.gz": {"num_bytes": 397912127, "checksum": "fda805ed19f4b996b048386f4bd73924dc965a069e85b8b4452a54a1372375fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00320-of-01024.json.gz": {"num_bytes": 398765416, "checksum": "bce244d024c076911c1c6dbd35609be5442c8b0440690e2cbb342ac64bdc494b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00321-of-01024.json.gz": {"num_bytes": 396005962, "checksum": "763584ee096223b8aeffb1576ec6e4f3bea674ec4de40fa163c2f2221b3701d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00322-of-01024.json.gz": {"num_bytes": 398615672, "checksum": "5c12ec1d0c450fb7515c586f24311bad145050dfc64180d65bacbd346c2ce9c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00323-of-01024.json.gz": {"num_bytes": 397861187, "checksum": "93326f43273fb963593e0b1caab1e9588387291c23d5c14b5ae40b46b199998c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00324-of-01024.json.gz": {"num_bytes": 396679008, "checksum": "6ebfe6e28851e6d79cfdbf370602373fc2136e88936eece302ecaa8ef8251827"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00325-of-01024.json.gz": {"num_bytes": 396358086, "checksum": "51190fbfd48479842ec3c7d910b5519e01ff797ca0143c39be142c1650c5e893"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00326-of-01024.json.gz": {"num_bytes": 396490692, "checksum": "f4d9bbfd1bbc6e939fce9a2df26e45c79be73dbe2650fe79af395bdaa39cd121"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00327-of-01024.json.gz": {"num_bytes": 398354656, "checksum": "c70c824b6c16e5fad922ec9b8d363d97bed90501522b641b0eb0f66b8c086325"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00328-of-01024.json.gz": {"num_bytes": 397326336, "checksum": "7e6008433a0e5bc6eed28a13b9dba17246e7d65ca96c31092086c3546a3a397b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00329-of-01024.json.gz": {"num_bytes": 396390524, "checksum": "f379d844a35172424554bb82a65c790c354b76c0e7abfd868225d1968017d1a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00330-of-01024.json.gz": {"num_bytes": 398259199, "checksum": "ea15be4a83c3de66c42410e13e5ef9c93baf86099a8eded1c1d10b0cd5ad0f29"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00331-of-01024.json.gz": {"num_bytes": 397618860, "checksum": "7b6aad6224ead9ee3a0c860cfd991301ef5e97093b23c76d713e73f4911d0e44"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00332-of-01024.json.gz": {"num_bytes": 396743573, "checksum": "bc5333d383020d2296aa0f6ec940ab586a367efe50d1c597f9db55ca72fa66e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00333-of-01024.json.gz": {"num_bytes": 397460128, "checksum": "095b3a85a9598009638622ca21cb00142efa0d68196c8c3a8bb922cccb465e8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00334-of-01024.json.gz": {"num_bytes": 396900262, "checksum": "6f005575f4843b84f4512e1b7c1b748edf497e4e9f55eaae47f9b4637161ccab"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00335-of-01024.json.gz": {"num_bytes": 396106895, "checksum": "66bfe399d0859f71c20db01de53ca7bf997b33afcd3d181f181d9f265a2c2fa2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00336-of-01024.json.gz": {"num_bytes": 397732616, "checksum": "1f1e0435de870b98b119e91edd4a0d32d078dbb810f919a70b85360cd860f0cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00337-of-01024.json.gz": {"num_bytes": 397834763, "checksum": "1db4bcdaa6fca612c3f1b38dad6d5402679ca21aa6a545850d61bcda10103697"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00338-of-01024.json.gz": {"num_bytes": 396712179, "checksum": "810c104a8862699c490fc8625a7be4115872fe2de4d8c061e095dc5a81eb4d19"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00339-of-01024.json.gz": {"num_bytes": 396838831, "checksum": "9bbc616d5c4aba46475957a22544dbdb0557f8de31cdf919718fbfe55bc70ac8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00340-of-01024.json.gz": {"num_bytes": 395587861, "checksum": "48c8411ee2b5fc8cffe1589ed204d0ac8a12b5b3bb1857373f84bae984d49e8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00341-of-01024.json.gz": {"num_bytes": 398093153, "checksum": "4ff8ba83e489580da2401aaa23ca3329befe8fc08b6f299b612950c358688604"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00342-of-01024.json.gz": {"num_bytes": 397248009, "checksum": "c72e063f95d10ce661b4bc97538eccf6da6ad493b7e54da555a46e4a47aabbed"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00343-of-01024.json.gz": {"num_bytes": 395939409, "checksum": "249eb2080c55402aab34a31a442b06bcaa25d2df3f4319ea1a5f50dc6bb709b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00344-of-01024.json.gz": {"num_bytes": 397608807, "checksum": "8cc57604fcc5fa920b0d16df6e8d8b7f4ca88c0c76c86f9ac81f42a615b330e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00345-of-01024.json.gz": {"num_bytes": 395751274, "checksum": "13fbc76e49a8b856f7563b945bef10d786a86caff63b4cebea50416ca34932ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00346-of-01024.json.gz": {"num_bytes": 395516794, "checksum": "61d43da2e3e7770016ba7235eaa74a1e6a180e64cd2cfacefed5c34e8b72eca7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00347-of-01024.json.gz": {"num_bytes": 396180000, "checksum": "4a0ca2103de168d05d0090c8800d47f216cc167a9cfe9e736403aedf040c5e46"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00348-of-01024.json.gz": {"num_bytes": 398461180, "checksum": "a56396961496499ac289a85d126b916132e787d0dc4fbd9961aca7dbbc7cfcff"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00349-of-01024.json.gz": {"num_bytes": 398049366, "checksum": "ca012572c575f6a8e6ad6453296ff93f22118995c17928e76b655da44ce5810b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00350-of-01024.json.gz": {"num_bytes": 396532962, "checksum": "bb35d17862201063b46d8745dc182756d1bb09e809c4c355452ab1967e655491"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00351-of-01024.json.gz": {"num_bytes": 396576223, "checksum": "19ea45ab2fe5487d2a69cca7c9a1db7a09c8d5dfdf130412bbcd241cc60a61c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00352-of-01024.json.gz": {"num_bytes": 395956381, "checksum": "bb5869b8649fffadd5f1945ca9a79588e84081a8fc45b7e4cb5507149b5be2d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00353-of-01024.json.gz": {"num_bytes": 398903623, "checksum": "cb16a7ecadd28a8b5622c4e581f463f0ae2fe20a3e6582fa6885d76e7523715a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00354-of-01024.json.gz": {"num_bytes": 397316693, "checksum": "42aea18548695c458ddc229d8c837356845609aca3bb64ce6e07b185443b9468"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00355-of-01024.json.gz": {"num_bytes": 396240550, "checksum": "1577d76807548d83427293b9f534a3261fb72a345569f0491a1fd2691047bd92"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00356-of-01024.json.gz": {"num_bytes": 396132315, "checksum": "b6e17a39292e082e517082b23b381305ebe889c2530fb5eb74a2683d36d07a86"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00357-of-01024.json.gz": {"num_bytes": 395948117, "checksum": "524ebed10c881f52f155db5d6690806f5a97aa8f811deadae916323b50427ed5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00358-of-01024.json.gz": {"num_bytes": 397397242, "checksum": "8e23d852bc3a0dda4684d5fd511003ad6f18232e5f54e32638c8db62e9d18c6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00359-of-01024.json.gz": {"num_bytes": 396141321, "checksum": "345c34dafbc59f5e93355c8b2e6fcde6bf59bc9e1ebbf5cb962d54228e6d3204"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00360-of-01024.json.gz": {"num_bytes": 397258644, "checksum": "51db06055d95e2b43fddebf8c2b7d76b7572745f129d89fe005f8e5d3f12b758"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00361-of-01024.json.gz": {"num_bytes": 397913411, "checksum": "2c0f6054fef084d3e7cd10e2de0b1d3a48dc716af1e9146548195df128bdaba9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00362-of-01024.json.gz": {"num_bytes": 397722576, "checksum": "664b390b20498eb6e78fc09604b3a947fc1847a01e3eaae4c7861d1dde3b90fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00363-of-01024.json.gz": {"num_bytes": 395416894, "checksum": "c57529884c6d4977a279a097c0dfbcc31d52048cdcf64950182c743583d7989a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00364-of-01024.json.gz": {"num_bytes": 397028679, "checksum": "ed4f252d63c679f6e3f35847e0871c3360e072b0d6963f662d7e808b6615457f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00365-of-01024.json.gz": {"num_bytes": 397574891, "checksum": "68e8e44a531d98897245fee90ad349f4fdee891b2f68dfda78a1dedcc9474326"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00366-of-01024.json.gz": {"num_bytes": 396905692, "checksum": "9e88b888d85633671e009ed7093763b934a42054ed6a1252222dc64781a20e22"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00367-of-01024.json.gz": {"num_bytes": 396802011, "checksum": "2abaf3f3946788258b8543fa2ccccc0c20e6980b9d26a38decd356e67f575fa1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00368-of-01024.json.gz": {"num_bytes": 395630737, "checksum": "b4960e3395d8a1bf8350f57e5f6280b00443a4c6b85e6fd47478fbbfc1733caf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00369-of-01024.json.gz": {"num_bytes": 396228047, "checksum": "08e8210426e6c6ef9746675592a3eea4a92eff9aa4bb7ffc6bf6ba54bc411f72"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00370-of-01024.json.gz": {"num_bytes": 396548482, "checksum": "10e0305ac4d1e410d749637e0c03386d969563f8eb73bbbc376fc1d21025e4ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00371-of-01024.json.gz": {"num_bytes": 397344482, "checksum": "03df0f4aa5c377f6b45db3c3b863240bfb1211ddb226bc055433fbcd9ee8e873"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00372-of-01024.json.gz": {"num_bytes": 395872223, "checksum": "9b70549213cb01595179928cdb020daaf7bcd2085c5e947d111f3cc66e406d2c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00373-of-01024.json.gz": {"num_bytes": 397399096, "checksum": "945c204cdb107669a8d1252a91323eb300c902bdd6c6a8167a90805ec02cba9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00374-of-01024.json.gz": {"num_bytes": 397755002, "checksum": "8353d4383f73caceb5d112f260b37d1349dc7898af2d05b98ffe17d22aea97ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00375-of-01024.json.gz": {"num_bytes": 396534763, "checksum": "a3de41388a6d8ce3b605c6586e47b74a565dd2f54175551987bda0a0ff95036f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00376-of-01024.json.gz": {"num_bytes": 395594630, "checksum": "7cadf813f2b31a1bfe44fdfc84aef4eb65e889c2616c56b189890734c22b731f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00377-of-01024.json.gz": {"num_bytes": 398241040, "checksum": "15df154b52cb4d9314dbc4ac26ca4b4df7125b12131d538fd480f8a6b3fbdfc8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00378-of-01024.json.gz": {"num_bytes": 397217224, "checksum": "208ce680427f62d78dad857bee91122a79f968589b4e44f2f89919e91f4dea30"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00379-of-01024.json.gz": {"num_bytes": 398504097, "checksum": "0052fe7f27e720423b6143f401b8618428d913b22fc2af2950874785e2ef7528"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00380-of-01024.json.gz": {"num_bytes": 397494149, "checksum": "15c4f07a2629c7bd79b243c97367e3e18de02b5ab09eccc0f85b1eba0e0b071a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00381-of-01024.json.gz": {"num_bytes": 397190859, "checksum": "77c71b4a79ac2f462040ea0e8408fdb8f719fac0f09fadb760ed00b709e9dea5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00382-of-01024.json.gz": {"num_bytes": 398126420, "checksum": "aa44d029398c33f733065c489ab3ded9395f6e53263407173b6e9c27b6fb9c45"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00383-of-01024.json.gz": {"num_bytes": 399108296, "checksum": "f507161fbe96f8abe9dedccba2458448719e6b153bcc1256ecee6b4b9c82256e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00384-of-01024.json.gz": {"num_bytes": 396156787, "checksum": "83c236bbc8508fb81992c837751a4d8ad4b9bc138dd1f4bb5c1fcc68203e12da"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00385-of-01024.json.gz": {"num_bytes": 396878483, "checksum": "df45b4749951a46695f88789fc536617ee3470083e55562292f606e09185e4a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00386-of-01024.json.gz": {"num_bytes": 397495799, "checksum": "a8240c9e7266e47bda8880e38ac8a5afa8541aed4b989d6642b31497716a51ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00387-of-01024.json.gz": {"num_bytes": 397062301, "checksum": "e6fd54ea6f17d5570fa4cc97554813a7a33bd4e44cbc456b27b0c87c1af22c60"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00388-of-01024.json.gz": {"num_bytes": 397074091, "checksum": "fdc2a134df4a669deb839f26947c86b7e7a4bc7596a6a1c25562cb97fbb6b089"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00389-of-01024.json.gz": {"num_bytes": 397056868, "checksum": "e7390f0007582a3460fa67375b2628c85a1aa85954796d8e6584fadcb35761cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00390-of-01024.json.gz": {"num_bytes": 396404332, "checksum": "820a97060abd3172852f38e1636706c8389adad8495de56f4c3a2c3ba6008235"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00391-of-01024.json.gz": {"num_bytes": 397125489, "checksum": "68732c5ab9f4b6945e79ce2a1b45b97a97822d6a107aa79aa9135f29d91173ab"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00392-of-01024.json.gz": {"num_bytes": 394992472, "checksum": "c9d1e8cfd481631a76544e5880ceee9990e7553c88c5978a91b48ec8aa47717d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00393-of-01024.json.gz": {"num_bytes": 394778146, "checksum": "7a5ec4f0878f676a3ac2c417f512186066d793f28d611f97135c3626b3b60fdd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00394-of-01024.json.gz": {"num_bytes": 397024190, "checksum": "44e32db5a39684ab1789cfe97b6e9cbd3c539390e7a4c8ec9298e7177945452b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00395-of-01024.json.gz": {"num_bytes": 396537190, "checksum": "601ec281240753ac5793ec7cb83802a788c4d88e56dfd83e6c875cf2ef9bd8f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00396-of-01024.json.gz": {"num_bytes": 398049705, "checksum": "b1024b69e191b2c7073f5f4f3ea51e8710be54db8603ce8aaabbfb919ea6694d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00397-of-01024.json.gz": {"num_bytes": 396670567, "checksum": "11357bc600f9b0c443f124c7fa4046d10cf03e19016e5ba8cdde884d2ff76c9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00398-of-01024.json.gz": {"num_bytes": 394706629, "checksum": "778eca6d845b9a7d49e22941b959a95e5e4d2d9714720f27b810230d136acfde"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00399-of-01024.json.gz": {"num_bytes": 398257272, "checksum": "27c2a30af83975d32469e85fb2e27953a3aa9f97514f621063325cb9af1829fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00400-of-01024.json.gz": {"num_bytes": 398732278, "checksum": "aff9a39748526a03d3476288cdbce122c3683baf113362e9085895609d03c3c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00401-of-01024.json.gz": {"num_bytes": 396372632, "checksum": "a6af262bb962eb1c45d2003ee1bb2be1a3a12cb3e53d4ffe58b4b68dd852957f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00402-of-01024.json.gz": {"num_bytes": 396783625, "checksum": "db9aca12012da21fc5a0619a47e9c3075959786d6d6d74f6a244af1cb33c402d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00403-of-01024.json.gz": {"num_bytes": 396950960, "checksum": "b3566f7b9251f6aea9343d1344151f10fc104464f92e8f10a97742defffc2244"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00404-of-01024.json.gz": {"num_bytes": 398481154, "checksum": "897904040b5887620b9996cf89656f5bff329a430a8c3dfd6802d0c879675376"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00405-of-01024.json.gz": {"num_bytes": 396065216, "checksum": "45e0108549ab06d9a8ad5c45dc53250798d0e58f7e940080a754106801250009"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00406-of-01024.json.gz": {"num_bytes": 395637879, "checksum": "bda70f3a19b19e2ffdd1c3a26b959945b447acd450cab49e72ce727d2218af5f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00407-of-01024.json.gz": {"num_bytes": 398356109, "checksum": "1df9e8b4715d9a3f02a0b06aef6095f81d38acd1be0b4fa402acaac0258c3116"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00408-of-01024.json.gz": {"num_bytes": 396041456, "checksum": "e89ebf354280543204e78f4308a8f8751cc26094524628cd8e9cb691d9911b82"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00409-of-01024.json.gz": {"num_bytes": 396254329, "checksum": "15729474174d6a5adb5935f25afa6de2f03a8dd2f73b780e23795ede92f5762d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00410-of-01024.json.gz": {"num_bytes": 397850848, "checksum": "98f1b8fc845e0005b76d7eac70a430ce98e6989569344ea92266f8391b1396fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00411-of-01024.json.gz": {"num_bytes": 395527322, "checksum": "52b2e31f2adb61c8e703c6758016cbfc650f8104dcd5f78867c81434be155ea6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00412-of-01024.json.gz": {"num_bytes": 396155992, "checksum": "7b6b4192f9bec4fdeaf9d6dcabd9cbba6b4c8ebb42d26730fea21bad139823c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00413-of-01024.json.gz": {"num_bytes": 395766377, "checksum": "775d1fac6b1708ba0384d922640b2f372b3ee146fc79fbe692ff69a7c6c699b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00414-of-01024.json.gz": {"num_bytes": 394860848, "checksum": "0386d8a8e0cc9d5d613b1f84085791de57ad05751d94d25681d86dff5cec1afb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00415-of-01024.json.gz": {"num_bytes": 397566065, "checksum": "1957b0d185943b1952dc66e78f0a7d449f49f8f55fc0978bf77e8dde10f4714d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00416-of-01024.json.gz": {"num_bytes": 396297306, "checksum": "3f8796934edb79d172e682511a5ed7666aa09ff541ce55e2c66406bdb6eeda9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00417-of-01024.json.gz": {"num_bytes": 398314475, "checksum": "8da08075b966c04aa7859275eefd34c78cd2b9edc366684733d027ad6d619ba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00418-of-01024.json.gz": {"num_bytes": 396296110, "checksum": "efe43733ebfc7b65c646aee68b883cf40124c1446a28e70ff2bfa9e1bb1377cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00419-of-01024.json.gz": {"num_bytes": 397614415, "checksum": "c0f02d78715de9c3ea0c684dad36a506386081fed2011ec298ca0ee623c7792e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00420-of-01024.json.gz": {"num_bytes": 395133656, "checksum": "6237f5797a35dcdd89a0b70cac4dedcfb3fe418560f8dbbf6cad685f11c870b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00421-of-01024.json.gz": {"num_bytes": 397061849, "checksum": "ee37899a6a49269026633ec79577491ff4b11e219e0236dcba68eb168279067b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00422-of-01024.json.gz": {"num_bytes": 396539584, "checksum": "e5914a4b97c27da82eaee2f4f67a165de946bb38a00d6126b1527f5eb1200417"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00423-of-01024.json.gz": {"num_bytes": 397715346, "checksum": "b99e628f8790a7baa8ee7828e31f2ec72374f9a8390c1d64c9b8092b10d9c7fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00424-of-01024.json.gz": {"num_bytes": 396335469, "checksum": "9cb3b9eb00760bb68f3df4b66b96f1e5798c338231500472fd64c49cd87c6599"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00425-of-01024.json.gz": {"num_bytes": 396714466, "checksum": "f28d4901ccde8eb7afcede9732ab94fd18c49e0e3731659ef587058d6ea2ab28"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00426-of-01024.json.gz": {"num_bytes": 395566563, "checksum": "9ab75a89a425ce974fd36e936476a30db913c2d7c9ca6e5522b91ffbcbbe30cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00427-of-01024.json.gz": {"num_bytes": 395379035, "checksum": "5e1ca658bea5ba5506afbb9ae5a5da4d35cdc3a215478c68e11652a7d5d918f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00428-of-01024.json.gz": {"num_bytes": 396419259, "checksum": "d740b37b576bcde0e1c8eee27c3bfb3b58c1a0d3c5b471001804b2a37f277ac9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00429-of-01024.json.gz": {"num_bytes": 397116774, "checksum": "d1c10b0ba72aa2d4cb4640d1263c32868190942b1e93b4bb4e9798e25f10ba67"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00430-of-01024.json.gz": {"num_bytes": 396634586, "checksum": "11dec038b4c1c35d32d000915812b6ec8da9abbbec2e15f7493551198b6a1ef3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00431-of-01024.json.gz": {"num_bytes": 396704705, "checksum": "efdfdef444cf68fc05090107033ffe2ac906b6efe2fc138e90f47cd4bd0b6204"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00432-of-01024.json.gz": {"num_bytes": 396264701, "checksum": "fa649c2e2dbc992408c3a60327e5d5ace4697c84010446bb286e544eb6c604be"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00433-of-01024.json.gz": {"num_bytes": 396887722, "checksum": "3d5fd3fbf209dfff2057143a3dcf7eceeccb1e85967a9a85a992f465e3522335"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00434-of-01024.json.gz": {"num_bytes": 398856291, "checksum": "ab6dc5343b052da901f4671c1cb3173850fbc6bbfac2623ca14936b2b83d9667"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00435-of-01024.json.gz": {"num_bytes": 395888569, "checksum": "26abd1e2263af02f998705501bd02ead2edc3d7f68fadc7b198e7fcf4dffc454"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00436-of-01024.json.gz": {"num_bytes": 396976077, "checksum": "a5dadf6ec93e8dcd62b0e1de3cb03c866147bafe0da8e631341663ccc03bb801"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00437-of-01024.json.gz": {"num_bytes": 395809168, "checksum": "7f98e98270f9b88570b5e498511ee65d07428db604af349ef9107dbcf65ac4e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00438-of-01024.json.gz": {"num_bytes": 399136723, "checksum": "0e03ec507b90b38d5b6d7dfe27d40e127efdc9a0bae349bea2e743375ea29b9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00439-of-01024.json.gz": {"num_bytes": 396435416, "checksum": "5f868ba66ea32a23be4a926fda0a86d0d2ab4948326e1ebac615fa16a2a6864d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00440-of-01024.json.gz": {"num_bytes": 397487165, "checksum": "d30005787e7472313982cf2860e0a0764900b82a7bf616da27e6c1c3298eb215"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00441-of-01024.json.gz": {"num_bytes": 395968030, "checksum": "181461b447d88040130c3348ae7d22f220e0f97ace030d6f54301a9a3d483fc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00442-of-01024.json.gz": {"num_bytes": 396909150, "checksum": "0854cd3454047e0c6a0746ef21e0cbbb22fbdf4349c2e668f4fa1e49add183c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00443-of-01024.json.gz": {"num_bytes": 396271897, "checksum": "2493db29dd3cadef3719576c34213496eff807df5ae8cf538f13e84d403fec77"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00444-of-01024.json.gz": {"num_bytes": 395540084, "checksum": "5e717d9e0c1b6f728df0f206e422a0958a537dddf31fffa4d699e5bf4b3c2b16"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00445-of-01024.json.gz": {"num_bytes": 398750991, "checksum": "b8af9d413da48fb5f9a9174b12ad253b2eb2c1ed7709cab710d66710841568e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00446-of-01024.json.gz": {"num_bytes": 397575547, "checksum": "2bad5a914cb9f2e5e99d76afbf85eef66c18e7c1cf2e11c5d455792ae86ab441"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00447-of-01024.json.gz": {"num_bytes": 398035036, "checksum": "d834925674a33ed5eb8fcb335fd81b95e4ab882010e434e3fb9323e0f23be2bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00448-of-01024.json.gz": {"num_bytes": 398658613, "checksum": "16f3ac40180e47b9b97998f5d1d7c0e9336e2fee5612a3397fd161937f7a2b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00449-of-01024.json.gz": {"num_bytes": 397934476, "checksum": "09dd3d5a529f62b10d1ec97f37ed142315190fb437be3f50987ee955b11f7672"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00450-of-01024.json.gz": {"num_bytes": 396444119, "checksum": "8a25c11e0adc5fdf50944767fbfbf01a9c35b3c0e07205c7c06288d1f68b4c10"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00451-of-01024.json.gz": {"num_bytes": 395963541, "checksum": "f3ac2e295ca4b3ca1f55c8b500ea2588f1519163cec381297ad4bef390fbbe1c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00452-of-01024.json.gz": {"num_bytes": 396594911, "checksum": "25a57709e934077c2972f0f8a1a9db7afe9b7558ab023bd6ee5224b2f8cd770a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00453-of-01024.json.gz": {"num_bytes": 396745507, "checksum": "75c1a4803bb58efe5df885bccd13596d46dd1f3ea30899a7e83812167b990bde"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00454-of-01024.json.gz": {"num_bytes": 396193342, "checksum": "c151679573ea5f5b52e26e8b50da7e14760d1ec15c63a5b864b648190efd48f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00455-of-01024.json.gz": {"num_bytes": 398096160, "checksum": "7f86270b13ee4133adaa06de809f26ef581229407813fca05db521d9d36880dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00456-of-01024.json.gz": {"num_bytes": 398965570, "checksum": "d5b292189c5d318e0ad622eec1e764993084d0477147f51f29acd637935fec5c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00457-of-01024.json.gz": {"num_bytes": 396672892, "checksum": "8b490f615b3ed701390ed671d5645dec4aa3fc576a032da8f9d434087c1eb8c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00458-of-01024.json.gz": {"num_bytes": 396911580, "checksum": "8bcadc16baaa4e36fe17ffc0862c264230385e18bbd861671ad5fd8cbb86404d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00459-of-01024.json.gz": {"num_bytes": 395969213, "checksum": "b8ff8371a01d7bd1782044058ee0f53d4d1275ebca0870ba16104c1c4b12f07c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00460-of-01024.json.gz": {"num_bytes": 396928338, "checksum": "23dde1fe55277467d6d2385684b71e90e9066e6a3c349a1da30a1487e87c8539"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00461-of-01024.json.gz": {"num_bytes": 400009637, "checksum": "34b98d46d207c5b6ea7416fab6f3cfcb1444cdc19376464ae9abb9296fd14c3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00462-of-01024.json.gz": {"num_bytes": 398107677, "checksum": "2031735c0f38ce43e37a5bb1b9728fc37c758fc4af71758c3d3b9535716a3253"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00463-of-01024.json.gz": {"num_bytes": 395503017, "checksum": "7820184904183fad9a61b6c638df9de11d4624bb3aca08885b842255172cecee"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00464-of-01024.json.gz": {"num_bytes": 397493281, "checksum": "b39b1b1e6686014a3c62e74912ec3b915dfc161b62e2d1108410354e6dec760a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00465-of-01024.json.gz": {"num_bytes": 397080149, "checksum": "a65cc7f590cc498da334d5a8653e818421e09e5e6ce2e8bc2a29ac67a02c3d43"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00466-of-01024.json.gz": {"num_bytes": 396633690, "checksum": "15d891873ba02923893cbc8c42adc0468bb39161f898a810037cc2e9f82e0796"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00467-of-01024.json.gz": {"num_bytes": 395045117, "checksum": "711686ff5478ec35ccaaf1549b7a33b941e322585f702257dfe2d31630245ba9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00468-of-01024.json.gz": {"num_bytes": 399486439, "checksum": "59c4599c8610f4c54778daedbb358f5e26fa527f8f94c3364b70565ebc90571e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00469-of-01024.json.gz": {"num_bytes": 396170105, "checksum": "4263dbb03135c2d8b16fb323208f98fe1a1ff1223e76a7ba085f881411a0ab95"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00470-of-01024.json.gz": {"num_bytes": 397479432, "checksum": "2db90de8f4d2bde9af453478ed4667166f636af701bb487095311f99b28e59bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00471-of-01024.json.gz": {"num_bytes": 396679096, "checksum": "caea3c4744adb89f006d9b0d9ef93241a55c1fc165cb0cd62b6d07fa3a40cdc0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00472-of-01024.json.gz": {"num_bytes": 397080237, "checksum": "34995676d953f4c95f8bd4f54fba8f92b86189cd73298ab77ee2702611b86e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00473-of-01024.json.gz": {"num_bytes": 397881706, "checksum": "c0fc6c68ae509d8273e7ca0efbe24f1452a57dcb000f44f550fe9600fd305e62"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00474-of-01024.json.gz": {"num_bytes": 397705270, "checksum": "50aeb620f8c03a2e4f2346a0c79a4509adfae084ffbeff0b86d8892b858a821d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00475-of-01024.json.gz": {"num_bytes": 397201717, "checksum": "4fa508d23abd417bdb0b0e7a61f9aedfb770609214cd85b10b4bde7ced7f12b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00476-of-01024.json.gz": {"num_bytes": 397522775, "checksum": "27da6164865687041e4f53d9ecec2edc877b147da5b424acbac2c69480132a08"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00477-of-01024.json.gz": {"num_bytes": 397323156, "checksum": "e40115fc4901a3930494652ce9ee7abb0c3f41abc6d6c58c81fa75a0ee752db8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00478-of-01024.json.gz": {"num_bytes": 397380721, "checksum": "79a16b7016aed0eec375ca383eb316765687f12421f786b2e133faa5690ef197"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00479-of-01024.json.gz": {"num_bytes": 396828680, "checksum": "08185ce3c3e5b01552be7d8f08ed5b27a6b1b121bb2d7d70a78b7074fee02fa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00480-of-01024.json.gz": {"num_bytes": 398678311, "checksum": "37a5804dafb2f4aff9e393af5b127c3577ab8a5dd23f1e41f2304b25a4c428a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00481-of-01024.json.gz": {"num_bytes": 397654112, "checksum": "47ce12535b753d8936ce3b569675e76cb6f638bfb74a93caf201f3ffc409d71a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00482-of-01024.json.gz": {"num_bytes": 396387301, "checksum": "1d07828a199bb1e1c0c8342ba99e484093557188370d1ced90803c2615d24b7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00483-of-01024.json.gz": {"num_bytes": 397178863, "checksum": "b6499612fac654798010e11c27ee8a25fc05d1dbed8aaf2338fd0ea377dc4732"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00484-of-01024.json.gz": {"num_bytes": 395826769, "checksum": "ce197ad5a226249bbba53c34b9f3c83508b542853748c3094a5b98befb537f2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00485-of-01024.json.gz": {"num_bytes": 397100006, "checksum": "f483044a4a0418b695e0b989f0fd03bfa79df01b649991f2356443bcb29d0820"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00486-of-01024.json.gz": {"num_bytes": 397658615, "checksum": "297beef7b85dc128a6a58d834c5fd1b24bd7fe84c7a317500461720c742235f1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00487-of-01024.json.gz": {"num_bytes": 396904673, "checksum": "06751938694fad1645ed575208e8e2c1efebb7165b4feb2d0ea871dc348741f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00488-of-01024.json.gz": {"num_bytes": 398019631, "checksum": "eb58bf8b011fedf15835841317e445e9e757c9939b4453a013233f020f98a697"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00489-of-01024.json.gz": {"num_bytes": 395822836, "checksum": "b339e33e7affbdaf691852d3668ff79adf8476a3c33eb86ad9f4ad4a6ebbf3dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00490-of-01024.json.gz": {"num_bytes": 398410737, "checksum": "4d8356cf804474538772c5520e77e75ac750dce3e6b103c9feab49ccd46a58ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00491-of-01024.json.gz": {"num_bytes": 396607853, "checksum": "1757097fb884d03aa288a05870016b1c2b9f1700ac5913d85c9821cf2e367702"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00492-of-01024.json.gz": {"num_bytes": 397612443, "checksum": "92e98e431a378e0402d81299c49209c66d39b0ba7ae63711f8d6ecf542f5fdf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00493-of-01024.json.gz": {"num_bytes": 395595466, "checksum": "d839e1763aa6ebc7cbcf1b870d947ba45b0b4ac95b0adbe4941a0b121690a311"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00494-of-01024.json.gz": {"num_bytes": 400397068, "checksum": "31caeb5f0ef694c06ce434df44c01f4a91fcd48e4acb4f1bf167eae6e59a02de"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00495-of-01024.json.gz": {"num_bytes": 396458630, "checksum": "26291dfcae5145cdc306317ecf95851a3f693b4a7c6e132e55384ec69d85ef3c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00496-of-01024.json.gz": {"num_bytes": 395037560, "checksum": "b32344b92f81006ad9e2e471f5ef8133e87924c5150145b13d51c3d7a0f68c46"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00497-of-01024.json.gz": {"num_bytes": 396247929, "checksum": "0396f0bb16b06ff130e955f260233ec868ada1daef6e8cbd480ce388628d49b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00498-of-01024.json.gz": {"num_bytes": 394798084, "checksum": "28d43d4e7bbce4e20167741ea2bbc3f17981aa51f9c040cfc41c522e732c6d32"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00499-of-01024.json.gz": {"num_bytes": 396699883, "checksum": "c6f6deff919b375fb08c74e159c25aa66362e4cddb0700f9b1e0e2701293ae70"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00500-of-01024.json.gz": {"num_bytes": 397014521, "checksum": "7ee22957fdfad0880f132f47860612331afce7a48975b9312233ba8ddf537bed"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00501-of-01024.json.gz": {"num_bytes": 399063718, "checksum": "ec94186b620037002819cd40347e6aaf67cb847848483790cd687222c9addbbf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00502-of-01024.json.gz": {"num_bytes": 396938850, "checksum": "a218de10cee75c4bb5a7102fbe208e6e65142ba5f960ecdc2b56b6f85fa30840"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00503-of-01024.json.gz": {"num_bytes": 394631309, "checksum": "8189de9454986f63253fa1ad44c63d5c2f692ff4bc3a848c7c2fd02e08f4e1b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00504-of-01024.json.gz": {"num_bytes": 397884411, "checksum": "b7b268545c27573840bf8a6abb7361c209f92f9b5f0f8028fffd49b0c773854b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00505-of-01024.json.gz": {"num_bytes": 395784113, "checksum": "b9f1610be9f045c15e43a7343bd2918743a71585a7122a4e781533dd39a73132"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00506-of-01024.json.gz": {"num_bytes": 397939195, "checksum": "f07b77d1be71c5922321e8683140f9a63a90903f1fbd1515d908807e12fc4597"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00507-of-01024.json.gz": {"num_bytes": 395925741, "checksum": "23e9927e9e83fd03e9d99c3fac05f1bf63d6c296a2b02d1aa208798d27d8dc1c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00508-of-01024.json.gz": {"num_bytes": 397426015, "checksum": "f4b8a74c610cea50a6b144337f65fcfed11fff21df6683503f25d4b82e29a4e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00509-of-01024.json.gz": {"num_bytes": 399072341, "checksum": "c3069ae9658273cbaeaed1730f171837c8d3042e31d1093cf0f519f601309a41"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00510-of-01024.json.gz": {"num_bytes": 395859781, "checksum": "e5863648f64423397ca1a7838df18aeddbb3d5d3a2551321fd99a480508fa86f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00511-of-01024.json.gz": {"num_bytes": 396948832, "checksum": "a2209ec05a794f083cf163c102c6ddd8d5e5627674686950e17e586128a81e60"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00512-of-01024.json.gz": {"num_bytes": 396585426, "checksum": "1c6fdb002dab490e6ddd7fe6023b2124bb944b7ebe95ee3b7faca9a92f4b5de3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00513-of-01024.json.gz": {"num_bytes": 396789970, "checksum": "83b02c0cf9ffea9d021adc102269c30a33ab3a803d331ba8d39aaa9b3b7acb43"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00514-of-01024.json.gz": {"num_bytes": 397131474, "checksum": "783f25460641cd3532c3bb3920c7d3f0c68b5e674d44cba33b1ed755608cf8ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00515-of-01024.json.gz": {"num_bytes": 396127068, "checksum": "61e5b9947f77d929442f23fe84465d88044631aa1eb6438a0b86372cba7286fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00516-of-01024.json.gz": {"num_bytes": 397526020, "checksum": "539b032f528d1ec3a8e8420514ef2118f05482297b052f6d28876a8bf776a080"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00517-of-01024.json.gz": {"num_bytes": 397748661, "checksum": "03b85a51aa7bcde672cc017fcbb0f11976cbd1447fc0ccb4f4bc822b2b04b27b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00518-of-01024.json.gz": {"num_bytes": 397915751, "checksum": "80dec6dc7d15459c113c16f23978c38cdc1157ca18468d8a00e0d2192bb2ffd9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00519-of-01024.json.gz": {"num_bytes": 397847480, "checksum": "7125e7915fd03c6312cfe448e4e7a8629249765c13d8558b17c240c2aef713b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00520-of-01024.json.gz": {"num_bytes": 396232144, "checksum": "27974f9766c18fd0b652c94eafa3493243c8e1b25b6e850e857ab6246b193b48"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00521-of-01024.json.gz": {"num_bytes": 395111538, "checksum": "61406e92a8f9a6ab800b3dd25cbac842e3487a4c7db7b1bb2070a41d627367a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00522-of-01024.json.gz": {"num_bytes": 397690206, "checksum": "b2e29801d120132a5fbbd3662a54290e46ff5e178b3146ebfc2169facf72e7e4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00523-of-01024.json.gz": {"num_bytes": 398274007, "checksum": "79905dbc45756c9f1c225120709d39cbf3caf435e322a531a4add690a1d0440c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00524-of-01024.json.gz": {"num_bytes": 395689218, "checksum": "1dc3086cb869abb13862970186f6a77cb29b687cd49518173f639c148d937f6b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00525-of-01024.json.gz": {"num_bytes": 397979085, "checksum": "6958bbc6029c00229fb0059d016a6b7a2bd21cfdc69392893423d2657c35c7c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00526-of-01024.json.gz": {"num_bytes": 398473877, "checksum": "895f42c4e7569f0db3832af13e56499f65fff74e93fc0cdf60c1c4b4b08881c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00527-of-01024.json.gz": {"num_bytes": 395879939, "checksum": "e84e72048b56878b1ff904ee83d92c208e15b16663b99a9d763edc23c2e0e55f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00528-of-01024.json.gz": {"num_bytes": 396472889, "checksum": "badcc3cda339c61936591e9333787ea032c42d7ff2288fdaff791bdc8504ce96"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00529-of-01024.json.gz": {"num_bytes": 396983038, "checksum": "ad20643f9d50c7c508fa136ceed0039ce39708e0e7a5e743c1981f1000bc3c4e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00530-of-01024.json.gz": {"num_bytes": 395774249, "checksum": "9453fa3fd296150b436f0146171ea8317512c6735ee9434622a83765a5d9e310"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00531-of-01024.json.gz": {"num_bytes": 396171120, "checksum": "3e3c230ab6beda13e4dd4747c7c6291e57b1ccb4a96ac2edb46ffdb4c3cb05b5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00532-of-01024.json.gz": {"num_bytes": 396200411, "checksum": "e9b52c3dad233fd1c4310cf5f76c2e6d0788ed084abcf931f99ab7002976d75b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00533-of-01024.json.gz": {"num_bytes": 395580851, "checksum": "e135cc4420d9f4d17ab523f7db8c559021a46a9a6bcdd21a6c4075047465906e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00534-of-01024.json.gz": {"num_bytes": 397459281, "checksum": "bb4f32ee1c1bedf4582b0f4f9ec7644be73fa25bf18cca7506e3c26e98818bad"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00535-of-01024.json.gz": {"num_bytes": 397344480, "checksum": "3766ddf8313c5cee08a575fa96bdde06a5b293f1964e58293ea583d72bd18e20"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00536-of-01024.json.gz": {"num_bytes": 396588089, "checksum": "56d236a4250f9488d80b93c0c005962d018da256ea5632c7e16ae26c54188749"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00537-of-01024.json.gz": {"num_bytes": 397606873, "checksum": "d7ec24ef99de2769937b89e0ca7e291eca2bd0438d501d9228d5ab035f49d83e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00538-of-01024.json.gz": {"num_bytes": 397608864, "checksum": "1a60378a0f1a200b11f85577bbd0f373ae47022eab16fad53da492ca1ed35bfd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00539-of-01024.json.gz": {"num_bytes": 398377669, "checksum": "787d263107eb09e852b015c17d1d0f54d8b93e78292c0c1e60cf99f27535c608"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00540-of-01024.json.gz": {"num_bytes": 398516980, "checksum": "dce03ef0813ef66e27df8730da7e341b49bf7e684bffd3a9cf700905501d1d72"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00541-of-01024.json.gz": {"num_bytes": 395557685, "checksum": "e4035222d65124bd3e33372b76b65c2dad9e696701607ceeb5968d483595645c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00542-of-01024.json.gz": {"num_bytes": 395725875, "checksum": "4e7ae0b1c0c4d514e0208e21336d095fea5970475077d6690a917faadb2b72b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00543-of-01024.json.gz": {"num_bytes": 397625187, "checksum": "a96ac467b6ace74a08f7dbc4bb8e3fc57fae36abc8975d6b60a7b7353ca9ca88"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00544-of-01024.json.gz": {"num_bytes": 397078230, "checksum": "337470c84cde5d02bc6a89003a6796de9e63db269e7800637ef2d220d75bd3ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00545-of-01024.json.gz": {"num_bytes": 396145060, "checksum": "da65d66aa4cfff77c754f8017eedd92cb82494b9425c2d5c5491d64603b2231e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00546-of-01024.json.gz": {"num_bytes": 396093007, "checksum": "399f7b70d1c1b45ce315f396d5fa0db2c69e41c522b0514e19bcc6802b953b1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00547-of-01024.json.gz": {"num_bytes": 397457696, "checksum": "47fc8fd82271e6b1fb074512da45dc005e22cb7f0aca3b7b621ea87613aeff9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00548-of-01024.json.gz": {"num_bytes": 396246097, "checksum": "3108770b39746852d7c048d9a8777722480505bbf4592732c7d1f231e2505c55"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00549-of-01024.json.gz": {"num_bytes": 393096516, "checksum": "9bb2b88775593afe4060349985ff4417a37f1ba9b4ef33399c58644c01a92b89"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00550-of-01024.json.gz": {"num_bytes": 396631619, "checksum": "cbb55d645d145ecc2ff9b96524463f82d5548c0bdf42381fc6faaad256e7ead7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00551-of-01024.json.gz": {"num_bytes": 396806780, "checksum": "ece03d7f12daa39473b6b8d5faed08a3f751efb9b1ee99f69c5188633d4a0f43"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00552-of-01024.json.gz": {"num_bytes": 398608968, "checksum": "7fbbde9c39d67d8d7f9f16c0848188b743c6ff5bc44e6339d5fd88c32e1aafef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00553-of-01024.json.gz": {"num_bytes": 397696672, "checksum": "85f9c5c5fbcfd06f715b520a1a3a63a014b1831d2f65de5f02cfea49a18ddf63"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00554-of-01024.json.gz": {"num_bytes": 397122204, "checksum": "78e3d43c3d2b71d8483788a085cd5706648767de7a2fc4aab707d6a05257ff00"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00555-of-01024.json.gz": {"num_bytes": 398704893, "checksum": "113e5fd99ada6ca96c086487b6e4012bad711d1d482d580e22d3af5b9d118572"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00556-of-01024.json.gz": {"num_bytes": 398099675, "checksum": "c7a816f8f2f74b4554ac17ffc41e67ebbcabb7c8b0c94292b4569bea372bea3d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00557-of-01024.json.gz": {"num_bytes": 396538561, "checksum": "7af6d2c9886481a0d393e026739b5ad7d0fc358ecc216d2fc124160402d4b50a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00558-of-01024.json.gz": {"num_bytes": 397660839, "checksum": "c1033428189671d4e1ba55c822040f307748c6ec31b80be3e4ed8e7a4325066b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00559-of-01024.json.gz": {"num_bytes": 398754128, "checksum": "69c9f88840166363f2b7ddaef05ac9d10441fd184d8451abfde76eb105572342"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00560-of-01024.json.gz": {"num_bytes": 394988981, "checksum": "a2dc4fc315a0db8f1a868d631d2941ab2806f44c2ae698e94bb7e8308bd67c70"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00561-of-01024.json.gz": {"num_bytes": 395801300, "checksum": "dc1b2b4594e3fc7f8795f7649d1c524405edce56d617f1e214692565de8c8937"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00562-of-01024.json.gz": {"num_bytes": 398322250, "checksum": "c23404fef6a6b5b887cc2dddfe341e983939ae36078d62842919a3739c96b43a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00563-of-01024.json.gz": {"num_bytes": 397584845, "checksum": "c909fe429772c8198f904496ea6cf239d669c6c787889cefcb7623e08a988db0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00564-of-01024.json.gz": {"num_bytes": 396436964, "checksum": "8e7cb1863057a3b9929af4da29b4e1cca1f71c254f5eba91a657d9e8c1fd6dea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00565-of-01024.json.gz": {"num_bytes": 396486039, "checksum": "23ba56e78c4edc4d58fd7fbfcf784b29037204a641e43a9894c95c68bdb982fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00566-of-01024.json.gz": {"num_bytes": 395358745, "checksum": "71259a300ff096b49e3461c91824a8185037ca85ef2018dff2617f335ab304b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00567-of-01024.json.gz": {"num_bytes": 396405726, "checksum": "d9b56ed523376681dd81cb9831727467461bdfb87c80d3932937338370093033"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00568-of-01024.json.gz": {"num_bytes": 397509797, "checksum": "c650aad13a48d5b0c51162ad19c9eb3135559d0a3318dba701a90e8138a8cd24"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00569-of-01024.json.gz": {"num_bytes": 396514261, "checksum": "d71e4126c2deffae8ee55077cee9dd2b70ce27adec767bce06e02afb23b42416"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00570-of-01024.json.gz": {"num_bytes": 397072833, "checksum": "519a32e1bdf7f5b97e1a438242a79218317e04e44021dc61aa65c526d35ce8ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00571-of-01024.json.gz": {"num_bytes": 397170114, "checksum": "919a9659156cafb26b87190fc00b9d33c4fd536dd35544cbef8e5ddc018ae365"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00572-of-01024.json.gz": {"num_bytes": 396475017, "checksum": "3d7e4e548f01c9ad5fc99b4342cbf9a9004737058dd93aae8b7d95b2c00856bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00573-of-01024.json.gz": {"num_bytes": 396749955, "checksum": "032f8e37328c9f0fc046e5a6ff5a79cbb744f3100c4cbea78e397c449471bb10"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00574-of-01024.json.gz": {"num_bytes": 396036505, "checksum": "8e795341527712be32a69307ce8cbd2d6195c6b2fea596d326a279734505198e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00575-of-01024.json.gz": {"num_bytes": 396722381, "checksum": "45a43576cfc61842bde146eaa566b4f22a128c3c2eb8f30c59a6b6cae4bcd4e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00576-of-01024.json.gz": {"num_bytes": 396163377, "checksum": "38429d2d6176ee42ddd495e052c01735a9a7f0076cde107d24a0a9c7a26bf2a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00577-of-01024.json.gz": {"num_bytes": 396813305, "checksum": "eae77c319bba236feaffc9f74eaa38e911fa48eb06f4794c9b1a6d17edab91a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00578-of-01024.json.gz": {"num_bytes": 397797226, "checksum": "1dd2b3d7e99fde8903bc12625568ec4fc6fe653737b3af5e9c71432e311cf5f0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00579-of-01024.json.gz": {"num_bytes": 396012631, "checksum": "d9322e66701b4ada3788b91a07e87b03af6c91eb4cfaaefee23c0330987a1840"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00580-of-01024.json.gz": {"num_bytes": 397943129, "checksum": "23deb32e1b0f07a55a5cf1572cb8e313ce716c748a07f58bd90cbae97290d0a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00581-of-01024.json.gz": {"num_bytes": 397614648, "checksum": "6193f8b848c7930fc04b9f2429dbccf36f1b291271b3eaf646c655433bf3ff9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00582-of-01024.json.gz": {"num_bytes": 396659280, "checksum": "40997ef02c7040356cd1c5acd8e6a5121e00b31253713cad4f529ab2922affc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00583-of-01024.json.gz": {"num_bytes": 397686445, "checksum": "5cd21271e4ae036f8d1e0c320330a6c93a8b1ffbb9293a80c56c2d7f123f9ee7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00584-of-01024.json.gz": {"num_bytes": 395500815, "checksum": "c25befb7c735b2340b092a04375d2109c1b876d2b0057dd8d4ed4beac87118ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00585-of-01024.json.gz": {"num_bytes": 398413461, "checksum": "073f632e95c218fdf17274fc21915c94f56bdfbb58a6b1a0550de249ce4d2129"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00586-of-01024.json.gz": {"num_bytes": 396849745, "checksum": "647cbe9bd7709c0d8a01485096fd88ad0fc09b27de324eae141a8d841536b71b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00587-of-01024.json.gz": {"num_bytes": 398567154, "checksum": "557af97a8d2b2656149bc25ee5b362116d173e6a48911b860ec10d512b4b763d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00588-of-01024.json.gz": {"num_bytes": 398086388, "checksum": "9e9afa15ee3534e497c9fc7c8cd967388183193dade3d1ec82a8e2b0e82c5118"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00589-of-01024.json.gz": {"num_bytes": 397335823, "checksum": "ed8a1d0b9c55f465b5d4a4e5ea022f6d17aaa8b82569be7cfec55629c1bf26c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00590-of-01024.json.gz": {"num_bytes": 394931693, "checksum": "3fbe539fcf64f0d914c19b383de9953b0605d4a69f48801145f0db1972f9c6b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00591-of-01024.json.gz": {"num_bytes": 397828770, "checksum": "9165de8866384d3d03c3876c39c96706e33a24b9f95acc09999c2dbfb85cd9cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00592-of-01024.json.gz": {"num_bytes": 398782493, "checksum": "433a9cb730d7ab024b56ad662a3ea53633f7ff26c625051c4c02f252beeb87a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00593-of-01024.json.gz": {"num_bytes": 399264489, "checksum": "4a7e5f40aa8b692cfa0519d33a868e9a05e579ad430204bc13c48b533eadc5ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00594-of-01024.json.gz": {"num_bytes": 396629833, "checksum": "521d5e90550dbc97ab26a18a0b75da81e38ce2083ff5fd93340fded2e54e1ca1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00595-of-01024.json.gz": {"num_bytes": 396916313, "checksum": "30c9be1d99ce0a41b214fdbd5115988c82ca317d4aceb30c19fbca05e0a409e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00596-of-01024.json.gz": {"num_bytes": 397013253, "checksum": "b16bd9d7d893b4a71056575fa0799bef96120c03cfc6e2a88c292469a67f2614"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00597-of-01024.json.gz": {"num_bytes": 395980036, "checksum": "3bd15089b6fff342df2b3109d7ebadca35cead4f44ca5b1b55e55d8892aab82f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00598-of-01024.json.gz": {"num_bytes": 396295935, "checksum": "6252d951a9570baea9767cf3350a6d09ac5a5fc34ba80eae3b5c40adb8361ab9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00599-of-01024.json.gz": {"num_bytes": 398608239, "checksum": "b265a385cdd5e64d1fb2ffce739e72f2fe2cc8944621f20e2084dc52b91cdd9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00600-of-01024.json.gz": {"num_bytes": 396563743, "checksum": "43d12028cbe738e8f450911f6a55dcb00f8742cefc2a2c4da5f9e9220b0572c1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00601-of-01024.json.gz": {"num_bytes": 398256993, "checksum": "9368dcfc581e6d572d899ef25b129bc0268901a2fa009500174a0985bcf330df"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00602-of-01024.json.gz": {"num_bytes": 396202546, "checksum": "3cc57d7afd161fcd411f73da8369d98db4c6d8e30643ee01450adef21e8ea3ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00603-of-01024.json.gz": {"num_bytes": 396338425, "checksum": "cc21fc5b8ed6e5115bd8924954d685ed52cd5b773ab63d37188343443c95851a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00604-of-01024.json.gz": {"num_bytes": 397597307, "checksum": "d24f6d807ae35037e695e19917ed446f74448166fa464c862e31fe7ba2bea196"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00605-of-01024.json.gz": {"num_bytes": 398278313, "checksum": "99166183c752aed8d0f2cc9c010f1ebdd4fb93d40e936fd6c082eb3542baa956"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00606-of-01024.json.gz": {"num_bytes": 396590468, "checksum": "657ce79340c15524a5897459a6cf712fa4127def2445f7eb3de21c9b46db3794"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00607-of-01024.json.gz": {"num_bytes": 396603228, "checksum": "3705441435f18d1e4aeea9e794e1216fcd29b48213763a554808e3d3697951a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00608-of-01024.json.gz": {"num_bytes": 397280580, "checksum": "be0bef2c16e9bdd0387276402dc99fe5a9a0a7a105a44e88bdb783139f2de474"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00609-of-01024.json.gz": {"num_bytes": 398284528, "checksum": "3a7c7a8cb01f6d7589152a1483682a5fa99e119490f3e70d8a02f582f2e2b19c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00610-of-01024.json.gz": {"num_bytes": 398872039, "checksum": "c349aac5b64227397ec2870992ac9e4fac9fe39f1fd4e0a7b8c727e171655e14"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00611-of-01024.json.gz": {"num_bytes": 398736440, "checksum": "63ca5eb2d27632b3b4dde8e40f9925e71e21ef737262bcda7a99324a67e0fab5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00612-of-01024.json.gz": {"num_bytes": 395170895, "checksum": "3b4bb3e14ee981a9edb9828ce40b86b5d83dfafcc1a5e0e02642cb40924bd6ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00613-of-01024.json.gz": {"num_bytes": 398443337, "checksum": "e95adbd7d55024b7e62145860f217a6f04f5fcef79ac23e92dd9e14f9a0b2a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00614-of-01024.json.gz": {"num_bytes": 398854661, "checksum": "def8cb789f8f79fa169e855816c5e4bc7d5c253e565502691a9abb826d7436d4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00615-of-01024.json.gz": {"num_bytes": 395505189, "checksum": "6775ca6aa4f834289396a438906b90936ed0ff6390213dac2b0861f40d7761e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00616-of-01024.json.gz": {"num_bytes": 398999454, "checksum": "6cd5efddacb09cc80ec1eb79f93b562044787903b3cb1c879be2acec64a9dbdb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00617-of-01024.json.gz": {"num_bytes": 398570431, "checksum": "26d1f587377446e8b1499be7a3b6776d437baa40353fb04c591203a420eb0cc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00618-of-01024.json.gz": {"num_bytes": 397064982, "checksum": "e59a87fd1cd3d87fff4b15c3a9331521d7587ac7f4a7fd51ec3906b484ef9ad0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00619-of-01024.json.gz": {"num_bytes": 396676338, "checksum": "8077c3a15d93579d0fbf00bd9d117bf4f50092c5be3acf46c7d4433ef7be9dfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00620-of-01024.json.gz": {"num_bytes": 398186471, "checksum": "ee3fb91d7797ebf1daf8dcb81563b7dae7b161d97732efd35e3eb6ebea732ee2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00621-of-01024.json.gz": {"num_bytes": 396467968, "checksum": "386adb83129a7306ef4da37c1cbedc39b3971e7633d516d406a982f307577e67"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00622-of-01024.json.gz": {"num_bytes": 398293882, "checksum": "b708cad0e04c56174d0feec84d7224a4490cb8db023d38e57398cad89b78568f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00623-of-01024.json.gz": {"num_bytes": 397396780, "checksum": "c50c4568c6f103b3e6a3702cbd915ecb530df954df808156bc38a98f36a0b944"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00624-of-01024.json.gz": {"num_bytes": 396971282, "checksum": "11351ef83c9fb883d6c0f484af5c10f0d686b7ac4a2f08fae9ac3d9837df0a0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00625-of-01024.json.gz": {"num_bytes": 395882440, "checksum": "dfa97ea7949c9bbf7af43d43ac5c8d0034bdbd1ad572895159b7c7846ab89676"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00626-of-01024.json.gz": {"num_bytes": 398292846, "checksum": "fbc9c23dc286ad6fd7f01f344de97ef5789733af581de278488869bd36f3b246"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00627-of-01024.json.gz": {"num_bytes": 399890427, "checksum": "f43bbde36b8bd34ed9998b99b42c85434b8bbc8bbaa1cf5b38cec6393099c23f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00628-of-01024.json.gz": {"num_bytes": 399589466, "checksum": "c50058a4937912b678d33d34ff91e2287e8701365f4f71fce61f9002652556cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00629-of-01024.json.gz": {"num_bytes": 397355095, "checksum": "051c4631d0587b6f65827410ad2f2121c05c849a009274415bc5e7f72db42d44"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00630-of-01024.json.gz": {"num_bytes": 397860559, "checksum": "07b48a86a8a3245fe5b78f6943c8970c839942b8d86abf173507225b0d1520d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00631-of-01024.json.gz": {"num_bytes": 396161304, "checksum": "70a03f0308105de5266c4a40803b51f99888b362b71409719b7f71f73761b590"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00632-of-01024.json.gz": {"num_bytes": 395620184, "checksum": "c6923984c419f08bb4e6effc27dd25dd986513034338debc9b238592dad9f607"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00633-of-01024.json.gz": {"num_bytes": 397572527, "checksum": "900fc701703234031e825a1eb2d11b364f1dda97eb0c7943e17ef278695f7bea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00634-of-01024.json.gz": {"num_bytes": 396215174, "checksum": "0cc838e395581933123fc57c6690afbdd2be1b67d213336d9b8c08b3876f8458"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00635-of-01024.json.gz": {"num_bytes": 399176005, "checksum": "5a3daa1bd0be8c997da56257f063a7d1c7b2b271648a46615b26ca4beeb42863"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00636-of-01024.json.gz": {"num_bytes": 396035356, "checksum": "9d21ce1c8b5a7c1330cc95b1f45286fb8578d5dcec0686724ff6e25a97f38a7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00637-of-01024.json.gz": {"num_bytes": 397214839, "checksum": "83cd34e1ba09c268b515fda7699e12bfa2531fb7e60e2f861946ffdc01e54a04"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00638-of-01024.json.gz": {"num_bytes": 396292535, "checksum": "82a7bae9a7d35fa707bcb6d90f7b244f1509e112dfdbd604c9be1f8b8ce7150b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00639-of-01024.json.gz": {"num_bytes": 398009954, "checksum": "b6d7ebd102c67960413caf5fcdc5b4aea728b6d3d6369ab8dd3cd6bee6c769de"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00640-of-01024.json.gz": {"num_bytes": 397558496, "checksum": "151c55d019fd84fdc0eab73d24984e5d88ac964c86f89a361a03dc776a22b5b4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00641-of-01024.json.gz": {"num_bytes": 398031508, "checksum": "e0e87304a8ac408adca2badf2564ec52caf155295ea303a121c30f3b1ce797b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00642-of-01024.json.gz": {"num_bytes": 396594124, "checksum": "73d08c99b6b96d96b82d88267b2a392a7dda2084ba5142b8eefd0d23212702d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00643-of-01024.json.gz": {"num_bytes": 394552252, "checksum": "ebccf3b935d63c30f626d317af250b6bd0f04ef5e1cced829287ba64fbb0d25f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00644-of-01024.json.gz": {"num_bytes": 397586341, "checksum": "674c0965a9a880c057b6f2dbb785a4a6ae048954d44ba4f5266dd5e65095d06e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00645-of-01024.json.gz": {"num_bytes": 397950976, "checksum": "7ac8d4dacd682a2977818f01d860c3dfa5a5e5a78f7d2d95be0353a675452e93"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00646-of-01024.json.gz": {"num_bytes": 397511840, "checksum": "452a9cc03facf9151552f914f9a8a3507a96fd8ea40f7d04951a29ecbf6aa1e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00647-of-01024.json.gz": {"num_bytes": 396692070, "checksum": "5a795a238203444596c711bcedc634e653e5240c9a800a9884c51f878340b494"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00648-of-01024.json.gz": {"num_bytes": 392707626, "checksum": "9cc366c37950624df6af318ee52a97d32a40e278fcb519cbe8545b04bee3204e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00649-of-01024.json.gz": {"num_bytes": 396283284, "checksum": "4ddeec31a30b5c563838b17e1115ad30041e08c70a94f299ea324ee4b71fd82b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00650-of-01024.json.gz": {"num_bytes": 396349662, "checksum": "f5bc63114ec9d73d6cea7f8e38a95031ae2bcde849b27440afd840a3e72aac13"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00651-of-01024.json.gz": {"num_bytes": 397187042, "checksum": "7199c0242b2654509af187c9c8bbfc22cc5067aafa1ff69949b1f0e5b718425b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00652-of-01024.json.gz": {"num_bytes": 396263026, "checksum": "c9e62b6df7213ea5b71913fbf736403f33c51e5a868bf1035cebcc39d80635bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00653-of-01024.json.gz": {"num_bytes": 398689010, "checksum": "f3bcc9eca4d71043e920db6399a032f916c23b1da329d2ef86434a74f8e7b318"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00654-of-01024.json.gz": {"num_bytes": 396938678, "checksum": "fb41df26e1f68e1e9d12ae8740535ca66e80910320be2270d680fec40d6fe9a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00655-of-01024.json.gz": {"num_bytes": 395995226, "checksum": "018b40ddf6d88c4c346c8018439d16f6ca66ee0720970e84ddc34b1010ae35d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00656-of-01024.json.gz": {"num_bytes": 397860049, "checksum": "8f3847e9bb5a8145e2959b340f86cc06f85e6646f32d5d785c5c90ec11a9f404"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00657-of-01024.json.gz": {"num_bytes": 397142407, "checksum": "a1ae8735a39bd099dac2e50c22e312f1a010f2644774ef53c995f3437c0a5524"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00658-of-01024.json.gz": {"num_bytes": 397827609, "checksum": "f6154377cfff2453392fb899f81514a7c0ffd40dbc35d8842d61a115d0aeef35"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00659-of-01024.json.gz": {"num_bytes": 396861858, "checksum": "4299633524667921549573c469a73e33abae89d107375d5ccc6a6d987c2a2a26"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00660-of-01024.json.gz": {"num_bytes": 397773823, "checksum": "44eaf6c1739d8a9c13c54750c473ac04aaf9d2223d8893cd8094f1769b1f6f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00661-of-01024.json.gz": {"num_bytes": 396311257, "checksum": "18edb60444b660c7cc68dbe59ac71989be0e20ff13639725a5f05e4d4d512514"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00662-of-01024.json.gz": {"num_bytes": 396176936, "checksum": "7b60541181fbb92f361fbdf0bee80d086c75279610aab792a7b3877d49a3e1bb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00663-of-01024.json.gz": {"num_bytes": 396274985, "checksum": "59e057ee5f5e8c7267138c18c5c88f3ca24d30f86c484e4bb0c0a4eb5169c4a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00664-of-01024.json.gz": {"num_bytes": 397483935, "checksum": "585f45d3ac3f88c3bf1c86e01daa46537f8f5c5165521412de0e67393cb6da33"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00665-of-01024.json.gz": {"num_bytes": 398831104, "checksum": "e403d2f4ff6e74abc9639749f93f77cc868453908c10821fea7fafdbcc981a06"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00666-of-01024.json.gz": {"num_bytes": 397668116, "checksum": "f9bbafa396a466b24630a259a01804b2857c1dde2fa3cec60b2967a88ad9f528"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00667-of-01024.json.gz": {"num_bytes": 398123165, "checksum": "ed693d5ecb9dfcaf545e831b5769b877e927125794cae61a0ec7821c3c85dfe6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00668-of-01024.json.gz": {"num_bytes": 398152096, "checksum": "51c33c07d503743704f564bc6a372c2f6f8f13a1ddd00b0b9a2c44c94cc57444"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00669-of-01024.json.gz": {"num_bytes": 397927981, "checksum": "d356b5268ba39e38ffccd20e95803f3218407e0a1ca3b4d1165ff82796ec1bae"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00670-of-01024.json.gz": {"num_bytes": 399074605, "checksum": "bb96ea8154ae01275a9197709820e670c4e6212c740e92a7f1cfb7c618a49bea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00671-of-01024.json.gz": {"num_bytes": 397864381, "checksum": "afca3dbcaefdc368e996259fd595b77fd98a885ec005a93069a01b83227c827b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00672-of-01024.json.gz": {"num_bytes": 396077133, "checksum": "3da96ebd1b28b55b03bbab8e85f78295cffdad9020f869cb456da27058ffa090"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00673-of-01024.json.gz": {"num_bytes": 396943842, "checksum": "6a4c344a8af68a95e20d58b64fff8fe616c2a406cf26f642cdfea65fce5883d1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00674-of-01024.json.gz": {"num_bytes": 396975969, "checksum": "e6b0f7727d78143fa180abb76e617b37660b35f6323f19bf1dcbc78fb9374508"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00675-of-01024.json.gz": {"num_bytes": 396692800, "checksum": "e4ed97b19c6d83e618a3fcaff75460d828ca419b1e62842a1493b0ec4c9703e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00676-of-01024.json.gz": {"num_bytes": 396514400, "checksum": "a5672f1561ab85f071395de43e702791aaacff77a9f67f6ec9e14b12aba675b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00677-of-01024.json.gz": {"num_bytes": 395939125, "checksum": "3dacd3bb90b5e645d1b9a962d8df87f571b0fcf227996068535bb98a68f9191d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00678-of-01024.json.gz": {"num_bytes": 397022852, "checksum": "c1a0ef31342161369b7fb709be17e3c86191c1a52cb04b704fc58190818302c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00679-of-01024.json.gz": {"num_bytes": 398325372, "checksum": "47ddd1056ad977407f61b2eac3ff803d17b1aa8fa0719279bf911caf49bbb7c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00680-of-01024.json.gz": {"num_bytes": 395502228, "checksum": "cbb93f322d684ed558cbf8d92b9f83958ba772fe4177093a334b4596343f3cd4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00681-of-01024.json.gz": {"num_bytes": 397981781, "checksum": "9ec2dec493733846a1ec9f68ff5130cd461d7ab9c07b22d4aae94463bcf03146"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00682-of-01024.json.gz": {"num_bytes": 395265758, "checksum": "7731cb9a2898c730a650e5d1b358886ed562228928aefe55d991cfaaa61a9a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00683-of-01024.json.gz": {"num_bytes": 398783283, "checksum": "6f2bb48070e809ac17fc90e1117d63bd8c7cd0079d9e44c9f262c4ce60f5d373"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00684-of-01024.json.gz": {"num_bytes": 396160769, "checksum": "fd07413637b97b68cb3a7a6cb86c4656017b7841728e806485ae196294e79f8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00685-of-01024.json.gz": {"num_bytes": 395594461, "checksum": "939925a9169da729891fbeef926f420b80bcc60e0f170bcf9a2095449a22d424"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00686-of-01024.json.gz": {"num_bytes": 398275260, "checksum": "13836c45719ba10f2d581cf17cdab1daa4cc207a49db2b4786b451605842ac4b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00687-of-01024.json.gz": {"num_bytes": 395256765, "checksum": "0c0d0e6c1e3cb9a024c184a8510066a005c031a15af74d117d0e736a358a91d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00688-of-01024.json.gz": {"num_bytes": 396635904, "checksum": "2462e084563f8b8de68c6e826289949ff8ebf8cfaf323344c07ab93e56373539"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00689-of-01024.json.gz": {"num_bytes": 397749444, "checksum": "d03746220f3374c80102ed39d8f6ae0daec40fc1b23312c08ecdee82a65ac6df"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00690-of-01024.json.gz": {"num_bytes": 399380060, "checksum": "217d032ecce8d0b7e448befe83aa051a3bfab8cb0e167d043b6abc833f5e9b4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00691-of-01024.json.gz": {"num_bytes": 396975651, "checksum": "354fe9bc07aefc55cbbf8752f53ad69d45761da928bc8deb6fee1de9e244e93e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00692-of-01024.json.gz": {"num_bytes": 399720848, "checksum": "21f88940b6cbceefd66ea5e8d466467806370ae24a5833ca308cd840daf5ff8d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00693-of-01024.json.gz": {"num_bytes": 396787846, "checksum": "c8d28980ffa1eff4459d2fbf0043a1f8eeaf840a3b1d1ea4989b2192c7a82041"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00694-of-01024.json.gz": {"num_bytes": 397945967, "checksum": "1936570da24c4bab9fe0559826f1cc509c4ab6eb3679e26d697efa6e7e5c8a81"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00695-of-01024.json.gz": {"num_bytes": 396349049, "checksum": "8e497506f84513272a8a0694e7d4efb004b1e3b515887e3b5762f59b6c659dc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00696-of-01024.json.gz": {"num_bytes": 394901418, "checksum": "9e1d6cc187ff67ee734bbadc6cbd57eae05634a448edfde184fa8d6fc3259836"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00697-of-01024.json.gz": {"num_bytes": 399142528, "checksum": "9584496113a8612620748aaba35e185b8f47b7c96b4ff0dc7bfdd6024a3faa14"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00698-of-01024.json.gz": {"num_bytes": 395923784, "checksum": "83a3c57b3870ed9beeaf3ec8ab694e0be458106f3128b14b2a44a036e89d32b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00699-of-01024.json.gz": {"num_bytes": 397137494, "checksum": "0befea64fe749d79592e337bc359bcef70ca8816d0126ebf89d4b8fbfbdcbec6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00700-of-01024.json.gz": {"num_bytes": 396554785, "checksum": "34739b543636aeadb6dcce3e7c97ca49026cc9897c13add6b592fe60e5c40338"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00701-of-01024.json.gz": {"num_bytes": 398091188, "checksum": "c9bcc7c9e91de707ee548e67452d6970af2e19bef91f966b19fa71504e5305fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00702-of-01024.json.gz": {"num_bytes": 396039798, "checksum": "fcda5f8ddc5ed163db84aa70c565f8181731af9a29918a2ece0436d3146d7125"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00703-of-01024.json.gz": {"num_bytes": 396889704, "checksum": "c80445d442a766d2e87ecf5804e87bf7f8b23c2238476fc2b51f657400739306"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00704-of-01024.json.gz": {"num_bytes": 399465260, "checksum": "0bb73674d579523fcbe079fbea7190138911711f023404ae46ea7b685fc09c73"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00705-of-01024.json.gz": {"num_bytes": 398579507, "checksum": "97d6fd9cea2a47913c6ee9d1e34c3440858f25f3d670cc81c8f83f2346fce6e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00706-of-01024.json.gz": {"num_bytes": 398761590, "checksum": "2f4836001b8b80066ae09b6e385ed0048770c13ba2410e0f0309ab4b9200e37d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00707-of-01024.json.gz": {"num_bytes": 395576626, "checksum": "8e0c0c635a7a7c32d4fdb1a7906ee95a9f334a55b2ff3881cdc7d5e816a9c817"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00708-of-01024.json.gz": {"num_bytes": 395930921, "checksum": "e6978b92f333230972e2b4c31cb86b5286fb899948c7680c7a9cbe75a9d60296"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00709-of-01024.json.gz": {"num_bytes": 395734676, "checksum": "13071a3527071f06570c6cfa485073f2f3980c83cac782db6bf66a75dd865df3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00710-of-01024.json.gz": {"num_bytes": 396501107, "checksum": "6562cb3675a42a58b8c8b2a232043adf532fe49420e30c3c237a6d8889a8de30"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00711-of-01024.json.gz": {"num_bytes": 398422179, "checksum": "f38b59c4739d3c15e5bf5dbc0965d1a5dcc0f49a3c89eb7a6822003aaa1ae7c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00712-of-01024.json.gz": {"num_bytes": 395905103, "checksum": "500b4914f3c42d5e24ced7d36dbd3143c49e4fd5dfc3d53a172d1a55ae738889"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00713-of-01024.json.gz": {"num_bytes": 396009909, "checksum": "4f50bfa762db1435a89195fd180615e9f569c1668e128d343c87c40ac5cf60ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00714-of-01024.json.gz": {"num_bytes": 396963447, "checksum": "fd9eea7dfb93916a3798a8b69d29fb5d4bf0fec448b8a24427f729e7a41205e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00715-of-01024.json.gz": {"num_bytes": 397474378, "checksum": "3c61bcf6f24e21d2584bb4ae008230540d9a375e35f3c4ba1668621b80d85c5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00716-of-01024.json.gz": {"num_bytes": 396285471, "checksum": "c554e562a369d9696219ea8b0e363907c50f626d7c410a26515e07de801da74a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00717-of-01024.json.gz": {"num_bytes": 394827995, "checksum": "f8b4678c21d93c19d50cb576f0910050d24dfd606238bbf8013c45f98defda12"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00718-of-01024.json.gz": {"num_bytes": 395517823, "checksum": "1bf63affd6914d98e197b6e1ce526cae7754ecdc750184154d3cb8e3bdd21a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00719-of-01024.json.gz": {"num_bytes": 395561934, "checksum": "c04b162d984ff2ada9f39aa6c0fac04a1531fbde05175f856d2e3ca2797a448a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00720-of-01024.json.gz": {"num_bytes": 396227762, "checksum": "25da2ac7c1f3cbc361807f67e8826ffa95f4caa25f81f66832cbd0a08f1a51f5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00721-of-01024.json.gz": {"num_bytes": 397716450, "checksum": "28180c6396deaf34e2a197f5cad1b53ba1c9532db8b5c21dd7d81332b2793181"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00722-of-01024.json.gz": {"num_bytes": 398022279, "checksum": "9c3a8038a7f9431b90f67ea0d3b77353d0508b09865f49af575b6aaf5e32d6b7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00723-of-01024.json.gz": {"num_bytes": 398064523, "checksum": "4b18959f604bd5f379a73b52947261cb8d63f2243f5afeb5807a13669ef4a800"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00724-of-01024.json.gz": {"num_bytes": 394747045, "checksum": "615f13a1b2a6942931519b7a7f6aba286f6045aad65b041c2c6643ce906de1a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00725-of-01024.json.gz": {"num_bytes": 396726374, "checksum": "4099a416eccbb56818efda68bd027c993c1a5fa1a8e722bc268041fd3f804cfb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00726-of-01024.json.gz": {"num_bytes": 397361407, "checksum": "152d5e2bad0de3b6b48fb26066891b160ea79c4c382ce6aec6047196e3b08ef6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00727-of-01024.json.gz": {"num_bytes": 395542925, "checksum": "ce1d46b0cd7d9e4075db3feab71d2f72939817ebf45819e73ec277c9cc07307b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00728-of-01024.json.gz": {"num_bytes": 396647931, "checksum": "c859626b14584c1bab396c867ad5eb11ff3af39628206b03612ee2d2b3058497"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00729-of-01024.json.gz": {"num_bytes": 398272080, "checksum": "758fbdc5bf6d66a36d69d31141742b2a917bf0341494b844f22ab82cd54e7ead"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00730-of-01024.json.gz": {"num_bytes": 395977662, "checksum": "56a7fcb59ece26d4b19be0bd5e6c2d0f05e4b1b23e8ce7b4fab064a29b229c02"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00731-of-01024.json.gz": {"num_bytes": 397530948, "checksum": "bf0f4dc8796a737daf80b977a6e3656cb1e244fc40d6df92852da45e53e6cfdd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00732-of-01024.json.gz": {"num_bytes": 398314575, "checksum": "1862bcc85d48f59283eae56836e5598f20287ce36a185252abb24bcfbd1377cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00733-of-01024.json.gz": {"num_bytes": 398547748, "checksum": "476389cb582df3c214f3f5a45268bdb47b581a432c08723bd811daa5f5990083"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00734-of-01024.json.gz": {"num_bytes": 397380175, "checksum": "2b6fd36a8f8bc3edfcd8a486de44d2f3132f7b8f4bb2d4c93453dbf1a1b6667a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00735-of-01024.json.gz": {"num_bytes": 399584382, "checksum": "3e0a067fef0b40edcd23ce6680efc07253660b8c00699630bb7629b9d803a198"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00736-of-01024.json.gz": {"num_bytes": 395312038, "checksum": "e4f92413c837d269481ecc0b5d0fc87548bd2ae718ef7f9bff18674ece289bc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00737-of-01024.json.gz": {"num_bytes": 396820243, "checksum": "e61680c57505f027ef8cbd28a45e706936befa2ab40a24a63e638019a1717b63"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00738-of-01024.json.gz": {"num_bytes": 397691872, "checksum": "d3acc0c9c76ef2df89f49896744dac53f488f830d3d42f0c481f2321ed60fa67"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00739-of-01024.json.gz": {"num_bytes": 397912166, "checksum": "18d281ed9831f28c4c54256a844ab2cff7a5b681da1b7c8eab2565b106381aa9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00740-of-01024.json.gz": {"num_bytes": 397093867, "checksum": "6a65230910384587f5e7f34b52c2a6d9a86a8b1f7a23d26f890b6e810c051815"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00741-of-01024.json.gz": {"num_bytes": 396371058, "checksum": "26eb40e98075ab716b4edec76d1723a679e648258d6812119b46f7522dfa9b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00742-of-01024.json.gz": {"num_bytes": 398346941, "checksum": "466043ec98eb806916806cff7495f0bae89cfeb2835204ea34328030b92a27f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00743-of-01024.json.gz": {"num_bytes": 397366055, "checksum": "d98d31aaadf95dd0d1cf0548db515c8e77c95bbc4b611ae9ab5650429c171889"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00744-of-01024.json.gz": {"num_bytes": 398722902, "checksum": "a43c80ab3bd8d12d12b4ea41d9054b90214fd3ea2ef957f317d6ed6fa7b60e34"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00745-of-01024.json.gz": {"num_bytes": 397562514, "checksum": "1e6dad94e0f90bfa0fdc5557c58873aaa95fa9ce1c7b70a1fe76817289cff78b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00746-of-01024.json.gz": {"num_bytes": 397731351, "checksum": "21fefd6cffa9032c9ca7cec91cd775c83bbd37419ae236eeec9589f8bc4be0dc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00747-of-01024.json.gz": {"num_bytes": 397781450, "checksum": "b84c74bf1caecf92777fb85129bb009eb3a27fbab1b97af567f36a8bf100e704"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00748-of-01024.json.gz": {"num_bytes": 397425031, "checksum": "fe9bb225f6d03b44e552ec985c844e5012e90c4ad99f699ec4ed4297db91349d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00749-of-01024.json.gz": {"num_bytes": 397925850, "checksum": "3913b2955fee02e2ba716d843559bc4bf4e85a2884ae4495446a379f857a30e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00750-of-01024.json.gz": {"num_bytes": 397089489, "checksum": "773486144d3008cb3207c3c8b65fe6081c9e64dda09728d3586bc82e6bb73fca"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00751-of-01024.json.gz": {"num_bytes": 394819424, "checksum": "d728b117a7b74150b03ed7d562514c2e45ccc03b0bceb120eddfa8333166a923"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00752-of-01024.json.gz": {"num_bytes": 397199683, "checksum": "6c10c3f4e3737db6a70375bd605139de61ae8b09a1aa91dd1cfdb82c183f0cb3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00753-of-01024.json.gz": {"num_bytes": 399197199, "checksum": "101c4ed5426b586a4aeeb7dbd377306eae9eec2eaf934e79d25583abff70b15b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00754-of-01024.json.gz": {"num_bytes": 396415619, "checksum": "732f4dedcf1266bcabf15a6a1cdead617ea37d428d8cfbccb5a9dd7521133075"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00755-of-01024.json.gz": {"num_bytes": 394564662, "checksum": "a23f1bb1de23554efff68e730d85802a6491936fb54e256744af641f97ec155b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00756-of-01024.json.gz": {"num_bytes": 395577258, "checksum": "2f4275994a103dca517d4eb3656009c8138930079e00303c7b8746ab6094fd19"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00757-of-01024.json.gz": {"num_bytes": 397161772, "checksum": "ab16360173283b22a7e19d181fbf55a6a8d07f0d9007b51aa159c1e81661f5e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00758-of-01024.json.gz": {"num_bytes": 397545456, "checksum": "ff5a6292bc557aa9895de39697e8aea5843fa5a00c83c7983eaa36640d446ecf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00759-of-01024.json.gz": {"num_bytes": 395470957, "checksum": "66a64accfa6c281d2bdfa7b6846397f56c2d4f8a22ae8925a07af853e42f5521"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00760-of-01024.json.gz": {"num_bytes": 397328304, "checksum": "46778c90bcc6da96cf02e66956a1bcabcb9a95bad538cfc0d5190db473a278a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00761-of-01024.json.gz": {"num_bytes": 397706141, "checksum": "4825f25d6e1d13c70e6e65ce13ccd7b1922344c48ee2806952f3ba1b6e26d3ae"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00762-of-01024.json.gz": {"num_bytes": 396983663, "checksum": "25e1645f05d342b5f872ca809b36d516c7336c22035bfa86cf295d0865e08789"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00763-of-01024.json.gz": {"num_bytes": 396355038, "checksum": "d4c3a92808f0bfb042423cd4166abc57d20603ef07a0f0912058a718a38f26d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00764-of-01024.json.gz": {"num_bytes": 395434042, "checksum": "aa4384f587fd64c24fad9a27defb0345eb44cc536b3d45c710017d225c191ded"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00765-of-01024.json.gz": {"num_bytes": 397204482, "checksum": "cf419554f6c4f6201ebe92e7a232013e5949910f3d54f5cf3d1d65845685c7ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00766-of-01024.json.gz": {"num_bytes": 396420917, "checksum": "32076dd8004ebe35f46d6e790fd6330ad1d7df2b7ae3c4ede325b0da73a673ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00767-of-01024.json.gz": {"num_bytes": 396840905, "checksum": "08e5fd0fc1578a337f3dafdb3c718ade437256119e1968e9f958a8ea9d052c81"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00768-of-01024.json.gz": {"num_bytes": 398085225, "checksum": "3579e0756bb6cbf1eddfca27de5cf067a212d683134bc6f8c26a79b7d802bfce"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00769-of-01024.json.gz": {"num_bytes": 396879117, "checksum": "0913c93203a084521212e473d08c1d11e8136a8e37f1891330fbce0397bd431b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00770-of-01024.json.gz": {"num_bytes": 396386647, "checksum": "6c12ab51c92b9c92336a6142a1a4e2f7c3725beb7e61dcb004551d13e8d5488e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00771-of-01024.json.gz": {"num_bytes": 396279989, "checksum": "752deaefbf22dd1b1adb36561e8524c1dc555fd105bf3acb78611be9bce72318"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00772-of-01024.json.gz": {"num_bytes": 397850815, "checksum": "4f1969284d1f448caf0bff5d05eeb995cf2339801f6a71e01286f4f7f387c564"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00773-of-01024.json.gz": {"num_bytes": 399466666, "checksum": "20ba552cd30349bc8a2c0b6a8701d4587a005e7ebdf6e3f2a3bf95462c304447"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00774-of-01024.json.gz": {"num_bytes": 398051538, "checksum": "1f66196e8fbf0ebef977f235d2aacb7245f4033b53ecf75ada2f8007465a629d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00775-of-01024.json.gz": {"num_bytes": 399284061, "checksum": "97df92baa605c34ce857d380f1ca42f9e2a0de499ccaa9bab26a5c449451d1ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00776-of-01024.json.gz": {"num_bytes": 396710162, "checksum": "4b1ec54b82c8e5d969d3000ce547f4c20df16d9cc0b889b2b58c8839e9d8e27f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00777-of-01024.json.gz": {"num_bytes": 397265441, "checksum": "03827ccc3c5bebbd12a04019e9797945c55becabf7f9c1f3fe5353513f5c5a38"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00778-of-01024.json.gz": {"num_bytes": 396050013, "checksum": "54aeadf4fe16949b2ee9438feabe979570e7587bb07b3c57e47422f662191936"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00779-of-01024.json.gz": {"num_bytes": 397124991, "checksum": "913e268b5474a8b4cf1426f5a0a06c7f437eeabbc35f0126481328b419f85bf6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00780-of-01024.json.gz": {"num_bytes": 395196367, "checksum": "4c1a4f296916c30103a5dacacf8a167e43bb424d085ed3491b19f0ec1985d9f9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00781-of-01024.json.gz": {"num_bytes": 396578403, "checksum": "a54f26c233662299ec8f0ae1bd266879e93cf4676707b0955114a1a80e2fcf61"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00782-of-01024.json.gz": {"num_bytes": 396142106, "checksum": "3713c6b725afd833063402e6577bc0ed003a87720f700f9272864c2360bfd260"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00783-of-01024.json.gz": {"num_bytes": 396470511, "checksum": "fe9d904a07ffb2581b6734c8dd847435b867d3043ce4b4840b1c54374919d757"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00784-of-01024.json.gz": {"num_bytes": 398156228, "checksum": "af762a9ff3eeb7ed4a56f54702911f0c190b97f8efaa02cb89b1626a1c44c9f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00785-of-01024.json.gz": {"num_bytes": 397185035, "checksum": "6629e1827aab88f55d53de24625f8362daccf910663db8584d959aa44f8043a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00786-of-01024.json.gz": {"num_bytes": 396556703, "checksum": "ce51603900ea0aad8981fbfa8d05d684bfef5360413dadc6933246c2dc81c413"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00787-of-01024.json.gz": {"num_bytes": 396214799, "checksum": "6eed5802b89d63eea115cbfd9e00f6d1b4970bb3600a887b904b548181a4acef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00788-of-01024.json.gz": {"num_bytes": 397965162, "checksum": "eaa948fdaa744576f006bd70d54f129968772a479fb0bd8e946d7605857545d2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00789-of-01024.json.gz": {"num_bytes": 396280999, "checksum": "e0b80ec73507f96310abf070e5cd17d5a67ffb4a337820a8b79a02afe81a0b99"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00790-of-01024.json.gz": {"num_bytes": 396224660, "checksum": "2b4a06fb6f68c773da34f8d4c33d7746b6a3206bb242042841e5e007fe3cb6ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00791-of-01024.json.gz": {"num_bytes": 397681975, "checksum": "1b167c20d0414d970cda74cd357cf07d69abd1d3fb0f57222028b369551d513b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00792-of-01024.json.gz": {"num_bytes": 396210611, "checksum": "ab55128753a1e58d1032b8fd747c48158a721b12e85990627478f22b78e156ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00793-of-01024.json.gz": {"num_bytes": 397534599, "checksum": "e7476bde08e0065c523d09932cf2cf6ffe8ba023ae0ee435238efb5dd6f93d7c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00794-of-01024.json.gz": {"num_bytes": 396536137, "checksum": "6228922504b2d3ebeef4735abdff06cc786d6533a6c150d50f34042aeeae1544"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00795-of-01024.json.gz": {"num_bytes": 395235406, "checksum": "9dae151c15898d7991417596a364e30f00e0ff6280f1505953e6de40c2e228e2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00796-of-01024.json.gz": {"num_bytes": 396226178, "checksum": "1dc8decde490324087fcd06e4b1e17117606f2d61a80d506d89a12cce11ba291"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00797-of-01024.json.gz": {"num_bytes": 398556774, "checksum": "a454758e8cffccc88f83517a241f2457e683647949cde6aaf1e217de42f6a52b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00798-of-01024.json.gz": {"num_bytes": 396109677, "checksum": "3daa6b8602517b9873db96522a2852d940d52cdf0fa86f259ac41a9cd688751f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00799-of-01024.json.gz": {"num_bytes": 397930210, "checksum": "09dec669699a437d6fb78b3f2705028fb380b2eaa20ee73b77270216a48b8a95"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00800-of-01024.json.gz": {"num_bytes": 394545441, "checksum": "726f99301047519de253e3edbaef5f4a4f95e3850b1b98e01c7864499dad7833"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00801-of-01024.json.gz": {"num_bytes": 395867151, "checksum": "a97ef657bd8ea718427ffc686f55fc1786f0834755fce3ea3ae8402d9f75c11b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00802-of-01024.json.gz": {"num_bytes": 398573429, "checksum": "20ee1f30272a0d5db74e8589be12c17173580cc9f14b039b3d33f3197816ef95"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00803-of-01024.json.gz": {"num_bytes": 398084513, "checksum": "31d1a8f6965d3a8cb7e28fa8bf2cb9a5609d4a129dbc630a8e2a939f475b2003"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00804-of-01024.json.gz": {"num_bytes": 397815811, "checksum": "edb758146d462848bdb113df90fa4b9f451eca6658cbd2cab147c8b0eaf88a70"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00805-of-01024.json.gz": {"num_bytes": 398641802, "checksum": "b916bafa7269ad4ed09c58c74dc3f098b529444609dafc57e6e4056aa6496ee9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00806-of-01024.json.gz": {"num_bytes": 397993720, "checksum": "92fcc5881ca81b808c14f8c9960d873be70f857f95fd1e777b1ae1d4c62bbbaa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00807-of-01024.json.gz": {"num_bytes": 397743279, "checksum": "79aca62194176964b66a90dda7631d01acc2a6abea1ba19a90076139e390170a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00808-of-01024.json.gz": {"num_bytes": 397076817, "checksum": "a469391e432dac6967e841d46eaeabe9429849492a3df5e91431777fe9b9f164"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00809-of-01024.json.gz": {"num_bytes": 395533122, "checksum": "1278d928e105ea7d9c397ef1da79dcc8791dfad9177727aba098bd451734ce45"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00810-of-01024.json.gz": {"num_bytes": 397468683, "checksum": "5c6f3e7550827de9d7028decd82320a55722785394ea4951ee78f3ffadb2d4e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00811-of-01024.json.gz": {"num_bytes": 397348260, "checksum": "8c1ece72814dd82bf1bb663b76a40c58129c08540195f9b2134eff5837faa366"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00812-of-01024.json.gz": {"num_bytes": 396753479, "checksum": "b3770924d0576f7cd1706771c411f0f288277c6c6c922dc7af4017b665109a88"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00813-of-01024.json.gz": {"num_bytes": 397977743, "checksum": "864040da6f03f4d2ed2a9eae4daedf304e0d27196f0b522cee4e8fee55f9ea71"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00814-of-01024.json.gz": {"num_bytes": 396168620, "checksum": "542986bb3b75ffcfc853af11a80edb6a31e12527d2588f1c5b2119fe35d3f150"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00815-of-01024.json.gz": {"num_bytes": 397639162, "checksum": "a617c2f27306ce5de74ab756cbf74707fddeb0aa92277b66d0cd65be230f386a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00816-of-01024.json.gz": {"num_bytes": 398296204, "checksum": "174a2e77e6562384cc4e7459ebf536db5cf4b530e4f1d7714e60d082ac7a19c6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00817-of-01024.json.gz": {"num_bytes": 396112543, "checksum": "95af2c4f32efb4ed2a41cfa38dd2be09d51d4b0dc53ca8763309503f0276d56b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00818-of-01024.json.gz": {"num_bytes": 398371592, "checksum": "67789e3525f2daf6af2551df12a50341c3ef51c89a9c714a8def76209b5b7460"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00819-of-01024.json.gz": {"num_bytes": 396751420, "checksum": "07431a263e2bb92c048fadbab74ce1399f76fc57a04d7f9e90cb33aa60a4c5e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00820-of-01024.json.gz": {"num_bytes": 399213859, "checksum": "83c03df95869973c2ed46c909c0e92e7ecd75317c06b09e447a62b592421d1c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00821-of-01024.json.gz": {"num_bytes": 398408628, "checksum": "b5cb8c52a8713c5291ccf29c171e9bd9b57a54211392a19e8f31182d1053a032"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00822-of-01024.json.gz": {"num_bytes": 395429180, "checksum": "8c47bf7a0d2b9c84d255df0e7da058fba2b4ca6da3c20cbdfe5a686e01cf5c45"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00823-of-01024.json.gz": {"num_bytes": 395437149, "checksum": "62818e45f34e70728494c74daa583e30c70aebf91c2f057470039f6d35059691"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00824-of-01024.json.gz": {"num_bytes": 394503147, "checksum": "e9fd88994b23531ba26e6859ec1985798a2ab9b300c2fdb1e202ac553ab305b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00825-of-01024.json.gz": {"num_bytes": 398841091, "checksum": "77ad5a9ac5e3c1d1180981bffbbdbf8a429854001d990258c615e0e16c8a9f6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00826-of-01024.json.gz": {"num_bytes": 397404278, "checksum": "06a39374c1cda19cc4b034c4877e1fd3bdc84290fdb621fdcdc77f3c5eea9a47"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00827-of-01024.json.gz": {"num_bytes": 399316947, "checksum": "fd27a73b130c1cf8256f22212e23799d0dd31281cd29bcf9bb658bcda457b66e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00828-of-01024.json.gz": {"num_bytes": 397514415, "checksum": "3e7d199d05f885e8bba769d21a55a3f2ef2114b66ed738428ceb506fdf272ff2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00829-of-01024.json.gz": {"num_bytes": 397251538, "checksum": "91650563e9520b2d1ec2cd726304b781b4156ffb68bc172635a53f425fa6bb0a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00830-of-01024.json.gz": {"num_bytes": 397653118, "checksum": "893ef017cbf7d46c99d9c69ba74344cfc2800bb23faf93e7400c0c282422945f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00831-of-01024.json.gz": {"num_bytes": 397299276, "checksum": "4eb3c91e52547f3b4af586f5bbdb0cdaf6a345b202a09c6aabff5c5f628b2948"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00832-of-01024.json.gz": {"num_bytes": 396915924, "checksum": "9fffd46fc1f1bce010484f2850102e2e153c5695c277efb67f65811630c2493d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00833-of-01024.json.gz": {"num_bytes": 397652261, "checksum": "3b89df9375a906c96eb1e21a6572a07de2f5d875996c01c744933984edb1af1a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00834-of-01024.json.gz": {"num_bytes": 396070735, "checksum": "b758b4cbfdfb799a8615ec9c3678b27dcd9b1d63af4f272879e0dae84cac9d63"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00835-of-01024.json.gz": {"num_bytes": 398028152, "checksum": "6e07f1e6a099aa496fef3015514fe5f3cc665c742f8a783389c7da4ce0e0e72d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00836-of-01024.json.gz": {"num_bytes": 395941604, "checksum": "6bef1291a741ea5976749456185a3e3a03c3fcc9ac00370f28672ab39c552db8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00837-of-01024.json.gz": {"num_bytes": 398655070, "checksum": "b0b7e1c826302417630c3e1b1877bf106beefb5a7a11feb9bbf1ac3712714fed"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00838-of-01024.json.gz": {"num_bytes": 396374435, "checksum": "3e9bdde8b73397a5fce143e91c92f9e66f46b45edfb30da1cac400b9aa7b2ecc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00839-of-01024.json.gz": {"num_bytes": 396388725, "checksum": "4154322b97c600742660125e6458787e603cf1a44b49267f4d1c569387fd132e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00840-of-01024.json.gz": {"num_bytes": 397564603, "checksum": "f9560028196fc934378389e355101e5e7f8fde9e5c921722704a18b24ebc5804"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00841-of-01024.json.gz": {"num_bytes": 397001678, "checksum": "0dad99ac959765280e6bf6d9d1a1468ef9dc9cc781e8f5bb832f7295e4e79f69"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00842-of-01024.json.gz": {"num_bytes": 397139167, "checksum": "e81fd683da081349629a0a7ae8ff7813351ed23caf4ef87041b64524034abc83"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00843-of-01024.json.gz": {"num_bytes": 396044889, "checksum": "d8e3a5b4148c7e86dea50ee5ba89ef55629d3550fd926c41754e5a26e7e52c36"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00844-of-01024.json.gz": {"num_bytes": 397365441, "checksum": "c4d2ffe853b55464961b707b6d0264d6852817077204a0380c906184c077012c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00845-of-01024.json.gz": {"num_bytes": 396477802, "checksum": "7b3c4d435eca57a0fad05c106ec5928750aa01d95047618a3bc84e5342e912c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00846-of-01024.json.gz": {"num_bytes": 395983616, "checksum": "bdad2ba411291435ac0cdd083e46aa8369499f014a788fa85ed8c419fe9cb2de"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00847-of-01024.json.gz": {"num_bytes": 397646062, "checksum": "3f6bddcefcceaa4184161432e4f0b9292ae4fe7dac3079d4191a31a38f48c7bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00848-of-01024.json.gz": {"num_bytes": 395958111, "checksum": "5ed10d926e5fd1dcbc777df82391eb3ba57276c7303d488d6f3591022d20cc4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00849-of-01024.json.gz": {"num_bytes": 396960036, "checksum": "ab82adc6f66ab0403cbbb38859009a460e6c8c38c789bc2b2420da8b87096a9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00850-of-01024.json.gz": {"num_bytes": 396603592, "checksum": "5a6aa59a01504f5655d429dd5cb3ebc39e3994b22cbaeb5b09ceb29a26b94031"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00851-of-01024.json.gz": {"num_bytes": 396511886, "checksum": "f1954da7e217d893a0237a0f431dd2a9071723e543bf0f4943ce38fab048a44e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00852-of-01024.json.gz": {"num_bytes": 397626831, "checksum": "f5cdcd7ec4f3c855a1006f9278ed4df50574a3fa7aa1c5a2e255ea5fa1a770cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00853-of-01024.json.gz": {"num_bytes": 395811873, "checksum": "24b1033da877ebddc09cfe2d3325868448dab9083b5147d6cfc4fa63ab402a94"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00854-of-01024.json.gz": {"num_bytes": 396513614, "checksum": "419952e0bc38cce474190c0b9ea581ccbce77da5e045dd60f5ff1fa1d2833d19"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00855-of-01024.json.gz": {"num_bytes": 396493352, "checksum": "3d2b529871c625fc9c1c59b9d5cede2a77e609041f1ea044d68ac16e9fa6a30c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00856-of-01024.json.gz": {"num_bytes": 396852729, "checksum": "a3b56e6171fc2b14ebe67f6a71af688ea6135597bb8f8cf83e2fb460727aa5eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00857-of-01024.json.gz": {"num_bytes": 396428653, "checksum": "de550a5d608bffde45c149bc0d4c1165cbd3b5baab3d3529f006a02aba6d53e7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00858-of-01024.json.gz": {"num_bytes": 397039613, "checksum": "11374c2685676ac2eb3dd0d281b44b512ff1d2968ab320d9c857b44304eb8ab8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00859-of-01024.json.gz": {"num_bytes": 396515194, "checksum": "64879e565e5c467e630566ab75524bb300d58798c814637ffebd15646544cd5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00860-of-01024.json.gz": {"num_bytes": 397764125, "checksum": "7e22be61b3413c8fca2414087655b7ef7bef2ab5ee373fee74d13c8fb991675b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00861-of-01024.json.gz": {"num_bytes": 395314420, "checksum": "29c451c69c8c05f6eee2741b9ef6c241f551257a45da8342a1d6bb341f80314a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00862-of-01024.json.gz": {"num_bytes": 397763845, "checksum": "679668616899f548fb35da32c3e5f121002670cc3296c0c90f5bf45eb3ea1d79"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00863-of-01024.json.gz": {"num_bytes": 397356206, "checksum": "43c5b3af2173d4293396f336ec363aa2f31580b65128f44ca8bb891f2022859c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00864-of-01024.json.gz": {"num_bytes": 395463092, "checksum": "77b7b6299955f4869e5db994fa6b20fe3007cf8cf2b6609442fb1ed49284cee6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00865-of-01024.json.gz": {"num_bytes": 396909291, "checksum": "7eca0e82842b52f99640ab574e4b2446309aba6ac262f980fc6d249a337d06a4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00866-of-01024.json.gz": {"num_bytes": 397587651, "checksum": "931014d99ab2a765ebf90e876694647c265ca5e6bf2b459eb027d6b06643a8ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00867-of-01024.json.gz": {"num_bytes": 395992645, "checksum": "0976a5389aed40e4bca89cf22382cf121390c75bd755437be474c097c8fee0ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00868-of-01024.json.gz": {"num_bytes": 397789857, "checksum": "6ffd848d165290a746a21767e79a9f046b70534aaf7b14fc01f9365e4e3f7d93"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00869-of-01024.json.gz": {"num_bytes": 398124116, "checksum": "5fb85058bdf40c0ee6cf748cda7483b1b3cfad18c26a90c2150c2a3f30ceeeca"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00870-of-01024.json.gz": {"num_bytes": 396432487, "checksum": "89d50aaa3620eac4ad593a403ea637b2ff090361ead05c3aa8c7a3351c66ad65"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00871-of-01024.json.gz": {"num_bytes": 397484772, "checksum": "490f4104981a9ab3ef04600a4865b9a2a18239e335d7fb7fff79ec1b7a225318"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00872-of-01024.json.gz": {"num_bytes": 397240896, "checksum": "d344994866bc49475f66e9937636afa787e1ff560e3f62dc1a0e4d0220d6ed39"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00873-of-01024.json.gz": {"num_bytes": 395450398, "checksum": "5d3b320aab1f7f09450531649666ded1aba8a9bbcf0f47992c43cb40a6d7a929"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00874-of-01024.json.gz": {"num_bytes": 396365056, "checksum": "346aae20204537ba2f4a865ca80b5d1c6da1e3a3b78d306d7570a69f185cc4fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00875-of-01024.json.gz": {"num_bytes": 396679348, "checksum": "ba81f9c1650d30853edbb9886dde84658c254dee5a3ac1062484f7194cd413f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00876-of-01024.json.gz": {"num_bytes": 398278881, "checksum": "88fb38aad7cadd76c818dbe7a372144dfe17d110f7d2123a80d14686fb43a6dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00877-of-01024.json.gz": {"num_bytes": 397051868, "checksum": "049e4a62056c98284b35d10a74ad5ef7014265a6dccb99a71f93a409933a685f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00878-of-01024.json.gz": {"num_bytes": 396132123, "checksum": "bb7b97a82bd6d31612de66a03af35d404b15808b925e7fd94bd0a8e9e928b927"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00879-of-01024.json.gz": {"num_bytes": 396520374, "checksum": "2a56fed53aa022e6a7956f604d54d99af89a15b6c7fc6b037f94d347f1d15f51"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00880-of-01024.json.gz": {"num_bytes": 397004524, "checksum": "1cadef434909d4508a9a6bf40d6a9323256f3089615a5d2963c83040d5f549f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00881-of-01024.json.gz": {"num_bytes": 397336334, "checksum": "0e36dcd0eb1773eec15ffd0fbbe8951343bb6961dd1838b51e74da2e055db176"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00882-of-01024.json.gz": {"num_bytes": 394949798, "checksum": "78c99406cb921c2b8f5b86e4e7eeed24c799678732e5a5450db6b12b7ceeef61"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00883-of-01024.json.gz": {"num_bytes": 398647721, "checksum": "f0e7a0a9970c7fdb5f629771e76bb06bf62b79e9cbf5008e866f954dd436401b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00884-of-01024.json.gz": {"num_bytes": 396040500, "checksum": "05272a55eb2840f94a7dcc30a8d09b957511b983b0fc3fa618a8995bc594d055"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00885-of-01024.json.gz": {"num_bytes": 396460591, "checksum": "27511aa50410260d261866dc970b897b10a95dd4dfd92b0bc3a5fc41e6c75335"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00886-of-01024.json.gz": {"num_bytes": 396149133, "checksum": "e66ba9c7ceca631a4b43ecff1e151524a209368f298ca83624476ee9144cc3cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00887-of-01024.json.gz": {"num_bytes": 397164216, "checksum": "95e341054bd8a21e7f49e4a5aaa5fbe51517ff631e66e67ff1cdaea6e3178002"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00888-of-01024.json.gz": {"num_bytes": 398216402, "checksum": "6fef57de31fa1692d8a4021b317554688657fad3f55dc144e2971d63083e7879"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00889-of-01024.json.gz": {"num_bytes": 396976936, "checksum": "36da1bd0eaa27ca6e8510a3c005695fbbd7b0fedf63f077e3787590d4b1af625"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00890-of-01024.json.gz": {"num_bytes": 396903125, "checksum": "6bbbe5db2c0938efe5f8afe7b30765f45cedc9fd4209bb7826c489381175bc5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00891-of-01024.json.gz": {"num_bytes": 396404354, "checksum": "47601b1b1a0a725c32ae0c32364f7ac188b7e8c68d29a2dffbe1a4dbe39393f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00892-of-01024.json.gz": {"num_bytes": 398144052, "checksum": "a7b6bdafa5a226c22ccdf97c873e4915ed8dd8b59e2820a4dc62f600b4710175"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00893-of-01024.json.gz": {"num_bytes": 397990484, "checksum": "12f08cfa1fb4f94a3d7d9584cc3f5ae9fa518cc095e4cb07939d02ecfb7ffd9b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00894-of-01024.json.gz": {"num_bytes": 398271782, "checksum": "004bf46ac7c8d7770b458ec341322f5cef643926aff9255954f08faa1dd43d53"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00895-of-01024.json.gz": {"num_bytes": 395489909, "checksum": "3ea14b3dbd7a4c9cb7aad83d1311d335714aaea5b2dd0374debd63c56d02dcbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00896-of-01024.json.gz": {"num_bytes": 397589097, "checksum": "c0f1c7e54bf7a808f66d2acc9aec79f1ce936ba480f5d1e379c6853714413175"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00897-of-01024.json.gz": {"num_bytes": 399215096, "checksum": "20958123acf2d578448a5166f1209b0452db33ed395cfe512015106bf99ad31d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00898-of-01024.json.gz": {"num_bytes": 397044516, "checksum": "46c5145069d861c04b2ac1afe80c4c4453f91869f6cb6a1d9f7b648f1b08942e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00899-of-01024.json.gz": {"num_bytes": 397687759, "checksum": "2a3923d8ff2ce0eab5978a8e0198bc2d1512cfa19c69e673e048b8eaa72f82b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00900-of-01024.json.gz": {"num_bytes": 395192267, "checksum": "9cc72deeea7fbc0fa3782c41938d66315923dd9f53d89f47c00f85f93e454ce5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00901-of-01024.json.gz": {"num_bytes": 397806320, "checksum": "8cfff74f280636416f523c271f75e5704a570db4cddb8a70d033158868c21347"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00902-of-01024.json.gz": {"num_bytes": 398450537, "checksum": "7df8804eb5ecb79177001f9ce3c66f0ad20cccd8151e817816e9342d07c392be"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00903-of-01024.json.gz": {"num_bytes": 396733151, "checksum": "89551a52d1e97b4ec3007f8c43191c1ae1475d0ba5b48d20818a12c85b0add74"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00904-of-01024.json.gz": {"num_bytes": 397497719, "checksum": "2bcde59dfaa642722969d1401a4ce43a35c57930bb1d664371efece1e2e91c32"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00905-of-01024.json.gz": {"num_bytes": 395760696, "checksum": "ec844272b0666a455dfe0cab065e00df44e8da2156a03797100418307c96830c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00906-of-01024.json.gz": {"num_bytes": 398496346, "checksum": "ff68909d470edef08929a91068e1de02841c16a000fbbd17ef042cb76f1fff37"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00907-of-01024.json.gz": {"num_bytes": 397085405, "checksum": "a9b26676af61a6a1355225bce5bbcd67aeaf0fb7dc2209f30235b275536baa85"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00908-of-01024.json.gz": {"num_bytes": 397037103, "checksum": "e86688677a46103b0b224333faf1b4f89da062e4ec0ee35752c91ff9772697c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00909-of-01024.json.gz": {"num_bytes": 397394775, "checksum": "93082177607900bfce7fc53f1665a831093bb50caea33e014f327181579c0012"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00910-of-01024.json.gz": {"num_bytes": 396668466, "checksum": "dcfe639607c18a309e2c91864a6912dce3851abd62bbed3ba16390899e637327"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00911-of-01024.json.gz": {"num_bytes": 397926997, "checksum": "aa995c38d953237b1d6d53be7237958a00ca2dbab4a753c7c4404849fb416d5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00912-of-01024.json.gz": {"num_bytes": 397810240, "checksum": "e3f17ac285e8c9b04713713a957602a63e176f476d4a67018012e9cf2a3e5a84"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00913-of-01024.json.gz": {"num_bytes": 397143597, "checksum": "4082ab833be47cf881693ea4442e3940625e0d2c1117e15234886fdfa779bce3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00914-of-01024.json.gz": {"num_bytes": 396398347, "checksum": "7c62dfd17b21ff64af640e4aca8fea0240998596d11ca551a3ab045d5041fcac"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00915-of-01024.json.gz": {"num_bytes": 398622100, "checksum": "69abe67cda4b1613d5f741804ccdb294cd5f457027818d9366db8cf2f5f40871"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00916-of-01024.json.gz": {"num_bytes": 397387266, "checksum": "6effa83cbf3345fd7e41e432ef82156bb1334f2cf17589bce313aebee9727131"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00917-of-01024.json.gz": {"num_bytes": 399730979, "checksum": "f0d0ff1ae76a84c07647fa1517410533862f1927fa85dbf38017dabf4607bc1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00918-of-01024.json.gz": {"num_bytes": 396895902, "checksum": "84cc56e725be31047d0b6a025cfacefc462f4a1a546feaa34af95a6f25a4e1a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00919-of-01024.json.gz": {"num_bytes": 395247578, "checksum": "daa3156989ddaa9a7eba228848697ccf6a385679359ab765881d2293bef107aa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00920-of-01024.json.gz": {"num_bytes": 398305242, "checksum": "2a9e02ef643962f6009e42304b983c87bae7b74c1edcbf8e6808b320ea7ea776"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00921-of-01024.json.gz": {"num_bytes": 396446011, "checksum": "f83526ad11d81820fce4231e3303d613dbbe56a8fae878d9442c8d7e98023437"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00922-of-01024.json.gz": {"num_bytes": 398010331, "checksum": "e47cb9d7550644ef807c3ea9e19ca4aa1df54eb908b54651bf0e17f0ded9157d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00923-of-01024.json.gz": {"num_bytes": 399160018, "checksum": "470401e5b0777096806113a36dcb92b8d453d6e8f5f4f0b15df2788e382ca03f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00924-of-01024.json.gz": {"num_bytes": 396880756, "checksum": "c86e546c68bf8458951fa723c086d6efa5b210f53cd4fcb2de4b9efc7a71a275"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00925-of-01024.json.gz": {"num_bytes": 396806561, "checksum": "5d9b1105c0053dc9530c911046f4da458f41d92c771282d0df8a3a22838feaec"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00926-of-01024.json.gz": {"num_bytes": 397479994, "checksum": "c3253305ac4ef226501e4fd4a6acfc6067a76c084ad852eb2a9f5916aa3d51a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00927-of-01024.json.gz": {"num_bytes": 397083225, "checksum": "8931df0ee597f72ea3592d0a4d236ce655a92cf4e7eb9298145f496246c18c21"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00928-of-01024.json.gz": {"num_bytes": 398000839, "checksum": "5e29e75231bdb413dedd1211bd87e9fc3f4ab8bba41999afc1ddcddc16f4599a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00929-of-01024.json.gz": {"num_bytes": 397731309, "checksum": "03f7a9199b7927a6d78a8aa4eed32c250d32dc409e3bb2847d7db948ee63d46c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00930-of-01024.json.gz": {"num_bytes": 398133003, "checksum": "b22a79dc228697394d0ce25b7d31112f9e1a6508cdc4b57af35e84e65167bfeb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00931-of-01024.json.gz": {"num_bytes": 396694508, "checksum": "dbbc65db3d442f9ace85498a3b27bb598c20cea171b3de17d409f9b989c262d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00932-of-01024.json.gz": {"num_bytes": 396255463, "checksum": "02af4162b084004e99dc6862c88749545593e342a83523597cada140e57a0ab7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00933-of-01024.json.gz": {"num_bytes": 399013035, "checksum": "dc4d3b4f03c36a8f1393ba15195c3f64b128862b812839689fa387e708ffabaa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00934-of-01024.json.gz": {"num_bytes": 396593138, "checksum": "02a5a8e02b2636c9e912a9ef8a79ececde4f4fc92bea74e59791d181bec104cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00935-of-01024.json.gz": {"num_bytes": 396748502, "checksum": "05d1d6290580d5c74b906ab03fe6773ecaaa1ff3be84dfdef48d1a2e7f5e1120"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00936-of-01024.json.gz": {"num_bytes": 397737673, "checksum": "351d3543b1457da9719061948a1b4bdd79be8a0b786ecd6a9a8cc0db49cd2181"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00937-of-01024.json.gz": {"num_bytes": 395377872, "checksum": "d431b01bddcf911d7da5bad74a78d0d1527d60d9720f77868ef08e1a65850986"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00938-of-01024.json.gz": {"num_bytes": 397193715, "checksum": "bff5e755b174e3608ba72b39898a2bb5e9ca6d3362b70bd66143566aeff52690"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00939-of-01024.json.gz": {"num_bytes": 398044482, "checksum": "03facf22c376f03a8078e99d1dcc1c22ed5d7e179de472019cae894f40c7a4ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00940-of-01024.json.gz": {"num_bytes": 398894204, "checksum": "3d3a2125262ee8ca498cd54db52fe626d010a2a93c000ea2b45f931e491ea9e5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00941-of-01024.json.gz": {"num_bytes": 396758197, "checksum": "b3957de08e7779d8ec23af02a6d709189796314c70a99f46c90d0bfbd14ad561"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00942-of-01024.json.gz": {"num_bytes": 398181993, "checksum": "74aec8dec794c79683dfe43d8aece4c1c47c5389aa6d4bea847ac461cb5ba21f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00943-of-01024.json.gz": {"num_bytes": 396271547, "checksum": "231f63d05f81d249f618768c9f712cc31314dacf55a6004902a0e7d0bfb13724"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00944-of-01024.json.gz": {"num_bytes": 396603419, "checksum": "d5661730f3ed6cc5bbc5d935a6f1ac7d241b40c52dc83775a421e7a1a672f518"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00945-of-01024.json.gz": {"num_bytes": 396596660, "checksum": "3b5aeb0786dddf0b9cabe2ca071283b276822e2861d8688e38f927595c159b02"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00946-of-01024.json.gz": {"num_bytes": 399900563, "checksum": "6d5549970af2c6987583477991552e1944b411642782c07d17eb52f91e714a1b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00947-of-01024.json.gz": {"num_bytes": 395391489, "checksum": "f5544ecb42c385cd5d5120c82140e4a36051f6a401d89ce30c8f2fc08cd69804"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00948-of-01024.json.gz": {"num_bytes": 399257562, "checksum": "1448cca7f1b9824adcf8437a33d14a7e95b705396611f82e7aba9a69e0a25118"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00949-of-01024.json.gz": {"num_bytes": 396371965, "checksum": "a7eb228f1d1ff2744af3d1a1358a94611cd92c25d81edac0e209b9f81c8a0a60"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00950-of-01024.json.gz": {"num_bytes": 398022110, "checksum": "8651693d2180e518039da487f638c532c53f6d79a33356922b2d8706aa6a83cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00951-of-01024.json.gz": {"num_bytes": 396224338, "checksum": "c46bc8aa1621153fbd913b5d0b23a82352a28b36ec997c4df4b92dcc6ef26895"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00952-of-01024.json.gz": {"num_bytes": 397581207, "checksum": "02775930e3c420978a9d2785ee0137c3963dba7bc34538b2155eb38dd6ee89a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00953-of-01024.json.gz": {"num_bytes": 397045599, "checksum": "9d54940cb594de6e0f8593f64293e96375f0a5c56f3569c72720476bcef1f1a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00954-of-01024.json.gz": {"num_bytes": 395457873, "checksum": "3c12a1c3061164f345d9e402bed28be9af84ef56d5df1b22a3cf9f818ed47ae8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00955-of-01024.json.gz": {"num_bytes": 396450938, "checksum": "45db78bea4fae6cd69d900c581fccda873d2aa9f24ac5e9dfc18b486c15c3788"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00956-of-01024.json.gz": {"num_bytes": 397120474, "checksum": "7db7ea23446bd8a66737546c5daa0c2dec7bd5c4743f52eb53685ccbf54d9b17"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00957-of-01024.json.gz": {"num_bytes": 397403279, "checksum": "89de2950bc3f7dd4f95d8a0b7cba19e9678bfbc23175bc22d9f9599ec1ad9cd0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00958-of-01024.json.gz": {"num_bytes": 396861933, "checksum": "f325478647cbec9d79bff2266672144147276a82f665d3014c5d2fa9c112c387"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00959-of-01024.json.gz": {"num_bytes": 398439950, "checksum": "70d786bb337c012269caf6aeea3bf9604d279d3e4335294c72ca6cb5a9fbd951"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00960-of-01024.json.gz": {"num_bytes": 395684257, "checksum": "e1d170b0a4d6954a920ef3923688a7dbf40398609ed2ae04b2635df9ceb07821"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00961-of-01024.json.gz": {"num_bytes": 397526287, "checksum": "47b90e3747f35bf67c872d65d843f6dd9bfca15dcb769b31bf3586c6645858bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00962-of-01024.json.gz": {"num_bytes": 397473683, "checksum": "d0ddb2c104f515144265bd3eed526a65ada46f848183688b420694751b113272"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00963-of-01024.json.gz": {"num_bytes": 397964876, "checksum": "74725b631c1699b1166589eaebb66374c031b170eab3ab359230cd4a23a8ae79"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00964-of-01024.json.gz": {"num_bytes": 396523661, "checksum": "fa0d49a2cc726628d9a1b5ae2ace52ee90401af8ae15add27c3f4566dd99a79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00965-of-01024.json.gz": {"num_bytes": 399289514, "checksum": "11fb1878a8b204181f7f776a764f5e9e577d0fe62d4b2e4ce2164ce9fcc30b8f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00966-of-01024.json.gz": {"num_bytes": 397411408, "checksum": "5646014ca3c99f53bd13183187b1e6e8f84cb6c846d6f1f3a3c82edb4accc47e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00967-of-01024.json.gz": {"num_bytes": 395095282, "checksum": "b799b17f36d85235eaf1bed9f4f760a22b75fca736744218e44fae5917a2286c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00968-of-01024.json.gz": {"num_bytes": 397189410, "checksum": "8d9748f5a92a9e0b836fe74b962bd2da04b62a0a2943ea5e440cef19166a5479"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00969-of-01024.json.gz": {"num_bytes": 395651742, "checksum": "f42c71219641fa302692698b4944864f27b7f87d4477a86babe23745dad72715"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00970-of-01024.json.gz": {"num_bytes": 396180197, "checksum": "383d9586f27579b4a97c5901013b3e025f10dc813047d65158d6621430803aec"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00971-of-01024.json.gz": {"num_bytes": 396574555, "checksum": "d2c9700fbac454d3b3a42b2a3c4eb0111eb7cca7cab3d545b0912aba60415c91"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00972-of-01024.json.gz": {"num_bytes": 399639122, "checksum": "5d59e643bf20156a28e5e9dfcd811c5a6c3779e1875f375db09a0fa1871dcc90"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00973-of-01024.json.gz": {"num_bytes": 395456709, "checksum": "8b22e82588e30f30f664895b9716cbb0cf38d5ff4331d3be31ab25663c634a00"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00974-of-01024.json.gz": {"num_bytes": 396693438, "checksum": "5fba4f9d634d968f15d5d4fb29d253646494e3e125aaf1c2f8fab38a7e60180b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00975-of-01024.json.gz": {"num_bytes": 395697641, "checksum": "b4c5fceb9fa2397a9b7c75249bd3386b8dbf999d5b52521051a86e067d698448"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00976-of-01024.json.gz": {"num_bytes": 397172005, "checksum": "093aa01a944a222828656d31dacd8ecd57a24a51d361a8742514bb6af009dce9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00977-of-01024.json.gz": {"num_bytes": 396182407, "checksum": "1beef6e248c00abee5f8952641b12d3f5b12d58adc05c8d461c0a073a6ca9b39"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00978-of-01024.json.gz": {"num_bytes": 396180428, "checksum": "0f2bb125af300de2c9fe347899673a4bd2842ba8298146bfe94c9eddc41893cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00979-of-01024.json.gz": {"num_bytes": 396479117, "checksum": "1fe9d0e54b9be79722e6483e386801263ca51d6e9ad925dabbb58a38c4df877e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00980-of-01024.json.gz": {"num_bytes": 395119279, "checksum": "0f262ff2d4701497f6fd6d4f9d3cb1aa3a730ad6bef1961d890a3b0cb4747ee8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00981-of-01024.json.gz": {"num_bytes": 398285798, "checksum": "a295b85e63c176cecd9f5222ba417eeda307e41847eb38c61dec9b83101a8256"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00982-of-01024.json.gz": {"num_bytes": 397811687, "checksum": "2a3a0e0f454dd72a68ed1dd71c508a9b24fb2349ffdfc588cbfcef728cbaff05"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00983-of-01024.json.gz": {"num_bytes": 397069906, "checksum": "5b4256392755c4dd79cd37cd6ede645a9a549c4436acd27495e974ebe1d80bc7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00984-of-01024.json.gz": {"num_bytes": 397670152, "checksum": "68d4f5dbb3fa349a6811edce8056eb297e771cb9c9939c3a84d30c6ba3ad9dc2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00985-of-01024.json.gz": {"num_bytes": 397949975, "checksum": "6ba478b8a1ebf3b1dd67ed7b4a055cc9cc3c01bc90c1852aea8f5a99f6c07e69"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00986-of-01024.json.gz": {"num_bytes": 397730984, "checksum": "a39a23589cc434e573613e3ead44f33adb005c2c13cea8b33601647c97300fce"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00987-of-01024.json.gz": {"num_bytes": 399173506, "checksum": "eab46d9d0a0cf05dc5ba475017d98f02f1cfd756c8e707d9823a0463713ebf23"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00988-of-01024.json.gz": {"num_bytes": 398674037, "checksum": "88749d380aac85314df66448542b696e9ae6f61f1b27dc395556737f59ad9024"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00989-of-01024.json.gz": {"num_bytes": 395313344, "checksum": "bc565b662396e3ab4e108635e01873014515663bd5216926a59ae80f6cd4273b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00990-of-01024.json.gz": {"num_bytes": 398567254, "checksum": "e9b9bd97a30ccac353a2386babbd01c3a3bbede8c07bc28d17aecc7ef5af6330"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00991-of-01024.json.gz": {"num_bytes": 396958611, "checksum": "505ab5458d5e52d656048284fd22cc0fcd16e49ba19331669239be37645cb04e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00992-of-01024.json.gz": {"num_bytes": 396102263, "checksum": "59ac5b2b04f224be04a4ceac6a16e29a33681f19cd40cbce3d3e8eb961b9f33f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00993-of-01024.json.gz": {"num_bytes": 396935362, "checksum": "c804f2311de9f7ae5691280e16261b9f8385ef9a71929b2111dfade532b6bdd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00994-of-01024.json.gz": {"num_bytes": 398832432, "checksum": "594727bdc3756e678bd4d156216712ed6c8fc98d3f8e9594cfbed10b2e414554"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00995-of-01024.json.gz": {"num_bytes": 396699737, "checksum": "bb3c73c6d48aebf9c60cde56944faa5bb6727db4cc48ae23d67650742462c42d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00996-of-01024.json.gz": {"num_bytes": 398059244, "checksum": "ac1a7e6e2c2a5468c704f5a2318b5617dd4ce140b98271e2034e00015db6cd76"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00997-of-01024.json.gz": {"num_bytes": 397439167, "checksum": "ce9664b29c86c05d3541aee377acdca7a32ef8f0220e0b4b6bf18276b692529f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00998-of-01024.json.gz": {"num_bytes": 397383159, "checksum": "1b4db1b59255f106dd2af7510112eef6d6b611d9f9e000a0e585b623fdb8ae98"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.00999-of-01024.json.gz": {"num_bytes": 396339114, "checksum": "ee5e1508704b03f0a9cb3c4bfb578c08fb83a4d20760e3b40f101c58cbbb3ec7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01000-of-01024.json.gz": {"num_bytes": 395172166, "checksum": "f8cbf0bd9c2b90e588942048848fbfa1a20cf775364cb9c84b4d5dd7cf19e603"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01001-of-01024.json.gz": {"num_bytes": 396629363, "checksum": "7cad3f9a28e5988ef91073c48e9d85ea7030289690f817545cfa9f1165dd33d9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01002-of-01024.json.gz": {"num_bytes": 396507390, "checksum": "b4ae1017913509855d6d8d4413ff3de4a8d519d91f354b6e5b5267219d20658b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01003-of-01024.json.gz": {"num_bytes": 397652598, "checksum": "0c115446c159d27e6e1354173ebec29e6dff5f38c4d2ddb46c07c450523309c9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01004-of-01024.json.gz": {"num_bytes": 397408971, "checksum": "f0b559a832a9ee50225fe1417d936d6b898026d80a105b976deaeae75f9e30a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01005-of-01024.json.gz": {"num_bytes": 397753911, "checksum": "e001c9285ade7de6ac23716b596ddcc733f05bd6abd7e1a67874894c93fbd43a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01006-of-01024.json.gz": {"num_bytes": 397962701, "checksum": "acf13433824104e4bfc3a8aaf8805eb16712cd97b2dc1d48e7d771bee4bd41c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01007-of-01024.json.gz": {"num_bytes": 395966285, "checksum": "4c6069f6a95d036fd3e05a4246db932ad5ab89b9470274f23a17df0b77b9b717"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01008-of-01024.json.gz": {"num_bytes": 397075505, "checksum": "9b3b9c0cd4ee02e18a5d22142183874586da8fd23b4f97033e354f9681d150a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01009-of-01024.json.gz": {"num_bytes": 396881470, "checksum": "14d2d7cf2ebf3b2c73bad4a6099fa1d2b1cb341b100976b03232fb664a7d020e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01010-of-01024.json.gz": {"num_bytes": 397471393, "checksum": "01e6f56bebe0c874d82135f551a6b917759c41af48d127df181267dc9b8f6486"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01011-of-01024.json.gz": {"num_bytes": 398092801, "checksum": "ead5b6b13bd09136fccd9548c224398401bda0ca7ff62ca4db852760760f13d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01012-of-01024.json.gz": {"num_bytes": 397831436, "checksum": "daa2d1507f9b56de0c4aa9d86d93259c1e6f73f0cdfd553ce075a16807dbcb56"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01013-of-01024.json.gz": {"num_bytes": 395098326, "checksum": "c2b21a1a56e9879335c72008919e8f7998dcc1e8df2258fdf2196ea86194e3cc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01014-of-01024.json.gz": {"num_bytes": 396164077, "checksum": "0df125946c83c66c6961eae2aa45ad7eea7038d808281d633ce30686a8245e01"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01015-of-01024.json.gz": {"num_bytes": 397895284, "checksum": "f6f6eee8fc113b7e717654b9305cc5129c3ee1ce9f263b91f0202762f078a526"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01016-of-01024.json.gz": {"num_bytes": 397723033, "checksum": "48426df1f4665d3179251904c96a0e73c041ed5b57885b4dd852809e632685b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01017-of-01024.json.gz": {"num_bytes": 396761053, "checksum": "f33cf2d744585e0338b29a5a5638752123b7b59f9ae3b723cf7e7b536f9f80ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01018-of-01024.json.gz": {"num_bytes": 396562520, "checksum": "72adb0869cac573282c4bd938cdff556f659540dd4a0a6663711974cb2dc147a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01019-of-01024.json.gz": {"num_bytes": 397564701, "checksum": "3b64235effaf41ad61698b2c28f4d73ced1b6ec6b6d79e0f52314176fa0feb12"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01020-of-01024.json.gz": {"num_bytes": 396053080, "checksum": "b16b9f815823d176f94388d4c482652ac656aa763ec738ccd8c8a2a3bdefc1e9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01021-of-01024.json.gz": {"num_bytes": 394731398, "checksum": "f4c0044abadd339055bf13843938eef4c066856757250fc15f77060fc0881ba6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01022-of-01024.json.gz": {"num_bytes": 396548645, "checksum": "5ecd8432526eda57065e6161f0618a19cd5993c7dfe86575775f1bf01836f750"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-train.01023-of-01024.json.gz": {"num_bytes": 396863581, "checksum": "c6cd29b8f6067152ccd584ded81df1f9cb905515d48815b8a546d104ec7a3565"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-validation.00000-of-00008.json.gz": {"num_bytes": 50774357, "checksum": "7cd6c8b1072af3f3ca3fa160d9411960908142743b101f7229223e6658acb42c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-validation.00001-of-00008.json.gz": {"num_bytes": 51252663, "checksum": "d36ef5fc04b24117a19d992de06400e5f290f11786be99be9de68818f7495694"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-validation.00002-of-00008.json.gz": {"num_bytes": 50860289, "checksum": "ab8b3dee7c0698c3cc3a74f159d85495b6bb9529600ef9246bec218ae6775e28"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-validation.00003-of-00008.json.gz": {"num_bytes": 50141661, "checksum": "54d62c9359000b99713a8a0a0fdfa415f1c09824555526f01dc7217b068542ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-validation.00004-of-00008.json.gz": {"num_bytes": 51141505, "checksum": "c11e31de558613237533b41354ca29f0635b599a1c9232517dbf4c2cb1197319"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-validation.00005-of-00008.json.gz": {"num_bytes": 50797157, "checksum": "20d39c0f52c34a3148c0a235238ed3849576ed895c3a43cb47b0159bf233c7d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-validation.00006-of-00008.json.gz": {"num_bytes": 50158887, "checksum": "754a2b7f134bf45f17db7450d5c0eaf2b8824e4a6072be7b20db434f9cb7968f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/en.noblocklist/c4-validation.00007-of-00008.json.gz": {"num_bytes": 50232244, "checksum": "f90c1d79c51ee1a009dc05930fc40e9ee4c3840ca2412cc129855156aaddc279"}}, "download_size": 407016751197, "post_processing_size": null, "dataset_size": 2060282008734, "size_in_bytes": 2467298759931}, "realnewslike": {"description": "A colossal, cleaned version of Common Crawl's web crawl corpus.\n\nBased on Common Crawl dataset: \"https://commoncrawl.org\".\n\nThis is the processed version of Google's C4 dataset by AllenAI.\n\n", "citation": "\n@article{2019t5,\n author = {Colin Raffel and Noam Shazeer and Adam Roberts and Katherine Lee and Sharan Narang and Michael Matena and Yanqi Zhou and Wei Li and Peter J. Liu},\n title = {Exploring the Limits of Transfer Learning with a Unified Text-to-Text Transformer},\n journal = {arXiv e-prints},\n year = {2019},\n archivePrefix = {arXiv},\n eprint = {1910.10683},\n}\n", "homepage": "https://github.com/allenai/allennlp/discussions/5056", "license": "", "features": {"text": {"dtype": "string", "id": null, "_type": "Value"}, "timestamp": {"dtype": "string", "id": null, "_type": "Value"}, "url": {"dtype": "string", "id": null, "_type": "Value"}}, "post_processed": null, "supervised_keys": null, "task_templates": null, "builder_name": "c4", "config_name": "realnewslike", "version": "0.0.0", "splits": {"train": {"name": "train", "num_bytes": 38165657946, "num_examples": 13799838, "dataset_name": "c4"}, "validation": {"name": "validation", "num_bytes": 37875873, "num_examples": 13863, "dataset_name": "c4"}}, "download_checksums": {"https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00000-of-00512.json.gz": {"num_bytes": 30085821, "checksum": "6666a680b0a34eb8756dcb5fd2b12f0078237f3502e8a513bd3e5b71bb92be00"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00001-of-00512.json.gz": {"num_bytes": 30065900, "checksum": "61c3f9ab763067f76d9bea349d86efb97af7539d481b5d2807f362204971c327"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00002-of-00512.json.gz": {"num_bytes": 30028880, "checksum": "3aa4405d957ed42d10d643efe7c0f51b05e8f29cf4ad8783448083c1cd3f2a24"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00003-of-00512.json.gz": {"num_bytes": 30136880, "checksum": "f6eb49e4c0d691e67fe96ddeb3f8370c5e63a7297a31a8da0c58f5cb3a9f6061"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00004-of-00512.json.gz": {"num_bytes": 30110499, "checksum": "6e0908780f555f4b74c6a5055e2c9708333a8466f0b8723a8ea38cc04828ce44"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00005-of-00512.json.gz": {"num_bytes": 30097927, "checksum": "a333562df3fcd4c5ccf51b4c00e11f6619ac4a28a878383aefad277bd30131a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00006-of-00512.json.gz": {"num_bytes": 30013820, "checksum": "7c436cd0993077187988239cf74c3e64de440dacad62ba4b02bd4ac0a8d219b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00007-of-00512.json.gz": {"num_bytes": 30557005, "checksum": "dc9e43681c404fef1741e9608295b8dfae0953473993f3fc44fb83af07a6b82b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00008-of-00512.json.gz": {"num_bytes": 30369535, "checksum": "8de7a4005acdb60436b4e5d7274084e28df3aee31a5457c6837452094544c541"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00009-of-00512.json.gz": {"num_bytes": 30033048, "checksum": "32310a6c74cbee1dbb8b196e0cfad41f79e88e48d8f04c88692d42506113b903"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00010-of-00512.json.gz": {"num_bytes": 29948345, "checksum": "b7df217de849e26ecce5ed7a35b6e6238fcc1c08e969023f209307842dd496c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00011-of-00512.json.gz": {"num_bytes": 30558885, "checksum": "82e5428aaeecf27141a7105e48b78dc02516ae6ebc3d6cd4ef13963316279e1f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00012-of-00512.json.gz": {"num_bytes": 29888513, "checksum": "f3d7e496b7c85ed7d020c8f8a24a0b27f9b2535abdb22b45c08441a29398c44c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00013-of-00512.json.gz": {"num_bytes": 29936292, "checksum": "bf04d82f0cdddc09ce4aecd9f71910b9858badaf6456253d43d89e6a8c56cba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00014-of-00512.json.gz": {"num_bytes": 30169338, "checksum": "15b4611513154de0dfc1c9d470326fd053adf70de814ecfe8ba7ccee66de947e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00015-of-00512.json.gz": {"num_bytes": 30071363, "checksum": "887bdea83bdefc50786c93e8014d1d49999f8090ff15168598c884cd0724fec2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00016-of-00512.json.gz": {"num_bytes": 30451660, "checksum": "288ad0d553d54052354be506f87878fa7c54b0fa65811c6e456b3262e1d117e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00017-of-00512.json.gz": {"num_bytes": 29940254, "checksum": "b13ad58ae9f38598cb9d560e3ab34c1d0200db73fe86da12230e50086b532463"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00018-of-00512.json.gz": {"num_bytes": 30282186, "checksum": "5a67e71955ab2d8f6531bd3949cd8ab71f4ff91863ea5a6ec3e7b33c31a05dd6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00019-of-00512.json.gz": {"num_bytes": 30373907, "checksum": "a70682315a0cfe0af815c7b2abbcd63310fabbc33ad6e19daad19f1f51506955"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00020-of-00512.json.gz": {"num_bytes": 30104199, "checksum": "980e544ce130a06e9e99ec906342eb0ab8aeaa96ac26eca01c56ebb463f5d688"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00021-of-00512.json.gz": {"num_bytes": 29733696, "checksum": "a69729b8f3ccb9db12476a31917783c1c6e036e7bbbb4089f430362aef71f467"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00022-of-00512.json.gz": {"num_bytes": 30012894, "checksum": "589e698fe450e22cba47813a5a28da5393e79702a528f6a8469f72f6d630caad"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00023-of-00512.json.gz": {"num_bytes": 30024851, "checksum": "2a7b036c38fb4d2df6535631018c23d001931e5bf8d8a815fd5b2f9343ec4529"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00024-of-00512.json.gz": {"num_bytes": 29906809, "checksum": "7e512306cb6ebb0b0c3e96ceb16dade9e1e1f484e754bebd0078e7f545fc5b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00025-of-00512.json.gz": {"num_bytes": 30332268, "checksum": "b636b91fcd9a91ce05b8cbeea6f591a0e916175ab23b0cfaf688171c8a98ae8c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00026-of-00512.json.gz": {"num_bytes": 30288490, "checksum": "9e2f8e2a37dcfe66873cc5355740448ef75a1de2deeb2d8c047c3c3a7ee485c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00027-of-00512.json.gz": {"num_bytes": 29897688, "checksum": "882616d1e8ca66c0b6e7aa2ccb18d9239021603ab1b9486638a9a3447ddebe0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00028-of-00512.json.gz": {"num_bytes": 30201690, "checksum": "0312b12f50c64fbe7b894a28e0940089ad57af95df8116cd7d43c0435ec2e79b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00029-of-00512.json.gz": {"num_bytes": 30237920, "checksum": "1e8677140186b219d32e764889dcc344ccac9db51685363324d1bc13ddef2bb7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00030-of-00512.json.gz": {"num_bytes": 30048903, "checksum": "43558e81c291cbf53a5b6a016aecb0e07e26a98b8fb32f4a000037b281afa363"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00031-of-00512.json.gz": {"num_bytes": 30294528, "checksum": "c33ae8a2fad7e5264d093fbe89ed1611357110a4f0f26dd5a93a4dc15560f205"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00032-of-00512.json.gz": {"num_bytes": 29868168, "checksum": "5dc2a8f96db8da87607efc0b708e6a2172530f0c9b43665dc01286109b5c55bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00033-of-00512.json.gz": {"num_bytes": 30105916, "checksum": "c4cdc2b39a86eff251f903d7f3d39605b721615aeffa6a2753f3588b7dbef6c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00034-of-00512.json.gz": {"num_bytes": 30126174, "checksum": "6d874182112b0881dc929c0182a30ec4f9f1633372a2b822200a7b1faaf4f1bf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00035-of-00512.json.gz": {"num_bytes": 30084101, "checksum": "5bea17f0cd4dd888f5d8a2d4092138e4777d80493a1f410d618d4cedf353b914"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00036-of-00512.json.gz": {"num_bytes": 30095974, "checksum": "6e7f42f3012d8ca7500c7e2ec82d27c26b3cd8bb5b8b66a7fc8355d77284f433"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00037-of-00512.json.gz": {"num_bytes": 30239345, "checksum": "54ee45bf25152060679bab3e5fc6f5cb5a3add6acd2664cb152f88c223f83239"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00038-of-00512.json.gz": {"num_bytes": 30247683, "checksum": "f738a2f0f156f7bd897d9d822748d4192a5fe46b566c7288ed5b840c4ffeda64"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00039-of-00512.json.gz": {"num_bytes": 30057005, "checksum": "60235900d69579334660c153c4fe384c08f14f4e729a06a1e8247e8b4ab8a213"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00040-of-00512.json.gz": {"num_bytes": 30185136, "checksum": "5a059d64fd6a1b42a2faeb4088db327c47f9e8328737ab74a0e0457f84433374"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00041-of-00512.json.gz": {"num_bytes": 30314653, "checksum": "2cfdc460c8dd0fb4766191ef2aec0af856af7c95d11eb3f1d731f63b71db4daa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00042-of-00512.json.gz": {"num_bytes": 30123256, "checksum": "64e59b8ebde3c12b0a1d218a302252b96aeb5bb4976927463101a9509579ec22"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00043-of-00512.json.gz": {"num_bytes": 30057043, "checksum": "edd200b97394f15f9cf0a6289406a83b42c3d6f961456f031f5814db4f6d482a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00044-of-00512.json.gz": {"num_bytes": 30029900, "checksum": "1b2980f21ee5cffb271591adc8eaa414438841426442f194b5f4b703356f4e5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00045-of-00512.json.gz": {"num_bytes": 30367170, "checksum": "83967210891345b831956722e8dcd29cf55fb17b786c85c2dd2778528ab4d1c2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00046-of-00512.json.gz": {"num_bytes": 30105866, "checksum": "6921ac4854e2eacaeb4be07669faab85f2bab33f744c7efae1ce17be25176bb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00047-of-00512.json.gz": {"num_bytes": 29957618, "checksum": "e8eba2ba9f51e76a06a2df43b6b120c47b6e41f61e46a2e3331518ebb2d0c84b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00048-of-00512.json.gz": {"num_bytes": 30329887, "checksum": "6af9c44a53d7eb9df9d86ee4d895fb9f7f2b9b3863fd30aae325e79fb792a10c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00049-of-00512.json.gz": {"num_bytes": 30116207, "checksum": "57dc1e94f73b55e0be5690b01d61188a62186ea9f5f85b556ecef3bcaa36fb92"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00050-of-00512.json.gz": {"num_bytes": 30236341, "checksum": "eb75bdf0e63e798838b3d7abfc6a3bfab5de2ba39af833c38048dfe39c1175b1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00051-of-00512.json.gz": {"num_bytes": 30357091, "checksum": "f48b1f5e07311ca9d69787019a56ad849932e6868d1f7778681cf7e4cc9fc562"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00052-of-00512.json.gz": {"num_bytes": 29944959, "checksum": "debf9490c057f11e404898b4a57cb424c1eb523fa90bb7899b1317f970481638"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00053-of-00512.json.gz": {"num_bytes": 30240416, "checksum": "9e847a5c6eb80e5c045fbb405729c695911674bd8d29b1d0be0791303d02f41d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00054-of-00512.json.gz": {"num_bytes": 30174556, "checksum": "65a80db1cdde9153e08277ad2d9074dfba1682c0f771fbb9f4aa8f88ca557f43"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00055-of-00512.json.gz": {"num_bytes": 30134394, "checksum": "beb8d280d322520ded21aec92ae087867d0bce64aac4e243a127a88f143ff578"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00056-of-00512.json.gz": {"num_bytes": 29891026, "checksum": "82fceaec35a2456487a59ae652d72f41a940d2d6bafdc4f05a6e02bcd7ed4dc9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00057-of-00512.json.gz": {"num_bytes": 29920525, "checksum": "e4fd55ba5fb2825ef4209aec87706ecdd3db040242c6aacfc82f350765fbeff8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00058-of-00512.json.gz": {"num_bytes": 30060421, "checksum": "3cfc894a1853e3d1f2daa314873b7919fa52b7208b590637f8face6536305770"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00059-of-00512.json.gz": {"num_bytes": 30038488, "checksum": "4f06ab7b5ce8e8c696445db4a3e32896b6396e3f67d7414a593e7398d752e564"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00060-of-00512.json.gz": {"num_bytes": 30129718, "checksum": "7923385ee0c6801073feb10437ee3c59e5f5dfe82c2311ad8c4ec670dcc0ec87"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00061-of-00512.json.gz": {"num_bytes": 30130505, "checksum": "5cd682e148b8488775622098214fc2009ef9c95355f46341bd78434f1b560fa2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00062-of-00512.json.gz": {"num_bytes": 29968130, "checksum": "53562fc23501f3a1d11c8ae6a59e719d6f4e67db8b8ea1d55e2b1b80849afd08"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00063-of-00512.json.gz": {"num_bytes": 30116532, "checksum": "008cc5c0cb7d60e84ffdfe2132f6bb49aafbb31083fd026067b3859326ca64fb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00064-of-00512.json.gz": {"num_bytes": 30236194, "checksum": "8f9eee169071e80c94c248f1c37b7fa631bd75a7f6e401f6a963aecd8815910b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00065-of-00512.json.gz": {"num_bytes": 30077312, "checksum": "8c5e18ea3575cd350e98d062ef88d3fd1df068e4bd410be8732723bda03656c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00066-of-00512.json.gz": {"num_bytes": 29920862, "checksum": "e377b8112dc6ff6834607c27b927636429e887f4ab8edc0824363941b7bb311d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00067-of-00512.json.gz": {"num_bytes": 30278223, "checksum": "ec2c2ac74cc3f4f814d645410cccda266151949dd36aae518b8082b948b47edb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00068-of-00512.json.gz": {"num_bytes": 29940464, "checksum": "ddfc16a17cabf48a2c59fa8ef25ccd12d899d3462d08b45f2a301567ccc105c4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00069-of-00512.json.gz": {"num_bytes": 29903118, "checksum": "66d9d1791cda56607b2561199503cef216df86b28d4519d5862905671a4ec4c5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00070-of-00512.json.gz": {"num_bytes": 30082323, "checksum": "8072d3bd5e19c005493c0332b73ca5be253397f54be90be1bb7b2ef8df7ad117"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00071-of-00512.json.gz": {"num_bytes": 30128276, "checksum": "b7c68af5a6dcac3fbb3dcbe12123d1045a79baf657a8b3bdada60c1a97404c48"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00072-of-00512.json.gz": {"num_bytes": 30458419, "checksum": "cfe5c6ae2ad1531271b0039042e033bdd7caf9604bfa219980ca27513cea755f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00073-of-00512.json.gz": {"num_bytes": 30366974, "checksum": "a132f5e85376b0d0a06c6ae6af9c226dcbc98394461578c4fbc6cd439ba6e721"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00074-of-00512.json.gz": {"num_bytes": 29987779, "checksum": "f905e808b50908a7d2a7f0944e7e6c01ffd97ec16e5f0b6ed7169a60d66b0100"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00075-of-00512.json.gz": {"num_bytes": 30070204, "checksum": "b57458683803936f6bc03b06fc26be9d1a09ba09517b5c1518676f468e404595"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00076-of-00512.json.gz": {"num_bytes": 30129238, "checksum": "81e88ec53e39d6191e40e5852564f592b745abf99c71ff78302292632f636792"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00077-of-00512.json.gz": {"num_bytes": 30051399, "checksum": "218b0f6e219e42113e35d99458861f8511266dee6c17d9e2780a17af8877f822"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00078-of-00512.json.gz": {"num_bytes": 30144230, "checksum": "c0a337619559362e0e1cd0fe87c9ced5c987313a7f3cb65eb44f8b861c41c616"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00079-of-00512.json.gz": {"num_bytes": 30544297, "checksum": "27e257efda6adbce01585b3b6cdeefa95d31f607012fed5dd4310bfb5a790ba7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00080-of-00512.json.gz": {"num_bytes": 30188866, "checksum": "26411f1a0a7b299d0bf6cf78db04b0bcc617894cd87d59e54614f3258dd393ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00081-of-00512.json.gz": {"num_bytes": 30418881, "checksum": "87a659f6b24560a754ccbfb6aee019484e48e3ddc7955a6c7a18aa9098952cfe"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00082-of-00512.json.gz": {"num_bytes": 30086460, "checksum": "708fe5108042b957688817625c84059c11700b18ddcea3814b86b6c8c66af8a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00083-of-00512.json.gz": {"num_bytes": 30138639, "checksum": "8d8681519538afdb7622b677ca5d3ae2a643382bae9639e3ad90c82d36477653"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00084-of-00512.json.gz": {"num_bytes": 30228150, "checksum": "db708760b9d45e0b20c8dde9b0008f01761d9bb0f37a194845b4d097a60e477c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00085-of-00512.json.gz": {"num_bytes": 30004564, "checksum": "19ba55c7cbc44ae30a6497373fc15b548e5c45667f790c392857f6fdaa7e2bf6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00086-of-00512.json.gz": {"num_bytes": 29696360, "checksum": "4cb07dd259a084818f9a79a4fe4fb7b24ea1adda0cd4fd405ba003e7bd481f12"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00087-of-00512.json.gz": {"num_bytes": 29927300, "checksum": "7c3c07dbc9c57881a3c1abab85a927f1ba609c58da9dcec22d7415079cd336b6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00088-of-00512.json.gz": {"num_bytes": 30038333, "checksum": "59158c87d7e9e5011516f98dec1313758072ca6685c7ad9df5ee4a075d9ff8a2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00089-of-00512.json.gz": {"num_bytes": 30223506, "checksum": "d3f39f7e90b4a82257779290a3f2de5619049d69b2169577f1e3c81791d85419"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00090-of-00512.json.gz": {"num_bytes": 30266969, "checksum": "88ed3237aadff809cec186fa378e176774d3f32aef1a6d8bfdbc530f64e8aed4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00091-of-00512.json.gz": {"num_bytes": 29885840, "checksum": "b9a247993a8eec31b3f853d1329ae79da29397dd27eb4acdc196b71c091335e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00092-of-00512.json.gz": {"num_bytes": 29942337, "checksum": "3d83cc54c06cad8effdb7a38ed6666b5d912e6fffcf4c82471af064b0aabe05e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00093-of-00512.json.gz": {"num_bytes": 30129376, "checksum": "d72ed9855fa86ceb4089435da3d78e8d4151b92185f828329b534d1adf3821db"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00094-of-00512.json.gz": {"num_bytes": 29613450, "checksum": "f61f74aa65a81616b97cbc34a8be1b563f83f69709642b8156eb76cdda02103f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00095-of-00512.json.gz": {"num_bytes": 30469526, "checksum": "926d1ba2e4b191e75b0bce0cbe4c15f95f244445ec03a6095c009c34e36f897e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00096-of-00512.json.gz": {"num_bytes": 30126036, "checksum": "e74818ad94e408498644dc71f1ed967f356f539418222f1dfea467a21c99badc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00097-of-00512.json.gz": {"num_bytes": 30374980, "checksum": "d9cc8827ee38bddd1a31e48b2b0064a567520e3c0f2e1be745acef57d267e4d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00098-of-00512.json.gz": {"num_bytes": 29928579, "checksum": "090ad37fd9eaeb53308599f2da1053b19b1c6478adaea5a8a1c35d6c35340111"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00099-of-00512.json.gz": {"num_bytes": 29901456, "checksum": "c0e7d9a7cbc3b9b940077508441e471a1eb70e822479fcad726b900e6c196382"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00100-of-00512.json.gz": {"num_bytes": 30033459, "checksum": "b62033de618191de3200205e6e40725baf045e403060d10417211d47854d6bb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00101-of-00512.json.gz": {"num_bytes": 30280468, "checksum": "8726d092785856ec690dcd8a9edcd968cd04af1cfafe8a83192e3c0782f02b4a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00102-of-00512.json.gz": {"num_bytes": 29805195, "checksum": "248edf4dd6c9a1137c7b45ab0b5a05a5fc93fd14cec17a5da4d758b9f7b359df"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00103-of-00512.json.gz": {"num_bytes": 29995494, "checksum": "d66b75c3f08a0db141d2c0162eb3dbc351e656ba1ba480e77eda051435d1390f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00104-of-00512.json.gz": {"num_bytes": 30318447, "checksum": "09bd2068c20d33783f39322c95756fd3dbd0da91f4380fae3822cb33b7d06779"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00105-of-00512.json.gz": {"num_bytes": 30209523, "checksum": "0a399ecb1116890e1a0189cd2842d64d8ed53213b1623ae38229a6ac4f5c1c76"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00106-of-00512.json.gz": {"num_bytes": 30476739, "checksum": "540f682a7c977d20f920b5af1ec7e40c14a0d54f1718b43271e22dece9cdce16"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00107-of-00512.json.gz": {"num_bytes": 30203291, "checksum": "0dd51deb74ab391c54b20862f7df561f74d00be2ee4fc13987f91771870c099b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00108-of-00512.json.gz": {"num_bytes": 30265100, "checksum": "172b09a108b154014077a415f644cd16db6a66f178bf780c120a6c4fecc3c0a8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00109-of-00512.json.gz": {"num_bytes": 30342649, "checksum": "214a8f147f2d77ec0f3889b0a2d782e5d44230878359e695e9523561e6723a1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00110-of-00512.json.gz": {"num_bytes": 30152418, "checksum": "dc0d34ce7918b80ecef3528ec2b063edf7b12223c453ac7fb9d39232fecd81d7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00111-of-00512.json.gz": {"num_bytes": 30160329, "checksum": "d0594cb69d26f0e853575d86f92b1aa233b5bb236804a2f496a792fa031014ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00112-of-00512.json.gz": {"num_bytes": 30428351, "checksum": "2b0542d973bab88e696fb9efbe042167600da397d776ef65344dce868bbcb0b9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00113-of-00512.json.gz": {"num_bytes": 30200133, "checksum": "10dcb929692795fefcf4623040191d9cb6199fbb3b164648b62b9867e8392379"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00114-of-00512.json.gz": {"num_bytes": 30205273, "checksum": "f16631d5bcbbe133a01675286ca7667400ecc7e6df13d728015381d21ec71cfc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00115-of-00512.json.gz": {"num_bytes": 30164849, "checksum": "bed27819db4bb7e02cb42cdda18acd232659a2eaa43eed910ba26d686cb3f837"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00116-of-00512.json.gz": {"num_bytes": 30117752, "checksum": "4eb4bec7adac3c2f431d356212f8a9d47136f0011f5f9e71dd29d82b1b823e2a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00117-of-00512.json.gz": {"num_bytes": 30062588, "checksum": "79639624734885b3051b10f052f5486d7124bbc4bcd18d99348f3683ee2fc54f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00118-of-00512.json.gz": {"num_bytes": 30125828, "checksum": "e922a4a5332a4182ddcf6ac8ba910024fe4fa878b524f7368b27373f75bbfe44"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00119-of-00512.json.gz": {"num_bytes": 30156741, "checksum": "a44aba8779b99ace2f212789389af058d12dfb0706221b296676d5e10528dd78"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00120-of-00512.json.gz": {"num_bytes": 30489925, "checksum": "82bec41bbea7bc5ddb67b3bccea51122da7d0922768f8bda7a0c9d489bd20cdb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00121-of-00512.json.gz": {"num_bytes": 29606989, "checksum": "b49238f5b75aaf876657826cfbd4346d250f564a86bdb010aa1e85b44a969229"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00122-of-00512.json.gz": {"num_bytes": 29770557, "checksum": "0803ccbd505db47cd09b20d86cc6ad459c7a8d1c583a5ee756b0397369d8b6fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00123-of-00512.json.gz": {"num_bytes": 30248121, "checksum": "d73a1bf285a0355bd61a25891cd8c5fd9da66535ec515dc7e1602a769b994727"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00124-of-00512.json.gz": {"num_bytes": 30131013, "checksum": "65d2dcc7e63a28e1911717d149b907d0c74fda6e36db2840353a0290f7880324"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00125-of-00512.json.gz": {"num_bytes": 30348971, "checksum": "5dee3c7afe0364ccb8e36647d01e78ffe61690f29f29aa033efac9a0413c2a47"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00126-of-00512.json.gz": {"num_bytes": 30370074, "checksum": "1dc04b3755291842711623d1d6cf042e2d66987103a0c708f01c9136a8c42db6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00127-of-00512.json.gz": {"num_bytes": 30320846, "checksum": "e31a27ba25bdf13e6f929fd38d53409dd3f50be78ad955b69b1956709de5aedb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00128-of-00512.json.gz": {"num_bytes": 30076235, "checksum": "122ee9d293428a7a823c17b3a432b5b2198fa2a68bbb246b97e981bd09f78f0c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00129-of-00512.json.gz": {"num_bytes": 30569486, "checksum": "918bf43ce3ab54d535dd02cbcd09f1081890be3287e23fd81bfa032beec61ebc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00130-of-00512.json.gz": {"num_bytes": 30280169, "checksum": "ab0a53e8c10dfdd139281175b5fcfe3090fa238fcb383e27b1dcdfdbbe8a879c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00131-of-00512.json.gz": {"num_bytes": 30338899, "checksum": "e54771e12a6f3583c3accf9bcc01b598819231f367e7f80cbd44cf6683c5c852"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00132-of-00512.json.gz": {"num_bytes": 29969011, "checksum": "f69d7052ca7657fdebe547a6e196b109285d5d4e4f1a68f3900a37ba6fecc22f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00133-of-00512.json.gz": {"num_bytes": 30179558, "checksum": "cf2130dedafd8f47e97661a5b1555813433e3f7293b5c5cb222cf551d90a0604"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00134-of-00512.json.gz": {"num_bytes": 30080257, "checksum": "1a32902fc21633ae8d41e4e5518804f4c719dc8729b866ebc32d3c36fdadbc10"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00135-of-00512.json.gz": {"num_bytes": 30284972, "checksum": "6e3a78e7a530d91ee4578caf462a4c685a5f221f0cd8eb9639c9067e2b655a7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00136-of-00512.json.gz": {"num_bytes": 30130265, "checksum": "defc57340cbaa5f325994a91b5134789c84a76a4ca7b9fdbf993b0e634735f05"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00137-of-00512.json.gz": {"num_bytes": 30146793, "checksum": "7ce5035f452eb2e1adeff36d0c6d6d65c245d139a86ef48bbe10c5275975183b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00138-of-00512.json.gz": {"num_bytes": 30180265, "checksum": "298849a53a8ea0e68d01cc137195bc36d686077bed722e1198337a1dee3c51cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00139-of-00512.json.gz": {"num_bytes": 30398387, "checksum": "ef2ac4b8f195141a79a357d934d5d97bd4d2c64027ec7509b5873a4ae32fcb9d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00140-of-00512.json.gz": {"num_bytes": 29652990, "checksum": "290f1c99b696e345aaa6ac6d5a882a87dcf5d3939b08ba859a359d2459498785"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00141-of-00512.json.gz": {"num_bytes": 30083642, "checksum": "fb6a38388a25261d86fbd8ffea63e06bcbcbd6846a4eb6f13fd09d7fe5a1fbc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00142-of-00512.json.gz": {"num_bytes": 30131064, "checksum": "b61ccf6166ea4b777629bdc07d543f299bf7569deab18228ec5bb9edc8cd3eb5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00143-of-00512.json.gz": {"num_bytes": 30244435, "checksum": "22812c50efdfcf2c0fdcf593639dfea09ffee8068321c30effc669c8234d4f3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00144-of-00512.json.gz": {"num_bytes": 29725094, "checksum": "79cfa65a3115193629d16606643d90dcf27d3108c320cc9e364ba19fdb9fb1d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00145-of-00512.json.gz": {"num_bytes": 30335033, "checksum": "e836f0bc9acba85fd1721d19cc24054e97defb0d12678bdc0d086f40deb9b1a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00146-of-00512.json.gz": {"num_bytes": 29905680, "checksum": "bf684871a235078390d6c6bb03fc2d5bbffec2b095806df652a19baf5e67135d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00147-of-00512.json.gz": {"num_bytes": 29852459, "checksum": "0e716de5b3b09ec287b039be0f0dd6edd7d541aa6d3f9d2be18768e1cd5f4cd8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00148-of-00512.json.gz": {"num_bytes": 30364788, "checksum": "4cef624e6b7c2b73dbfb47227e31681223a5a9369c4b7daef8606b796f010dd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00149-of-00512.json.gz": {"num_bytes": 30096278, "checksum": "fb448ccc7412f5ca8667004a70f3dd6e1b5e6cb7f6facc06564bd22b1d815593"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00150-of-00512.json.gz": {"num_bytes": 29776995, "checksum": "1e14268cf723bc7336b33896537643d21dbefc1f05ffd5201feb5fb1130f9683"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00151-of-00512.json.gz": {"num_bytes": 30205172, "checksum": "797224cf74063fbcaec741535278ccce141e6dbbdd69a2191d07f89816ab14fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00152-of-00512.json.gz": {"num_bytes": 29845034, "checksum": "77eeb2353f544c714deea68d4a781b498c40d7c1e27db3aade4987b381ca29c0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00153-of-00512.json.gz": {"num_bytes": 30258796, "checksum": "0fc581e92e70dda031d72a4aa0bbd65b1e9b28884f0ef5dd5e895cbecb270609"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00154-of-00512.json.gz": {"num_bytes": 30249734, "checksum": "ba10dd0a24bded170541e23078264b82b35bc99e402db594e2335e31905ededf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00155-of-00512.json.gz": {"num_bytes": 30198742, "checksum": "fe285ac893126062bcbc20df75a9f65c57d3a7391354fa7e62b7f6a7122d6e77"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00156-of-00512.json.gz": {"num_bytes": 30168323, "checksum": "d21826b71bc85dbc496dd947ae9ee79d62885cffb3fa7c47409feee6ab247f17"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00157-of-00512.json.gz": {"num_bytes": 30241978, "checksum": "fc41765301b62849eda0b7b08f792e45f03db458fb92063af70c43d7cd0d0bb6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00158-of-00512.json.gz": {"num_bytes": 29959715, "checksum": "1eded3ce0bc099c7e198e9277719d578c3fb6c425bb2110cb0ca6ce469d1d19f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00159-of-00512.json.gz": {"num_bytes": 30109595, "checksum": "eccaab5b694c2f0017fe1d423637872d5587f6deb316796f7c0ff5517fa28178"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00160-of-00512.json.gz": {"num_bytes": 30201741, "checksum": "4ceee71372da6112101665f5bbf942a85f065feaab924c6e3f83498169bbe255"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00161-of-00512.json.gz": {"num_bytes": 30176266, "checksum": "6ed829daaad190b2d50b626d840edb750a063afad95315ffe7604a193183a489"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00162-of-00512.json.gz": {"num_bytes": 30018118, "checksum": "dcf8509a55213425a41706e5209ad411afb715fb9cd8c1a8b8edca23fab7d6cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00163-of-00512.json.gz": {"num_bytes": 30236016, "checksum": "d93cfaabcc7197637f233896b5799527f27d5b2dc60f0f0411ee51f05f09c500"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00164-of-00512.json.gz": {"num_bytes": 30150055, "checksum": "cc7de5ed3c774ff1dc350fbb5167dc1610c4f9a0dbc7c5d60ed4cf08aaf23ce3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00165-of-00512.json.gz": {"num_bytes": 30348056, "checksum": "b41c4a3b7b4e96262fe5c87d06fbeb000dc48cc1d304a475bb4f4e1af84a9afb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00166-of-00512.json.gz": {"num_bytes": 30015834, "checksum": "0a0821b7628b9b019995a9f34223e2960ded84331ce1bb55089838becb8a170a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00167-of-00512.json.gz": {"num_bytes": 30282254, "checksum": "1285af56d024efe2166fa892878d471948e1d4c996922c7673e3c0f7f0f76bef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00168-of-00512.json.gz": {"num_bytes": 29815124, "checksum": "29ec54ed647725ca3b9aec3bae341151a8e2b708cf21cd87b4389329298442b8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00169-of-00512.json.gz": {"num_bytes": 30346843, "checksum": "1791e3f8371a63f9f849b7bf430e70d3f4011dbdef572c166cc5d49d06162fd7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00170-of-00512.json.gz": {"num_bytes": 30175685, "checksum": "de8f82986addfc64b88fd3041d7ee6fdb64e6f770758146dc4c9309df348e965"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00171-of-00512.json.gz": {"num_bytes": 30145505, "checksum": "0dda47f679666862de6343e1109ed92866a42e8fa129ee69e9f0b73f18b6aecb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00172-of-00512.json.gz": {"num_bytes": 30009998, "checksum": "2990dae6c16b7d60652439bed8b80ee4cf93972f33d8511d3d6aabaddfeca5cd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00173-of-00512.json.gz": {"num_bytes": 30062185, "checksum": "e154a969bba2bf9430e0c8307561de78599fd2bd527cb1f15bbaf8f8e88cdf23"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00174-of-00512.json.gz": {"num_bytes": 30055129, "checksum": "e714ae153e8a927c88fe577d4c27017985d3ed7f3d0f5470f9a5f25c2e901a9c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00175-of-00512.json.gz": {"num_bytes": 30091082, "checksum": "5f47c663d1e15d94fb0057d303048be990c713f3285ada2c6233137b1d84d60f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00176-of-00512.json.gz": {"num_bytes": 30235767, "checksum": "20b05e4e99e5a05f6a4c29b304803b895bb8816caea6203643723ca587d66128"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00177-of-00512.json.gz": {"num_bytes": 30071950, "checksum": "29294e4b224df4695c9342c6f23d5495de9a0ca6a1be7217aa2211506e8ac7bc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00178-of-00512.json.gz": {"num_bytes": 29932121, "checksum": "6022ed3b2ceef02324e40d3c7407622c95ead2cd3d3c41ab15ff9dd218265673"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00179-of-00512.json.gz": {"num_bytes": 30119251, "checksum": "42fa0aa883d9db4303a4981e4e308b2432b031fbccc98c3e1994ec775ba8023e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00180-of-00512.json.gz": {"num_bytes": 30175456, "checksum": "6fb2ebd61524846f6b1f746f9c6356045623beb4b685fe265a23446037c9cd9f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00181-of-00512.json.gz": {"num_bytes": 30029564, "checksum": "b779d721bb135fceaeddebb0dad1bdb43c9067a5e8595b3d544dfa7a084eb9f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00182-of-00512.json.gz": {"num_bytes": 30437016, "checksum": "b388fc0e862d7f6bb5b879ff7c69c301038faf5b542f6b40cbea4e2096a41e6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00183-of-00512.json.gz": {"num_bytes": 29994048, "checksum": "8208eeca7bc76f8b1786c95939d321ca0c7ae190b1f12dae86738810e412aa8b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00184-of-00512.json.gz": {"num_bytes": 30338616, "checksum": "49859e75d999f65de99f9236e649a81989360f0328ba684671057b0dd7cf5e79"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00185-of-00512.json.gz": {"num_bytes": 30088874, "checksum": "ff6d32fdd471d3076a9367c175baab84a5d699ccd6dcfe00c755f0b714ca6074"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00186-of-00512.json.gz": {"num_bytes": 30193681, "checksum": "82508ed104fc57de3062258eaea57854ab9e1934437a88dc0d8a9921f3641bbc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00187-of-00512.json.gz": {"num_bytes": 30171163, "checksum": "409d6576b25ad27455c755e5484e3f51d5d9788962efabe1c32e06bb3febacab"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00188-of-00512.json.gz": {"num_bytes": 30060432, "checksum": "fae94de96fa2962ef51e2ea90a5f760a5cee5de249bfd9f56d7c7b4e5c20f6de"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00189-of-00512.json.gz": {"num_bytes": 30180741, "checksum": "25293d5cba09980086f380d9e9ab44543adbbdcd05ed08601248b3a2b16d118c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00190-of-00512.json.gz": {"num_bytes": 30207152, "checksum": "ccfee160de15df5d88f0ff5a898a0c5b2d0ef4ebd6e6832715a9ef8a9904f88f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00191-of-00512.json.gz": {"num_bytes": 30143987, "checksum": "4c579619e465d9d97451801147202826a3855e772ea6dc4e9968e43ce2b8c05d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00192-of-00512.json.gz": {"num_bytes": 30072097, "checksum": "9c32ecb6d4ec9feb27c5b642879b464e68ca8804db161219503f624e7ca1166f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00193-of-00512.json.gz": {"num_bytes": 30172886, "checksum": "8442ddc3843c72aa169ca67801ff865ff85e4183beb38faa664f4f1d1c22a5d8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00194-of-00512.json.gz": {"num_bytes": 30037105, "checksum": "2942ecacb22cb9a2953c68f21ddf3368cd47ab1f2b2d8e1f5c76b1c849b28d91"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00195-of-00512.json.gz": {"num_bytes": 30014854, "checksum": "9e5c6815a5734403a7062bb27b2565d433a3520a401c836ac3f16e743a1dd949"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00196-of-00512.json.gz": {"num_bytes": 30020510, "checksum": "792712f0073c158b5f96f7a99d97970fca3819b69739d34d7d2b7f4b8b407b7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00197-of-00512.json.gz": {"num_bytes": 30072566, "checksum": "3ece37e2d0d0b26fbd839b5d3facdfd70844945a06867fb68b141f6b1378462b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00198-of-00512.json.gz": {"num_bytes": 30036679, "checksum": "c3f37a9b89987dde4578b394b5c3916c2d4fd87e0902309b4c81af19b1d2d5ea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00199-of-00512.json.gz": {"num_bytes": 30195178, "checksum": "ae01bb5515097a083afd498d8530e788d99671e7cf802c4402957d6252b2ec77"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00200-of-00512.json.gz": {"num_bytes": 30064374, "checksum": "2399d4869f3a8bb4a9adced5ec548a9a3fde1d4fbc4e3abd9a0a3b495fb9a8ef"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00201-of-00512.json.gz": {"num_bytes": 30136711, "checksum": "5c922040697bad8d7807d79f34f2b667eea63ceefba89b2d413fcd4d66497607"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00202-of-00512.json.gz": {"num_bytes": 29962983, "checksum": "e4df518d612a8614de73d5944a31d22ad06ec9ecd26fb52e500df71fe363c1be"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00203-of-00512.json.gz": {"num_bytes": 30178998, "checksum": "e84a98a176451fc82d940a64cdec821e320a648780edba6466b74a1966eca47e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00204-of-00512.json.gz": {"num_bytes": 29988832, "checksum": "c6dc56388bc7c57cbdee8280895ab80da7b4d49c9a0101a685229c50cad2e2e1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00205-of-00512.json.gz": {"num_bytes": 30229414, "checksum": "e7e5175b6a7372377ba3a0db439911e189db459787d48588183ac1a0198c5fa7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00206-of-00512.json.gz": {"num_bytes": 29914929, "checksum": "eb263433133660ebe219cd5817dea3b546ef2fba0e15396b2768d7091117cdea"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00207-of-00512.json.gz": {"num_bytes": 29912800, "checksum": "7f8a5f62ba5912b64af5b02bd987b4d81727223ef8eff110022e89d01961366f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00208-of-00512.json.gz": {"num_bytes": 29900590, "checksum": "bc2af142244601bb7a96859dfd9885196940e675ca217cfc7c73ac9c614ea938"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00209-of-00512.json.gz": {"num_bytes": 30242768, "checksum": "fa51a4337faecfc790ca925802f87f10761552e16578b880ced80497f62bba60"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00210-of-00512.json.gz": {"num_bytes": 30039857, "checksum": "3adf7482ec6a3ad106c8edca3645a94032c33f84fcd26bd9876f2b8a1f6b5722"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00211-of-00512.json.gz": {"num_bytes": 29846856, "checksum": "8e931aaa9c1f069c0eca0b4605277610df9d2d0c07a0dbe6191fb7081b0e642a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00212-of-00512.json.gz": {"num_bytes": 30022172, "checksum": "21c8bba1c83544c27977b22b077fd77f8df9cd06bc4eb5e9e9a532c511498d36"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00213-of-00512.json.gz": {"num_bytes": 29877918, "checksum": "b64ebaa088df5c6230e69f207267a038705c38f4d327970e9117979e1c13d1ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00214-of-00512.json.gz": {"num_bytes": 29906552, "checksum": "55d833a2b78ad564e6532d1acd14511e8b48d703030e3bbc92d7c835c1ed38c7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00215-of-00512.json.gz": {"num_bytes": 30075441, "checksum": "999c77c136d3df83601e33c823f389b133f33c4c0b03736ceace617b526cb293"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00216-of-00512.json.gz": {"num_bytes": 30507152, "checksum": "0b23d4e57eaa101c78bab46151add537668d2722bf0c50470c1b434ec3389ae1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00217-of-00512.json.gz": {"num_bytes": 30044236, "checksum": "6abacfd53e231a38c714d436018cef9a58f53320026c2ebb27d6caf08f02d7ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00218-of-00512.json.gz": {"num_bytes": 30047926, "checksum": "01120ef69493d84c44d112a41c69a851edaf89232679366e812f240fd26a0e47"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00219-of-00512.json.gz": {"num_bytes": 30349211, "checksum": "c4fc219559f0f076f634fc6812d4b13c229908c1ae45c3b74c059fb3b8124f63"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00220-of-00512.json.gz": {"num_bytes": 30063445, "checksum": "11f712439d54ef062cfa1225328fc4faaef5f6c9c0b0d87a0a81d25a71350e28"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00221-of-00512.json.gz": {"num_bytes": 30115660, "checksum": "9a344857ef4f9d141b57df38e25f717153b773436d72c23e10289ffe67c315eb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00222-of-00512.json.gz": {"num_bytes": 30134562, "checksum": "227cd1847a948e388b404b5cda9289f05510d4e22f0ae5ec4d5a87a8f7f98a45"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00223-of-00512.json.gz": {"num_bytes": 30120819, "checksum": "e0029aa6b612a98f76e37d82107fcb90f2b57ae8d52beea172b5153b76334f20"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00224-of-00512.json.gz": {"num_bytes": 30371365, "checksum": "1ce5242d163ca12dbb22655eb841bf80750b552353af4f84973285d823d0add5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00225-of-00512.json.gz": {"num_bytes": 30319212, "checksum": "71cb82bb95107a7e0b7777a5fcaa0f76b465ba828ac47401babcf7289eeb2335"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00226-of-00512.json.gz": {"num_bytes": 30020940, "checksum": "b7b8d98ade41f52ece23e896bdc4c19ad034a92ba18adb5fac85c7271afbfa65"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00227-of-00512.json.gz": {"num_bytes": 30109958, "checksum": "b2ec382f44caf4e8e46fef2faf6bd2e4000420e6da2eb12a5d9f6e7efb4e1564"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00228-of-00512.json.gz": {"num_bytes": 29940895, "checksum": "ff86264683d0fdf9d689aa30e7889c4ceed21098b7c60a220db92d396614cb1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00229-of-00512.json.gz": {"num_bytes": 30080588, "checksum": "3a5502cedd61501055eb16adb6ef861c75880524c5468a69cd346bc03e98e219"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00230-of-00512.json.gz": {"num_bytes": 30376399, "checksum": "6d3a4171a1febe9149f6900e3cca5a38046ca9d59214b548a4ef9de7de754bbd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00231-of-00512.json.gz": {"num_bytes": 30031670, "checksum": "a2c8d9bb3eb260d5d8a7dcafc4703540332e2896e5127372d380d7efbd567a3a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00232-of-00512.json.gz": {"num_bytes": 30132612, "checksum": "c9dec917eff4d72c684d6f8373ca66839061e29d25f0aa5fd6fb7de5c30df469"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00233-of-00512.json.gz": {"num_bytes": 30178285, "checksum": "1eb83b8eb7e72b2b3e55420436bb17521b989d0627da46f8cc61fe9f420fd464"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00234-of-00512.json.gz": {"num_bytes": 29991258, "checksum": "5e14e2a9e8c0aba73feb9134c694e99baf57357bb524877322ff5181eedef1f2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00235-of-00512.json.gz": {"num_bytes": 30045172, "checksum": "50a118a072498b5338802cceacb97a9aa9242252e8d76d305cf5f0d928fd4af6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00236-of-00512.json.gz": {"num_bytes": 30403542, "checksum": "7d7605576975232579e422a1b72625ad6f9d714d27770725dc7b99ba258e1985"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00237-of-00512.json.gz": {"num_bytes": 30242989, "checksum": "22d152fa02c5a959e978ea4887dd873dfef7267af0a577b4d796ff0cb52d5c56"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00238-of-00512.json.gz": {"num_bytes": 30214634, "checksum": "6d0af6f396fa21867e899a7678c633e47bfe79bcbda29b8072c5d32ab20a9aa3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00239-of-00512.json.gz": {"num_bytes": 30255546, "checksum": "d35a93632638b6283053b121f0f30d47ea20b2747d871c3dd0beb13f4ffbcad9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00240-of-00512.json.gz": {"num_bytes": 30347604, "checksum": "fd052d532fcfe811d96f8433f79a684f68f76ec42bd959c76ae3b63aec0b2c3e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00241-of-00512.json.gz": {"num_bytes": 30135691, "checksum": "12c80c41dc4d6313bce4a171999ecda93ffc59f2c70cca363bce214cd12dc9f7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00242-of-00512.json.gz": {"num_bytes": 30229834, "checksum": "fca5b81914ac0c5fe0b0c1a554a1e62c64af5c98740df1f8ce8f48f2a62b6a48"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00243-of-00512.json.gz": {"num_bytes": 30053753, "checksum": "ba41c505579524e9d244354a70060c9a0131007e0b129f03e628bb7b7b512ca9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00244-of-00512.json.gz": {"num_bytes": 30216889, "checksum": "54a391c1d2de7627e739f3cd94eeccd50a80d56a40606f7c5392f6098df456cf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00245-of-00512.json.gz": {"num_bytes": 29887569, "checksum": "c3263ea7e16e0036961dad28fef57ce4f0495219e59b4e800af82b67b3c6c506"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00246-of-00512.json.gz": {"num_bytes": 29906815, "checksum": "a3dcc92aed81708434edee84397010eae4ffeaa38b39aaf3919256f72deee625"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00247-of-00512.json.gz": {"num_bytes": 30074896, "checksum": "019e983a95908651bfae83e37bda5200b3888b03ab235fc8db2d5b16742f028f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00248-of-00512.json.gz": {"num_bytes": 30108081, "checksum": "6f68835ec02cf899f8f44a795b1e3117956ff5bb6c8946435d9861ae7a112df3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00249-of-00512.json.gz": {"num_bytes": 29957882, "checksum": "9bed6b7f56d93fa3973d4f177dde0973fa0eb6fe17d8d85279d865531613f963"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00250-of-00512.json.gz": {"num_bytes": 29822284, "checksum": "1848bef8d11360df55a576c64147e519327b1178f77d3ec14ab9522b33b1c423"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00251-of-00512.json.gz": {"num_bytes": 29956462, "checksum": "425f69c361a8671cf571df577ac0cfafb4894de494360084b7cbe9cb8869bc3f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00252-of-00512.json.gz": {"num_bytes": 29733712, "checksum": "7198e831e75eff1e116513f9cbe098c071f051c545b41d1943211a1d996a3c67"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00253-of-00512.json.gz": {"num_bytes": 30450662, "checksum": "0452804e723c919bd3c84217bb1dfc8764112fd70c5581f84520df7592f28ae9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00254-of-00512.json.gz": {"num_bytes": 29944765, "checksum": "dbbff2253d70094537de481344e5706315271fdfce7ebaddc8d277ed05ddfe24"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00255-of-00512.json.gz": {"num_bytes": 30321363, "checksum": "79173dd85d535cee71afb52f7775bbf7289509bc555efe21a8700d36f7e5da25"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00256-of-00512.json.gz": {"num_bytes": 29982818, "checksum": "bacd191568e72da06c564fc7476225ce83440de6aea6c85ebe7f5279f1c15846"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00257-of-00512.json.gz": {"num_bytes": 30338592, "checksum": "998287203665559c27a66e889611ed716b7a389e403b2e857086f548b2c47b39"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00258-of-00512.json.gz": {"num_bytes": 29911193, "checksum": "ed9829f41a71cc187d0ddfeafc9cbde8e362b52914c988708a1a5ffbd3c152af"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00259-of-00512.json.gz": {"num_bytes": 30227794, "checksum": "2fe86814499a3379601a179acca1d440b3c79467827ce9ef9787e1ab311904e0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00260-of-00512.json.gz": {"num_bytes": 30206902, "checksum": "c4efdad05d3f5e9f27884399ab0ec82081c26486e87f0ed5408a9eb80b223daf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00261-of-00512.json.gz": {"num_bytes": 30035514, "checksum": "e47675a956a626a32b1870c61e6f98c3cfe9cc571901cf477abae982b4e63c96"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00262-of-00512.json.gz": {"num_bytes": 30406718, "checksum": "ae19c1389e26562322f745bafbd7839e7a95b3169743d48baa7ae7f2db2a0b5e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00263-of-00512.json.gz": {"num_bytes": 30266531, "checksum": "289c9fee87f12ea22ad5329f80cb379e5e9c22c5cb6639077748958228c62bf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00264-of-00512.json.gz": {"num_bytes": 30100823, "checksum": "7c65dd5d90c6df49ca2dcbfdbf1b9fbb0789cb32043795942d88c5f2d7a99869"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00265-of-00512.json.gz": {"num_bytes": 29957109, "checksum": "e3a1b501b2cc3f5f2667ef179d7876db602daedefd0cd741c0898679b24984e6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00266-of-00512.json.gz": {"num_bytes": 30196603, "checksum": "9337dd8240f168da5f6a8b57c5c169a2a400a9a160eccc8a6e44e7b32004ff19"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00267-of-00512.json.gz": {"num_bytes": 30304605, "checksum": "513eea4e78c399cc045e25f13bb5f77ddb6c9b606522bed8216945c529894e8a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00268-of-00512.json.gz": {"num_bytes": 30312562, "checksum": "0503c5bf6848213c5fcb81a5c94307fc010d910a8989e104ad5fedca58c76f7e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00269-of-00512.json.gz": {"num_bytes": 30045257, "checksum": "59bd3011d12d7d70b5fd64bc2dd2016b1a9ca6f0d210dbb3e6c202bbbf74ced5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00270-of-00512.json.gz": {"num_bytes": 30027628, "checksum": "8d3ecf4c61acafc49b624d08b6aa31340643e030f6c2248f689e8a17d355359e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00271-of-00512.json.gz": {"num_bytes": 30014730, "checksum": "b2e4820a0a7287786f802b3b40602c8ca77c7813b5f50db8a336b89b89bbdf37"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00272-of-00512.json.gz": {"num_bytes": 30145705, "checksum": "20c73e4a9056a5201621a4799b86c323c5136af43caa63a74298a5c3bee890a6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00273-of-00512.json.gz": {"num_bytes": 30165945, "checksum": "8f07a91b6b40444635d869b94558fa68e3593626808bc6122d4e17403cf76101"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00274-of-00512.json.gz": {"num_bytes": 30097947, "checksum": "9530522c841d8f09ccb89f4f0238f7b9048c211e85b27449fb3c09d3bd2bab7b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00275-of-00512.json.gz": {"num_bytes": 30296359, "checksum": "51a358db81805a20df4f920baacf3adea05209282f800fbedfc7fa49638a072e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00276-of-00512.json.gz": {"num_bytes": 30311407, "checksum": "a51253cf73fb200053eb5fd5eca398a7a070fcaa27fc99b23389d09eef7fe5ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00277-of-00512.json.gz": {"num_bytes": 30372345, "checksum": "cc4f6d9040d8c4909d4ea5b661a7e54ba4775ff1c7c55db1ff686a56d428e2a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00278-of-00512.json.gz": {"num_bytes": 30379507, "checksum": "1052defa657524e1211e67d775a32243b164eda431c4c6ed351f0c6727f21b16"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00279-of-00512.json.gz": {"num_bytes": 30195406, "checksum": "6f4fdc92c516ad779fd521afba7d8d5bcd40672e63028f43f70fff4d7605f5ba"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00280-of-00512.json.gz": {"num_bytes": 29902057, "checksum": "c26f89efd0977465f45fe321036d88e2d6ca3ee1edc4bafe4b40ad1895cfc0e3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00281-of-00512.json.gz": {"num_bytes": 29779702, "checksum": "094139d741b7a47faaaaf50093ab4edbef6ad1943985c6f453ce45a67a95b190"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00282-of-00512.json.gz": {"num_bytes": 30063500, "checksum": "280d69bfc795f1502a9e744d53d1a189051a1e771042721f8e6f74f6559e25a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00283-of-00512.json.gz": {"num_bytes": 29956350, "checksum": "505e49b7eeab46c77a324959eeff103f8899da1efc4d0fef5c0e6c6f8879a721"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00284-of-00512.json.gz": {"num_bytes": 30146285, "checksum": "9b075f2cfdb9a90fcdc7f779a52b0c5dad36385214844d4fd9df1e528ae78b6a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00285-of-00512.json.gz": {"num_bytes": 30160056, "checksum": "d9b9f3cbb9ce2a0a0a1a2f7ce91e98621d48a7a900c278aeef437dc6c0a7cdf0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00286-of-00512.json.gz": {"num_bytes": 29844025, "checksum": "6de9ff1013484662305e414725be2d0a4a1873a941250b95b80b5dea8919cf95"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00287-of-00512.json.gz": {"num_bytes": 30089218, "checksum": "444ff132c4a5330653b7319d34b2c7f4ae3b960d8b510cbd7389e3881f65ac5d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00288-of-00512.json.gz": {"num_bytes": 30092170, "checksum": "46dc5b3b84e4387ad718fdf96b751354d7048e898ec664e0d3bdfc21ee841ec2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00289-of-00512.json.gz": {"num_bytes": 30365397, "checksum": "b42e35746112198143ac18509e4f0148772db75e19f5eea9ed0d7e2849dbba48"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00290-of-00512.json.gz": {"num_bytes": 30275920, "checksum": "25d99877235c4b9dacd5d1dd7e9d16bba76cdf6cb1725fa617209142873dca0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00291-of-00512.json.gz": {"num_bytes": 30125784, "checksum": "51da68b6f2751a83e2534c342b6e9d69c419fb606b44c42b872d69f5f726df3c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00292-of-00512.json.gz": {"num_bytes": 30201021, "checksum": "1e0a42b5e7ea7049c3c86b96d37c5d1c36f3ba2e2dab02145a897ef056fa6a87"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00293-of-00512.json.gz": {"num_bytes": 30124224, "checksum": "8c744f5c6eb92c0de70649cd773c0ad147bc7a1487b2ae7f1107bce9d19da601"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00294-of-00512.json.gz": {"num_bytes": 30074708, "checksum": "b3cfa4c4408c1a9f39b48e18a62e112ec3c132b226efe0850f9e58e2a517aa97"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00295-of-00512.json.gz": {"num_bytes": 29990007, "checksum": "012f63e147d22e34249e930975a2d8958a8d0b17350a9f6e368d702189b40d5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00296-of-00512.json.gz": {"num_bytes": 30093755, "checksum": "5573859cc485ae4535b83fd408dcc6a82f644832c93e6125db9a16dd6ded338f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00297-of-00512.json.gz": {"num_bytes": 30078472, "checksum": "25e694485171ba1347ccbd7916c1b87a0d46acfd13795a8aabb1cb57b5eb1221"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00298-of-00512.json.gz": {"num_bytes": 30327122, "checksum": "6d6832cb3b1c86b6392bc9ca52f69a0bb16bf71c3c7664d9fe668ee259a40a30"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00299-of-00512.json.gz": {"num_bytes": 30214180, "checksum": "9f3c3d87a525874ea117e36e0b30d7f5cc6c64564506808058a0788d74943634"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00300-of-00512.json.gz": {"num_bytes": 29895171, "checksum": "e99d296965da2f731ea660889ce834cd1d21edf427298bab3a059ff3ebc64a2d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00301-of-00512.json.gz": {"num_bytes": 30131063, "checksum": "e5eeb0f237cf986134c946bb3c2a4b5483fb9c88b3c2b16b9db26135043036d6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00302-of-00512.json.gz": {"num_bytes": 30184609, "checksum": "4ac9bf5ca6fac7f7293238852424340326347ceaa6f5dfa6fddef8003421bebd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00303-of-00512.json.gz": {"num_bytes": 29956412, "checksum": "559019fe1ef1f7e77ac53ad98b3556965ebc524ecb80bbc3f26255d5ae6e3609"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00304-of-00512.json.gz": {"num_bytes": 29974071, "checksum": "3c54edc4b6a7e34048cbbadb55cb3b16496a4e6e7334b4ede4e1368daf4c5301"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00305-of-00512.json.gz": {"num_bytes": 30338106, "checksum": "1c91c0c5bcc2bec0a698318ad6f576a06db7885c20ed7f36782427b80580a75a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00306-of-00512.json.gz": {"num_bytes": 30178986, "checksum": "fff99f2758c2de57ccbfbfc6388f67e624d00d4a6cccb5820a7a8f5fcf02d386"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00307-of-00512.json.gz": {"num_bytes": 29493455, "checksum": "5d08c6e3909e21bed456ff9d06c983f14d3a277cb399a91047a692184f87c4c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00308-of-00512.json.gz": {"num_bytes": 30228844, "checksum": "04bffac195e24383d06b0ab9ebf019959a4e7abe8e8e6a0cdfbf0a8e7c23c899"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00309-of-00512.json.gz": {"num_bytes": 30351688, "checksum": "3ce14d5104d1318c6a16d042735f0a71f4452897de60d17408181ec5b135bbb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00310-of-00512.json.gz": {"num_bytes": 29993012, "checksum": "afad2f39bf4cb932e50d9a0be93940b423e7abcc3d67dac15b1939e4e40f4ce4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00311-of-00512.json.gz": {"num_bytes": 30448951, "checksum": "a049c31ef6304084d33cb7bdd2e21ada0c60b40b1002b2369e60d36a5098c4b0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00312-of-00512.json.gz": {"num_bytes": 30034189, "checksum": "557d1e88400a6d1d8ee4d717a959239edacbdd3e18d8cd20c5c85b77174dc302"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00313-of-00512.json.gz": {"num_bytes": 30066486, "checksum": "e4823ea1e9a59d5db84564a5b90c28fd8058450f238c60ad689ffd6b673d65f8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00314-of-00512.json.gz": {"num_bytes": 30397706, "checksum": "1b4c0653e7ccf7fda0a53d8cbd5ddd57322ac83822e9d05bbdb9eb8ac979cf50"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00315-of-00512.json.gz": {"num_bytes": 30219107, "checksum": "9c364c9cab4ff7acdd1818b13de2f36713df8fa6c504ba15cdf47fe8e3c30206"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00316-of-00512.json.gz": {"num_bytes": 30098661, "checksum": "84dd8a8739b5abc39d8180f0894b1fbf2930d6d333d7c86b646f40763327397c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00317-of-00512.json.gz": {"num_bytes": 30178992, "checksum": "16e4791b4e5ab3719dacf79fedb0b88ed54346372874c37ccb71d86bc419edc3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00318-of-00512.json.gz": {"num_bytes": 30022982, "checksum": "98345a826aab12bdaf5e639205d5dcdc1da8fecd7cafc1982df89ac8d4df7ebf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00319-of-00512.json.gz": {"num_bytes": 30360409, "checksum": "d53a39019a1627b42ae6bff68e283d37d0bb5f48b328c2c5cdcc1a3897f4e992"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00320-of-00512.json.gz": {"num_bytes": 30347267, "checksum": "c343a0eedf58484055e58762802ae8cc05f2cdb0b923785c493d056a2cbdb015"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00321-of-00512.json.gz": {"num_bytes": 29967877, "checksum": "cc5795d254ad749ccfe613034927bdf95529545ae1f277b694dd24a5996aca83"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00322-of-00512.json.gz": {"num_bytes": 29885538, "checksum": "d5eaaa1eea983bd37ed34651e6c16b746ff7c92e48038b234149fa6d04d3d866"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00323-of-00512.json.gz": {"num_bytes": 30308848, "checksum": "a42cfaef5e088fd6b24dfc121084a6cd038f5b0bfaecb9f33997ab22a97fb155"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00324-of-00512.json.gz": {"num_bytes": 30351634, "checksum": "0e2e6933f93466e9c8fe966f7770fe4c34caf182c713dad3206f4132eed1d41d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00325-of-00512.json.gz": {"num_bytes": 30077168, "checksum": "77cdbf7040ce7f38d735fef41813ce63aaa16fcd87fce80e6ca6bd56d350c369"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00326-of-00512.json.gz": {"num_bytes": 30031750, "checksum": "8d994c2dc1b766e3270dce3f0b8f6f8fe22d5c1e0e9780e1bfed52c1292b8641"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00327-of-00512.json.gz": {"num_bytes": 29845765, "checksum": "f6279e351d016769d6fb5482d01a15ba054d5fe6f9f1c4e92c0663cef0083002"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00328-of-00512.json.gz": {"num_bytes": 30253188, "checksum": "2ea84aafd94d1843a2cc4428279dbb079c6ae0aae6c00f90ee4b5ace3c827afd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00329-of-00512.json.gz": {"num_bytes": 30124922, "checksum": "49e3d91126d53eada7bbd87bfe9eaae74f059c69cd70a3a3b8101f49c1aca154"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00330-of-00512.json.gz": {"num_bytes": 30026414, "checksum": "07442fc4f7fb1732362293bc15a6754d70ecf4743392cf89c4497b3cd96269fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00331-of-00512.json.gz": {"num_bytes": 29961847, "checksum": "f437c6f5f758a5d32c8fc949037060259162864c29aeaabf37032e79f5a1cf0b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00332-of-00512.json.gz": {"num_bytes": 30167166, "checksum": "96018497eb6dec020436c1333ff81980a64fb615997855fdd8cf35fe3f658db6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00333-of-00512.json.gz": {"num_bytes": 30192963, "checksum": "1c12ea6b9031049dbc84e4da6b5fdedf480e989385d758c88322c415a1cabbb0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00334-of-00512.json.gz": {"num_bytes": 29847008, "checksum": "c269285f15f626b4b15a7d1705ffa08e3f4d49ce13de8174b72f9f6276a1c6af"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00335-of-00512.json.gz": {"num_bytes": 30262244, "checksum": "179ee564e6fc644d9ee139bdb02d470a1172221b0f6e510ee5935683500f8257"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00336-of-00512.json.gz": {"num_bytes": 30262910, "checksum": "317933afdd8dc8a3a355e44ee3d84bbab12a2f30c98ea1172dde7074ed4c0557"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00337-of-00512.json.gz": {"num_bytes": 30155329, "checksum": "c5b850399252ec41b0fd9cb2da87ce25e5a44df9f44c6ed9d8c559a5729e5a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00338-of-00512.json.gz": {"num_bytes": 29952961, "checksum": "48083123ba97a6212e0501799bd01936f0795bdd4d9c2710b9aa67d54b29037e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00339-of-00512.json.gz": {"num_bytes": 30403399, "checksum": "313b60f985dcf591f34d351b758eedace655b6c6d3946dd2ddc55f34a9a97ae9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00340-of-00512.json.gz": {"num_bytes": 29917484, "checksum": "2c72290f3bd51dea2a2877d68a968dc2b75dadf99ab3cc2230e41be45f3515d3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00341-of-00512.json.gz": {"num_bytes": 29905522, "checksum": "1acd83a0da4a7a4912b589dbeb68b37396d0454371b2b71af4ae18b854d482ce"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00342-of-00512.json.gz": {"num_bytes": 30022369, "checksum": "8756be42335bba12d06de63e247659f8d603a092ff342360dfed645aec135c47"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00343-of-00512.json.gz": {"num_bytes": 30229313, "checksum": "863e29987a3ccfa08e14ae987c81367a53b9fe08795184db086117a9555e058b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00344-of-00512.json.gz": {"num_bytes": 29924335, "checksum": "aa9003a7cc3527fb658fd807c78890587a8b35634a1f0838bc221a6374205d20"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00345-of-00512.json.gz": {"num_bytes": 30229482, "checksum": "a7e88b015bcf7761217e9b3ffd413f13cac48f6afe083353436de6cbd0d0018d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00346-of-00512.json.gz": {"num_bytes": 30029147, "checksum": "b862ea62ac032c203c0038c061a44edabe4644be03b876ec7322e96762374940"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00347-of-00512.json.gz": {"num_bytes": 29808182, "checksum": "62915b86cbbf61a76f73d05509a8e839aae0b965134ef79022377625df7ef741"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00348-of-00512.json.gz": {"num_bytes": 30091116, "checksum": "6c384c2c6bc8340b88e085f8bbc2616be68c96fa7b8b88306b4500367d053a49"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00349-of-00512.json.gz": {"num_bytes": 29867618, "checksum": "bfb19508ecf8bd4d9a8847f0edab5acde6896182c27da706a6f2863bec43c152"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00350-of-00512.json.gz": {"num_bytes": 29723106, "checksum": "a645c62c94de9018175f15a0b38aa8bd2484601ee189b7c27d589288eb5af97e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00351-of-00512.json.gz": {"num_bytes": 30047620, "checksum": "991061a23834e6bb3dc0595cf0e8328e07746d10fbf7a7ba397c1410cb66175a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00352-of-00512.json.gz": {"num_bytes": 29808328, "checksum": "6c8e377a6cc82e81d66e2be3d23c1cdd42480015a68a1db458d542b7ff64ab7d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00353-of-00512.json.gz": {"num_bytes": 30040117, "checksum": "ead6f32d98a91c47fb9c21334143f02181efb0b831705baeebb9820d069598fe"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00354-of-00512.json.gz": {"num_bytes": 29953984, "checksum": "ba349e503d017abbc1c83da2314c0a4892a9f3e5e480173812578f44d9b5904c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00355-of-00512.json.gz": {"num_bytes": 30179912, "checksum": "2bfeab794bbe0432db52cc595d25864b17fdb0744a80d6d907f6f2ffc5c56b81"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00356-of-00512.json.gz": {"num_bytes": 30312163, "checksum": "d0dec696d28c601d3a1f75b0b6e6e711e00809f0d5ea915f63cb6d9b7adcc597"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00357-of-00512.json.gz": {"num_bytes": 29931515, "checksum": "d43c75371e32d0c1e65f43acc00aac3ca43762d4c6eb6bb61759ac5fca593a99"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00358-of-00512.json.gz": {"num_bytes": 29739788, "checksum": "96fef1b4a5d6a080ff5d4a10bc90911dcb2ddecb4be91d0c9620e6d2484e3ee3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00359-of-00512.json.gz": {"num_bytes": 29913841, "checksum": "05b065d2d13b787ddee4707be7e2be46173c23794b9e8c773d0da743f435db17"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00360-of-00512.json.gz": {"num_bytes": 29805295, "checksum": "826104b9f4c2634d128f15564bd4990057dfbbb4066f2a082039d243bab56935"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00361-of-00512.json.gz": {"num_bytes": 29839676, "checksum": "ee5ba4cb14ecee0c857828a866615c6bfe45f67b158173dcac44146a02d97738"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00362-of-00512.json.gz": {"num_bytes": 30154783, "checksum": "d67b49e6fa5dc293fbd3057b7ca0beb7e0bd1ff692cdad7f2dfb7abadc1f4599"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00363-of-00512.json.gz": {"num_bytes": 30126118, "checksum": "6940704da6cde5822d48dc806280b8d57e0593ba299731e68ca9c2a4f7cf65bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00364-of-00512.json.gz": {"num_bytes": 30184894, "checksum": "e740b4a0240e691f16a423fd658aa3c7539986695418af3b5a171a48524db74f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00365-of-00512.json.gz": {"num_bytes": 30386766, "checksum": "5a6a9461ef9ca579a849f6bef4d6225504a885aa797d3b2236ed8df6f5ea72ee"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00366-of-00512.json.gz": {"num_bytes": 30208411, "checksum": "8e0ce2447dfadaa4d41b991a2ce1be63b409e58e88944594dc8591bf9ab41403"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00367-of-00512.json.gz": {"num_bytes": 30266003, "checksum": "04ea00b46a583edea7740d74d719ef7f303b7f3873365b9ff4e94f08ef80832a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00368-of-00512.json.gz": {"num_bytes": 29993752, "checksum": "38b1a55dd4ff1b504d2dbc0b2ad54fe43ab16c8bdba55bd97f4a55dafa8c83dd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00369-of-00512.json.gz": {"num_bytes": 29833222, "checksum": "a25c405918920ed00edf5f3007cb8895b59fb67618dfea266b048273303b9592"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00370-of-00512.json.gz": {"num_bytes": 29988999, "checksum": "2812e6d9865d77ca8ac2d1499ba86be1ceed868a1da2bd13fbd0967058a3516c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00371-of-00512.json.gz": {"num_bytes": 29866636, "checksum": "ecd1d3bdc41c3f41f8c9d3a63c75766c173f70ff117af748a08c221ca4273b18"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00372-of-00512.json.gz": {"num_bytes": 30296883, "checksum": "723d2c5ebbdd95ab84c53e458d81944b6907d08c7aec67300f012880624d0010"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00373-of-00512.json.gz": {"num_bytes": 30310322, "checksum": "ae45d088521f2faf9852cb169962176e84bbb81d5ba157d4228d348f7fcf60f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00374-of-00512.json.gz": {"num_bytes": 30340527, "checksum": "9b09c9e1b424fd05540b720c5a85f71eea43d743dc4ebb318e839125ccac9383"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00375-of-00512.json.gz": {"num_bytes": 30193692, "checksum": "c3ca4bb179cadf872f25f1cdb5c3667933bb8dfb7af21068a24b1b09c961dfa8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00376-of-00512.json.gz": {"num_bytes": 30184130, "checksum": "5d801f4bc20c4c6d8821ccfff06cb5dfe4214e571734feacbea3325462afa280"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00377-of-00512.json.gz": {"num_bytes": 30259301, "checksum": "ebf08508c24e29a8a14b72248f090d765b02ee7a31296811d0391f2a2e73c046"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00378-of-00512.json.gz": {"num_bytes": 29650049, "checksum": "c13e994e68b938ca069d2d412e7891cbaf2ee205d65b1c17c6acfea01adce157"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00379-of-00512.json.gz": {"num_bytes": 30265211, "checksum": "667da6f0650dd684aa50bc691b5783968ae8cab847dea14fc8d8bfe203e351f4"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00380-of-00512.json.gz": {"num_bytes": 30429631, "checksum": "7cf0e9ae00bec72f571d152730107efdd944176818600517fb2d0412a859d366"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00381-of-00512.json.gz": {"num_bytes": 29889471, "checksum": "f781b3128e92c54365be7771695555378067a65fb922e04062ab6f3f092ec827"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00382-of-00512.json.gz": {"num_bytes": 30029894, "checksum": "2d133def2bc4b840312ebe5c466c9f22729b67aa4c2a41dda2e6a9a55ddcddbb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00383-of-00512.json.gz": {"num_bytes": 30249255, "checksum": "e8610abf7e2bd70b1067a1b2dbf392ac32be156945502629228969974d3899b2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00384-of-00512.json.gz": {"num_bytes": 30362665, "checksum": "f217071bd0c1b1bddb3342c85064d7ebb54bcde2512997636f0638a0b3641588"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00385-of-00512.json.gz": {"num_bytes": 30080234, "checksum": "2db4b15c7391b6e6d3791721ee574d09101df597110feebc59e4f0aff4df6c26"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00386-of-00512.json.gz": {"num_bytes": 29897704, "checksum": "035daed74487c5262b8cfbefdfaefd17f2834c7b4a1d293934d755e059b58f5b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00387-of-00512.json.gz": {"num_bytes": 30072139, "checksum": "73013fbd06eaf94a7c8a0f0de420f83bed56655fb2d4e5d93972e8ca1847d130"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00388-of-00512.json.gz": {"num_bytes": 30123843, "checksum": "5db846c3d0b36774ce771ddfa8c53a915767926a2ad48222256d839326336f19"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00389-of-00512.json.gz": {"num_bytes": 30278955, "checksum": "9e4c590e67b2fbd357af955e39864ffe73dda201d76759935fda80b10b463500"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00390-of-00512.json.gz": {"num_bytes": 30013591, "checksum": "90974ba6eff489e0f4f52187b6241120740c782945e86525cb5d1e551a54e322"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00391-of-00512.json.gz": {"num_bytes": 29925212, "checksum": "10fcd62813434e2557b5861fd8604f534952561065bee9dc525b1cd3f5b2730f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00392-of-00512.json.gz": {"num_bytes": 30016498, "checksum": "da88b36bd3f15551d8fad115a86f111cc5c3d9a3c6fa9497214aabec7bcd6aad"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00393-of-00512.json.gz": {"num_bytes": 30061083, "checksum": "1ed9881020f240e1277e6513bc2abf24ea48e9cb0046d7e87a6d3669c8b42a0f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00394-of-00512.json.gz": {"num_bytes": 30043459, "checksum": "a35c3de1b0c982df8471705574e6eb7cc730fff122ff17d1381f2c7b9f20d6bd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00395-of-00512.json.gz": {"num_bytes": 29921106, "checksum": "f4cf52f8d6a1288773cc366469df140f885b233fb6aa1cb75387a450d88ec94f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00396-of-00512.json.gz": {"num_bytes": 30024980, "checksum": "5ebe04e54e4242d52aacb4c2e107dd10e609d5a7a6ff0425d9952bed98ef4921"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00397-of-00512.json.gz": {"num_bytes": 30096825, "checksum": "3ac381004d8257aa50fb28f0fd2171abbb93ad825c3f43422b9dbec6e1c6f31b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00398-of-00512.json.gz": {"num_bytes": 30059739, "checksum": "40c38af325f4d01ae7c74aa9cd8f8d1c96c6af851175f80d3c50d85c5f5d3585"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00399-of-00512.json.gz": {"num_bytes": 30049826, "checksum": "2ba0109b2d5b88422250bcbd2494cc6e11528710f38fa6e83a1f699b840b68a7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00400-of-00512.json.gz": {"num_bytes": 29953506, "checksum": "010610ba3af3dbfbcf2fac93136b7066fc58eb914dce9ae999722d0cfec4d331"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00401-of-00512.json.gz": {"num_bytes": 30271141, "checksum": "29587bb4be2c367f6479705b5c3c28716affeefc857ac1f77e4c33e55264def0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00402-of-00512.json.gz": {"num_bytes": 29861236, "checksum": "8e399149c335ec599f881fada448c9b4be22326357153c74b0de627078f1d43c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00403-of-00512.json.gz": {"num_bytes": 30175831, "checksum": "0d2800836914a1e2ef4a1aaea6e70d19699fc2555582ec670223177cac05a4fa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00404-of-00512.json.gz": {"num_bytes": 30097682, "checksum": "f9665e9199978b123feb962ce347b30cc1520626c32dfef0ca3cd8895a45e445"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00405-of-00512.json.gz": {"num_bytes": 29810961, "checksum": "8ea29cf9f7774a16a4c2aaeff1b6353de2951073676a9c411f19b0a5fb755b07"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00406-of-00512.json.gz": {"num_bytes": 29963498, "checksum": "90b10c91f6e0006576ec9b426c424e50fc1726c25ae8eb91bf91bb9001ade2e8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00407-of-00512.json.gz": {"num_bytes": 30089554, "checksum": "cfa905514e4f19c4eb82e438f5eb987731004476f026f4bebbeeafbe519ec85f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00408-of-00512.json.gz": {"num_bytes": 30148002, "checksum": "dddada59e2ef306cdf83b7c9ce3c912792237852053a4ea683224438a242c5ff"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00409-of-00512.json.gz": {"num_bytes": 29989174, "checksum": "907667ac304b6cca7100a9606e915c003fee43f1640d5b01405beb16eac4c379"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00410-of-00512.json.gz": {"num_bytes": 30519580, "checksum": "acd5cd2ecc46927046c81c9bb3459dd72a98e346ebb59c13c0db08fbb60961a0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00411-of-00512.json.gz": {"num_bytes": 30408107, "checksum": "6a9c2d42717f853cd4a76fc5275e95e2a584b7465c6059f586f6a06417048a42"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00412-of-00512.json.gz": {"num_bytes": 29699198, "checksum": "29e76bdab47496ed61a102edd3c61c20e60ab52abeb8e6068f7aa4ad1868f4fc"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00413-of-00512.json.gz": {"num_bytes": 30065457, "checksum": "b4a33941d0b994b82e3be351542cb4a832742e050ebbd71481e7ba34c8dcbc3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00414-of-00512.json.gz": {"num_bytes": 30342960, "checksum": "4ba7edb3c77a45f0e4cb7e969053db6f44ce8c0a8ef262582512814b1161d9ad"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00415-of-00512.json.gz": {"num_bytes": 30201576, "checksum": "25cb4eb4bdf3cd1b29289a23696be8bd41c5f577294e94607bea7b91252a04fd"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00416-of-00512.json.gz": {"num_bytes": 30021170, "checksum": "60472bd2a2896bfb57baabb583fc6cdd402a1d776f6a4c9bb58ed556e67cd76f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00417-of-00512.json.gz": {"num_bytes": 30237505, "checksum": "aea8fd33c2acf1cef890549b1f88b18a2eeb37f6d4dd22b552f735811ad0b8a1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00418-of-00512.json.gz": {"num_bytes": 29999334, "checksum": "93583d771ce7f0e1d044de2919a3ffdd48b7b7dab0cd3b6dc459200dd53d8762"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00419-of-00512.json.gz": {"num_bytes": 30194801, "checksum": "cd36e129487272742f3e60ab6512dd79b3d1ce3c22490d2e47c00c2ae595cfc6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00420-of-00512.json.gz": {"num_bytes": 29903898, "checksum": "6f18a5ffc7efe5f555b02d3a31ed43714e09e73f7462206220d70450f47cd6f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00421-of-00512.json.gz": {"num_bytes": 30015573, "checksum": "cfacef2cffd953425eaf4d7b2b6cf5d2637bf5d58c6ed2bd0002442795c7d36c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00422-of-00512.json.gz": {"num_bytes": 29966521, "checksum": "14f646b15948cf586ec1abd4bf4bf45bf180913e4d09049fa779bc7a196e455e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00423-of-00512.json.gz": {"num_bytes": 29972805, "checksum": "ad7d4ab443c7a8122976570891a225a44ff86d2299d70706066633a6204eb0de"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00424-of-00512.json.gz": {"num_bytes": 30317886, "checksum": "37c8bf3b535ea4053aa2424c846e3449f9eb27d5ff999e1e93b6cee0aa975333"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00425-of-00512.json.gz": {"num_bytes": 30059310, "checksum": "674ca5eaf6a88f76881c8a1c48e1e0f93794785ee5ea17fb70f49228d7f39614"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00426-of-00512.json.gz": {"num_bytes": 30182498, "checksum": "988d08cd18162d9a309155d2e75cd4980f76ab4c73ef8286edae94ca4628ebcf"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00427-of-00512.json.gz": {"num_bytes": 30253874, "checksum": "aa8c08a684ea0bbfda9297aea07429172a2fa4a161268b964421796173275b35"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00428-of-00512.json.gz": {"num_bytes": 30055421, "checksum": "b1ed26e826bee7fcbc31cf1c368c9a63eeedbea1c2fd0fb07370b461a03d1a7f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00429-of-00512.json.gz": {"num_bytes": 29830674, "checksum": "3efdc67ad7a108416dae47886e542da5c2ab1cd7e1aedd25c1c5d4e0607572f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00430-of-00512.json.gz": {"num_bytes": 29938000, "checksum": "3221ef5e4c28d44c1da4fa04689f318217991c07aff4fdee5e1091fe8e1162ac"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00431-of-00512.json.gz": {"num_bytes": 29829687, "checksum": "225f4e22df1b45a7dc9fef2f5a44da8f8ee25608cbe34195e21b49c8cd10f3ed"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00432-of-00512.json.gz": {"num_bytes": 30006209, "checksum": "9fc53637db7b16c8cf6f824adf21d4602efab715ad78eab62c4be7981a8bbc1d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00433-of-00512.json.gz": {"num_bytes": 30656456, "checksum": "6bf7b701dc18f68d0facd7cdea49a26cdcfdd7829d5346eefe555485cfa7f336"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00434-of-00512.json.gz": {"num_bytes": 30138891, "checksum": "793532f72aa41c1dd7c549e9597fe8e73796c53eb5fe410a73de418ec446d686"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00435-of-00512.json.gz": {"num_bytes": 30430276, "checksum": "0d13d345ad12999fb4e7a9675e08bb1c90980fd193ed8530e4258e07bd6ea754"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00436-of-00512.json.gz": {"num_bytes": 30173309, "checksum": "fbce5fadb4b49bf833f77337929d873b2b25c3b564f7622f3672dde7a044e5d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00437-of-00512.json.gz": {"num_bytes": 30142240, "checksum": "76c34800a3223f5fe0f1960f3d3c9dd9ecdc2e652493d71ef245415b5027c902"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00438-of-00512.json.gz": {"num_bytes": 29979673, "checksum": "4784c3787d24b9d46ad7c835683c6506c2e55c84835391e2aca0355f032a1888"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00439-of-00512.json.gz": {"num_bytes": 30169105, "checksum": "5012d03e637769d7494bd3cef0a8dfc8b38c995e0d5780089c15d6b1495b3a8e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00440-of-00512.json.gz": {"num_bytes": 30107004, "checksum": "529beaf4ad0251e35be574b1f623571526ec91a588ebd7df43e9d1cb99445f53"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00441-of-00512.json.gz": {"num_bytes": 30324563, "checksum": "f5e5fbf5e329f5bb0e83f758b8fc76516d65c3f91ad97e328187eaea83e4b667"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00442-of-00512.json.gz": {"num_bytes": 30335681, "checksum": "b8a26ed60f87a87347886b4467aa576ec5e8c106931589a1aa821b99fdabdb54"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00443-of-00512.json.gz": {"num_bytes": 30155655, "checksum": "e27bfb813fd6aba96ada81b095a559f0b7847cd25f7f8973663b19cdc5b8985a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00444-of-00512.json.gz": {"num_bytes": 30340540, "checksum": "705dec13ba2824d45e801bc2cf3e709d6492b1ff6de2f9ddefb5a57dbdada4ca"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00445-of-00512.json.gz": {"num_bytes": 30248960, "checksum": "09a6b83910369cf269c4f095607fb2f0ac0ec7e25b501f577fe13920a8573ee0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00446-of-00512.json.gz": {"num_bytes": 30316703, "checksum": "8f88b794c08bb492f50073337a30aafac0d05819505b507ab283dba0cf17d125"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00447-of-00512.json.gz": {"num_bytes": 30184407, "checksum": "38c819df823197bea6d647c3f78bcc15024aabba814cae322c1663c45fa8382e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00448-of-00512.json.gz": {"num_bytes": 30238484, "checksum": "8c0abfb8dca37a179b01dadd2227206cbe6e5b916d0111c0b00d2edc3951c7f6"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00449-of-00512.json.gz": {"num_bytes": 30143151, "checksum": "9731e9644e5615d5d5ebdbacc6efa6382df856c8763b7485c9a5838864c1332f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00450-of-00512.json.gz": {"num_bytes": 30122606, "checksum": "3b746f616f21c91277cde8e6d0d7f792ead7874de7ecdf11830a4a56db3dc799"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00451-of-00512.json.gz": {"num_bytes": 30128179, "checksum": "d6cadfc64ee39c9beb93f0bf8c169ca9d9053e0f76e1c9697841438e20dddef3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00452-of-00512.json.gz": {"num_bytes": 29979326, "checksum": "42de19ffc3ec821fbf5ff686d1b36d189ad9ee5c4553a2ff0d003ee1a754c9c8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00453-of-00512.json.gz": {"num_bytes": 30118272, "checksum": "22f9b2d3a9f089f1015f74d1ca0aca8f2a4970595326d964817177cbe6859271"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00454-of-00512.json.gz": {"num_bytes": 30018294, "checksum": "17c16895edccbb8b40fcc52cbafc0c15957020eb530e071dcce34544d5958bd1"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00455-of-00512.json.gz": {"num_bytes": 30155903, "checksum": "8b9d49837b309c3389d03dd3bbae92395bf7086134fbc69d28d9fff60a90d4a3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00456-of-00512.json.gz": {"num_bytes": 30282104, "checksum": "ab63fd2efb0cc883d303241b3488a8135a196db7edc844458cfc1483898ceb3b"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00457-of-00512.json.gz": {"num_bytes": 29920723, "checksum": "dbde2eeef90144b209ef5afa6d5165ad638ae57d919926a379a10fccf6850a61"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00458-of-00512.json.gz": {"num_bytes": 30163167, "checksum": "800307106f5861e0bc246bcaae214e6dadeee849905cac184ecfe6d0b560fa68"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00459-of-00512.json.gz": {"num_bytes": 30248893, "checksum": "3e78d327a9463929f33311e18116f5d1d2ae4926f7a600378875ba854cf5ee47"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00460-of-00512.json.gz": {"num_bytes": 29840067, "checksum": "047568a5dad00b04ca1ea4aa262c7a4af9b61e87bc4ea02ffd5c6c8c049bf8a5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00461-of-00512.json.gz": {"num_bytes": 30179062, "checksum": "ed8abe7b465bc19150b831632cb7afa298d6cb4beb9b6043a35a0f8afb5f730d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00462-of-00512.json.gz": {"num_bytes": 30266398, "checksum": "d7b74f5c1c1f7bb489700adcfb7e48400c4fcca7669e2d56396d9fabb5a63b91"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00463-of-00512.json.gz": {"num_bytes": 30158800, "checksum": "224815aee29f6d04ddbc7457c84338eef9b127a767e7b50ed77283ff166d4f93"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00464-of-00512.json.gz": {"num_bytes": 30393915, "checksum": "0dd019fd2c19936ce2e6410b65872f630131c5da7543c8e66fa87547fd1a2209"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00465-of-00512.json.gz": {"num_bytes": 30148939, "checksum": "6d74dc9d74d28c2b8ba8d43ba3d594af0cb176cfa7bf738f3933be2a9c37bb85"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00466-of-00512.json.gz": {"num_bytes": 30268228, "checksum": "0e201327066f28c19b082fe35e4fb3bd76c8fd2d32236d1d6e2309489152aa66"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00467-of-00512.json.gz": {"num_bytes": 30121937, "checksum": "7352e5a9ee66dcbeed2c9e1fbe6c9355f0e5dd1b30b592a9fd5690958945e5a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00468-of-00512.json.gz": {"num_bytes": 30004669, "checksum": "53876848336ac57c082c9d5735bc1717f69ef38688b221d5e5ab9cd9cb4ec620"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00469-of-00512.json.gz": {"num_bytes": 30049860, "checksum": "a5a720b38f106dd5d2a2b7647748b52b4531ac12294e3b0d8dbc92062639c0c3"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00470-of-00512.json.gz": {"num_bytes": 29961380, "checksum": "9611764fc4f84b92e86fa6f9ea41464f6c26b07d1c51241b627a3d155e99d163"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00471-of-00512.json.gz": {"num_bytes": 30449164, "checksum": "db508df549d518c3e8b99b2f0098ea93fead1e632f53d8ae2cebff1d3476577c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00472-of-00512.json.gz": {"num_bytes": 30312620, "checksum": "1993b5e292c6c60a3373aabe896f1a57afaad73fdce0ec60e30696368f7c0afa"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00473-of-00512.json.gz": {"num_bytes": 30406764, "checksum": "913045c61fb5a145379d9fe08c91ea63092b197400c0c87bfa65af91720b563c"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00474-of-00512.json.gz": {"num_bytes": 30078563, "checksum": "c495119e150b083d709ca915abd760683793361ebf3e079b04efc9b7e1900379"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00475-of-00512.json.gz": {"num_bytes": 29860761, "checksum": "50bb5f40d2e91ab136aa63063fff860529c8961f2a38500a645b10339751589e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00476-of-00512.json.gz": {"num_bytes": 30199778, "checksum": "c969cfbb7ed7716f665b336b2ed9f7b10b532c7adc6d8a347964831a39cfef0e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00477-of-00512.json.gz": {"num_bytes": 30130742, "checksum": "54c8b89102cf882eda5208544a6c5d317c1defa8d997f9450ebd576e58f91830"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00478-of-00512.json.gz": {"num_bytes": 29901444, "checksum": "f669299d794ecc0523c64ad31af8fcce5cf3f880e87fd73f4c3f434425e9b238"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00479-of-00512.json.gz": {"num_bytes": 30587214, "checksum": "25d0fbd9027deaf140650f0b82a2316c37939f199fe7633b9f643684404f2029"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00480-of-00512.json.gz": {"num_bytes": 30145237, "checksum": "68a29728290e1199ce8d1ac060365bc443ea67c24292b2b04f1b4ca44ca7238d"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00481-of-00512.json.gz": {"num_bytes": 30204159, "checksum": "1605034b89e33f6794c901adac1eb200bb489f76b9bae6bc56b01e9f6ab4c254"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00482-of-00512.json.gz": {"num_bytes": 30430794, "checksum": "2dce9df095e89ea6645fb599f518612511a62b6c475808ad004c32968b19bae8"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00483-of-00512.json.gz": {"num_bytes": 30102412, "checksum": "c7c626977521b0d1f5bcc02c484b3eb4f517ba71006a4802df08a0f4cfb8ea9e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00484-of-00512.json.gz": {"num_bytes": 30171871, "checksum": "519ed997f1f1f1de7864b0bddf202b25e25bed349f63593a88337262d7705968"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00485-of-00512.json.gz": {"num_bytes": 30049539, "checksum": "8d2314fd3239ba3dfa99962c1d0a38e05edf9194e1faebae88f6b19ecab8fbf7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00486-of-00512.json.gz": {"num_bytes": 29949995, "checksum": "a7521e09cbe77098c23172427bfb931dd50f0c9d58b034fd1621687849a8d379"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00487-of-00512.json.gz": {"num_bytes": 30345072, "checksum": "ebc6254a4d241afb886b8df20819301121fcb234a32a1dd4ee8ae49571081f92"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00488-of-00512.json.gz": {"num_bytes": 30300622, "checksum": "509bba28ddf770d38554a2e846f2ce0d2af59e3662a6d6ec4dddb75fb509f8d5"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00489-of-00512.json.gz": {"num_bytes": 29949909, "checksum": "996e61f8e674b0a016a568630ee13a7473f99a919437c225a4198d232861e628"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00490-of-00512.json.gz": {"num_bytes": 29995429, "checksum": "9730024ad352eb12f74ac446ed32b9c57898658954be5dd639184fc5264527cb"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00491-of-00512.json.gz": {"num_bytes": 30293919, "checksum": "65b2a7de3284e892441b0fe8e850d89de842355d78fa9944358b1ee5912a948f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00492-of-00512.json.gz": {"num_bytes": 30115831, "checksum": "26b535c3175bb86ef721593f81d9cf006d4c3749f156c63ccd2a2c04e1201236"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00493-of-00512.json.gz": {"num_bytes": 30187809, "checksum": "a0918223c5523da20bd8230de1985b0a3cbb1e239af3d62a83d720a3a528c567"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00494-of-00512.json.gz": {"num_bytes": 30149878, "checksum": "6e9a5e329f834e41b4a8a9a6809df3243e5bffc580327912288ad7f790b43ab7"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00495-of-00512.json.gz": {"num_bytes": 29711944, "checksum": "3b9ba9d667e1241692ff9a654a68e98e8e94e32244a9419b2542137b63fb4705"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00496-of-00512.json.gz": {"num_bytes": 30114815, "checksum": "24b78cc36bb0abc67c998320e7029b6e7bbbee267a367eb538f23956c13f27a9"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00497-of-00512.json.gz": {"num_bytes": 30048480, "checksum": "29c3606acf298498fc3498bd769544e2879afbd0d5c46cee298cb25058694aac"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00498-of-00512.json.gz": {"num_bytes": 29934973, "checksum": "8afaffea92dfad745be8aa8cd3de0ee97cbcc26fbad6c71d56683aef6a27055f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00499-of-00512.json.gz": {"num_bytes": 29796509, "checksum": "9cbbd8f6d8fe92207c4cb2f0422284726deca1bde7f30cb01cce7fcd4665b380"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00500-of-00512.json.gz": {"num_bytes": 30221736, "checksum": "902904aa9fadaecbe698402a27b4e68b00813e67b79f84d4c696cd9c72f08f55"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00501-of-00512.json.gz": {"num_bytes": 30108320, "checksum": "76e848f8dbc082158fc5d3a2f7c10cd6e03585667c00efc639f2c6f47d44aeb2"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00502-of-00512.json.gz": {"num_bytes": 30381907, "checksum": "885bbc9788235abf33728737f72f267e60d1f5d4a77493cae76f161651d89579"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00503-of-00512.json.gz": {"num_bytes": 29983805, "checksum": "5134934392b13e3f84dd32dcb1c59f4d5416d6dfd925bf896f3eb61881d82136"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00504-of-00512.json.gz": {"num_bytes": 30041413, "checksum": "4978245a7f545d676bad6edfdfe60ffdad94de47af0fb10649fa39e9b068939e"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00505-of-00512.json.gz": {"num_bytes": 30021620, "checksum": "64933c28ea3f608326f1c6ef56170886767f1ab4f9ecbc4bf3263c7043901fce"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00506-of-00512.json.gz": {"num_bytes": 30260343, "checksum": "84667dbe68ecf1f9bbdaba0e73eca6fe0444f6594a1e9a4b46e9812ae7bce7d0"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00507-of-00512.json.gz": {"num_bytes": 30173739, "checksum": "dd6d44e4f344f3ab1cd61bacced7b5f1429cf6823fc9282452a539012bda028a"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00508-of-00512.json.gz": {"num_bytes": 29903443, "checksum": "4afc46096ac2697867c3a75896c5ceb36617c4c21a749dded58a1ea4565e41df"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00509-of-00512.json.gz": {"num_bytes": 29862664, "checksum": "74a720dc16b389e8122d61aa94bc12a5bc4253ca6f39679781c938e2eb556878"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00510-of-00512.json.gz": {"num_bytes": 29744368, "checksum": "6a302049e7a1668c5fb2e4b5afca518fa53ba1a9dc717015ecb5768e85ec4139"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-train.00511-of-00512.json.gz": {"num_bytes": 29896714, "checksum": "48b89e909c0e33fd59c9623f8517cdfa90fa35a4641f999c6f68e1cc9f2a309f"}, "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/realnewslike/c4-validation.00000-of-00001.json.gz": {"num_bytes": 15284943, "checksum": "42ac859dc1c4d48d165ec602909403e2066ce1d4854149ed70b9ec9cc96dc65f"}}, "download_size": 15435025687, "post_processing_size": null, "dataset_size": 76369191765, "size_in_bytes": 91804217452}} \ No newline at end of file From e8fe47b29f242030de12ab4ac5b0a57daa584aa5 Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 1 Jul 2021 17:06:13 +0200 Subject: [PATCH 15/19] style --- datasets/c4/c4.py | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/datasets/c4/c4.py b/datasets/c4/c4.py index b60abe87f13..993c9233f90 100644 --- a/datasets/c4/c4.py +++ b/datasets/c4/c4.py @@ -40,9 +40,7 @@ "en.noclean": {"train": 7168, "validation": 64}, } -_DATA_URL = ( - "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/{name}/c4-{split}.{index:05d}-of-{n_shards:05d}.json.gz" -) +_DATA_URL = "https://huggingface.co/datasets/allenai/c4/resolve/1ddc917116b730e1859edef32896ec5c16be51d0/{name}/c4-{split}.{index:05d}-of-{n_shards:05d}.json.gz" class C4(datasets.GeneratorBasedBuilder): From 49f46ac84b1eed46dc906094231f801f06b35f08 Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 1 Jul 2021 18:12:56 +0200 Subject: [PATCH 16/19] revert unused shard filtering in tests --- tests/test_dataset_common.py | 34 ++++++---------------------------- 1 file changed, 6 insertions(+), 28 deletions(-) diff --git a/tests/test_dataset_common.py b/tests/test_dataset_common.py index 359ea706651..5c12a40467f 100644 --- a/tests/test_dataset_common.py +++ b/tests/test_dataset_common.py @@ -76,27 +76,6 @@ def wrapper(self, dataset_name): return test_case -@contextmanager -def prepare_only_one_shard(dataset_builder: DatasetBuilder): - old_split_generators = dataset_builder._split_generators - try: - - def one_shard_split_generators(*args, **kwargs): - split_generators = old_split_generators(*args, **kwargs) - # if there are many shards, only keep the first one - for split_generator in split_generators: - split_generator.gen_kwargs = { - k: v[:1] if v and isinstance(v, list) and isinstance(v[0], str) and "000-of-" in v[0] else v - for k, v in split_generator.gen_kwargs.items() - } - return split_generators - - dataset_builder._split_generators = one_shard_split_generators - yield - finally: - dataset_builder._split_generators = old_split_generators - - def get_packaged_dataset_dummy_data_files(dataset_name, path_to_dummy_data): extensions = {"text": "txt", "json": "json", "pandas": "pkl", "csv": "csv", "parquet": "parquet"} return { @@ -179,13 +158,12 @@ def check_if_url_is_valid(url): dataset_builder.info.dataset_size = one_mega_byte # generate examples from dummy data - with prepare_only_one_shard(dataset_builder): - dataset_builder.download_and_prepare( - dl_manager=mock_dl_manager, - download_mode=GenerateMode.FORCE_REDOWNLOAD, - ignore_verifications=True, - try_from_hf_gcs=False, - ) + dataset_builder.download_and_prepare( + dl_manager=mock_dl_manager, + download_mode=GenerateMode.FORCE_REDOWNLOAD, + ignore_verifications=True, + try_from_hf_gcs=False, + ) # get dataset dataset = dataset_builder.as_dataset(ignore_verifications=True) From ab2aeaae23543bf8c1dac1319fb2800d89669bcb Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Thu, 1 Jul 2021 18:27:11 +0200 Subject: [PATCH 17/19] quality --- tests/test_dataset_common.py | 1 - 1 file changed, 1 deletion(-) diff --git a/tests/test_dataset_common.py b/tests/test_dataset_common.py index 5c12a40467f..49d30c49a49 100644 --- a/tests/test_dataset_common.py +++ b/tests/test_dataset_common.py @@ -17,7 +17,6 @@ import os import tempfile import warnings -from contextlib import contextmanager from functools import wraps from multiprocessing import Pool from typing import List, Optional From c7c291f0928804781fdf095e14a7f6947711ed53 Mon Sep 17 00:00:00 2001 From: Quentin Lhoest <42851186+lhoestq@users.noreply.github.com> Date: Fri, 2 Jul 2021 10:49:50 +0200 Subject: [PATCH 18/19] Update datasets/c4/README.md Co-authored-by: Dirk Groeneveld --- datasets/c4/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/datasets/c4/README.md b/datasets/c4/README.md index 35621129014..06b3d017efc 100644 --- a/datasets/c4/README.md +++ b/datasets/c4/README.md @@ -116,7 +116,7 @@ The data have several fields: | name | train |validation| |----------------|--------:|---------:| | en |364868892| 364608| -| en.noclocklist |393391519| 393226| +| en.noblocklist |393391519| 393226| | en.noclean | ?| ?| | realnewslike | 13799838| 13863| From 330cea5a991e7d62ce49c066fb6fd8edb9e942b3 Mon Sep 17 00:00:00 2001 From: Quentin Lhoest Date: Fri, 2 Jul 2021 11:15:11 +0200 Subject: [PATCH 19/19] data collection section --- datasets/c4/README.md | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/datasets/c4/README.md b/datasets/c4/README.md index 06b3d017efc..cebc50292f2 100644 --- a/datasets/c4/README.md +++ b/datasets/c4/README.md @@ -130,7 +130,9 @@ The data have several fields: #### Initial Data Collection and Normalization -[More Information Needed] +C4 dataset is a collection of about 750GB of English-language text sourced from the public Common Crawl web scrape. It includes heuristics to extract only natural language (as opposed to boilerplate and other gibberish) in addition to extensive deduplication. You can find the code that has been used to build this dataset in [c4.py](https://github.com/tensorflow/datasets/blob/5952d3d60d60e1727786fa7a9a23d24bb463d4d6/tensorflow_datasets/text/c4.py) by Tensorflow Datasets. + +The dataset was explicitly designed to be English only: any page that was not given a probability of at least 99% of being English by [langdetect](https://github.com/Mimino666/langdetect) was discarded. #### Who are the source language producers?