Update datasets/wikicorpus/wikicorpus.py

Co-authored-by: Albert Villanova del Moral <8515462+albertvillanova@users.noreply.github.com>
huggingface · Sep 6, 2021 · c1b2857 · c1b2857 · github-actions · Sep 6, 2021
1 parent 382af94
commit c1b2857
Showing 1 changed file with 1 addition and 1 deletion.
diff --git a/datasets/wikicorpus/wikicorpus.py b/datasets/wikicorpus/wikicorpus.py
@@ -159,7 +159,7 @@ def _generate_examples(self, dirpath):
                             pass
                         elif row.startswith("ENDOFARTICLE") or row.startswith("\n"):
                             if len(words) > 1:  # some content besides only (. . Fp 0)
-                                yield (file_idx, row_idx), {
+                                yield f"{file_idx}_{row_idx}", {
                                     "id": example["id"],
                                     "title": example["title"],
                                     "sentence": words,