From fdd8b26187c62acdbd6a1dc45e3d5a959a57c087 Mon Sep 17 00:00:00 2001 From: Trey Saddler <146968939+saddlerto@users.noreply.github.com> Date: Sun, 12 May 2024 14:47:25 -0400 Subject: [PATCH] Add content content/Data/wikitext.md --- content/Data/wikitext.md | 5 +++++ 1 file changed, 5 insertions(+) create mode 100644 content/Data/wikitext.md diff --git a/content/Data/wikitext.md b/content/Data/wikitext.md new file mode 100644 index 0000000..4438303 --- /dev/null +++ b/content/Data/wikitext.md @@ -0,0 +1,5 @@ +--- +{"publish":true,"path":"Data/wikitext.md","permalink":"/data/wikitext/"} +--- + +The WikiText language modeling dataset is a collection of over 100 million tokens extracted from the set of verified Good and Featured articles on Wikipedia. The dataset is available under the Creative Commons Attribution-ShareAlike License. \ No newline at end of file