Type: Dataset
Tags:
Bibtex:
Tags:
Bibtex:
@article{, title= {OpenWebText (Gokaslan's distribution, 2019), GPT-2 Tokenized}, journal= {}, author= {eukaryote31 and Joshua Peterson and Aaron Gokaslan and Vanya Cohen}, year= {}, url= {}, abstract= {Code by eukaryote31 and Joshua Peterson: https://github.com/jcpeterson/openwebtext and https://github.com/eukaryote31/openwebtext Scraped by Aaron Gokaslan and Vanya Cohen: https://skylion007.github.io/OpenWebTextCorpus/ Tokenized by eukaryote31}, keywords= {}, terms= {}, license= {}, superseded= {} }