{ "dataset": "translated-babylm-telugu", "input_dir": "../../gpt-2/telugu/data/translated-babylm-telugu/train", "vocab_size": 16384, "files": [ "../../gpt-2/telugu/data/translated-babylm-telugu/train/bnc_spoken.train.te.txt", "../../gpt-2/telugu/data/translated-babylm-telugu/train/childes.train.te.txt", "../../gpt-2/telugu/data/translated-babylm-telugu/train/gutenberg.train.te.txt", "../../gpt-2/telugu/data/translated-babylm-telugu/train/open_subtitles.train.te.txt", "../../gpt-2/telugu/data/translated-babylm-telugu/train/simple_wiki.train.te.txt", "../../gpt-2/telugu/data/translated-babylm-telugu/train/switchboard.train.te.txt" ], "special_tokens": [ "", "", "", "", "", "", "", "", "", "", "", "", "", "", "", "" ] }