gpt2-medium / tokenizer_config.json
kimsan0622's picture
Upload tokenizer
a4c3e1b
raw
history blame
261 Bytes
{
"clean_up_tokenization_spaces": true,
"model_max_length": 1000000000000000019884624838656,
"special_tokens": [
"<s>",
"</s>",
"<unk>",
"<sep>",
"<pad>",
"<cls>",
"<mask>"
],
"tokenizer_class": "PreTrainedTokenizerFast"
}