{ "add_prefix_space": false, "added_tokens_decoder": { "0": { "content": "<|endoftext|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "1": { "content": "<|im_start|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "2": { "content": "<|im_end|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "3": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "4": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "5": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "6": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "7": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "8": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "9": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "10": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "11": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "12": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "13": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "14": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "15": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "16": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "20": { "content": "$", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "24": { "content": "(", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "25": { "content": ")", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "28": { "content": ",", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "30": { "content": ".", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "42": { "content": ":", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "423": { "content": "--", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "1969": { "content": "``", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "2113": { "content": "IN", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "3816": { "content": "''", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "5137": { "content": "CC", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "6998": { "content": "CD", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "9324": { "content": "EX", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "9815": { "content": "MD", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "10179": { "content": "TO", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "12041": { "content": "LS", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "17679": { "content": "DT", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "19668": { "content": "NN", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "22259": { "content": "POS", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "29482": { "content": "RP", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "35991": { "content": "FW", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "45780": { "content": "RB", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "47306": { "content": "WP", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49152": { "content": "PRP$", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49153": { "content": "VBG", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49154": { "content": "VB", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49155": { "content": "VBP", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49156": { "content": "VBN", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49157": { "content": "JJ", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49158": { "content": "VBZ", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49159": { "content": "RBR", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49160": { "content": "VBD", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49161": { "content": "NNS", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49162": { "content": "NNP", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49163": { "content": "WRB", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49164": { "content": "PDT", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49165": { "content": "RBS", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49166": { "content": "PRP", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49167": { "content": "WP$", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49168": { "content": "NNPS", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49169": { "content": "JJS", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49170": { "content": "JJR", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49171": { "content": "SYM", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49172": { "content": "UH", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49173": { "content": "WDT", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true } }, "additional_special_tokens": [ "PRP$", "VBG", "FW", "VB", "POS", "''", "VBP", "VBN", "JJ", "WP", "VBZ", "DT", "RP", "$", "NN", ")", "(", "RBR", "VBD", ",", ".", "TO", "LS", "RB", ":", "NNS", "NNP", "``", "WRB", "CC", "PDT", "RBS", "PRP", "CD", "EX", "IN", "WP$", "MD", "NNPS", "--", "JJS", "JJR", "SYM", "UH", "WDT" ], "bos_token": "<|endoftext|>", "clean_up_tokenization_spaces": false, "eos_token": "<|endoftext|>", "max_length": 128, "model_max_length": 1000000000000000019884624838656, "pad_token": "<|endoftext|>", "padding": true, "tokenizer_class": "GPT2Tokenizer", "truncation": true, "unk_token": "<|endoftext|>", "vocab_size": 49152 }