kimsan0622
commited on
Commit
•
e2c2c42
1
Parent(s):
6eedadc
Upload tokenizer
Browse files- tokenizer_config.json +3 -2
tokenizer_config.json
CHANGED
@@ -33,7 +33,8 @@
|
|
33 |
"rstrip": false,
|
34 |
"single_word": false
|
35 |
},
|
36 |
-
"
|
|
|
37 |
"pad_token": {
|
38 |
"__type": "AddedToken",
|
39 |
"content": "<pad>",
|
@@ -50,7 +51,7 @@
|
|
50 |
"rstrip": false,
|
51 |
"single_word": false
|
52 |
},
|
53 |
-
"special_tokens_map_file": "
|
54 |
"tokenizer_class": "RobertaTokenizer",
|
55 |
"trim_offsets": true,
|
56 |
"unk_token": {
|
|
|
33 |
"rstrip": false,
|
34 |
"single_word": false
|
35 |
},
|
36 |
+
"model_max_length": 512,
|
37 |
+
"name_or_path": "out_roberta_base/ckpt_hf",
|
38 |
"pad_token": {
|
39 |
"__type": "AddedToken",
|
40 |
"content": "<pad>",
|
|
|
51 |
"rstrip": false,
|
52 |
"single_word": false
|
53 |
},
|
54 |
+
"special_tokens_map_file": "ke-t5-roberta/special_tokens_map.json",
|
55 |
"tokenizer_class": "RobertaTokenizer",
|
56 |
"trim_offsets": true,
|
57 |
"unk_token": {
|