lilyyellow commited on
Commit
2b502d3
1 Parent(s): 3a0b339

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -1,165 +1,164 @@
1
  {
2
- "_name_or_path": "/kaggle/working/my_awesome_ner-token_classification_v1.0",
3
  "architectures": [
4
- "ElectraForTokenClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
 
7
  "classifier_dropout": null,
8
- "embedding_size": 768,
9
- "finetuning_task": "ner",
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 768,
13
  "id2label": {
14
- "0": "I-ROLE",
15
- "1": "B-LANGUAGE",
16
- "2": "B-RANK",
17
- "3": "I-PHONE",
18
- "4": "I-SONG",
19
- "5": "I-DATETIME",
20
- "6": "I-RANK",
21
- "7": "I-SKILL",
22
- "8": "B-COMMUNICATION",
23
- "9": "B-LAW",
24
- "10": "B-RELIGION",
25
- "11": "I-LAW",
26
- "12": "B-LOCATION",
27
- "13": "B-PRODUCT",
28
- "14": "I-MISCELLANEOUS",
29
- "15": "I-SPORT",
30
- "16": "I-MONEY",
31
- "17": "B-MISCELLANEOUS",
32
- "18": "B-ORGANIZATION",
33
- "19": "B-PHONE",
34
- "20": "I-LANGUAGE",
35
- "21": "B-DATETIME",
36
- "22": "I-EMAIL",
37
- "23": "I-FOOD",
38
- "24": "B-URL",
39
- "25": "I-COMMUNICATION",
40
- "26": "I-LOCATION",
41
- "27": "B-SONG",
42
- "28": "O",
43
- "29": "B-PERSON",
44
- "30": "I-EVENT",
45
- "31": "I-ACTION",
46
- "32": "I-EDUCATION",
47
- "33": "B-GENDER",
48
- "34": "I-COUNTRY",
49
- "35": "B-EVENT",
50
- "36": "B-AGE",
51
- "37": "B-ADDRESS",
52
- "38": "I-ADDRESS",
53
- "39": "B-ANIMAL",
54
- "40": "I-GENDER",
55
- "41": "I-PERSON",
56
- "42": "B-ROLE",
57
- "43": "B-SPORT",
58
- "44": "I-DISEASE",
59
- "45": "B-MONEY",
60
- "46": "I-PRODUCT",
61
- "47": "I-RELIGION",
62
- "48": "I-TRANSPORTATION",
63
- "49": "B-DURATION",
64
- "50": "I-QUANTITY",
65
- "51": "I-AGE",
66
- "52": "B-EMAIL",
67
- "53": "B-IP",
68
- "54": "I-ORGANIZATION",
69
- "55": "B-EDUCATION",
70
- "56": "B-QUANTITY",
71
- "57": "I-DURATION",
72
- "58": "B-COUNTRY",
73
- "59": "B-FOOD",
74
- "60": "B-DISEASE",
75
- "61": "B-TRANSPORTATION",
76
- "62": "B-ACTION",
77
- "63": "I-ANIMAL",
78
- "64": "B-SKILL"
 
79
  },
80
  "initializer_range": 0.02,
81
  "intermediate_size": 3072,
82
  "label2id": {
83
- "B-ACTION": 62,
84
- "B-ADDRESS": 37,
85
- "B-AGE": 36,
86
- "B-ANIMAL": 39,
87
- "B-COMMUNICATION": 8,
88
- "B-COUNTRY": 58,
89
- "B-DATETIME": 21,
90
- "B-DISEASE": 60,
91
- "B-DURATION": 49,
92
- "B-EDUCATION": 55,
93
- "B-EMAIL": 52,
94
- "B-EVENT": 35,
95
- "B-FOOD": 59,
96
- "B-GENDER": 33,
97
- "B-IP": 53,
98
- "B-LANGUAGE": 1,
99
- "B-LAW": 9,
100
- "B-LOCATION": 12,
101
- "B-MISCELLANEOUS": 17,
102
- "B-MONEY": 45,
103
- "B-ORGANIZATION": 18,
104
- "B-PERSON": 29,
105
- "B-PHONE": 19,
106
- "B-PRODUCT": 13,
107
- "B-QUANTITY": 56,
108
- "B-RANK": 2,
109
- "B-RELIGION": 10,
110
- "B-ROLE": 42,
111
- "B-SKILL": 64,
112
- "B-SONG": 27,
113
- "B-SPORT": 43,
114
- "B-TRANSPORTATION": 61,
115
- "B-URL": 24,
116
- "I-ACTION": 31,
117
- "I-ADDRESS": 38,
118
- "I-AGE": 51,
119
- "I-ANIMAL": 63,
120
- "I-COMMUNICATION": 25,
121
- "I-COUNTRY": 34,
122
- "I-DATETIME": 5,
123
- "I-DISEASE": 44,
124
- "I-DURATION": 57,
125
- "I-EDUCATION": 32,
126
- "I-EMAIL": 22,
127
- "I-EVENT": 30,
128
- "I-FOOD": 23,
129
- "I-GENDER": 40,
130
- "I-LANGUAGE": 20,
131
- "I-LAW": 11,
132
- "I-LOCATION": 26,
133
- "I-MISCELLANEOUS": 14,
134
- "I-MONEY": 16,
135
- "I-ORGANIZATION": 54,
136
- "I-PERSON": 41,
137
- "I-PHONE": 3,
138
- "I-PRODUCT": 46,
139
- "I-QUANTITY": 50,
140
- "I-RANK": 6,
141
- "I-RELIGION": 47,
142
- "I-ROLE": 0,
143
- "I-SKILL": 7,
144
- "I-SONG": 4,
145
- "I-SPORT": 15,
146
- "I-TRANSPORTATION": 48,
147
- "O": 28
 
148
  },
149
- "layer_norm_eps": 1e-12,
150
- "max_position_embeddings": 512,
151
- "model_type": "electra",
152
  "num_attention_heads": 12,
153
  "num_hidden_layers": 12,
154
- "pad_token_id": 0,
 
155
  "position_embedding_type": "absolute",
156
- "summary_activation": "gelu",
157
- "summary_last_dropout": 0.1,
158
- "summary_type": "first",
159
- "summary_use_proj": true,
160
  "torch_dtype": "float32",
161
  "transformers_version": "4.41.2",
162
- "type_vocab_size": 2,
163
  "use_cache": true,
164
- "vocab_size": 62000
165
  }
 
1
  {
2
+ "_name_or_path": "FacebookAI/xlm-roberta-base",
3
  "architectures": [
4
+ "XLMRobertaForTokenClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
  "classifier_dropout": null,
9
+ "eos_token_id": 2,
 
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 768,
13
  "id2label": {
14
+ "0": "I-IP",
15
+ "1": "I-ROLE",
16
+ "2": "B-LANGUAGE",
17
+ "3": "B-RANK",
18
+ "4": "I-PHONE",
19
+ "5": "I-SONG",
20
+ "6": "I-DATETIME",
21
+ "7": "I-RANK",
22
+ "8": "I-SKILL",
23
+ "9": "B-COMMUNICATION",
24
+ "10": "B-LAW",
25
+ "11": "B-RELIGION",
26
+ "12": "I-LAW",
27
+ "13": "B-LOCATION",
28
+ "14": "B-PRODUCT",
29
+ "15": "I-MISCELLANEOUS",
30
+ "16": "I-SPORT",
31
+ "17": "I-MONEY",
32
+ "18": "B-MISCELLANEOUS",
33
+ "19": "B-ORGANIZATION",
34
+ "20": "B-PHONE",
35
+ "21": "I-LANGUAGE",
36
+ "22": "B-DATETIME",
37
+ "23": "I-EMAIL",
38
+ "24": "I-FOOD",
39
+ "25": "B-URL",
40
+ "26": "I-COMMUNICATION",
41
+ "27": "I-LOCATION",
42
+ "28": "B-SONG",
43
+ "29": "O",
44
+ "30": "B-PERSON",
45
+ "31": "I-EVENT",
46
+ "32": "I-ACTION",
47
+ "33": "I-EDUCATION",
48
+ "34": "B-GENDER",
49
+ "35": "I-COUNTRY",
50
+ "36": "B-EVENT",
51
+ "37": "B-AGE",
52
+ "38": "B-ADDRESS",
53
+ "39": "I-ADDRESS",
54
+ "40": "B-ANIMAL",
55
+ "41": "I-GENDER",
56
+ "42": "I-PERSON",
57
+ "43": "B-ROLE",
58
+ "44": "B-SPORT",
59
+ "45": "I-DISEASE",
60
+ "46": "B-MONEY",
61
+ "47": "I-PRODUCT",
62
+ "48": "I-RELIGION",
63
+ "49": "I-TRANSPORTATION",
64
+ "50": "B-DURATION",
65
+ "51": "I-QUANTITY",
66
+ "52": "I-AGE",
67
+ "53": "B-EMAIL",
68
+ "54": "B-IP",
69
+ "55": "I-ORGANIZATION",
70
+ "56": "B-EDUCATION",
71
+ "57": "B-QUANTITY",
72
+ "58": "I-DURATION",
73
+ "59": "B-COUNTRY",
74
+ "60": "B-FOOD",
75
+ "61": "B-DISEASE",
76
+ "62": "B-TRANSPORTATION",
77
+ "63": "B-ACTION",
78
+ "64": "I-ANIMAL",
79
+ "65": "B-SKILL"
80
  },
81
  "initializer_range": 0.02,
82
  "intermediate_size": 3072,
83
  "label2id": {
84
+ "B-ACTION": 63,
85
+ "B-ADDRESS": 38,
86
+ "B-AGE": 37,
87
+ "B-ANIMAL": 40,
88
+ "B-COMMUNICATION": 9,
89
+ "B-COUNTRY": 59,
90
+ "B-DATETIME": 22,
91
+ "B-DISEASE": 61,
92
+ "B-DURATION": 50,
93
+ "B-EDUCATION": 56,
94
+ "B-EMAIL": 53,
95
+ "B-EVENT": 36,
96
+ "B-FOOD": 60,
97
+ "B-GENDER": 34,
98
+ "B-IP": 54,
99
+ "B-LANGUAGE": 2,
100
+ "B-LAW": 10,
101
+ "B-LOCATION": 13,
102
+ "B-MISCELLANEOUS": 18,
103
+ "B-MONEY": 46,
104
+ "B-ORGANIZATION": 19,
105
+ "B-PERSON": 30,
106
+ "B-PHONE": 20,
107
+ "B-PRODUCT": 14,
108
+ "B-QUANTITY": 57,
109
+ "B-RANK": 3,
110
+ "B-RELIGION": 11,
111
+ "B-ROLE": 43,
112
+ "B-SKILL": 65,
113
+ "B-SONG": 28,
114
+ "B-SPORT": 44,
115
+ "B-TRANSPORTATION": 62,
116
+ "B-URL": 25,
117
+ "I-ACTION": 32,
118
+ "I-ADDRESS": 39,
119
+ "I-AGE": 52,
120
+ "I-ANIMAL": 64,
121
+ "I-COMMUNICATION": 26,
122
+ "I-COUNTRY": 35,
123
+ "I-DATETIME": 6,
124
+ "I-DISEASE": 45,
125
+ "I-DURATION": 58,
126
+ "I-EDUCATION": 33,
127
+ "I-EMAIL": 23,
128
+ "I-EVENT": 31,
129
+ "I-FOOD": 24,
130
+ "I-GENDER": 41,
131
+ "I-IP": 0,
132
+ "I-LANGUAGE": 21,
133
+ "I-LAW": 12,
134
+ "I-LOCATION": 27,
135
+ "I-MISCELLANEOUS": 15,
136
+ "I-MONEY": 17,
137
+ "I-ORGANIZATION": 55,
138
+ "I-PERSON": 42,
139
+ "I-PHONE": 4,
140
+ "I-PRODUCT": 47,
141
+ "I-QUANTITY": 51,
142
+ "I-RANK": 7,
143
+ "I-RELIGION": 48,
144
+ "I-ROLE": 1,
145
+ "I-SKILL": 8,
146
+ "I-SONG": 5,
147
+ "I-SPORT": 16,
148
+ "I-TRANSPORTATION": 49,
149
+ "O": 29
150
  },
151
+ "layer_norm_eps": 1e-05,
152
+ "max_position_embeddings": 514,
153
+ "model_type": "xlm-roberta",
154
  "num_attention_heads": 12,
155
  "num_hidden_layers": 12,
156
+ "output_past": true,
157
+ "pad_token_id": 1,
158
  "position_embedding_type": "absolute",
 
 
 
 
159
  "torch_dtype": "float32",
160
  "transformers_version": "4.41.2",
161
+ "type_vocab_size": 1,
162
  "use_cache": true,
163
+ "vocab_size": 250002
164
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a0d81a21d2e0cbd7b5630d221ad6cc07e5dbd84224606cc36ec026600ed7c42a
3
- size 532490884
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efaffc0ad114d65bb28b9f3b3c6d9a7e91ab49e64889ea6735d146f25fcedb05
3
+ size 1110039296
special_tokens_map.json CHANGED
@@ -1,37 +1,15 @@
1
  {
2
- "cls_token": {
3
- "content": "[CLS]",
4
- "lstrip": false,
5
- "normalized": false,
6
- "rstrip": false,
7
- "single_word": false
8
- },
9
  "mask_token": {
10
- "content": "[MASK]",
11
- "lstrip": false,
12
- "normalized": false,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "pad_token": {
17
- "content": "[PAD]",
18
- "lstrip": false,
19
  "normalized": false,
20
  "rstrip": false,
21
  "single_word": false
22
  },
23
- "sep_token": {
24
- "content": "[SEP]",
25
- "lstrip": false,
26
- "normalized": false,
27
- "rstrip": false,
28
- "single_word": false
29
- },
30
- "unk_token": {
31
- "content": "[UNK]",
32
- "lstrip": false,
33
- "normalized": false,
34
- "rstrip": false,
35
- "single_word": false
36
- }
37
  }
 
1
  {
2
+ "bos_token": "<s>",
3
+ "cls_token": "<s>",
4
+ "eos_token": "</s>",
 
 
 
 
5
  "mask_token": {
6
+ "content": "<mask>",
7
+ "lstrip": true,
 
 
 
 
 
 
 
8
  "normalized": false,
9
  "rstrip": false,
10
  "single_word": false
11
  },
12
+ "pad_token": "<pad>",
13
+ "sep_token": "</s>",
14
+ "unk_token": "<unk>"
 
 
 
 
 
 
 
 
 
 
 
15
  }
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5166e09320d5dea01a72734268a6136a5d53f2fe55980b6ba0fc19db6e003f72
3
- size 1394857
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a56def25aa40facc030ea8b0b87f3688e4b3c39eb8b45d5702b3a1300fe2a20
3
+ size 17082734
tokenizer_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "added_tokens_decoder": {
3
  "0": {
4
- "content": "[PAD]",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
@@ -9,7 +9,7 @@
9
  "special": true
10
  },
11
  "1": {
12
- "content": "[UNK]",
13
  "lstrip": false,
14
  "normalized": false,
15
  "rstrip": false,
@@ -17,7 +17,7 @@
17
  "special": true
18
  },
19
  "2": {
20
- "content": "[CLS]",
21
  "lstrip": false,
22
  "normalized": false,
23
  "rstrip": false,
@@ -25,40 +25,30 @@
25
  "special": true
26
  },
27
  "3": {
28
- "content": "[SEP]",
29
  "lstrip": false,
30
  "normalized": false,
31
  "rstrip": false,
32
  "single_word": false,
33
  "special": true
34
  },
35
- "4": {
36
- "content": "[MASK]",
37
- "lstrip": false,
38
  "normalized": false,
39
  "rstrip": false,
40
  "single_word": false,
41
  "special": true
42
  }
43
  },
 
44
  "clean_up_tokenization_spaces": true,
45
- "cls_token": "[CLS]",
46
- "do_basic_tokenize": true,
47
- "do_lower_case": false,
48
- "mask_token": "[MASK]",
49
- "max_length": 256,
50
- "model_max_length": 1000000000000000019884624838656,
51
- "never_split": null,
52
- "pad_to_multiple_of": null,
53
- "pad_token": "[PAD]",
54
- "pad_token_type_id": 0,
55
- "padding_side": "right",
56
- "sep_token": "[SEP]",
57
- "stride": 0,
58
- "strip_accents": null,
59
- "tokenize_chinese_chars": true,
60
- "tokenizer_class": "ElectraTokenizer",
61
- "truncation_side": "right",
62
- "truncation_strategy": "longest_first",
63
- "unk_token": "[UNK]"
64
  }
 
1
  {
2
  "added_tokens_decoder": {
3
  "0": {
4
+ "content": "<s>",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
 
9
  "special": true
10
  },
11
  "1": {
12
+ "content": "<pad>",
13
  "lstrip": false,
14
  "normalized": false,
15
  "rstrip": false,
 
17
  "special": true
18
  },
19
  "2": {
20
+ "content": "</s>",
21
  "lstrip": false,
22
  "normalized": false,
23
  "rstrip": false,
 
25
  "special": true
26
  },
27
  "3": {
28
+ "content": "<unk>",
29
  "lstrip": false,
30
  "normalized": false,
31
  "rstrip": false,
32
  "single_word": false,
33
  "special": true
34
  },
35
+ "250001": {
36
+ "content": "<mask>",
37
+ "lstrip": true,
38
  "normalized": false,
39
  "rstrip": false,
40
  "single_word": false,
41
  "special": true
42
  }
43
  },
44
+ "bos_token": "<s>",
45
  "clean_up_tokenization_spaces": true,
46
+ "cls_token": "<s>",
47
+ "eos_token": "</s>",
48
+ "mask_token": "<mask>",
49
+ "model_max_length": 512,
50
+ "pad_token": "<pad>",
51
+ "sep_token": "</s>",
52
+ "tokenizer_class": "XLMRobertaTokenizer",
53
+ "unk_token": "<unk>"
 
 
 
 
 
 
 
 
 
 
 
54
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5fdc78b473a44c34f1608a33ccf2450f0b2ae50f37d6b0b618bab6bc8079730b
3
  size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03eac65ea888e69c8dca7f7c772b61c29227c3029ba2741695d7f5820a6f3e7d
3
  size 5112