sujit27 commited on
Commit
b9d0e99
·
1 Parent(s): bd28ebb

NER-bert-large-wnut-v1

Browse files
.gitattributes CHANGED
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ mnist_test.csv filter=lfs diff=lfs merge=lfs -text
37
+ mnist_train_small.csv filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,131 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ base_model: bert-large-uncased
4
+ tags:
5
+ - generated_from_trainer
6
+ datasets:
7
+ - wnut_17
8
+ metrics:
9
+ - precision
10
+ - recall
11
+ - f1
12
+ - accuracy
13
+ model-index:
14
+ - name: sample_data
15
+ results:
16
+ - task:
17
+ name: Token Classification
18
+ type: token-classification
19
+ dataset:
20
+ name: wnut_17
21
+ type: wnut_17
22
+ config: wnut_17
23
+ split: validation
24
+ args: wnut_17
25
+ metrics:
26
+ - name: Precision
27
+ type: precision
28
+ value: 0.7290715372907154
29
+ - name: Recall
30
+ type: recall
31
+ value: 0.5729665071770335
32
+ - name: F1
33
+ type: f1
34
+ value: 0.6416610850636303
35
+ - name: Accuracy
36
+ type: accuracy
37
+ value: 0.9602644796236252
38
+ ---
39
+
40
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
41
+ should probably proofread and complete it, then remove this comment. -->
42
+
43
+ # sample_data
44
+
45
+ This model is a fine-tuned version of [bert-large-uncased](https://huggingface.co/bert-large-uncased) on the wnut_17 dataset.
46
+ It achieves the following results on the evaluation set:
47
+ - Loss: 0.2684
48
+ - Precision: 0.7291
49
+ - Recall: 0.5730
50
+ - F1: 0.6417
51
+ - Accuracy: 0.9603
52
+
53
+ ## Model description
54
+
55
+ More information needed
56
+
57
+ ## Intended uses & limitations
58
+
59
+ More information needed
60
+
61
+ ## Training and evaluation data
62
+
63
+ More information needed
64
+
65
+ ## Training procedure
66
+
67
+ ### Training hyperparameters
68
+
69
+ The following hyperparameters were used during training:
70
+ - learning_rate: 2e-05
71
+ - train_batch_size: 16
72
+ - eval_batch_size: 16
73
+ - seed: 42
74
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
75
+ - lr_scheduler_type: linear
76
+ - num_epochs: 5
77
+
78
+ ### Training results
79
+
80
+ | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 | Accuracy |
81
+ |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
82
+ | 0.6403 | 0.12 | 25 | 0.4914 | 0.0 | 0.0 | 0.0 | 0.9205 |
83
+ | 0.334 | 0.23 | 50 | 0.4539 | 0.0 | 0.0 | 0.0 | 0.9205 |
84
+ | 0.2346 | 0.35 | 75 | 0.3556 | 0.4118 | 0.0419 | 0.0760 | 0.9236 |
85
+ | 0.2352 | 0.47 | 100 | 0.2936 | 0.4337 | 0.2464 | 0.3143 | 0.9341 |
86
+ | 0.1725 | 0.59 | 125 | 0.2898 | 0.4983 | 0.3421 | 0.4057 | 0.9372 |
87
+ | 0.1449 | 0.7 | 150 | 0.2858 | 0.4606 | 0.3493 | 0.3973 | 0.9399 |
88
+ | 0.1548 | 0.82 | 175 | 0.2487 | 0.5699 | 0.3900 | 0.4631 | 0.9435 |
89
+ | 0.1429 | 0.94 | 200 | 0.3071 | 0.6888 | 0.3469 | 0.4614 | 0.9415 |
90
+ | 0.1506 | 1.06 | 225 | 0.2252 | 0.4820 | 0.4952 | 0.4885 | 0.9465 |
91
+ | 0.1196 | 1.17 | 250 | 0.2512 | 0.5463 | 0.4940 | 0.5188 | 0.9485 |
92
+ | 0.1062 | 1.29 | 275 | 0.2916 | 0.6395 | 0.4605 | 0.5355 | 0.9495 |
93
+ | 0.0983 | 1.41 | 300 | 0.2402 | 0.6199 | 0.5443 | 0.5796 | 0.9497 |
94
+ | 0.1068 | 1.53 | 325 | 0.2470 | 0.6018 | 0.4773 | 0.5324 | 0.9504 |
95
+ | 0.0879 | 1.64 | 350 | 0.2360 | 0.6468 | 0.5586 | 0.5995 | 0.9511 |
96
+ | 0.0928 | 1.76 | 375 | 0.2267 | 0.6126 | 0.5467 | 0.5777 | 0.9514 |
97
+ | 0.1045 | 1.88 | 400 | 0.2258 | 0.6934 | 0.5060 | 0.5851 | 0.9542 |
98
+ | 0.0933 | 2.0 | 425 | 0.2403 | 0.6954 | 0.5108 | 0.5890 | 0.9547 |
99
+ | 0.0497 | 2.11 | 450 | 0.2539 | 0.6460 | 0.5371 | 0.5865 | 0.9554 |
100
+ | 0.0607 | 2.23 | 475 | 0.3065 | 0.7293 | 0.4737 | 0.5743 | 0.9523 |
101
+ | 0.0857 | 2.35 | 500 | 0.2565 | 0.6770 | 0.4964 | 0.5728 | 0.9545 |
102
+ | 0.0513 | 2.46 | 525 | 0.2569 | 0.6931 | 0.5323 | 0.6022 | 0.9569 |
103
+ | 0.0697 | 2.58 | 550 | 0.2273 | 0.7193 | 0.5670 | 0.6341 | 0.9566 |
104
+ | 0.0446 | 2.7 | 575 | 0.2361 | 0.6348 | 0.5634 | 0.5970 | 0.9580 |
105
+ | 0.0498 | 2.82 | 600 | 0.2544 | 0.7109 | 0.5323 | 0.6088 | 0.9579 |
106
+ | 0.0464 | 2.93 | 625 | 0.2576 | 0.7237 | 0.5514 | 0.6259 | 0.9589 |
107
+ | 0.0441 | 3.05 | 650 | 0.2691 | 0.7321 | 0.5490 | 0.6275 | 0.9586 |
108
+ | 0.0524 | 3.17 | 675 | 0.2368 | 0.6947 | 0.5825 | 0.6337 | 0.9603 |
109
+ | 0.0335 | 3.29 | 700 | 0.2488 | 0.6991 | 0.5670 | 0.6262 | 0.9594 |
110
+ | 0.0349 | 3.4 | 725 | 0.2564 | 0.7084 | 0.5347 | 0.6094 | 0.9580 |
111
+ | 0.026 | 3.52 | 750 | 0.2523 | 0.7085 | 0.5610 | 0.6262 | 0.9594 |
112
+ | 0.0314 | 3.64 | 775 | 0.2647 | 0.7335 | 0.5467 | 0.6265 | 0.9584 |
113
+ | 0.0213 | 3.76 | 800 | 0.2551 | 0.7032 | 0.5754 | 0.6329 | 0.9603 |
114
+ | 0.0312 | 3.87 | 825 | 0.2470 | 0.7034 | 0.5957 | 0.6451 | 0.9606 |
115
+ | 0.0313 | 3.99 | 850 | 0.2693 | 0.7421 | 0.5610 | 0.6390 | 0.9598 |
116
+ | 0.0243 | 4.11 | 875 | 0.2699 | 0.7345 | 0.5658 | 0.6392 | 0.9598 |
117
+ | 0.0289 | 4.23 | 900 | 0.2535 | 0.7143 | 0.5682 | 0.6329 | 0.9603 |
118
+ | 0.0226 | 4.34 | 925 | 0.2581 | 0.7205 | 0.5706 | 0.6368 | 0.9602 |
119
+ | 0.0173 | 4.46 | 950 | 0.2644 | 0.7145 | 0.5718 | 0.6352 | 0.9601 |
120
+ | 0.0139 | 4.58 | 975 | 0.2705 | 0.7164 | 0.5682 | 0.6338 | 0.9600 |
121
+ | 0.0243 | 4.69 | 1000 | 0.2615 | 0.7116 | 0.5813 | 0.6399 | 0.9606 |
122
+ | 0.0222 | 4.81 | 1025 | 0.2642 | 0.7229 | 0.5742 | 0.64 | 0.9606 |
123
+ | 0.0112 | 4.93 | 1050 | 0.2684 | 0.7291 | 0.5730 | 0.6417 | 0.9603 |
124
+
125
+
126
+ ### Framework versions
127
+
128
+ - Transformers 4.33.2
129
+ - Pytorch 2.0.1+cu118
130
+ - Datasets 2.14.5
131
+ - Tokenizers 0.13.3
anscombe.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {"Series":"I", "X":10.0, "Y":8.04},
3
+ {"Series":"I", "X":8.0, "Y":6.95},
4
+ {"Series":"I", "X":13.0, "Y":7.58},
5
+ {"Series":"I", "X":9.0, "Y":8.81},
6
+ {"Series":"I", "X":11.0, "Y":8.33},
7
+ {"Series":"I", "X":14.0, "Y":9.96},
8
+ {"Series":"I", "X":6.0, "Y":7.24},
9
+ {"Series":"I", "X":4.0, "Y":4.26},
10
+ {"Series":"I", "X":12.0, "Y":10.84},
11
+ {"Series":"I", "X":7.0, "Y":4.81},
12
+ {"Series":"I", "X":5.0, "Y":5.68},
13
+
14
+ {"Series":"II", "X":10.0, "Y":9.14},
15
+ {"Series":"II", "X":8.0, "Y":8.14},
16
+ {"Series":"II", "X":13.0, "Y":8.74},
17
+ {"Series":"II", "X":9.0, "Y":8.77},
18
+ {"Series":"II", "X":11.0, "Y":9.26},
19
+ {"Series":"II", "X":14.0, "Y":8.10},
20
+ {"Series":"II", "X":6.0, "Y":6.13},
21
+ {"Series":"II", "X":4.0, "Y":3.10},
22
+ {"Series":"II", "X":12.0, "Y":9.13},
23
+ {"Series":"II", "X":7.0, "Y":7.26},
24
+ {"Series":"II", "X":5.0, "Y":4.74},
25
+
26
+ {"Series":"III", "X":10.0, "Y":7.46},
27
+ {"Series":"III", "X":8.0, "Y":6.77},
28
+ {"Series":"III", "X":13.0, "Y":12.74},
29
+ {"Series":"III", "X":9.0, "Y":7.11},
30
+ {"Series":"III", "X":11.0, "Y":7.81},
31
+ {"Series":"III", "X":14.0, "Y":8.84},
32
+ {"Series":"III", "X":6.0, "Y":6.08},
33
+ {"Series":"III", "X":4.0, "Y":5.39},
34
+ {"Series":"III", "X":12.0, "Y":8.15},
35
+ {"Series":"III", "X":7.0, "Y":6.42},
36
+ {"Series":"III", "X":5.0, "Y":5.73},
37
+
38
+ {"Series":"IV", "X":8.0, "Y":6.58},
39
+ {"Series":"IV", "X":8.0, "Y":5.76},
40
+ {"Series":"IV", "X":8.0, "Y":7.71},
41
+ {"Series":"IV", "X":8.0, "Y":8.84},
42
+ {"Series":"IV", "X":8.0, "Y":8.47},
43
+ {"Series":"IV", "X":8.0, "Y":7.04},
44
+ {"Series":"IV", "X":8.0, "Y":5.25},
45
+ {"Series":"IV", "X":19.0, "Y":12.50},
46
+ {"Series":"IV", "X":8.0, "Y":5.56},
47
+ {"Series":"IV", "X":8.0, "Y":7.91},
48
+ {"Series":"IV", "X":8.0, "Y":6.89}
49
+ ]
california_housing_test.csv ADDED
The diff for this file is too large to render. See raw diff
 
california_housing_train.csv ADDED
The diff for this file is too large to render. See raw diff
 
config.json ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "bert-large-uncased",
3
+ "architectures": [
4
+ "BertForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "gradient_checkpointing": false,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 1024,
12
+ "id2label": {
13
+ "0": "O",
14
+ "1": "B-corporation",
15
+ "2": "I-corporation",
16
+ "3": "B-creative-work",
17
+ "4": "I-creative-work",
18
+ "5": "B-group",
19
+ "6": "I-group",
20
+ "7": "B-location",
21
+ "8": "I-location",
22
+ "9": "B-person",
23
+ "10": "I-person",
24
+ "11": "B-product",
25
+ "12": "I-product"
26
+ },
27
+ "initializer_range": 0.02,
28
+ "intermediate_size": 4096,
29
+ "label2id": {
30
+ "B-corporation": 1,
31
+ "B-creative-work": 3,
32
+ "B-group": 5,
33
+ "B-location": 7,
34
+ "B-person": 9,
35
+ "B-product": 11,
36
+ "I-corporation": 2,
37
+ "I-creative-work": 4,
38
+ "I-group": 6,
39
+ "I-location": 8,
40
+ "I-person": 10,
41
+ "I-product": 12,
42
+ "O": 0
43
+ },
44
+ "layer_norm_eps": 1e-12,
45
+ "max_position_embeddings": 512,
46
+ "model_type": "bert",
47
+ "num_attention_heads": 16,
48
+ "num_hidden_layers": 24,
49
+ "pad_token_id": 0,
50
+ "position_embedding_type": "absolute",
51
+ "torch_dtype": "float32",
52
+ "transformers_version": "4.33.2",
53
+ "type_vocab_size": 2,
54
+ "use_cache": true,
55
+ "vocab_size": 30522
56
+ }
mnist_test.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51c292478d94ec3a01461bdfa82eb0885d262eb09e615679b2d69dedb6ad09e7
3
+ size 18289443
mnist_train_small.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ef64781aa03180f4f5ce504314f058f5d0227277df86060473d973cf43b033e
3
+ size 36523880
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cae9c83d13291be565ef89cbe180235243c8689318b96b4d9110159413b6ce0a
3
+ size 1336556201
special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "clean_up_tokenization_spaces": true,
3
+ "cls_token": "[CLS]",
4
+ "do_lower_case": true,
5
+ "mask_token": "[MASK]",
6
+ "model_max_length": 512,
7
+ "pad_token": "[PAD]",
8
+ "sep_token": "[SEP]",
9
+ "strip_accents": null,
10
+ "tokenize_chinese_chars": true,
11
+ "tokenizer_class": "BertTokenizer",
12
+ "unk_token": "[UNK]"
13
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2df789abcb23d846539f6371973af479722c2fa03f3c133903a9334565c80156
3
+ size 4027
vocab.txt ADDED
The diff for this file is too large to render. See raw diff