Training in progress, epoch 1

Files changed (8) hide show

README.md CHANGED Viewed

@@ -12,8 +12,6 @@ metrics:
 model-index:
 - name: legal_ai_India_ner_results
   results: []
-datasets:
-- opennyaiorg/InLegalNER
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -69,4 +67,4 @@ The following hyperparameters were used during training:
 - Transformers 4.48.3
 - Pytorch 2.5.1+cu124
 - Datasets 3.3.2
-- Tokenizers 0.21.0

 model-index:
 - name: legal_ai_India_ner_results
   results: []
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 - Transformers 4.48.3
 - Pytorch 2.5.1+cu124
 - Datasets 3.3.2
+- Tokenizers 0.21.0

config.json CHANGED Viewed

@@ -1,11 +1,12 @@
 {
-  "_name_or_path": "bert-base-uncased",
   "architectures": [
     "BertForTokenClassification"
   ],
   "attention_probs_dropout_prob": 0.1,
   "classifier_dropout": null,
-  "gradient_checkpointing": false,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
@@ -78,6 +79,7 @@
   "model_type": "bert",
   "num_attention_heads": 12,
   "num_hidden_layers": 12,
   "pad_token_id": 0,
   "position_embedding_type": "absolute",
   "torch_dtype": "float32",

 {
+  "_name_or_path": "nlpaueb/legal-bert-base-uncased",
   "architectures": [
     "BertForTokenClassification"
   ],
   "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
   "classifier_dropout": null,
+  "eos_token_ids": 0,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
   "model_type": "bert",
   "num_attention_heads": 12,
   "num_hidden_layers": 12,
+  "output_past": true,
   "pad_token_id": 0,
   "position_embedding_type": "absolute",
   "torch_dtype": "float32",

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2a13c8d5b13bb4d332da4f2c94e3c8c8cfcf4bdb017ff954a323ddc411e92296
 size 435679140

 version https://git-lfs.github.com/spec/v1
+oid sha256:2f75cc7c4cda143f865686ed735a7de23c4f63539d3c2c2e5cc9a8fd0511a8e3
 size 435679140

runs/Feb24_19-47-23_92734c0b55b6/events.out.tfevents.1740426444.92734c0b55b6.23332.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e01f078ad3b58b67f36ae98f60370075fe14052151a430c1c3a45c1c3abf9980
+size 7108

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json CHANGED Viewed

@@ -41,12 +41,14 @@
       "special": true
     }
   },
-  "clean_up_tokenization_spaces": false,
   "cls_token": "[CLS]",
   "do_lower_case": true,
   "extra_special_tokens": {},
   "mask_token": "[MASK]",
   "model_max_length": 512,
   "pad_token": "[PAD]",
   "sep_token": "[SEP]",
   "strip_accents": null,

       "special": true
     }
   },
+  "clean_up_tokenization_spaces": true,
   "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
   "do_lower_case": true,
   "extra_special_tokens": {},
   "mask_token": "[MASK]",
   "model_max_length": 512,
+  "never_split": null,
   "pad_token": "[PAD]",
   "sep_token": "[SEP]",
   "strip_accents": null,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1093ffd5ba32861a7f15a2bd54cfd6b3dc481ea2d0f7cf85ffe86121c3ab5bbd
 size 5368

 version https://git-lfs.github.com/spec/v1
+oid sha256:9ab82ecbbfc924de502d97edef152d751a6b63dbf64bbc4cafb77376dc525e54
 size 5368

vocab.txt CHANGED Viewed

The diff for this file is too large to render. See raw diff