qsnell commited on
Commit
70fa02f
1 Parent(s): a53d91c

Training complete!

Browse files
README.md CHANGED
@@ -1,4 +1,5 @@
1
  ---
 
2
  base_model: google/pegasus-cnn_dailymail
3
  tags:
4
  - generated_from_trainer
@@ -16,7 +17,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  This model is a fine-tuned version of [google/pegasus-cnn_dailymail](https://huggingface.co/google/pegasus-cnn_dailymail) on the samsum dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: 1.4882
20
 
21
  ## Model description
22
 
@@ -48,14 +49,14 @@ The following hyperparameters were used during training:
48
 
49
  ### Training results
50
 
51
- | Training Loss | Epoch | Step | Validation Loss |
52
- |:-------------:|:-----:|:----:|:---------------:|
53
- | 1.6287 | 0.54 | 500 | 1.4882 |
54
 
55
 
56
  ### Framework versions
57
 
58
- - Transformers 4.34.1
59
- - Pytorch 2.1.0+cu121
60
- - Datasets 2.14.6
61
- - Tokenizers 0.14.1
 
1
  ---
2
+ library_name: transformers
3
  base_model: google/pegasus-cnn_dailymail
4
  tags:
5
  - generated_from_trainer
 
17
 
18
  This model is a fine-tuned version of [google/pegasus-cnn_dailymail](https://huggingface.co/google/pegasus-cnn_dailymail) on the samsum dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 1.4854
21
 
22
  ## Model description
23
 
 
49
 
50
  ### Training results
51
 
52
+ | Training Loss | Epoch | Step | Validation Loss |
53
+ |:-------------:|:------:|:----:|:---------------:|
54
+ | 1.6718 | 0.5430 | 500 | 1.4854 |
55
 
56
 
57
  ### Framework versions
58
 
59
+ - Transformers 4.45.2
60
+ - Pytorch 2.4.1+cu121
61
+ - Datasets 3.0.1
62
+ - Tokenizers 0.20.0
config.json CHANGED
@@ -36,20 +36,20 @@
36
  "LABEL_1": 1,
37
  "LABEL_2": 2
38
  },
39
- "length_penalty": 0.8,
40
- "max_length": 128,
41
  "max_position_embeddings": 1024,
42
- "min_length": 32,
43
  "model_type": "pegasus",
44
  "normalize_before": true,
45
  "normalize_embedding": false,
46
- "num_beams": 8,
47
  "num_hidden_layers": 16,
48
  "pad_token_id": 0,
49
  "scale_embedding": true,
50
  "static_position_embeddings": true,
51
  "torch_dtype": "float32",
52
- "transformers_version": "4.34.1",
53
  "use_cache": true,
54
  "vocab_size": 96103
55
  }
 
36
  "LABEL_1": 1,
37
  "LABEL_2": 2
38
  },
39
+ "length_penalty": null,
40
+ "max_length": null,
41
  "max_position_embeddings": 1024,
42
+ "min_length": null,
43
  "model_type": "pegasus",
44
  "normalize_before": true,
45
  "normalize_embedding": false,
46
+ "num_beams": null,
47
  "num_hidden_layers": 16,
48
  "pad_token_id": 0,
49
  "scale_embedding": true,
50
  "static_position_embeddings": true,
51
  "torch_dtype": "float32",
52
+ "transformers_version": "4.45.2",
53
  "use_cache": true,
54
  "vocab_size": 96103
55
  }
generation_config.json CHANGED
@@ -9,5 +9,5 @@
9
  "min_length": 32,
10
  "num_beams": 8,
11
  "pad_token_id": 0,
12
- "transformers_version": "4.34.1"
13
  }
 
9
  "min_length": 32,
10
  "num_beams": 8,
11
  "pad_token_id": 0,
12
+ "transformers_version": "4.45.2"
13
  }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e9be6c317ece041a28bc5b2ff16f4760b5f11672e0c0525cd1d75c917d024a9
3
+ size 2283652852
runs/Oct20_16-23-43_84cda4c74c56/1666283033.8020647/events.out.tfevents.1666283033.84cda4c74c56.90220.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88a01358ab07ad10fafe3a325e38d84ac86af3d8b757c66649a53ffdde601aaa
3
+ size 5409
runs/Oct20_16-23-43_84cda4c74c56/1666284074.368571/events.out.tfevents.1666284074.84cda4c74c56.90220.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dbf5e452f66496634a0dac9cc0105c887d918e28e5810bc0baeedcc5a4e0646
3
+ size 5409
runs/Oct20_16-23-43_84cda4c74c56/events.out.tfevents.1666283033.84cda4c74c56.90220.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef8060d3346ed4b3fe8113942a43c84a659c2a2d40f723969c4e10e0d3b1723a
3
+ size 4334
runs/Oct20_16-23-43_84cda4c74c56/events.out.tfevents.1666284074.84cda4c74c56.90220.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea7c996c6e19f9ba652917fd3b589388c8b881096acc0108c66f549f2410c20c
3
+ size 4334
runs/Oct20_17-47-06_84cda4c74c56/1666288033.7993069/events.out.tfevents.1666288033.84cda4c74c56.90773.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ac5d4d0519af3ce680bf20c99acfe9ab3f3644a351c9d5a1340d43bcb778113
3
+ size 5409
runs/Oct20_17-47-06_84cda4c74c56/events.out.tfevents.1666288033.84cda4c74c56.90773.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3650cf17756eae45416a6e9c5765b805a40dc1af08bd0c7cc0c5699cea1edd1
3
+ size 4334
runs/Oct20_18-21-43_84cda4c74c56/1666290111.0084915/events.out.tfevents.1666290111.84cda4c74c56.91035.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7025589276cd324fa6d34e5d56a88069d724e98fd076be3ebdee08342034ca2
3
+ size 5409
runs/Oct20_18-21-43_84cda4c74c56/events.out.tfevents.1666290110.84cda4c74c56.91035.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb3e7f59e35a1e6899f52a62dab36ec762cea88782728a6912f50da88512ba12
3
+ size 4334
runs/Oct20_19-44-18_84cda4c74c56/1666295059.7752225/events.out.tfevents.1666295059.84cda4c74c56.91609.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d7167bcd6dfbc3788675b0a8c8126fe1ef61b7ed013b25564ee0410250dd9b1
3
+ size 5409
runs/Oct20_19-44-18_84cda4c74c56/events.out.tfevents.1666295059.84cda4c74c56.91609.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba06b4377d7ea98307f691f36be98720643a724ce12b095a8a76406ee7c72ee3
3
+ size 4335
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -847,6 +847,14 @@
847
  "rstrip": false,
848
  "single_word": false,
849
  "special": true
 
 
 
 
 
 
 
 
850
  }
851
  },
852
  "additional_special_tokens": [
@@ -953,7 +961,7 @@
953
  "<unk_101>",
954
  "<unk_102>"
955
  ],
956
- "clean_up_tokenization_spaces": true,
957
  "eos_token": "</s>",
958
  "full_tokenizer_file": null,
959
  "mask_token": "<mask_2>",
 
847
  "rstrip": false,
848
  "single_word": false,
849
  "special": true
850
+ },
851
+ "106": {
852
+ "content": "<n>",
853
+ "lstrip": false,
854
+ "normalized": false,
855
+ "rstrip": false,
856
+ "single_word": false,
857
+ "special": false
858
  }
859
  },
860
  "additional_special_tokens": [
 
961
  "<unk_101>",
962
  "<unk_102>"
963
  ],
964
+ "clean_up_tokenization_spaces": false,
965
  "eos_token": "</s>",
966
  "full_tokenizer_file": null,
967
  "mask_token": "<mask_2>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01e49aad50515f1e4d0b690698e786a4654676e51f8dc9c96f3b5f9f0f9d19c9
3
- size 4472
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:904b9775eb3570ba7d2326c89fe0a83e3fbb5917ab1aa8ec7fd2a761cea9c5ba
3
+ size 5176