Thalesian commited on
Commit
0677cfb
ยท
verified ยท
1 Parent(s): 6ef1988

End of training

Browse files
README.md CHANGED
@@ -9,14 +9,11 @@ model-index:
9
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
10
  should probably proofread and complete it, then remove this comment. -->
11
 
12
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/thalesian-university-of-new-mexico-press/huggingface/runs/fxb2lxiz)
13
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/thalesian-university-of-new-mexico-press/huggingface/runs/fxb2lxiz)
14
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/thalesian-university-of-new-mexico-press/huggingface/runs/fxb2lxiz)
15
  # train_2
16
 
17
  This model was trained from scratch on the None dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: 1.2508
20
 
21
  ## Model description
22
 
@@ -46,22 +43,17 @@ The following hyperparameters were used during training:
46
 
47
  ### Training results
48
 
49
- | Training Loss | Epoch | Step | Validation Loss |
50
- |:-------------:|:-----:|:----:|:---------------:|
51
- | No log | 1.0 | 392 | 4.1375 |
52
- | 0.5941 | 2.0 | 784 | 2.4509 |
53
- | 0.426 | 3.0 | 1176 | 2.0721 |
54
- | 0.3098 | 4.0 | 1568 | 1.8114 |
55
- | 0.3098 | 5.0 | 1960 | 1.5420 |
56
- | 0.2603 | 6.0 | 2352 | 1.4022 |
57
- | 0.2282 | 7.0 | 2744 | 1.3290 |
58
- | 0.2031 | 8.0 | 3136 | 1.2715 |
59
- | 0.1889 | 9.0 | 3528 | 1.2754 |
60
- | 0.1889 | 10.0 | 3920 | 1.2582 |
61
- | 0.1798 | 11.0 | 4312 | 1.2484 |
62
- | 0.1727 | 12.0 | 4704 | 1.2436 |
63
- | 0.1662 | 13.0 | 5096 | 1.2506 |
64
- | 0.1662 | 14.0 | 5488 | 1.2508 |
65
 
66
 
67
  ### Framework versions
 
9
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
10
  should probably proofread and complete it, then remove this comment. -->
11
 
 
 
 
12
  # train_2
13
 
14
  This model was trained from scratch on the None dataset.
15
  It achieves the following results on the evaluation set:
16
+ - Loss: 0.1708
17
 
18
  ## Model description
19
 
 
43
 
44
  ### Training results
45
 
46
+ | Training Loss | Epoch | Step | Validation Loss |
47
+ |:-------------:|:-----:|:-----:|:---------------:|
48
+ | 0.4186 | 1.0 | 1840 | 1.7597 |
49
+ | 0.0999 | 2.0 | 3680 | 0.4629 |
50
+ | 0.0711 | 3.0 | 5520 | 0.2730 |
51
+ | 0.059 | 4.0 | 7360 | 0.1899 |
52
+ | 0.0474 | 5.0 | 9200 | 0.1696 |
53
+ | 0.0469 | 6.0 | 11040 | 0.1704 |
54
+ | 0.0437 | 7.0 | 12880 | 0.1680 |
55
+ | 0.0429 | 8.0 | 14720 | 0.1691 |
56
+ | 0.0436 | 9.0 | 16560 | 0.1708 |
 
 
 
 
 
57
 
58
 
59
  ### Framework versions
added_tokens.json CHANGED
@@ -1,27 +1,248 @@
1
  {
2
- "\\": 32118,
3
- "ยก": 32103,
4
- "ยง": 32119,
5
- "ร—": 32106,
6
- "รฆ": 32123,
7
- "รธ": 32108,
8
- "ห€": 32116,
9
- "หฝ": 32107,
10
- "โ€": 32101,
11
- "โ€น": 32113,
12
- "โ€นโ€น": 32111,
13
- "โ€บ": 32115,
14
- "โ€บโ€บ": 32117,
15
- "โ„": 32102,
16
- "โ†": 32112,
17
- "โ†’": 32124,
18
- "โ‰ˆ": 32114,
19
- "โŒˆ": 32100,
20
- "โŒ‰": 32121,
21
- "ใ€ˆ": 32110,
22
- "ใ€ˆใ€ˆ": 32105,
23
- "ใ€‰": 32120,
24
- "ใ€‰ใ€‰": 32122,
25
- "๐’€น": 32109,
26
- "๐’‘ฑ": 32104
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
27
  }
 
1
  {
2
+ "ยฑ": 32276,
3
+ "โ†’": 32184,
4
+ "โŒœ": 32163,
5
+ "โŒ": 32144,
6
+ "โ—": 32321,
7
+ "โŸฆ": 32233,
8
+ "โŸง": 32295,
9
+ "๐€€": 32195,
10
+ "๐€": 32270,
11
+ "๐€‚": 32181,
12
+ "๐€ƒ": 32302,
13
+ "๐€„": 32248,
14
+ "๐€…": 32228,
15
+ "๐€†": 32204,
16
+ "๐€‡": 32310,
17
+ "๐€ˆ": 32326,
18
+ "๐€‰": 32281,
19
+ "๐€Š": 32111,
20
+ "๐€‹": 32238,
21
+ "๐€": 32196,
22
+ "๐€Ž": 32173,
23
+ "๐€": 32199,
24
+ "๐€": 32297,
25
+ "๐€‘": 32191,
26
+ "๐€’": 32104,
27
+ "๐€“": 32234,
28
+ "๐€”": 32283,
29
+ "๐€•": 32132,
30
+ "๐€–": 32227,
31
+ "๐€—": 32215,
32
+ "๐€˜": 32306,
33
+ "๐€™": 32193,
34
+ "๐€š": 32219,
35
+ "๐€›": 32330,
36
+ "๐€œ": 32300,
37
+ "๐€": 32143,
38
+ "๐€ž": 32293,
39
+ "๐€Ÿ": 32338,
40
+ "๐€ ": 32171,
41
+ "๐€ก": 32246,
42
+ "๐€ข": 32258,
43
+ "๐€ฃ": 32182,
44
+ "๐€ค": 32155,
45
+ "๐€ฅ": 32209,
46
+ "๐€ฆ": 32141,
47
+ "๐€จ": 32315,
48
+ "๐€ฉ": 32136,
49
+ "๐€ช": 32139,
50
+ "๐€ซ": 32266,
51
+ "๐€ฌ": 32220,
52
+ "๐€ญ": 32203,
53
+ "๐€ฎ": 32116,
54
+ "๐€ฏ": 32124,
55
+ "๐€ฐ": 32296,
56
+ "๐€ฑ": 32334,
57
+ "๐€ฒ": 32287,
58
+ "๐€ณ": 32103,
59
+ "๐€ด": 32202,
60
+ "๐€ต": 32229,
61
+ "๐€ถ": 32113,
62
+ "๐€ท": 32255,
63
+ "๐€ธ": 32187,
64
+ "๐€น": 32211,
65
+ "๐€บ": 32249,
66
+ "๐€ผ": 32254,
67
+ "๐€ฝ": 32301,
68
+ "๐€ฟ": 32210,
69
+ "๐€": 32218,
70
+ "๐": 32117,
71
+ "๐‚": 32162,
72
+ "๐ƒ": 32178,
73
+ "๐„": 32190,
74
+ "๐…": 32168,
75
+ "๐†": 32134,
76
+ "๐‡": 32123,
77
+ "๐ˆ": 32110,
78
+ "๐‰": 32277,
79
+ "๐Š": 32333,
80
+ "๐‹": 32235,
81
+ "๐Œ": 32305,
82
+ "๐": 32325,
83
+ "๐": 32291,
84
+ "๐‘": 32152,
85
+ "๐’": 32183,
86
+ "๐“": 32328,
87
+ "๐”": 32274,
88
+ "๐•": 32304,
89
+ "๐–": 32292,
90
+ "๐—": 32331,
91
+ "๐˜": 32336,
92
+ "๐™": 32201,
93
+ "๐š": 32118,
94
+ "๐›": 32282,
95
+ "๐œ": 32114,
96
+ "๐": 32284,
97
+ "๐‚€": 32128,
98
+ "๐‚": 32174,
99
+ "๐‚‚": 32157,
100
+ "๐‚ƒ": 32180,
101
+ "๐‚„": 32129,
102
+ "๐‚…": 32243,
103
+ "๐‚†": 32320,
104
+ "๐‚‡": 32253,
105
+ "๐‚ˆ": 32261,
106
+ "๐‚‰": 32247,
107
+ "๐‚Š": 32311,
108
+ "๐‚‹": 32151,
109
+ "๐‚Œ": 32179,
110
+ "๐‚": 32275,
111
+ "๐‚Ž": 32316,
112
+ "๐‚": 32250,
113
+ "๐‚": 32186,
114
+ "๐‚‘": 32327,
115
+ "๐‚’": 32225,
116
+ "๐‚”": 32236,
117
+ "๐‚•": 32329,
118
+ "๐‚–": 32341,
119
+ "๐‚—": 32122,
120
+ "๐‚š": 32245,
121
+ "๐‚›": 32102,
122
+ "๐‚œ": 32332,
123
+ "๐‚": 32322,
124
+ "๐‚ž": 32205,
125
+ "๐‚Ÿ": 32137,
126
+ "๐‚ก": 32165,
127
+ "๐‚ข": 32154,
128
+ "๐‚ฃ": 32299,
129
+ "๐‚ฅ": 32323,
130
+ "๐‚ฆ": 32192,
131
+ "๐‚ง": 32140,
132
+ "๐‚จ": 32164,
133
+ "๐‚ฉ": 32115,
134
+ "๐‚ช": 32214,
135
+ "๐‚ซ": 32231,
136
+ "๐‚ฌ": 32232,
137
+ "๐‚ญ": 32288,
138
+ "๐‚ฎ": 32101,
139
+ "๐‚ฏ": 32206,
140
+ "๐‚ฐ": 32264,
141
+ "๐‚ฑ": 32172,
142
+ "๐‚ฒ": 32212,
143
+ "๐‚ณ": 32268,
144
+ "๐‚ด": 32133,
145
+ "๐‚ต": 32112,
146
+ "๐‚ถ": 32127,
147
+ "๐‚ท": 32257,
148
+ "๐‚ธ": 32242,
149
+ "๐‚น": 32313,
150
+ "๐‚บ": 32142,
151
+ "๐‚ป": 32138,
152
+ "๐‚ผ": 32175,
153
+ "๐‚ฝ": 32230,
154
+ "๐‚พ": 32273,
155
+ "๐‚ฟ": 32240,
156
+ "๐ƒ€": 32109,
157
+ "๐ƒ": 32344,
158
+ "๐ƒ‚": 32105,
159
+ "๐ƒ„": 32149,
160
+ "๐ƒ†": 32216,
161
+ "๐ƒ‡": 32263,
162
+ "๐ƒˆ": 32312,
163
+ "๐ƒ‰": 32125,
164
+ "๐ƒŠ": 32221,
165
+ "๐ƒŒ": 32318,
166
+ "๐ƒ": 32213,
167
+ "๐ƒŽ": 32239,
168
+ "๐ƒ": 32335,
169
+ "๐ƒ": 32290,
170
+ "๐ƒ‘": 32197,
171
+ "๐ƒ“": 32100,
172
+ "๐ƒ”": 32161,
173
+ "๐ƒ•": 32207,
174
+ "๐ƒ—": 32251,
175
+ "๐ƒ™": 32267,
176
+ "๐ƒš": 32226,
177
+ "๐ƒ›": 32272,
178
+ "๐ƒœ": 32224,
179
+ "๐ƒ": 32298,
180
+ "๐ƒž": 32170,
181
+ "๐ƒŸ": 32339,
182
+ "๐ƒ ": 32166,
183
+ "๐ƒก": 32107,
184
+ "๐ƒข": 32271,
185
+ "๐ƒฃ": 32317,
186
+ "๐ƒค": 32135,
187
+ "๐ƒฅ": 32309,
188
+ "๐ƒฆ": 32252,
189
+ "๐ƒง": 32237,
190
+ "๐ƒจ": 32194,
191
+ "๐ƒฉ": 32177,
192
+ "๐ƒช": 32185,
193
+ "๐ƒซ": 32223,
194
+ "๐ƒฌ": 32269,
195
+ "๐ƒญ": 32189,
196
+ "๐ƒฎ": 32150,
197
+ "๐ƒฏ": 32167,
198
+ "๐ƒฐ": 32106,
199
+ "๐ƒฑ": 32222,
200
+ "๐ƒฒ": 32153,
201
+ "๐ƒณ": 32121,
202
+ "๐ƒด": 32208,
203
+ "๐ƒต": 32345,
204
+ "๐ƒถ": 32265,
205
+ "๐ƒท": 32126,
206
+ "๐ƒธ": 32198,
207
+ "๐ƒน": 32131,
208
+ "๐„ˆ": 32280,
209
+ "๐„‰": 32286,
210
+ "๐„Š": 32342,
211
+ "๐„‹": 32285,
212
+ "๐„Œ": 32217,
213
+ "๐„": 32259,
214
+ "๐„Ž": 32256,
215
+ "๐„": 32340,
216
+ "๐„": 32120,
217
+ "๐„‘": 32188,
218
+ "๐„’": 32260,
219
+ "๐„“": 32147,
220
+ "๐„”": 32119,
221
+ "๐„•": 32308,
222
+ "๐„–": 32160,
223
+ "๐„—": 32337,
224
+ "๐„˜": 32176,
225
+ "๐„™": 32294,
226
+ "๐„š": 32289,
227
+ "๐„›": 32319,
228
+ "๐„œ": 32159,
229
+ "๐„": 32200,
230
+ "๐„ž": 32244,
231
+ "๐„Ÿ": 32156,
232
+ "๐„ก": 32130,
233
+ "๐„ข": 32314,
234
+ "๐„ฃ": 32324,
235
+ "๐„ค": 32108,
236
+ "๐„ฅ": 32343,
237
+ "๐„ง": 32158,
238
+ "๐„ช": 32307,
239
+ "๐„ซ": 32169,
240
+ "๐„ท": 32145,
241
+ "๐„ธ": 32262,
242
+ "๐„น": 32279,
243
+ "๐„บ": 32146,
244
+ "๐„ผ": 32148,
245
+ "๐„ฝ": 32278,
246
+ "๐„พ": 32241,
247
+ "๐„ฟ": 32303
248
  }
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/Users/lee/GitHub/results/HIT-T5/train_1/checkpoint-5875",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
@@ -57,5 +57,5 @@
57
  "torch_dtype": "float32",
58
  "transformers_version": "4.44.0.dev0",
59
  "use_cache": true,
60
- "vocab_size": 32125
61
  }
 
1
  {
2
+ "_name_or_path": "/Users/lee/GitHub/results/GMY-T5/train_1/checkpoint-22831",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
 
57
  "torch_dtype": "float32",
58
  "transformers_version": "4.44.0.dev0",
59
  "use_cache": true,
60
+ "vocab_size": 32346
61
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c264eeb9f12489cb48bd49ed69bfba358cad96d942dfef553df30e9833c465ad
3
- size 891635496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775f88e543813d588848756191faf45933a549fc9179a682de772be4a21afae7
3
+ size 892314408
runs/Feb07_04-32-52_Lees-MacBook-Pro.local/events.out.tfevents.1738927972.Lees-MacBook-Pro.local ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:942b1f04bdab5b1b528a3aae69faf6574a62dc03269cf1adc17081a3dc5fe63b
3
+ size 15801
special_tokens_map.json CHANGED
@@ -101,7 +101,25 @@
101
  "<extra_id_98>",
102
  "<extra_id_99>"
103
  ],
104
- "eos_token": "</s>",
105
- "pad_token": "<pad>",
106
- "unk_token": "<unk>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
107
  }
 
101
  "<extra_id_98>",
102
  "<extra_id_99>"
103
  ],
104
+ "eos_token": {
105
+ "content": "</s>",
106
+ "lstrip": false,
107
+ "normalized": false,
108
+ "rstrip": false,
109
+ "single_word": false
110
+ },
111
+ "pad_token": {
112
+ "content": "<pad>",
113
+ "lstrip": false,
114
+ "normalized": false,
115
+ "rstrip": false,
116
+ "single_word": false
117
+ },
118
+ "unk_token": {
119
+ "content": "<unk>",
120
+ "lstrip": false,
121
+ "normalized": false,
122
+ "rstrip": false,
123
+ "single_word": false
124
+ }
125
  }
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fab1cdd3cf5f0f65cc1647be02cbcf585afe3d843684e73caadae054d39c5a58
3
- size 2426650
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4d3f7b0755307dea535dfe79c9df3f0810c6792c1b19e60aa79c12b0513d5e4
3
+ size 2466441
tokenizer_config.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:05509d70d28d3db8681d538447fec4a0890d35edf606f27f4b23c6507cd42ccb
3
- size 25005
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f955f64689f3aefc3b7074ccae4f46f2b231d2cc9b544465bbfaf2c376e3b689
3
+ size 62605
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2edd421734d0d356b12d24edacc16024cec326606a2aa9dd0bd3205b0185c9f2
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d8448f9ced35d49c60331bf55d861a0d6b81145453f8a78f002ad520788632a
3
  size 5432