sumuks commited on
Commit
321170b
·
verified ·
1 Parent(s): bf6ef4a

Training in progress, step 1500

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +51 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e94b87a58ad23a41943016a5384a0c5eea2b7a27c9024ce7df4f5ac4d217a6a
3
  size 645976488
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:474afdde13b45825aaa1e00f7ef60f5109d1cc33fdd07da07dfbb299b2104720
3
  size 645976488
trainer_log.jsonl CHANGED
@@ -99,3 +99,54 @@
99
  {"current_steps": 980, "total_steps": 1770, "loss": 1.6289, "lr": 2.467953871623073e-05, "epoch": 1.6610169491525424, "percentage": 55.37, "elapsed_time": "0:33:46", "remaining_time": "0:27:13"}
100
  {"current_steps": 990, "total_steps": 1770, "loss": 1.6339, "lr": 2.4186642632977697e-05, "epoch": 1.6779661016949152, "percentage": 55.93, "elapsed_time": "0:34:06", "remaining_time": "0:26:52"}
101
  {"current_steps": 1000, "total_steps": 1770, "loss": 1.6172, "lr": 2.3694062876185738e-05, "epoch": 1.694915254237288, "percentage": 56.5, "elapsed_time": "0:34:26", "remaining_time": "0:26:31"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
99
  {"current_steps": 980, "total_steps": 1770, "loss": 1.6289, "lr": 2.467953871623073e-05, "epoch": 1.6610169491525424, "percentage": 55.37, "elapsed_time": "0:33:46", "remaining_time": "0:27:13"}
100
  {"current_steps": 990, "total_steps": 1770, "loss": 1.6339, "lr": 2.4186642632977697e-05, "epoch": 1.6779661016949152, "percentage": 55.93, "elapsed_time": "0:34:06", "remaining_time": "0:26:52"}
101
  {"current_steps": 1000, "total_steps": 1770, "loss": 1.6172, "lr": 2.3694062876185738e-05, "epoch": 1.694915254237288, "percentage": 56.5, "elapsed_time": "0:34:26", "remaining_time": "0:26:31"}
102
+ {"current_steps": 1010, "total_steps": 1770, "loss": 1.6169, "lr": 2.3201991017257007e-05, "epoch": 1.711864406779661, "percentage": 57.06, "elapsed_time": "0:35:11", "remaining_time": "0:26:28"}
103
+ {"current_steps": 1020, "total_steps": 1770, "loss": 1.6156, "lr": 2.2710618430064843e-05, "epoch": 1.7288135593220337, "percentage": 57.63, "elapsed_time": "0:35:31", "remaining_time": "0:26:07"}
104
+ {"current_steps": 1030, "total_steps": 1770, "loss": 1.6348, "lr": 2.222013621652565e-05, "epoch": 1.7457627118644068, "percentage": 58.19, "elapsed_time": "0:35:51", "remaining_time": "0:25:45"}
105
+ {"current_steps": 1040, "total_steps": 1770, "loss": 1.6162, "lr": 2.173073513227667e-05, "epoch": 1.7627118644067796, "percentage": 58.76, "elapsed_time": "0:36:12", "remaining_time": "0:25:24"}
106
+ {"current_steps": 1050, "total_steps": 1770, "loss": 1.6162, "lr": 2.1242605512488248e-05, "epoch": 1.7796610169491527, "percentage": 59.32, "elapsed_time": "0:36:32", "remaining_time": "0:25:03"}
107
+ {"current_steps": 1060, "total_steps": 1770, "loss": 1.6146, "lr": 2.0755937197839802e-05, "epoch": 1.7966101694915255, "percentage": 59.89, "elapsed_time": "0:36:52", "remaining_time": "0:24:42"}
108
+ {"current_steps": 1070, "total_steps": 1770, "loss": 1.6178, "lr": 2.0270919460688055e-05, "epoch": 1.8135593220338984, "percentage": 60.45, "elapsed_time": "0:37:13", "remaining_time": "0:24:21"}
109
+ {"current_steps": 1080, "total_steps": 1770, "loss": 1.6287, "lr": 1.9787740931456165e-05, "epoch": 1.8305084745762712, "percentage": 61.02, "elapsed_time": "0:37:33", "remaining_time": "0:23:59"}
110
+ {"current_steps": 1090, "total_steps": 1770, "loss": 1.6348, "lr": 1.9306589525272756e-05, "epoch": 1.847457627118644, "percentage": 61.58, "elapsed_time": "0:37:54", "remaining_time": "0:23:38"}
111
+ {"current_steps": 1100, "total_steps": 1770, "loss": 1.6295, "lr": 1.8827652368888888e-05, "epoch": 1.8644067796610169, "percentage": 62.15, "elapsed_time": "0:38:14", "remaining_time": "0:23:17"}
112
+ {"current_steps": 1110, "total_steps": 1770, "loss": 1.629, "lr": 1.835111572790183e-05, "epoch": 1.8813559322033897, "percentage": 62.71, "elapsed_time": "0:38:34", "remaining_time": "0:22:56"}
113
+ {"current_steps": 1120, "total_steps": 1770, "loss": 1.6127, "lr": 1.7877164934313628e-05, "epoch": 1.8983050847457628, "percentage": 63.28, "elapsed_time": "0:38:55", "remaining_time": "0:22:35"}
114
+ {"current_steps": 1130, "total_steps": 1770, "loss": 1.6345, "lr": 1.740598431445282e-05, "epoch": 1.9152542372881356, "percentage": 63.84, "elapsed_time": "0:39:15", "remaining_time": "0:22:14"}
115
+ {"current_steps": 1140, "total_steps": 1770, "loss": 1.6291, "lr": 1.6937757117287278e-05, "epoch": 1.9322033898305084, "percentage": 64.41, "elapsed_time": "0:39:36", "remaining_time": "0:21:53"}
116
+ {"current_steps": 1150, "total_steps": 1770, "loss": 1.6311, "lr": 1.6472665443155983e-05, "epoch": 1.9491525423728815, "percentage": 64.97, "elapsed_time": "0:39:56", "remaining_time": "0:21:32"}
117
+ {"current_steps": 1160, "total_steps": 1770, "loss": 1.6082, "lr": 1.6010890172947606e-05, "epoch": 1.9661016949152543, "percentage": 65.54, "elapsed_time": "0:40:16", "remaining_time": "0:21:10"}
118
+ {"current_steps": 1170, "total_steps": 1770, "loss": 1.6266, "lr": 1.5552610897753292e-05, "epoch": 1.9830508474576272, "percentage": 66.1, "elapsed_time": "0:40:37", "remaining_time": "0:20:49"}
119
+ {"current_steps": 1180, "total_steps": 1770, "loss": 1.6265, "lr": 1.509800584902108e-05, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:40:57", "remaining_time": "0:20:28"}
120
+ {"current_steps": 1190, "total_steps": 1770, "loss": 1.5776, "lr": 1.4647251829239139e-05, "epoch": 2.016949152542373, "percentage": 67.23, "elapsed_time": "0:41:17", "remaining_time": "0:20:07"}
121
+ {"current_steps": 1200, "total_steps": 1770, "loss": 1.5922, "lr": 1.4200524143174677e-05, "epoch": 2.0338983050847457, "percentage": 67.8, "elapsed_time": "0:41:38", "remaining_time": "0:19:46"}
122
+ {"current_steps": 1200, "total_steps": 1770, "eval_loss": 1.6305924654006958, "epoch": 2.0338983050847457, "percentage": 67.8, "elapsed_time": "0:41:42", "remaining_time": "0:19:48"}
123
+ {"current_steps": 1210, "total_steps": 1770, "loss": 1.5948, "lr": 1.3757996529695411e-05, "epoch": 2.0508474576271185, "percentage": 68.36, "elapsed_time": "0:42:02", "remaining_time": "0:19:27"}
124
+ {"current_steps": 1220, "total_steps": 1770, "loss": 1.5884, "lr": 1.331984109420001e-05, "epoch": 2.0677966101694913, "percentage": 68.93, "elapsed_time": "0:42:23", "remaining_time": "0:19:06"}
125
+ {"current_steps": 1230, "total_steps": 1770, "loss": 1.6067, "lr": 1.2886228241683749e-05, "epoch": 2.084745762711864, "percentage": 69.49, "elapsed_time": "0:42:43", "remaining_time": "0:18:45"}
126
+ {"current_steps": 1240, "total_steps": 1770, "loss": 1.6103, "lr": 1.2457326610465642e-05, "epoch": 2.1016949152542375, "percentage": 70.06, "elapsed_time": "0:43:03", "remaining_time": "0:18:24"}
127
+ {"current_steps": 1250, "total_steps": 1770, "loss": 1.5979, "lr": 1.2033303006602444e-05, "epoch": 2.1186440677966103, "percentage": 70.62, "elapsed_time": "0:43:24", "remaining_time": "0:18:03"}
128
+ {"current_steps": 1260, "total_steps": 1770, "loss": 1.5786, "lr": 1.1614322339015484e-05, "epoch": 2.135593220338983, "percentage": 71.19, "elapsed_time": "0:43:44", "remaining_time": "0:17:42"}
129
+ {"current_steps": 1270, "total_steps": 1770, "loss": 1.5903, "lr": 1.1200547555355067e-05, "epoch": 2.152542372881356, "percentage": 71.75, "elapsed_time": "0:44:04", "remaining_time": "0:17:21"}
130
+ {"current_steps": 1280, "total_steps": 1770, "loss": 1.5913, "lr": 1.0792139578627865e-05, "epoch": 2.169491525423729, "percentage": 72.32, "elapsed_time": "0:44:25", "remaining_time": "0:17:00"}
131
+ {"current_steps": 1290, "total_steps": 1770, "loss": 1.592, "lr": 1.0389257244611602e-05, "epoch": 2.1864406779661016, "percentage": 72.88, "elapsed_time": "0:44:45", "remaining_time": "0:16:39"}
132
+ {"current_steps": 1300, "total_steps": 1770, "loss": 1.5968, "lr": 9.992057240081487e-06, "epoch": 2.2033898305084745, "percentage": 73.45, "elapsed_time": "0:45:06", "remaining_time": "0:16:18"}
133
+ {"current_steps": 1310, "total_steps": 1770, "loss": 1.5893, "lr": 9.600694041872518e-06, "epoch": 2.2203389830508473, "percentage": 74.01, "elapsed_time": "0:45:26", "remaining_time": "0:15:57"}
134
+ {"current_steps": 1320, "total_steps": 1770, "loss": 1.5861, "lr": 9.215319856801158e-06, "epoch": 2.23728813559322, "percentage": 74.58, "elapsed_time": "0:45:46", "remaining_time": "0:15:36"}
135
+ {"current_steps": 1330, "total_steps": 1770, "loss": 1.606, "lr": 8.836084562469921e-06, "epoch": 2.2542372881355934, "percentage": 75.14, "elapsed_time": "0:46:07", "remaining_time": "0:15:15"}
136
+ {"current_steps": 1340, "total_steps": 1770, "loss": 1.5911, "lr": 8.463135648977773e-06, "epoch": 2.2711864406779663, "percentage": 75.71, "elapsed_time": "0:46:27", "remaining_time": "0:14:54"}
137
+ {"current_steps": 1350, "total_steps": 1770, "loss": 1.5832, "lr": 8.096618161559142e-06, "epoch": 2.288135593220339, "percentage": 76.27, "elapsed_time": "0:46:47", "remaining_time": "0:14:33"}
138
+ {"current_steps": 1360, "total_steps": 1770, "loss": 1.5868, "lr": 7.736674644173695e-06, "epoch": 2.305084745762712, "percentage": 76.84, "elapsed_time": "0:47:08", "remaining_time": "0:14:12"}
139
+ {"current_steps": 1370, "total_steps": 1770, "loss": 1.5788, "lr": 7.383445084068907e-06, "epoch": 2.3220338983050848, "percentage": 77.4, "elapsed_time": "0:47:28", "remaining_time": "0:13:51"}
140
+ {"current_steps": 1380, "total_steps": 1770, "loss": 1.5769, "lr": 7.037066857337058e-06, "epoch": 2.3389830508474576, "percentage": 77.97, "elapsed_time": "0:47:48", "remaining_time": "0:13:30"}
141
+ {"current_steps": 1390, "total_steps": 1770, "loss": 1.5676, "lr": 6.69767467548762e-06, "epoch": 2.3559322033898304, "percentage": 78.53, "elapsed_time": "0:48:09", "remaining_time": "0:13:09"}
142
+ {"current_steps": 1400, "total_steps": 1770, "loss": 1.5896, "lr": 6.365400533056012e-06, "epoch": 2.3728813559322033, "percentage": 79.1, "elapsed_time": "0:48:29", "remaining_time": "0:12:48"}
143
+ {"current_steps": 1410, "total_steps": 1770, "loss": 1.5698, "lr": 6.040373656269041e-06, "epoch": 2.389830508474576, "percentage": 79.66, "elapsed_time": "0:48:49", "remaining_time": "0:12:28"}
144
+ {"current_steps": 1420, "total_steps": 1770, "loss": 1.5881, "lr": 5.722720452786928e-06, "epoch": 2.406779661016949, "percentage": 80.23, "elapsed_time": "0:49:10", "remaining_time": "0:12:07"}
145
+ {"current_steps": 1430, "total_steps": 1770, "loss": 1.5864, "lr": 5.412564462541544e-06, "epoch": 2.423728813559322, "percentage": 80.79, "elapsed_time": "0:49:30", "remaining_time": "0:11:46"}
146
+ {"current_steps": 1440, "total_steps": 1770, "loss": 1.592, "lr": 5.110026309689922e-06, "epoch": 2.440677966101695, "percentage": 81.36, "elapsed_time": "0:49:50", "remaining_time": "0:11:25"}
147
+ {"current_steps": 1450, "total_steps": 1770, "loss": 1.5912, "lr": 4.815223655701812e-06, "epoch": 2.457627118644068, "percentage": 81.92, "elapsed_time": "0:50:11", "remaining_time": "0:11:04"}
148
+ {"current_steps": 1460, "total_steps": 1770, "loss": 1.5732, "lr": 4.5282711535994115e-06, "epoch": 2.4745762711864407, "percentage": 82.49, "elapsed_time": "0:50:31", "remaining_time": "0:10:43"}
149
+ {"current_steps": 1470, "total_steps": 1770, "loss": 1.5994, "lr": 4.2492804033671145e-06, "epoch": 2.4915254237288136, "percentage": 83.05, "elapsed_time": "0:50:51", "remaining_time": "0:10:22"}
150
+ {"current_steps": 1480, "total_steps": 1770, "loss": 1.5906, "lr": 3.978359908548746e-06, "epoch": 2.5084745762711864, "percentage": 83.62, "elapsed_time": "0:51:12", "remaining_time": "0:10:01"}
151
+ {"current_steps": 1490, "total_steps": 1770, "loss": 1.593, "lr": 3.71561503404885e-06, "epoch": 2.5254237288135593, "percentage": 84.18, "elapsed_time": "0:51:32", "remaining_time": "0:09:41"}
152
+ {"current_steps": 1500, "total_steps": 1770, "loss": 1.6067, "lr": 3.4611479651548457e-06, "epoch": 2.542372881355932, "percentage": 84.75, "elapsed_time": "0:51:52", "remaining_time": "0:09:20"}