sumuks commited on
Commit
bf6ef4a
·
verified ·
1 Parent(s): 3f4d53f

Training in progress, step 1000

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +51 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f509c157b1a48dbcfe3c6436b6488702ec21e641507c405cbe8ef94110a6dc36
3
  size 645976488
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e94b87a58ad23a41943016a5384a0c5eea2b7a27c9024ce7df4f5ac4d217a6a
3
  size 645976488
trainer_log.jsonl CHANGED
@@ -48,3 +48,54 @@
48
  {"current_steps": 480, "total_steps": 1770, "loss": 1.6888, "lr": 4.5667864871793345e-05, "epoch": 0.8135593220338984, "percentage": 27.12, "elapsed_time": "0:16:18", "remaining_time": "0:43:49"}
49
  {"current_steps": 490, "total_steps": 1770, "loss": 1.6675, "lr": 4.538647406141308e-05, "epoch": 0.8305084745762712, "percentage": 27.68, "elapsed_time": "0:16:38", "remaining_time": "0:43:29"}
50
  {"current_steps": 500, "total_steps": 1770, "loss": 1.6828, "lr": 4.509715465598344e-05, "epoch": 0.847457627118644, "percentage": 28.25, "elapsed_time": "0:16:59", "remaining_time": "0:43:08"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
48
  {"current_steps": 480, "total_steps": 1770, "loss": 1.6888, "lr": 4.5667864871793345e-05, "epoch": 0.8135593220338984, "percentage": 27.12, "elapsed_time": "0:16:18", "remaining_time": "0:43:49"}
49
  {"current_steps": 490, "total_steps": 1770, "loss": 1.6675, "lr": 4.538647406141308e-05, "epoch": 0.8305084745762712, "percentage": 27.68, "elapsed_time": "0:16:38", "remaining_time": "0:43:29"}
50
  {"current_steps": 500, "total_steps": 1770, "loss": 1.6828, "lr": 4.509715465598344e-05, "epoch": 0.847457627118644, "percentage": 28.25, "elapsed_time": "0:16:59", "remaining_time": "0:43:08"}
51
+ {"current_steps": 510, "total_steps": 1770, "loss": 1.6713, "lr": 4.480001917601185e-05, "epoch": 0.864406779661017, "percentage": 28.81, "elapsed_time": "0:17:43", "remaining_time": "0:43:47"}
52
+ {"current_steps": 520, "total_steps": 1770, "loss": 1.6544, "lr": 4.449518318179029e-05, "epoch": 0.8813559322033898, "percentage": 29.38, "elapsed_time": "0:18:03", "remaining_time": "0:43:25"}
53
+ {"current_steps": 530, "total_steps": 1770, "loss": 1.6679, "lr": 4.418276522845231e-05, "epoch": 0.8983050847457628, "percentage": 29.94, "elapsed_time": "0:18:24", "remaining_time": "0:43:03"}
54
+ {"current_steps": 540, "total_steps": 1770, "loss": 1.6704, "lr": 4.386288681986516e-05, "epoch": 0.9152542372881356, "percentage": 30.51, "elapsed_time": "0:18:44", "remaining_time": "0:42:41"}
55
+ {"current_steps": 550, "total_steps": 1770, "loss": 1.6759, "lr": 4.353567236137521e-05, "epoch": 0.9322033898305084, "percentage": 31.07, "elapsed_time": "0:19:05", "remaining_time": "0:42:20"}
56
+ {"current_steps": 560, "total_steps": 1770, "loss": 1.6617, "lr": 4.3201249111424877e-05, "epoch": 0.9491525423728814, "percentage": 31.64, "elapsed_time": "0:19:25", "remaining_time": "0:41:58"}
57
+ {"current_steps": 570, "total_steps": 1770, "loss": 1.6632, "lr": 4.2859747132060006e-05, "epoch": 0.9661016949152542, "percentage": 32.2, "elapsed_time": "0:19:45", "remaining_time": "0:41:36"}
58
+ {"current_steps": 580, "total_steps": 1770, "loss": 1.6841, "lr": 4.251129923834685e-05, "epoch": 0.9830508474576272, "percentage": 32.77, "elapsed_time": "0:20:06", "remaining_time": "0:41:15"}
59
+ {"current_steps": 590, "total_steps": 1770, "loss": 1.6448, "lr": 4.215604094671835e-05, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:20:26", "remaining_time": "0:40:53"}
60
+ {"current_steps": 600, "total_steps": 1770, "loss": 1.6261, "lr": 4.1794110422269825e-05, "epoch": 1.0169491525423728, "percentage": 33.9, "elapsed_time": "0:20:47", "remaining_time": "0:40:31"}
61
+ {"current_steps": 600, "total_steps": 1770, "eval_loss": 1.6485204696655273, "epoch": 1.0169491525423728, "percentage": 33.9, "elapsed_time": "0:20:51", "remaining_time": "0:40:40"}
62
+ {"current_steps": 610, "total_steps": 1770, "loss": 1.6501, "lr": 4.142564842502461e-05, "epoch": 1.0338983050847457, "percentage": 34.46, "elapsed_time": "0:21:11", "remaining_time": "0:40:18"}
63
+ {"current_steps": 620, "total_steps": 1770, "loss": 1.6435, "lr": 4.1050798255190405e-05, "epoch": 1.0508474576271187, "percentage": 35.03, "elapsed_time": "0:21:32", "remaining_time": "0:39:57"}
64
+ {"current_steps": 630, "total_steps": 1770, "loss": 1.6567, "lr": 4.0669705697427754e-05, "epoch": 1.0677966101694916, "percentage": 35.59, "elapsed_time": "0:21:52", "remaining_time": "0:39:35"}
65
+ {"current_steps": 640, "total_steps": 1770, "loss": 1.6527, "lr": 4.0282518964152296e-05, "epoch": 1.0847457627118644, "percentage": 36.16, "elapsed_time": "0:22:13", "remaining_time": "0:39:13"}
66
+ {"current_steps": 650, "total_steps": 1770, "loss": 1.6408, "lr": 3.988938863789278e-05, "epoch": 1.1016949152542372, "percentage": 36.72, "elapsed_time": "0:22:33", "remaining_time": "0:38:52"}
67
+ {"current_steps": 660, "total_steps": 1770, "loss": 1.6441, "lr": 3.949046761272736e-05, "epoch": 1.11864406779661, "percentage": 37.29, "elapsed_time": "0:22:53", "remaining_time": "0:38:30"}
68
+ {"current_steps": 670, "total_steps": 1770, "loss": 1.6454, "lr": 3.908591103482088e-05, "epoch": 1.1355932203389831, "percentage": 37.85, "elapsed_time": "0:23:14", "remaining_time": "0:38:09"}
69
+ {"current_steps": 680, "total_steps": 1770, "loss": 1.6689, "lr": 3.867587624208627e-05, "epoch": 1.152542372881356, "percentage": 38.42, "elapsed_time": "0:23:34", "remaining_time": "0:37:47"}
70
+ {"current_steps": 690, "total_steps": 1770, "loss": 1.6475, "lr": 3.826052270299356e-05, "epoch": 1.1694915254237288, "percentage": 38.98, "elapsed_time": "0:23:55", "remaining_time": "0:37:26"}
71
+ {"current_steps": 700, "total_steps": 1770, "loss": 1.6469, "lr": 3.784001195455027e-05, "epoch": 1.1864406779661016, "percentage": 39.55, "elapsed_time": "0:24:15", "remaining_time": "0:37:04"}
72
+ {"current_steps": 710, "total_steps": 1770, "loss": 1.6335, "lr": 3.7414507539477315e-05, "epoch": 1.2033898305084745, "percentage": 40.11, "elapsed_time": "0:24:35", "remaining_time": "0:36:43"}
73
+ {"current_steps": 720, "total_steps": 1770, "loss": 1.6289, "lr": 3.698417494260494e-05, "epoch": 1.2203389830508475, "percentage": 40.68, "elapsed_time": "0:24:56", "remaining_time": "0:36:22"}
74
+ {"current_steps": 730, "total_steps": 1770, "loss": 1.6428, "lr": 3.654918152651319e-05, "epoch": 1.2372881355932204, "percentage": 41.24, "elapsed_time": "0:25:16", "remaining_time": "0:36:00"}
75
+ {"current_steps": 740, "total_steps": 1770, "loss": 1.6592, "lr": 3.610969646644222e-05, "epoch": 1.2542372881355932, "percentage": 41.81, "elapsed_time": "0:25:37", "remaining_time": "0:35:39"}
76
+ {"current_steps": 750, "total_steps": 1770, "loss": 1.6251, "lr": 3.566589068449761e-05, "epoch": 1.271186440677966, "percentage": 42.37, "elapsed_time": "0:25:57", "remaining_time": "0:35:18"}
77
+ {"current_steps": 760, "total_steps": 1770, "loss": 1.6708, "lr": 3.5217936783176216e-05, "epoch": 1.288135593220339, "percentage": 42.94, "elapsed_time": "0:26:17", "remaining_time": "0:34:57"}
78
+ {"current_steps": 770, "total_steps": 1770, "loss": 1.6334, "lr": 3.476600897823864e-05, "epoch": 1.305084745762712, "percentage": 43.5, "elapsed_time": "0:26:38", "remaining_time": "0:34:35"}
79
+ {"current_steps": 780, "total_steps": 1770, "loss": 1.6475, "lr": 3.431028303095415e-05, "epoch": 1.3220338983050848, "percentage": 44.07, "elapsed_time": "0:26:58", "remaining_time": "0:34:14"}
80
+ {"current_steps": 790, "total_steps": 1770, "loss": 1.6418, "lr": 3.385093617974458e-05, "epoch": 1.3389830508474576, "percentage": 44.63, "elapsed_time": "0:27:19", "remaining_time": "0:33:53"}
81
+ {"current_steps": 800, "total_steps": 1770, "loss": 1.6296, "lr": 3.338814707125377e-05, "epoch": 1.3559322033898304, "percentage": 45.2, "elapsed_time": "0:27:39", "remaining_time": "0:33:32"}
82
+ {"current_steps": 810, "total_steps": 1770, "loss": 1.636, "lr": 3.2922095690869224e-05, "epoch": 1.3728813559322033, "percentage": 45.76, "elapsed_time": "0:27:59", "remaining_time": "0:33:10"}
83
+ {"current_steps": 820, "total_steps": 1770, "loss": 1.6156, "lr": 3.2452963292723305e-05, "epoch": 1.3898305084745763, "percentage": 46.33, "elapsed_time": "0:28:20", "remaining_time": "0:32:49"}
84
+ {"current_steps": 830, "total_steps": 1770, "loss": 1.6474, "lr": 3.1980932329200756e-05, "epoch": 1.4067796610169492, "percentage": 46.89, "elapsed_time": "0:28:40", "remaining_time": "0:32:28"}
85
+ {"current_steps": 840, "total_steps": 1770, "loss": 1.6356, "lr": 3.150618637998041e-05, "epoch": 1.423728813559322, "percentage": 47.46, "elapsed_time": "0:29:01", "remaining_time": "0:32:07"}
86
+ {"current_steps": 850, "total_steps": 1770, "loss": 1.6396, "lr": 3.1028910080638354e-05, "epoch": 1.4406779661016949, "percentage": 48.02, "elapsed_time": "0:29:21", "remaining_time": "0:31:46"}
87
+ {"current_steps": 860, "total_steps": 1770, "loss": 1.6402, "lr": 3.054928905084049e-05, "epoch": 1.457627118644068, "percentage": 48.59, "elapsed_time": "0:29:41", "remaining_time": "0:31:25"}
88
+ {"current_steps": 870, "total_steps": 1770, "loss": 1.6282, "lr": 3.006750982215234e-05, "epoch": 1.4745762711864407, "percentage": 49.15, "elapsed_time": "0:30:02", "remaining_time": "0:31:04"}
89
+ {"current_steps": 880, "total_steps": 1770, "loss": 1.6402, "lr": 2.9583759765494267e-05, "epoch": 1.4915254237288136, "percentage": 49.72, "elapsed_time": "0:30:22", "remaining_time": "0:30:43"}
90
+ {"current_steps": 890, "total_steps": 1770, "loss": 1.6392, "lr": 2.9098227018270134e-05, "epoch": 1.5084745762711864, "percentage": 50.28, "elapsed_time": "0:30:42", "remaining_time": "0:30:22"}
91
+ {"current_steps": 900, "total_steps": 1770, "loss": 1.6472, "lr": 2.8611100411198037e-05, "epoch": 1.5254237288135593, "percentage": 50.85, "elapsed_time": "0:31:03", "remaining_time": "0:30:01"}
92
+ {"current_steps": 910, "total_steps": 1770, "loss": 1.6215, "lr": 2.8122569394871225e-05, "epoch": 1.542372881355932, "percentage": 51.41, "elapsed_time": "0:31:23", "remaining_time": "0:29:40"}
93
+ {"current_steps": 920, "total_steps": 1770, "loss": 1.6313, "lr": 2.763282396607803e-05, "epoch": 1.559322033898305, "percentage": 51.98, "elapsed_time": "0:31:43", "remaining_time": "0:29:19"}
94
+ {"current_steps": 930, "total_steps": 1770, "loss": 1.6452, "lr": 2.7142054593909422e-05, "epoch": 1.576271186440678, "percentage": 52.54, "elapsed_time": "0:32:04", "remaining_time": "0:28:58"}
95
+ {"current_steps": 940, "total_steps": 1770, "loss": 1.6386, "lr": 2.6650452145682762e-05, "epoch": 1.5932203389830508, "percentage": 53.11, "elapsed_time": "0:32:24", "remaining_time": "0:28:37"}
96
+ {"current_steps": 950, "total_steps": 1770, "loss": 1.6301, "lr": 2.615820781271075e-05, "epoch": 1.6101694915254239, "percentage": 53.67, "elapsed_time": "0:32:45", "remaining_time": "0:28:16"}
97
+ {"current_steps": 960, "total_steps": 1770, "loss": 1.6247, "lr": 2.566551303594437e-05, "epoch": 1.6271186440677967, "percentage": 54.24, "elapsed_time": "0:33:05", "remaining_time": "0:27:55"}
98
+ {"current_steps": 970, "total_steps": 1770, "loss": 1.6387, "lr": 2.5172559431518727e-05, "epoch": 1.6440677966101696, "percentage": 54.8, "elapsed_time": "0:33:25", "remaining_time": "0:27:34"}
99
+ {"current_steps": 980, "total_steps": 1770, "loss": 1.6289, "lr": 2.467953871623073e-05, "epoch": 1.6610169491525424, "percentage": 55.37, "elapsed_time": "0:33:46", "remaining_time": "0:27:13"}
100
+ {"current_steps": 990, "total_steps": 1770, "loss": 1.6339, "lr": 2.4186642632977697e-05, "epoch": 1.6779661016949152, "percentage": 55.93, "elapsed_time": "0:34:06", "remaining_time": "0:26:52"}
101
+ {"current_steps": 1000, "total_steps": 1770, "loss": 1.6172, "lr": 2.3694062876185738e-05, "epoch": 1.694915254237288, "percentage": 56.5, "elapsed_time": "0:34:26", "remaining_time": "0:26:31"}