Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- added_tokens.json +24 -0
- checkpoint-10000/added_tokens.json +24 -0
- checkpoint-10000/config.json +203 -0
- checkpoint-10000/generation_config.json +14 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- checkpoint-10000/global_step10000/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt +3 -0
added_tokens.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"</tool_call>": 151658,
|
3 |
+
"<tool_call>": 151657,
|
4 |
+
"<|box_end|>": 151649,
|
5 |
+
"<|box_start|>": 151648,
|
6 |
+
"<|endoftext|>": 151643,
|
7 |
+
"<|file_sep|>": 151664,
|
8 |
+
"<|fim_middle|>": 151660,
|
9 |
+
"<|fim_pad|>": 151662,
|
10 |
+
"<|fim_prefix|>": 151659,
|
11 |
+
"<|fim_suffix|>": 151661,
|
12 |
+
"<|im_end|>": 151645,
|
13 |
+
"<|im_start|>": 151644,
|
14 |
+
"<|image_pad|>": 151655,
|
15 |
+
"<|object_ref_end|>": 151647,
|
16 |
+
"<|object_ref_start|>": 151646,
|
17 |
+
"<|quad_end|>": 151651,
|
18 |
+
"<|quad_start|>": 151650,
|
19 |
+
"<|repo_name|>": 151663,
|
20 |
+
"<|video_pad|>": 151656,
|
21 |
+
"<|vision_end|>": 151653,
|
22 |
+
"<|vision_pad|>": 151654,
|
23 |
+
"<|vision_start|>": 151652
|
24 |
+
}
|
checkpoint-10000/added_tokens.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"</tool_call>": 151658,
|
3 |
+
"<tool_call>": 151657,
|
4 |
+
"<|box_end|>": 151649,
|
5 |
+
"<|box_start|>": 151648,
|
6 |
+
"<|endoftext|>": 151643,
|
7 |
+
"<|file_sep|>": 151664,
|
8 |
+
"<|fim_middle|>": 151660,
|
9 |
+
"<|fim_pad|>": 151662,
|
10 |
+
"<|fim_prefix|>": 151659,
|
11 |
+
"<|fim_suffix|>": 151661,
|
12 |
+
"<|im_end|>": 151645,
|
13 |
+
"<|im_start|>": 151644,
|
14 |
+
"<|image_pad|>": 151655,
|
15 |
+
"<|object_ref_end|>": 151647,
|
16 |
+
"<|object_ref_start|>": 151646,
|
17 |
+
"<|quad_end|>": 151651,
|
18 |
+
"<|quad_start|>": 151650,
|
19 |
+
"<|repo_name|>": 151663,
|
20 |
+
"<|video_pad|>": 151656,
|
21 |
+
"<|vision_end|>": 151653,
|
22 |
+
"<|vision_pad|>": 151654,
|
23 |
+
"<|vision_start|>": 151652
|
24 |
+
}
|
checkpoint-10000/config.json
ADDED
@@ -0,0 +1,203 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/mnt/bn/tiktok-mm-4/aiic/users/brianli/prod/checkpoints/LLaVA-OV-Qwen2-Mammoth-VL-8B",
|
3 |
+
"add_faster_video": false,
|
4 |
+
"add_time_instruction": false,
|
5 |
+
"architectures": [
|
6 |
+
"LlavaQwenForCausalLM"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.0,
|
9 |
+
"bos_token_id": 151643,
|
10 |
+
"eos_token_id": 151645,
|
11 |
+
"faster_token_stride": 10,
|
12 |
+
"force_sample": false,
|
13 |
+
"hidden_act": "silu",
|
14 |
+
"hidden_size": 3584,
|
15 |
+
"image_aspect_ratio": "anyres_max_4",
|
16 |
+
"image_crop_resolution": null,
|
17 |
+
"image_grid_pinpoints": [
|
18 |
+
[
|
19 |
+
384,
|
20 |
+
384
|
21 |
+
],
|
22 |
+
[
|
23 |
+
384,
|
24 |
+
768
|
25 |
+
],
|
26 |
+
[
|
27 |
+
384,
|
28 |
+
1152
|
29 |
+
],
|
30 |
+
[
|
31 |
+
384,
|
32 |
+
1536
|
33 |
+
],
|
34 |
+
[
|
35 |
+
384,
|
36 |
+
1920
|
37 |
+
],
|
38 |
+
[
|
39 |
+
384,
|
40 |
+
2304
|
41 |
+
],
|
42 |
+
[
|
43 |
+
768,
|
44 |
+
384
|
45 |
+
],
|
46 |
+
[
|
47 |
+
768,
|
48 |
+
768
|
49 |
+
],
|
50 |
+
[
|
51 |
+
768,
|
52 |
+
1152
|
53 |
+
],
|
54 |
+
[
|
55 |
+
768,
|
56 |
+
1536
|
57 |
+
],
|
58 |
+
[
|
59 |
+
768,
|
60 |
+
1920
|
61 |
+
],
|
62 |
+
[
|
63 |
+
768,
|
64 |
+
2304
|
65 |
+
],
|
66 |
+
[
|
67 |
+
1152,
|
68 |
+
384
|
69 |
+
],
|
70 |
+
[
|
71 |
+
1152,
|
72 |
+
768
|
73 |
+
],
|
74 |
+
[
|
75 |
+
1152,
|
76 |
+
1152
|
77 |
+
],
|
78 |
+
[
|
79 |
+
1152,
|
80 |
+
1536
|
81 |
+
],
|
82 |
+
[
|
83 |
+
1152,
|
84 |
+
1920
|
85 |
+
],
|
86 |
+
[
|
87 |
+
1152,
|
88 |
+
2304
|
89 |
+
],
|
90 |
+
[
|
91 |
+
1536,
|
92 |
+
384
|
93 |
+
],
|
94 |
+
[
|
95 |
+
1536,
|
96 |
+
768
|
97 |
+
],
|
98 |
+
[
|
99 |
+
1536,
|
100 |
+
1152
|
101 |
+
],
|
102 |
+
[
|
103 |
+
1536,
|
104 |
+
1536
|
105 |
+
],
|
106 |
+
[
|
107 |
+
1536,
|
108 |
+
1920
|
109 |
+
],
|
110 |
+
[
|
111 |
+
1536,
|
112 |
+
2304
|
113 |
+
],
|
114 |
+
[
|
115 |
+
1920,
|
116 |
+
384
|
117 |
+
],
|
118 |
+
[
|
119 |
+
1920,
|
120 |
+
768
|
121 |
+
],
|
122 |
+
[
|
123 |
+
1920,
|
124 |
+
1152
|
125 |
+
],
|
126 |
+
[
|
127 |
+
1920,
|
128 |
+
1536
|
129 |
+
],
|
130 |
+
[
|
131 |
+
1920,
|
132 |
+
1920
|
133 |
+
],
|
134 |
+
[
|
135 |
+
1920,
|
136 |
+
2304
|
137 |
+
],
|
138 |
+
[
|
139 |
+
2304,
|
140 |
+
384
|
141 |
+
],
|
142 |
+
[
|
143 |
+
2304,
|
144 |
+
768
|
145 |
+
],
|
146 |
+
[
|
147 |
+
2304,
|
148 |
+
1152
|
149 |
+
],
|
150 |
+
[
|
151 |
+
2304,
|
152 |
+
1536
|
153 |
+
],
|
154 |
+
[
|
155 |
+
2304,
|
156 |
+
1920
|
157 |
+
],
|
158 |
+
[
|
159 |
+
2304,
|
160 |
+
2304
|
161 |
+
]
|
162 |
+
],
|
163 |
+
"image_split_resolution": null,
|
164 |
+
"initializer_range": 0.02,
|
165 |
+
"intermediate_size": 18944,
|
166 |
+
"max_position_embeddings": 32768,
|
167 |
+
"max_window_layers": 28,
|
168 |
+
"mm_hidden_size": 1152,
|
169 |
+
"mm_newline_position": "grid",
|
170 |
+
"mm_patch_merge_type": "spatial_unpad",
|
171 |
+
"mm_projector_lr": null,
|
172 |
+
"mm_projector_type": "mlp2x_gelu",
|
173 |
+
"mm_resampler_type": null,
|
174 |
+
"mm_spatial_pool_mode": "bilinear",
|
175 |
+
"mm_spatial_pool_stride": null,
|
176 |
+
"mm_tunable_parts": "mm_vision_tower,mm_mlp_adapter,mm_language_model",
|
177 |
+
"mm_use_im_patch_token": false,
|
178 |
+
"mm_use_im_start_end": false,
|
179 |
+
"mm_vision_select_feature": "patch",
|
180 |
+
"mm_vision_select_layer": -2,
|
181 |
+
"mm_vision_tower": "google/siglip-so400m-patch14-384",
|
182 |
+
"mm_vision_tower_lr": 2e-06,
|
183 |
+
"model_type": "qwen2",
|
184 |
+
"num_attention_heads": 28,
|
185 |
+
"num_hidden_layers": 28,
|
186 |
+
"num_key_value_heads": 4,
|
187 |
+
"pos_skipping_range": 4096,
|
188 |
+
"rms_norm_eps": 1e-06,
|
189 |
+
"rope_scaling": null,
|
190 |
+
"rope_theta": 1000000.0,
|
191 |
+
"sliding_window": 131072,
|
192 |
+
"tie_word_embeddings": false,
|
193 |
+
"tokenizer_model_max_length": 8192,
|
194 |
+
"tokenizer_padding_side": "right",
|
195 |
+
"torch_dtype": "bfloat16",
|
196 |
+
"transformers_version": "4.40.0.dev0",
|
197 |
+
"use_cache": false,
|
198 |
+
"use_mm_proj": true,
|
199 |
+
"use_pos_skipping": false,
|
200 |
+
"use_sliding_window": false,
|
201 |
+
"vision_tower_pretrained": null,
|
202 |
+
"vocab_size": 152064
|
203 |
+
}
|
checkpoint-10000/generation_config.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 151643,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
151645,
|
6 |
+
151643
|
7 |
+
],
|
8 |
+
"pad_token_id": 151643,
|
9 |
+
"repetition_penalty": 1.05,
|
10 |
+
"temperature": 0.7,
|
11 |
+
"top_k": 20,
|
12 |
+
"top_p": 0.8,
|
13 |
+
"transformers_version": "4.40.0.dev0"
|
14 |
+
}
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c77d280c35d8b39d47c70af247cba8255092737de28ab9b6e75384f28005a293
|
3 |
+
size 1505698422
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22d83b3432e72d79879a6781f6d0e1fb12f5e326636077347b1d96c2b171c010
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3355b1d6dfe785f1be5b74dad865368c655fd8af10254eb22488932395d6d0f3
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:078e00dc8e67489a40ac33906e6840c343b937da3e7da5ad52115a2563092f27
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55850863215c73500af4600e2a05ce46391308d439f7e00ae9a0afd2c7dc8dbd
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85273695e6f4931c3780f2afeebbcd7584cd99e586962ec625f5c1d2b2824596
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:652ce75dbf35ac60b6c0461496b1d926118d6399a00491704f1cb8382a7ae6f5
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea2b7aa6567c069510bf57e88fe42b1822c83d5cfbdcf234f1add29b24bad1e7
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7247baa13839f2b4bba5f3fad5d9f7955f22a97c2b2bffc2143f5ea2ddf5a043
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:681b431132a2ccfef7ef5eb4ea66f33576744262219afd917e40a130cb8523d1
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d73fa797c18c2696f68fe1bc57302a0bba98188954a8a5006fc4223810ce0a72
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e62845de302b907743f63de124daa96222af740233385098fbc12884015580e
|
3 |
+
size 1505698422
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1e4a50ec200a12962936a0027d40fa3395120a504c3bc9a5a4d0a1aab5bc74d
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b985c2ad9db06162a547d93b75b805d5127f750ee8a05f274030f7d33982b50
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a440829bb23d3568c9a0c149c02799dd1686950f040e3d3bef225fd81854b80
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:767c459afbd0439f4644cb45070f28ba86b131b2051f264ca4a056831e6377a5
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e2efc9b65bfba1748fad101855a4805b80551ad18aae5b61f98ce022e658fe6
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d947bd75d9c74397ff4b4ac1cf1f33e8871a61a3480ddf10aadf02bdda6a018a
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec4250ca8abd5e76dbf8183637c5ccf279b94891ed794c5582233e3859e00589
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:981ff8cc31901f5340eeee22c144ff4af700d5ac869ae3a53804b1535c52bfbd
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9e9087a20ce5bb798dcabc4ed532dbc6eaa8b3ff7b142776a8a842a756c20ed
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7382e877975216a842ae2175e70dac54296f07a460e9d125278784b9d16f3f10
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d4fcdcb85883c7078529088387d725a1d5bba7e6a097b1461bf7de82e2a6645
|
3 |
+
size 1505698422
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f243d2aadd2a410f881765d4c00af20e9abc97fcf29824e03bd1540da7f14f0
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf1ac8268c1fcc27424669f93eb7ce97b0dea540f41c259955f363c3a16ba657
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75484b5980784be3e69e73b8912539cc3bb9b4f3669e4c8d35d5e3123ff8ca1c
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f62bb83afdd74df68274d214997d7f85271c0e63fc3ff3266b907d2530ca98e5
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a06d9f6f7c5cd3b350e6a49b814193a839a156eac14ea2787e00781c2801530
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9096130d05e3931341d653b0a542cc019614d10dca324aee430ba75b5ef2a7e0
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:236097383dfa1379c5d55657dded3800895ade894bc57a78e4173f43fa477c6c
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a127eae3c2337b8442416bd82c53105a275653eeb2edc3b3bfde7b520d55ce3
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:302ca4f135f81a6f45718a3fd1d63d6476bf02eae80a3a80730ff07f72153395
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f2cf498c66e90565b50ad702e81646bb6cc91f438fef9d0af2cd68a121311e1
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddf633efbe0d4ece620918e16693aa6aa3322ef4d151285028413eb791d85d63
|
3 |
+
size 1505698422
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95f76460a25996b45fdf8d2ef166c587f196622b04c3e52a72ac3e01ade58c72
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f868154cb714e483da172d1f45f421025af5a546dee540f80c69557bd07b8792
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d74e9ce025d50380e8f8ecfb8c94f5f9792ad44fae02106cb3e9bc4fec51d6cf
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3861238277f269ba273476a6412ec83c49c49f33ce552d2b138dd6364c0e4658
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c06b2bdbbc6a97bbb3d8df4a85ebdc2075242c21b59c02b03f52a823f4cf4a5
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7333ce4a3059e9ec710d77f647aa10b2e90d2452e68ff75b16a26ce127951652
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9407c3b852e949ab5e355836a2d70cd35b3437878e8cab35db9c54e21283580
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:178ac8edda525257b48614e6ade3e5a2f95fc2d4d84e9ce9f06d6fe19fb4e7a2
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18de407441f528e82c0d6e2d00da413a6170c37b073cb79a15692c08e1a16c3d
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b72663af9b2b4316df9609d1018dc9617a8ca1e7459460845693534c97e1218
|
3 |
+
size 1505698442
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85edd41b9fda89ff5a51c933cb546c218b8e9115008b2426f173fceafde626ae
|
3 |
+
size 1505698422
|
checkpoint-10000/global_step10000/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68d032e711ba379ccbff18e6ebf1f0fc6d4b225639a899734011577c0caf68d8
|
3 |
+
size 1505698442
|