Muennighoff
commited on
Commit
·
fb8067c
1
Parent(s):
9bae13a
Add
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +72 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt +3 -0
- 1b11b5100m/global_step2891/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt +3 -0
.gitattributes
CHANGED
@@ -393,3 +393,75 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
393 |
146m14b1b5/evaluation/generation/examples.146m14b1b5_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text
|
394 |
421m3b91b5/evaluation/generation/examples.421m3b91b5_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text
|
395 |
421m3b91b5/evaluation/generation/examples.421m3b91b5_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
393 |
146m14b1b5/evaluation/generation/examples.146m14b1b5_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text
|
394 |
421m3b91b5/evaluation/generation/examples.421m3b91b5_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text
|
395 |
421m3b91b5/evaluation/generation/examples.421m3b91b5_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text
|
396 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text
|
397 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text
|
398 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text
|
399 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text
|
400 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text
|
401 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text
|
402 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text
|
403 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text
|
404 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text
|
405 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text
|
406 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text
|
407 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text
|
408 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text
|
409 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text
|
410 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text
|
411 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text
|
412 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text
|
413 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text
|
414 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text
|
415 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text
|
416 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text
|
417 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text
|
418 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text
|
419 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text
|
420 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text
|
421 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text
|
422 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text
|
423 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text
|
424 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text
|
425 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text
|
426 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text
|
427 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text
|
428 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text
|
429 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text
|
430 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text
|
431 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text
|
432 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text
|
433 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text
|
434 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text
|
435 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text
|
436 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text
|
437 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text
|
438 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text
|
439 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text
|
440 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text
|
441 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text
|
442 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text
|
443 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text
|
444 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text
|
445 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text
|
446 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text
|
447 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text
|
448 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text
|
449 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text
|
450 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text
|
451 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text
|
452 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text
|
453 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text
|
454 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text
|
455 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text
|
456 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text
|
457 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text
|
458 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text
|
459 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text
|
460 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text
|
461 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text
|
462 |
+
1b11b51b5/evaluation/generation/examples.1b11b51b5_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text
|
463 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text
|
464 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text
|
465 |
+
619m22b22b/evaluation/generation/examples.619m22b22b_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text
|
466 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text
|
467 |
+
619m22b4b8/evaluation/generation/examples.619m22b4b8_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db1b094cf354e45a778a43db7f54a08f1e27d2634317ff51ef378e3b3838d11d
|
3 |
+
size 205568023
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e14beb359551b58199f235c0e02bd941c30fbdb5a9b91fc482c7f38aad63aab
|
3 |
+
size 205568162
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:181714819a3d922237ce56d03a83cf40b5f4eea572c5e4ce440fc7a4c48ca3f8
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f911b2985fb7aa44b8d9b35996cbbbd13169d82415f52e507b8022375b28cb1
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2061299a76f33576b9ce250b9e0bf970feb95fe3fd646c08b0ca2622acb946c
|
3 |
+
size 205568162
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d57cb598fc1846d6f855d6e5c4e00e82797f1dc13ba2408284b31d1868b07ad5
|
3 |
+
size 205568162
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be8e2e530d4ce9483e22589a1fd6dd09da81e41dc24d64a852038309a8cce56e
|
3 |
+
size 205568162
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1521ee4f6ef261af3bfab5f68be1aa6e728d19afec0ec2b0f0d86df0bb29b052
|
3 |
+
size 205567970
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26ebf2a06964504a79969c0b6658aed95cab5640c83ebbcf7a071e49d30a6492
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:698e822cc2f181e5068a1648170148bd2ae1e3c1a5e12c578f4829ccd36b245a
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a879c0b44a323db02107b32bd7b87242a9708b0bc569e8e0a6897be4d9afc12d
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:230d74416f2a36010b0aeed8054e0eee345c5a9449b7196bee1c2f4d78f3429f
|
3 |
+
size 205568151
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4788c2eb4698566c1676159a357bedaed8a3d881e6f1ba82b48d1cb3b3d46179
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93e3c08b316a92d5ac6afb52cfe3d2f373bab080dda19b2e19777f5a6cc589d6
|
3 |
+
size 205568034
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de8057323ade7890ef81f60f2b74ac6e8d5ac3ae468705ee7edf5de9545f5027
|
3 |
+
size 205568162
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c88bf0318aeeb0bb96704665ae829eba1e6dda41d8d85ff5fb7d6cba18e43f9
|
3 |
+
size 205568098
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb032cfe2338ef0eb0a99a66d0391d473838369aeb587c2148d56d4238ad2000
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fcf3795a1825455fa6a229b087838e7fd255e08e53530c1ff50e434b5ba9b583
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1918b9582f6faf60861c22692cb394cfc42bac80d9b8508f117a6ba18d3fd56d
|
3 |
+
size 205568034
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b877a352589c848a7f208966768ff31cf32c6cc2fee012c7b7404c19fd8ec5d4
|
3 |
+
size 205568162
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ad6a10f00b3d074e170bc908f518747d8e2fe08ba7207514ab74247983db776
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1805cf8704c5ab3abe7465a2c03ea6ced18434217c8da107d6a73dc7543f3561
|
3 |
+
size 205568098
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4f4918f1bfd75d87896b4fbc003421a8a416cd7a3fcdb0e6cbca0b41f4278f2
|
3 |
+
size 205568151
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc838be72907974b7ac55a792e9b3a2afa2d6216764b0dcb3a7a89c2aa0c40e2
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3e3fbf16adb55af4e1c5d3ece6da8e5b84c49e4ecd7714b8238abc6e3cf96b9
|
3 |
+
size 205568162
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1cc4b6c277db81f6b3c3ec4482357330c64947429ad8636d20a1fb51af9af9c8
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63c5125b823d77fdfa1d25ac61d6c9471443e12944ea4ee109452318b7514e8f
|
3 |
+
size 205568034
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d548dd512dbfbb5cfdd7d167a0b9c71a2bf6371e8c83c58f42f70f1a4faa445c
|
3 |
+
size 205568162
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4b610733a650e04421cbb5ce99ad503102274b06bdd6dbfbc2db53d40578b6a
|
3 |
+
size 205568290
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21474a01f5d09044034f6671f057885aa197ab638d35112507ab55a3163cf8fd
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:101efdd5ec18eff9549a4e35bb4b82efc7c26029cf08c0628ec157f2ca6b1243
|
3 |
+
size 205568098
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d6abfd051c4be40295a61e6bfdba7b5bf5c1ee82c5d652c78707259dbca83fd
|
3 |
+
size 205568162
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3baa12e7b6b33eac3a6b9c40756ff55b7b3f7fdcd890183f6ccbcc8293a8d3d
|
3 |
+
size 205568098
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ea882bebc763dcdba7504b14ee9b7dfd798b89749f255c6fe745a6e3597131e
|
3 |
+
size 205568215
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e0f0d104a3aa0059f55d9d758160ef829fdf22a30173bd03e1048d60426940a
|
3 |
+
size 205568162
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03c0e65929e60310f9ad4ce7134a844591e29e42dcba804b0965571bc66af6f2
|
3 |
+
size 205568354
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c1ce2a4ec7163259fa982a6d28c4ed53cbee68d2ed40361302bde7f85e44d4b
|
3 |
+
size 205568162
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25008365654f9c0982e459a840825712eba51106eebcf18db7236f6e0586969e
|
3 |
+
size 205568034
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e86de698fc9290f7915c8a205e1462457cf6f93df4c17825c91bd35bae100a8a
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:231394627d622c2e6f306ac4507d6834f0e9fc7cbffc8446c0d9de46ee270559
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44c0991da1a6173b4e6fb3b1f9a2434f3d7fb64a9a2b67cc1cd2c629269c0f21
|
3 |
+
size 205568162
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0252ba4e649f65ab4196550ec8e794112f27f588c50031a386741977325efee2
|
3 |
+
size 205568162
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f637ec37b2c19c5071d4b5e40b4d0fb3e49d094b6a696eaef4e94d3cf714e7d
|
3 |
+
size 205568034
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3d2510160a1ec149a69c9c280adc4581c89182cdc49dbd8a953ede05c05529e
|
3 |
+
size 205568290
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3508e9fe28d6d7c837a2cb7ad9fbab8804a060321951fcdffa8929ac67bc0d4c
|
3 |
+
size 205568023
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6e4a38516b7e2ba816b6f113649b05b0a7aaacd07feae7afbf74bcfb4f5f284
|
3 |
+
size 205568162
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6811f003a404942555437e84a0a7de89052aeb0316d0ca5b57f3f8f8f97b7d0f
|
3 |
+
size 205568226
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0dda45e2e1ee6d6e285503292c83eb4d0fd932e1ceb3145ed13edb8a6a31a70b
|
3 |
+
size 205568290
|
1b11b5100m/global_step2891/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d83856e3a620a2113c36c4879745b947efa57508e6accb0a8815403645ef087
|
3 |
+
size 205568034
|