neeleshg23 commited on
Commit
36f65f5
·
verified ·
1 Parent(s): 2b82429

Training in progress, step 2500

Browse files
Files changed (3) hide show
  1. config.json +2 -2
  2. model.safetensors +2 -2
  3. training_args.bin +3 -0
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "./results/checkpoint-10000",
3
  "architectures": [
4
  "MambaForCausalLM"
5
  ],
@@ -24,7 +24,7 @@
24
  "time_step_min": 0.001,
25
  "time_step_rank": 100,
26
  "time_step_scale": 1.0,
27
- "torch_dtype": "float32",
28
  "transformers_version": "4.46.2",
29
  "use_bias": false,
30
  "use_cache": true,
 
1
  {
2
+ "_name_or_path": "neeleshg23/draft-mamba-2-1600",
3
  "architectures": [
4
  "MambaForCausalLM"
5
  ],
 
24
  "time_step_min": 0.001,
25
  "time_step_rank": 100,
26
  "time_step_scale": 1.0,
27
+ "torch_dtype": "bfloat16",
28
  "transformers_version": "4.46.2",
29
  "use_bias": false,
30
  "use_cache": true,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7b38269647977e0f44263bc88f49af1c7ab50403e0074befb3b1659faab65d5
3
- size 334235984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a5f3700364aa7836e2ef3e15b8d47eef8fc533df9297f97933ed3714451e1ae
3
+ size 167323992
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:740f3b1e9446d357f909219a84d69f2040974d954b81b82be1b89898329552bb
3
+ size 5240