shreyaspimpalgaonkar commited on
Commit
061ba76
·
verified ·
1 Parent(s): a054ace

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +14 -10
config.json CHANGED
@@ -1,15 +1,17 @@
 
 
1
  "architectures": [
2
- "sciphi/triplex"
3
  ],
4
- "attention_bias": false,
5
  "attention_dropout": 0.0,
6
  "auto_map": {
7
- "AutoConfig": "microsoft/Phi-3-mini-128k-instruct--configuration_phi3.Phi3Config",
8
- "AutoModel": "microsoft/Phi-3-mini-128k-instruct--modeling_phi3.Phi3ForCausalLM",
9
- "AutoModelForCausalLM": "microsoft/Phi-3-mini-128k-instruct--modeling_phi3.Phi3ForCausalLM"
10
  },
11
  "bos_token_id": 1,
12
  "embd_pdrop": 0.0,
 
 
13
  "hidden_size": 3072,
14
  "initializer_range": 0.02,
15
  "intermediate_size": 8192,
@@ -17,6 +19,8 @@
17
  "model_type": "phi3",
18
  "num_attention_heads": 32,
19
  "num_hidden_layers": 32,
 
 
20
  "pad_token_id": 32000,
21
  "resid_pdrop": 0.0,
22
  "rms_norm_eps": 1e-05,
@@ -121,14 +125,14 @@
121
  2.8999999999999977,
122
  3.049999999999997
123
  ],
124
- "type": "yarn"
125
  },
126
  "rope_theta": 10000.0,
127
  "sliding_window": 262144,
128
  "tie_word_embeddings": false,
129
  "torch_dtype": "bfloat16",
130
- "transformers_version": "4.42.3",
131
- "use_cache": false,
132
-
133
  "vocab_size": 32064
134
- }
 
1
+ {
2
+ "_name_or_path": "sciphi/triplex",
3
  "architectures": [
4
+ "Phi3ForCausalLM"
5
  ],
 
6
  "attention_dropout": 0.0,
7
  "auto_map": {
8
+ "AutoConfig": "configuration_phi3.Phi3Config",
9
+ "AutoModelForCausalLM": "modeling_phi3.Phi3ForCausalLM"
 
10
  },
11
  "bos_token_id": 1,
12
  "embd_pdrop": 0.0,
13
+ "eos_token_id": 32000,
14
+ "hidden_act": "silu",
15
  "hidden_size": 3072,
16
  "initializer_range": 0.02,
17
  "intermediate_size": 8192,
 
19
  "model_type": "phi3",
20
  "num_attention_heads": 32,
21
  "num_hidden_layers": 32,
22
+ "num_key_value_heads": 32,
23
+ "original_max_position_embeddings": 4096,
24
  "pad_token_id": 32000,
25
  "resid_pdrop": 0.0,
26
  "rms_norm_eps": 1e-05,
 
125
  2.8999999999999977,
126
  3.049999999999997
127
  ],
128
+ "type": "longrope"
129
  },
130
  "rope_theta": 10000.0,
131
  "sliding_window": 262144,
132
  "tie_word_embeddings": false,
133
  "torch_dtype": "bfloat16",
134
+ "transformers_version": "4.40.2",
135
+ "use_cache": true,
136
+ "attention_bias": false,
137
  "vocab_size": 32064
138
+ }