eustlb HF staff commited on
Commit
7a0aee6
·
1 Parent(s): 9b6356d

update max tokens based on 30sec (max trained sample) * 6.5 toks/sec

Browse files
Files changed (2) hide show
  1. config.json +2 -1
  2. generation_config.json +3 -1
config.json CHANGED
@@ -5,6 +5,7 @@
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
 
8
  "decoder_hidden_act": "silu",
9
  "decoder_num_attention_heads": 8,
10
  "decoder_num_hidden_layers": 6,
@@ -19,7 +20,7 @@
19
  "initializer_range": 0.02,
20
  "intermediate_size": 1152,
21
  "is_encoder_decoder": true,
22
- "max_position_embeddings": 512,
23
  "model_type": "moonshine",
24
  "partial_rotary_factor": 0.9,
25
  "rope_scaling": null,
 
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
8
+ "pad_token_id": 2,
9
  "decoder_hidden_act": "silu",
10
  "decoder_num_attention_heads": 8,
11
  "decoder_num_hidden_layers": 6,
 
20
  "initializer_range": 0.02,
21
  "intermediate_size": 1152,
22
  "is_encoder_decoder": true,
23
+ "max_position_embeddings": 194,
24
  "model_type": "moonshine",
25
  "partial_rotary_factor": 0.9,
26
  "rope_scaling": null,
generation_config.json CHANGED
@@ -2,6 +2,8 @@
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
  "decoder_start_token_id": 1,
 
5
  "eos_token_id": 2,
6
- "transformers_version": "4.48.0.dev0"
 
7
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
  "decoder_start_token_id": 1,
5
+ "pad_token_id": 2,
6
  "eos_token_id": 2,
7
+ "transformers_version": "4.48.0.dev0",
8
+ "max_length": 194
9
  }