maykcaldas commited on
Commit
603e4af
·
1 Parent(s): 5b69007

Upload FlaxBertForPreTraining

Browse files
Files changed (2) hide show
  1. config.json +17 -37
  2. flax_model.msgpack +2 -2
config.json CHANGED
@@ -1,43 +1,23 @@
1
  {
2
- "activation_dropout": 0.0,
3
- "activation_function": "relu",
4
  "architectures": [
5
- "BartModel"
6
  ],
7
- "attention_dropout": 0.0,
8
- "bos_token_id": 14,
9
- "classifier_dropout": 0.0,
10
- "d_model": 1024,
11
- "decoder_attention_heads": 4,
12
- "decoder_ffn_dim": 1024,
13
- "decoder_layerdrop": 0.0,
14
- "decoder_layers": 6,
15
- "decoder_start_token_id": 2,
16
- "dropout": 0.1,
17
- "encoder_attention_heads": 4,
18
- "encoder_ffn_dim": 1024,
19
- "encoder_layerdrop": 0.0,
20
- "encoder_layers": 6,
21
- "eos_token_id": 82,
22
- "forced_eos_token_id": 82,
23
- "id2label": {
24
- "0": "LABEL_0",
25
- "1": "LABEL_1",
26
- "2": "LABEL_2"
27
- },
28
- "init_std": 0.02,
29
- "is_encoder_decoder": true,
30
- "label2id": {
31
- "LABEL_0": 0,
32
- "LABEL_1": 1,
33
- "LABEL_2": 2
34
- },
35
- "max_position_embeddings": 1024,
36
- "model_type": "bart",
37
  "num_hidden_layers": 6,
38
- "pad_token_id": 18,
39
- "scale_embedding": false,
40
- "transformers_version": "4.21.2",
 
41
  "use_cache": true,
42
- "vocab_size": 84
43
  }
 
1
  {
 
 
2
  "architectures": [
3
+ "BertForPreTraining"
4
  ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "classifier_dropout": null,
7
+ "hidden_act": "gelu",
8
+ "hidden_dropout_prob": 0.1,
9
+ "hidden_size": 2048,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 1024,
12
+ "layer_norm_eps": 1e-12,
13
+ "max_position_embeddings": 512,
14
+ "model_type": "bert",
15
+ "num_attention_heads": 8,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
  "num_hidden_layers": 6,
17
+ "pad_token_id": 4,
18
+ "position_embedding_type": "absolute",
19
+ "transformers_version": "4.25.1",
20
+ "type_vocab_size": 2,
21
  "use_cache": true,
22
+ "vocab_size": 473
23
  }
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f30905e2a787c470160818dc6924585c26cc59f06586ae8d6d889fbc8e24c60
3
- size 412066738
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3b476a0ba630169b9d88d7723db6c410c71c2eebad5dab92695661d7db5e345
3
+ size 545494790