vikp commited on
Commit
8429f44
1 Parent(s): 6352ac1

Upload model

Browse files
Files changed (3) hide show
  1. config.json +13 -13
  2. generation_config.json +0 -1
  3. model.safetensors +2 -2
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "vikp/order2",
3
  "architectures": [
4
  "OrderVisionEncoderDecoderModel"
5
  ],
@@ -23,7 +23,7 @@
23
  "decoder_attention_heads": 16,
24
  "decoder_ffn_dim": 4096,
25
  "decoder_layerdrop": 0.0,
26
- "decoder_layers": 4,
27
  "decoder_start_token_id": null,
28
  "diversity_penalty": 0.0,
29
  "do_sample": false,
@@ -52,10 +52,11 @@
52
  "LABEL_1": 1
53
  },
54
  "length_penalty": 1.0,
55
- "max_height": 1005,
56
- "max_length": 256,
57
  "max_position_embeddings": 1536,
58
- "max_width": 1005,
 
59
  "min_length": 0,
60
  "model_type": "mbart",
61
  "no_repeat_ngram_size": 0,
@@ -65,7 +66,6 @@
65
  "num_return_sequences": 1,
66
  "output_attentions": false,
67
  "output_hidden_states": false,
68
- "output_scale": 1000,
69
  "output_scores": false,
70
  "pad_token_id": 1,
71
  "prefix": null,
@@ -91,7 +91,7 @@
91
  "typical_p": 1.0,
92
  "use_bfloat16": false,
93
  "use_cache": true,
94
- "vocab_size": 57525
95
  },
96
  "encoder": {
97
  "_name_or_path": "vikp/donut-encoder",
@@ -107,10 +107,10 @@
107
  "cross_attention_hidden_size": null,
108
  "decoder_start_token_id": null,
109
  "depths": [
110
- 3,
111
- 4,
112
  14,
113
- 3
114
  ],
115
  "diversity_penalty": 0.0,
116
  "do_sample": false,
@@ -186,14 +186,14 @@
186
  "torch_dtype": "float32",
187
  "torchscript": false,
188
  "typical_p": 1.0,
189
- "use_2d_embeddings": true,
190
- "use_absolute_embeddings": false,
191
  "use_bfloat16": false,
192
  "window_size": 7
193
  },
194
  "is_encoder_decoder": true,
195
  "model_type": "vision-encoder-decoder",
196
  "tie_word_embeddings": false,
197
- "torch_dtype": "float16",
198
  "transformers_version": "4.36.2"
199
  }
 
1
  {
2
+ "_name_or_path": "vikp/order_hr",
3
  "architectures": [
4
  "OrderVisionEncoderDecoderModel"
5
  ],
 
23
  "decoder_attention_heads": 16,
24
  "decoder_ffn_dim": 4096,
25
  "decoder_layerdrop": 0.0,
26
+ "decoder_layers": 3,
27
  "decoder_start_token_id": null,
28
  "diversity_penalty": 0.0,
29
  "do_sample": false,
 
52
  "LABEL_1": 1
53
  },
54
  "length_penalty": 1.0,
55
+ "max_height": 1285,
56
+ "max_length": 20,
57
  "max_position_embeddings": 1536,
58
+ "max_target_positions": 517,
59
+ "max_width": 1285,
60
  "min_length": 0,
61
  "model_type": "mbart",
62
  "no_repeat_ngram_size": 0,
 
66
  "num_return_sequences": 1,
67
  "output_attentions": false,
68
  "output_hidden_states": false,
 
69
  "output_scores": false,
70
  "pad_token_id": 1,
71
  "prefix": null,
 
91
  "typical_p": 1.0,
92
  "use_bfloat16": false,
93
  "use_cache": true,
94
+ "vocab_size": 261
95
  },
96
  "encoder": {
97
  "_name_or_path": "vikp/donut-encoder",
 
107
  "cross_attention_hidden_size": null,
108
  "decoder_start_token_id": null,
109
  "depths": [
110
+ 2,
111
+ 2,
112
  14,
113
+ 2
114
  ],
115
  "diversity_penalty": 0.0,
116
  "do_sample": false,
 
186
  "torch_dtype": "float32",
187
  "torchscript": false,
188
  "typical_p": 1.0,
189
+ "use_2d_embeddings": false,
190
+ "use_absolute_embeddings": true,
191
  "use_bfloat16": false,
192
  "window_size": 7
193
  },
194
  "is_encoder_decoder": true,
195
  "model_type": "vision-encoder-decoder",
196
  "tie_word_embeddings": false,
197
+ "torch_dtype": "float32",
198
  "transformers_version": "4.36.2"
199
  }
generation_config.json CHANGED
@@ -3,7 +3,6 @@
3
  "bos_token_id": 0,
4
  "eos_token_id": 2,
5
  "forced_eos_token_id": 2,
6
- "max_length": 256,
7
  "pad_token_id": 1,
8
  "transformers_version": "4.36.2"
9
  }
 
3
  "bos_token_id": 0,
4
  "eos_token_id": 2,
5
  "forced_eos_token_id": 2,
 
6
  "pad_token_id": 1,
7
  "transformers_version": "4.36.2"
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bab3677b1d27a835e7f6ca54f719409789a9892f5b56f13b887858fef8415b0b
3
- size 306486136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76385baeaf50eab204bbd39b7ee7fb47af2763ff3319a088430f1eecd6776f13
3
+ size 550040752