katuni4ka commited on
Commit
6d9a937
·
verified ·
1 Parent(s): fbb330d

Upload 12 files

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer/tokenizer.json filter=lfs diff=lfs merge=lfs -text
model_index.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "SanaPipeline",
3
+ "_diffusers_version": "0.32.1",
4
+ "scheduler": [
5
+ "diffusers",
6
+ "FlowMatchEulerDiscreteScheduler"
7
+ ],
8
+ "text_encoder": [
9
+ "transformers",
10
+ "Gemma2Model"
11
+ ],
12
+ "tokenizer": [
13
+ "transformers",
14
+ "GemmaTokenizer"
15
+ ],
16
+ "transformer": [
17
+ "diffusers",
18
+ "SanaTransformer2DModel"
19
+ ],
20
+ "vae": [
21
+ "diffusers",
22
+ "AutoencoderDC"
23
+ ]
24
+ }
scheduler/scheduler_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "FlowMatchEulerDiscreteScheduler",
3
+ "_diffusers_version": "0.32.1",
4
+ "base_image_seq_len": 256,
5
+ "base_shift": 0.5,
6
+ "invert_sigmas": false,
7
+ "max_image_seq_len": 4096,
8
+ "max_shift": 1.15,
9
+ "num_train_timesteps": 1000,
10
+ "shift": 7.0,
11
+ "shift_terminal": null,
12
+ "use_beta_sigmas": false,
13
+ "use_dynamic_shifting": false,
14
+ "use_exponential_sigmas": false,
15
+ "use_karras_sigmas": false
16
+ }
text_encoder/config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Gemma2Model"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "attn_logit_softcapping": 50.0,
8
+ "bos_token_id": 2,
9
+ "cache_implementation": "hybrid",
10
+ "eos_token_id": 1,
11
+ "final_logit_softcapping": 30.0,
12
+ "head_dim": 16,
13
+ "hidden_activation": "gelu_pytorch_tanh",
14
+ "hidden_size": 8,
15
+ "initializer_range": 0.02,
16
+ "intermediate_size": 64,
17
+ "max_position_embeddings": 8192,
18
+ "model_type": "gemma2",
19
+ "num_attention_heads": 2,
20
+ "num_hidden_layers": 1,
21
+ "num_key_value_heads": 2,
22
+ "pad_token_id": 0,
23
+ "query_pre_attn_scalar": 224,
24
+ "rms_norm_eps": 1e-06,
25
+ "rope_theta": 10000.0,
26
+ "sliding_window": 4096,
27
+ "torch_dtype": "float32",
28
+ "transformers_version": "4.46.3",
29
+ "use_cache": true,
30
+ "vocab_size": 256000
31
+ }
text_encoder/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe4b97a4752fe2b5752f57a719674799c95d1c6b1c6a6222a4f294c8a7f0c4e8
3
+ size 8203696
tokenizer/special_tokens_map.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<bos>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<eos>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<pad>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "<unk>",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
+ }
tokenizer/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f7eee611703c5ce5d1eee32d9cdcfe465647b8aff0c1dfb3bed7ad7dbb05060
3
+ size 34362873
tokenizer/tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6969e64047744a44bb3abfb5c50f8de0f7ed8b571d5444426ef931f651d1a0ef
3
+ size 4241111
tokenizer/tokenizer_config.json ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
+ "added_tokens_decoder": {
5
+ "0": {
6
+ "content": "<pad>",
7
+ "lstrip": false,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false,
11
+ "special": true
12
+ },
13
+ "1": {
14
+ "content": "<eos>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ "2": {
22
+ "content": "<bos>",
23
+ "lstrip": false,
24
+ "normalized": false,
25
+ "rstrip": false,
26
+ "single_word": false,
27
+ "special": true
28
+ },
29
+ "3": {
30
+ "content": "<unk>",
31
+ "lstrip": false,
32
+ "normalized": false,
33
+ "rstrip": false,
34
+ "single_word": false,
35
+ "special": true
36
+ }
37
+ },
38
+ "bos_token": "<bos>",
39
+ "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
40
+ "clean_up_tokenization_spaces": false,
41
+ "eos_token": "<eos>",
42
+ "legacy": null,
43
+ "model_max_length": 1000000000000000019884624838656,
44
+ "pad_token": "<pad>",
45
+ "sp_model_kwargs": {},
46
+ "spaces_between_special_tokens": false,
47
+ "tokenizer_class": "GemmaTokenizer",
48
+ "unk_token": "<unk>",
49
+ "use_default_system_prompt": false
50
+ }
transformer/config.json ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "SanaTransformer2DModel",
3
+ "_diffusers_version": "0.32.1",
4
+ "attention_bias": false,
5
+ "attention_head_dim": 4,
6
+ "caption_channels": 8,
7
+ "cross_attention_dim": 8,
8
+ "cross_attention_head_dim": 4,
9
+ "dropout": 0.0,
10
+ "in_channels": 4,
11
+ "interpolation_scale": null,
12
+ "mlp_ratio": 2.5,
13
+ "norm_elementwise_affine": false,
14
+ "norm_eps": 1e-06,
15
+ "num_attention_heads": 2,
16
+ "num_cross_attention_heads": 2,
17
+ "num_layers": 2,
18
+ "out_channels": 4,
19
+ "patch_size": 2,
20
+ "sample_size": 32
21
+ }
transformer/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:290dbea496c321c14a6d6eff1e8700b98236e81ffddbc55257723cba98f1d3fe
3
+ size 29504
vae/config.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "AutoencoderDC",
3
+ "_diffusers_version": "0.32.1",
4
+ "attention_head_dim": 4,
5
+ "decoder_act_fns": "silu",
6
+ "decoder_block_out_channels": [
7
+ 8,
8
+ 8
9
+ ],
10
+ "decoder_block_types": [
11
+ "ResBlock",
12
+ "EfficientViTBlock"
13
+ ],
14
+ "decoder_layers_per_block": [
15
+ 1,
16
+ 1
17
+ ],
18
+ "decoder_norm_types": "rms_norm",
19
+ "decoder_qkv_multiscales": [
20
+ [],
21
+ [
22
+ 5
23
+ ]
24
+ ],
25
+ "downsample_block_type": "conv",
26
+ "encoder_block_out_channels": [
27
+ 8,
28
+ 8
29
+ ],
30
+ "encoder_block_types": [
31
+ "ResBlock",
32
+ "EfficientViTBlock"
33
+ ],
34
+ "encoder_layers_per_block": [
35
+ 1,
36
+ 1
37
+ ],
38
+ "encoder_qkv_multiscales": [
39
+ [],
40
+ [
41
+ 5
42
+ ]
43
+ ],
44
+ "in_channels": 3,
45
+ "latent_channels": 4,
46
+ "scaling_factor": 0.41407,
47
+ "upsample_block_type": "interpolate"
48
+ }
vae/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ec48485ff48bac9b212007be0398bf69fe296bda1b7538030636aaeacd463ad
3
+ size 43900