2481asd commited on
Commit
8991a12
·
1 Parent(s): e39162b

Delete controlnet

Browse files
Files changed (28) hide show
  1. controlnet/control_v11e_sd15_ip2p.yaml +0 -79
  2. controlnet/control_v11e_sd15_ip2p_fp16.safetensors +0 -3
  3. controlnet/control_v11e_sd15_shuffle.yaml +0 -80
  4. controlnet/control_v11e_sd15_shuffle_fp16.safetensors +0 -3
  5. controlnet/control_v11f1e_sd15_tile.yaml +0 -79
  6. controlnet/control_v11f1e_sd15_tile_fp16.safetensors +0 -3
  7. controlnet/control_v11f1p_sd15_depth.yaml +0 -79
  8. controlnet/control_v11f1p_sd15_depth_fp16.safetensors +0 -3
  9. controlnet/control_v11p_sd15_canny.yaml +0 -79
  10. controlnet/control_v11p_sd15_canny_fp16.safetensors +0 -3
  11. controlnet/control_v11p_sd15_inpaint.yaml +0 -79
  12. controlnet/control_v11p_sd15_inpaint_fp16.safetensors +0 -3
  13. controlnet/control_v11p_sd15_lineart.yaml +0 -79
  14. controlnet/control_v11p_sd15_lineart_fp16.safetensors +0 -3
  15. controlnet/control_v11p_sd15_mlsd.yaml +0 -79
  16. controlnet/control_v11p_sd15_mlsd_fp16.safetensors +0 -3
  17. controlnet/control_v11p_sd15_normalbae.yaml +0 -79
  18. controlnet/control_v11p_sd15_normalbae_fp16.safetensors +0 -3
  19. controlnet/control_v11p_sd15_openpose.yaml +0 -79
  20. controlnet/control_v11p_sd15_openpose_fp16.safetensors +0 -3
  21. controlnet/control_v11p_sd15_scribble.yaml +0 -79
  22. controlnet/control_v11p_sd15_scribble_fp16.safetensors +0 -3
  23. controlnet/control_v11p_sd15_seg.yaml +0 -79
  24. controlnet/control_v11p_sd15_seg_fp16.safetensors +0 -3
  25. controlnet/control_v11p_sd15_softedge.yaml +0 -79
  26. controlnet/control_v11p_sd15_softedge_fp16.safetensors +0 -3
  27. controlnet/control_v11p_sd15s2_lineart_anime.yaml +0 -79
  28. controlnet/control_v11p_sd15s2_lineart_anime_fp16.safetensors +0 -3
controlnet/control_v11e_sd15_ip2p.yaml DELETED
@@ -1,79 +0,0 @@
1
- model:
2
- target: cldm.cldm.ControlLDM
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- num_timesteps_cond: 1
7
- log_every_t: 200
8
- timesteps: 1000
9
- first_stage_key: "jpg"
10
- cond_stage_key: "txt"
11
- control_key: "hint"
12
- image_size: 64
13
- channels: 4
14
- cond_stage_trainable: false
15
- conditioning_key: crossattn
16
- monitor: val/loss_simple_ema
17
- scale_factor: 0.18215
18
- use_ema: False
19
- only_mid_control: False
20
-
21
- control_stage_config:
22
- target: cldm.cldm.ControlNet
23
- params:
24
- image_size: 32 # unused
25
- in_channels: 4
26
- hint_channels: 3
27
- model_channels: 320
28
- attention_resolutions: [ 4, 2, 1 ]
29
- num_res_blocks: 2
30
- channel_mult: [ 1, 2, 4, 4 ]
31
- num_heads: 8
32
- use_spatial_transformer: True
33
- transformer_depth: 1
34
- context_dim: 768
35
- use_checkpoint: True
36
- legacy: False
37
-
38
- unet_config:
39
- target: cldm.cldm.ControlledUnetModel
40
- params:
41
- image_size: 32 # unused
42
- in_channels: 4
43
- out_channels: 4
44
- model_channels: 320
45
- attention_resolutions: [ 4, 2, 1 ]
46
- num_res_blocks: 2
47
- channel_mult: [ 1, 2, 4, 4 ]
48
- num_heads: 8
49
- use_spatial_transformer: True
50
- transformer_depth: 1
51
- context_dim: 768
52
- use_checkpoint: True
53
- legacy: False
54
-
55
- first_stage_config:
56
- target: ldm.models.autoencoder.AutoencoderKL
57
- params:
58
- embed_dim: 4
59
- monitor: val/rec_loss
60
- ddconfig:
61
- double_z: true
62
- z_channels: 4
63
- resolution: 256
64
- in_channels: 3
65
- out_ch: 3
66
- ch: 128
67
- ch_mult:
68
- - 1
69
- - 2
70
- - 4
71
- - 4
72
- num_res_blocks: 2
73
- attn_resolutions: []
74
- dropout: 0.0
75
- lossconfig:
76
- target: torch.nn.Identity
77
-
78
- cond_stage_config:
79
- target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
controlnet/control_v11e_sd15_ip2p_fp16.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:11e7dbe52a73f66e701c1faa77b8a2cb0ee3abd721e1cae31123f5b299093435
3
- size 722601100
 
 
 
 
controlnet/control_v11e_sd15_shuffle.yaml DELETED
@@ -1,80 +0,0 @@
1
- model:
2
- target: cldm.cldm.ControlLDM
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- num_timesteps_cond: 1
7
- log_every_t: 200
8
- timesteps: 1000
9
- first_stage_key: "jpg"
10
- cond_stage_key: "txt"
11
- control_key: "hint"
12
- image_size: 64
13
- channels: 4
14
- cond_stage_trainable: false
15
- conditioning_key: crossattn
16
- monitor: val/loss_simple_ema
17
- scale_factor: 0.18215
18
- use_ema: False
19
- only_mid_control: False
20
- global_average_pooling: True
21
-
22
- control_stage_config:
23
- target: cldm.cldm.ControlNet
24
- params:
25
- image_size: 32 # unused
26
- in_channels: 4
27
- hint_channels: 3
28
- model_channels: 320
29
- attention_resolutions: [ 4, 2, 1 ]
30
- num_res_blocks: 2
31
- channel_mult: [ 1, 2, 4, 4 ]
32
- num_heads: 8
33
- use_spatial_transformer: True
34
- transformer_depth: 1
35
- context_dim: 768
36
- use_checkpoint: True
37
- legacy: False
38
-
39
- unet_config:
40
- target: cldm.cldm.ControlledUnetModel
41
- params:
42
- image_size: 32 # unused
43
- in_channels: 4
44
- out_channels: 4
45
- model_channels: 320
46
- attention_resolutions: [ 4, 2, 1 ]
47
- num_res_blocks: 2
48
- channel_mult: [ 1, 2, 4, 4 ]
49
- num_heads: 8
50
- use_spatial_transformer: True
51
- transformer_depth: 1
52
- context_dim: 768
53
- use_checkpoint: True
54
- legacy: False
55
-
56
- first_stage_config:
57
- target: ldm.models.autoencoder.AutoencoderKL
58
- params:
59
- embed_dim: 4
60
- monitor: val/rec_loss
61
- ddconfig:
62
- double_z: true
63
- z_channels: 4
64
- resolution: 256
65
- in_channels: 3
66
- out_ch: 3
67
- ch: 128
68
- ch_mult:
69
- - 1
70
- - 2
71
- - 4
72
- - 4
73
- num_res_blocks: 2
74
- attn_resolutions: []
75
- dropout: 0.0
76
- lossconfig:
77
- target: torch.nn.Identity
78
-
79
- cond_stage_config:
80
- target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
controlnet/control_v11e_sd15_shuffle_fp16.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:8cc77ae071888abefd6e80bafce3d2574f9f6f8aac7ab205db98fb12a53c1132
3
- size 722601100
 
 
 
 
controlnet/control_v11f1e_sd15_tile.yaml DELETED
@@ -1,79 +0,0 @@
1
- model:
2
- target: cldm.cldm.ControlLDM
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- num_timesteps_cond: 1
7
- log_every_t: 200
8
- timesteps: 1000
9
- first_stage_key: "jpg"
10
- cond_stage_key: "txt"
11
- control_key: "hint"
12
- image_size: 64
13
- channels: 4
14
- cond_stage_trainable: false
15
- conditioning_key: crossattn
16
- monitor: val/loss_simple_ema
17
- scale_factor: 0.18215
18
- use_ema: False
19
- only_mid_control: False
20
-
21
- control_stage_config:
22
- target: cldm.cldm.ControlNet
23
- params:
24
- image_size: 32 # unused
25
- in_channels: 4
26
- hint_channels: 3
27
- model_channels: 320
28
- attention_resolutions: [ 4, 2, 1 ]
29
- num_res_blocks: 2
30
- channel_mult: [ 1, 2, 4, 4 ]
31
- num_heads: 8
32
- use_spatial_transformer: True
33
- transformer_depth: 1
34
- context_dim: 768
35
- use_checkpoint: True
36
- legacy: False
37
-
38
- unet_config:
39
- target: cldm.cldm.ControlledUnetModel
40
- params:
41
- image_size: 32 # unused
42
- in_channels: 4
43
- out_channels: 4
44
- model_channels: 320
45
- attention_resolutions: [ 4, 2, 1 ]
46
- num_res_blocks: 2
47
- channel_mult: [ 1, 2, 4, 4 ]
48
- num_heads: 8
49
- use_spatial_transformer: True
50
- transformer_depth: 1
51
- context_dim: 768
52
- use_checkpoint: True
53
- legacy: False
54
-
55
- first_stage_config:
56
- target: ldm.models.autoencoder.AutoencoderKL
57
- params:
58
- embed_dim: 4
59
- monitor: val/rec_loss
60
- ddconfig:
61
- double_z: true
62
- z_channels: 4
63
- resolution: 256
64
- in_channels: 3
65
- out_ch: 3
66
- ch: 128
67
- ch_mult:
68
- - 1
69
- - 2
70
- - 4
71
- - 4
72
- num_res_blocks: 2
73
- attn_resolutions: []
74
- dropout: 0.0
75
- lossconfig:
76
- target: torch.nn.Identity
77
-
78
- cond_stage_config:
79
- target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
controlnet/control_v11f1e_sd15_tile_fp16.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:2f31868eedb243a77932e3c63907a6ba0a2058b6d65b5c27b89ee1b7f618ea33
3
- size 722601104
 
 
 
 
controlnet/control_v11f1p_sd15_depth.yaml DELETED
@@ -1,79 +0,0 @@
1
- model:
2
- target: cldm.cldm.ControlLDM
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- num_timesteps_cond: 1
7
- log_every_t: 200
8
- timesteps: 1000
9
- first_stage_key: "jpg"
10
- cond_stage_key: "txt"
11
- control_key: "hint"
12
- image_size: 64
13
- channels: 4
14
- cond_stage_trainable: false
15
- conditioning_key: crossattn
16
- monitor: val/loss_simple_ema
17
- scale_factor: 0.18215
18
- use_ema: False
19
- only_mid_control: False
20
-
21
- control_stage_config:
22
- target: cldm.cldm.ControlNet
23
- params:
24
- image_size: 32 # unused
25
- in_channels: 4
26
- hint_channels: 3
27
- model_channels: 320
28
- attention_resolutions: [ 4, 2, 1 ]
29
- num_res_blocks: 2
30
- channel_mult: [ 1, 2, 4, 4 ]
31
- num_heads: 8
32
- use_spatial_transformer: True
33
- transformer_depth: 1
34
- context_dim: 768
35
- use_checkpoint: True
36
- legacy: False
37
-
38
- unet_config:
39
- target: cldm.cldm.ControlledUnetModel
40
- params:
41
- image_size: 32 # unused
42
- in_channels: 4
43
- out_channels: 4
44
- model_channels: 320
45
- attention_resolutions: [ 4, 2, 1 ]
46
- num_res_blocks: 2
47
- channel_mult: [ 1, 2, 4, 4 ]
48
- num_heads: 8
49
- use_spatial_transformer: True
50
- transformer_depth: 1
51
- context_dim: 768
52
- use_checkpoint: True
53
- legacy: False
54
-
55
- first_stage_config:
56
- target: ldm.models.autoencoder.AutoencoderKL
57
- params:
58
- embed_dim: 4
59
- monitor: val/rec_loss
60
- ddconfig:
61
- double_z: true
62
- z_channels: 4
63
- resolution: 256
64
- in_channels: 3
65
- out_ch: 3
66
- ch: 128
67
- ch_mult:
68
- - 1
69
- - 2
70
- - 4
71
- - 4
72
- num_res_blocks: 2
73
- attn_resolutions: []
74
- dropout: 0.0
75
- lossconfig:
76
- target: torch.nn.Identity
77
-
78
- cond_stage_config:
79
- target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
controlnet/control_v11f1p_sd15_depth_fp16.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:1c4a79aa52fb63f607cb9ff479ea5aa1923b6ceb21267bd14b69bd05d7b617be
3
- size 722601100
 
 
 
 
controlnet/control_v11p_sd15_canny.yaml DELETED
@@ -1,79 +0,0 @@
1
- model:
2
- target: cldm.cldm.ControlLDM
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- num_timesteps_cond: 1
7
- log_every_t: 200
8
- timesteps: 1000
9
- first_stage_key: "jpg"
10
- cond_stage_key: "txt"
11
- control_key: "hint"
12
- image_size: 64
13
- channels: 4
14
- cond_stage_trainable: false
15
- conditioning_key: crossattn
16
- monitor: val/loss_simple_ema
17
- scale_factor: 0.18215
18
- use_ema: False
19
- only_mid_control: False
20
-
21
- control_stage_config:
22
- target: cldm.cldm.ControlNet
23
- params:
24
- image_size: 32 # unused
25
- in_channels: 4
26
- hint_channels: 3
27
- model_channels: 320
28
- attention_resolutions: [ 4, 2, 1 ]
29
- num_res_blocks: 2
30
- channel_mult: [ 1, 2, 4, 4 ]
31
- num_heads: 8
32
- use_spatial_transformer: True
33
- transformer_depth: 1
34
- context_dim: 768
35
- use_checkpoint: True
36
- legacy: False
37
-
38
- unet_config:
39
- target: cldm.cldm.ControlledUnetModel
40
- params:
41
- image_size: 32 # unused
42
- in_channels: 4
43
- out_channels: 4
44
- model_channels: 320
45
- attention_resolutions: [ 4, 2, 1 ]
46
- num_res_blocks: 2
47
- channel_mult: [ 1, 2, 4, 4 ]
48
- num_heads: 8
49
- use_spatial_transformer: True
50
- transformer_depth: 1
51
- context_dim: 768
52
- use_checkpoint: True
53
- legacy: False
54
-
55
- first_stage_config:
56
- target: ldm.models.autoencoder.AutoencoderKL
57
- params:
58
- embed_dim: 4
59
- monitor: val/rec_loss
60
- ddconfig:
61
- double_z: true
62
- z_channels: 4
63
- resolution: 256
64
- in_channels: 3
65
- out_ch: 3
66
- ch: 128
67
- ch_mult:
68
- - 1
69
- - 2
70
- - 4
71
- - 4
72
- num_res_blocks: 2
73
- attn_resolutions: []
74
- dropout: 0.0
75
- lossconfig:
76
- target: torch.nn.Identity
77
-
78
- cond_stage_config:
79
- target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
controlnet/control_v11p_sd15_canny_fp16.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:8932b66e15aae835b3490dbf989f56c253104cee08a88bf21283762f557c9f10
3
- size 722601100
 
 
 
 
controlnet/control_v11p_sd15_inpaint.yaml DELETED
@@ -1,79 +0,0 @@
1
- model:
2
- target: cldm.cldm.ControlLDM
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- num_timesteps_cond: 1
7
- log_every_t: 200
8
- timesteps: 1000
9
- first_stage_key: "jpg"
10
- cond_stage_key: "txt"
11
- control_key: "hint"
12
- image_size: 64
13
- channels: 4
14
- cond_stage_trainable: false
15
- conditioning_key: crossattn
16
- monitor: val/loss_simple_ema
17
- scale_factor: 0.18215
18
- use_ema: False
19
- only_mid_control: False
20
-
21
- control_stage_config:
22
- target: cldm.cldm.ControlNet
23
- params:
24
- image_size: 32 # unused
25
- in_channels: 4
26
- hint_channels: 3
27
- model_channels: 320
28
- attention_resolutions: [ 4, 2, 1 ]
29
- num_res_blocks: 2
30
- channel_mult: [ 1, 2, 4, 4 ]
31
- num_heads: 8
32
- use_spatial_transformer: True
33
- transformer_depth: 1
34
- context_dim: 768
35
- use_checkpoint: True
36
- legacy: False
37
-
38
- unet_config:
39
- target: cldm.cldm.ControlledUnetModel
40
- params:
41
- image_size: 32 # unused
42
- in_channels: 4
43
- out_channels: 4
44
- model_channels: 320
45
- attention_resolutions: [ 4, 2, 1 ]
46
- num_res_blocks: 2
47
- channel_mult: [ 1, 2, 4, 4 ]
48
- num_heads: 8
49
- use_spatial_transformer: True
50
- transformer_depth: 1
51
- context_dim: 768
52
- use_checkpoint: True
53
- legacy: False
54
-
55
- first_stage_config:
56
- target: ldm.models.autoencoder.AutoencoderKL
57
- params:
58
- embed_dim: 4
59
- monitor: val/rec_loss
60
- ddconfig:
61
- double_z: true
62
- z_channels: 4
63
- resolution: 256
64
- in_channels: 3
65
- out_ch: 3
66
- ch: 128
67
- ch_mult:
68
- - 1
69
- - 2
70
- - 4
71
- - 4
72
- num_res_blocks: 2
73
- attn_resolutions: []
74
- dropout: 0.0
75
- lossconfig:
76
- target: torch.nn.Identity
77
-
78
- cond_stage_config:
79
- target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
controlnet/control_v11p_sd15_inpaint_fp16.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:677a4fe351edecd40cd0d7cc210a8686b59d4e55207317f12319ef746a7a5a89
3
- size 722601100
 
 
 
 
controlnet/control_v11p_sd15_lineart.yaml DELETED
@@ -1,79 +0,0 @@
1
- model:
2
- target: cldm.cldm.ControlLDM
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- num_timesteps_cond: 1
7
- log_every_t: 200
8
- timesteps: 1000
9
- first_stage_key: "jpg"
10
- cond_stage_key: "txt"
11
- control_key: "hint"
12
- image_size: 64
13
- channels: 4
14
- cond_stage_trainable: false
15
- conditioning_key: crossattn
16
- monitor: val/loss_simple_ema
17
- scale_factor: 0.18215
18
- use_ema: False
19
- only_mid_control: False
20
-
21
- control_stage_config:
22
- target: cldm.cldm.ControlNet
23
- params:
24
- image_size: 32 # unused
25
- in_channels: 4
26
- hint_channels: 3
27
- model_channels: 320
28
- attention_resolutions: [ 4, 2, 1 ]
29
- num_res_blocks: 2
30
- channel_mult: [ 1, 2, 4, 4 ]
31
- num_heads: 8
32
- use_spatial_transformer: True
33
- transformer_depth: 1
34
- context_dim: 768
35
- use_checkpoint: True
36
- legacy: False
37
-
38
- unet_config:
39
- target: cldm.cldm.ControlledUnetModel
40
- params:
41
- image_size: 32 # unused
42
- in_channels: 4
43
- out_channels: 4
44
- model_channels: 320
45
- attention_resolutions: [ 4, 2, 1 ]
46
- num_res_blocks: 2
47
- channel_mult: [ 1, 2, 4, 4 ]
48
- num_heads: 8
49
- use_spatial_transformer: True
50
- transformer_depth: 1
51
- context_dim: 768
52
- use_checkpoint: True
53
- legacy: False
54
-
55
- first_stage_config:
56
- target: ldm.models.autoencoder.AutoencoderKL
57
- params:
58
- embed_dim: 4
59
- monitor: val/rec_loss
60
- ddconfig:
61
- double_z: true
62
- z_channels: 4
63
- resolution: 256
64
- in_channels: 3
65
- out_ch: 3
66
- ch: 128
67
- ch_mult:
68
- - 1
69
- - 2
70
- - 4
71
- - 4
72
- num_res_blocks: 2
73
- attn_resolutions: []
74
- dropout: 0.0
75
- lossconfig:
76
- target: torch.nn.Identity
77
-
78
- cond_stage_config:
79
- target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
controlnet/control_v11p_sd15_lineart_fp16.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:10559106d1bb8196298b7a81565ede9279295d2b2df15165b9dbe189994def56
3
- size 722601100
 
 
 
 
controlnet/control_v11p_sd15_mlsd.yaml DELETED
@@ -1,79 +0,0 @@
1
- model:
2
- target: cldm.cldm.ControlLDM
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- num_timesteps_cond: 1
7
- log_every_t: 200
8
- timesteps: 1000
9
- first_stage_key: "jpg"
10
- cond_stage_key: "txt"
11
- control_key: "hint"
12
- image_size: 64
13
- channels: 4
14
- cond_stage_trainable: false
15
- conditioning_key: crossattn
16
- monitor: val/loss_simple_ema
17
- scale_factor: 0.18215
18
- use_ema: False
19
- only_mid_control: False
20
-
21
- control_stage_config:
22
- target: cldm.cldm.ControlNet
23
- params:
24
- image_size: 32 # unused
25
- in_channels: 4
26
- hint_channels: 3
27
- model_channels: 320
28
- attention_resolutions: [ 4, 2, 1 ]
29
- num_res_blocks: 2
30
- channel_mult: [ 1, 2, 4, 4 ]
31
- num_heads: 8
32
- use_spatial_transformer: True
33
- transformer_depth: 1
34
- context_dim: 768
35
- use_checkpoint: True
36
- legacy: False
37
-
38
- unet_config:
39
- target: cldm.cldm.ControlledUnetModel
40
- params:
41
- image_size: 32 # unused
42
- in_channels: 4
43
- out_channels: 4
44
- model_channels: 320
45
- attention_resolutions: [ 4, 2, 1 ]
46
- num_res_blocks: 2
47
- channel_mult: [ 1, 2, 4, 4 ]
48
- num_heads: 8
49
- use_spatial_transformer: True
50
- transformer_depth: 1
51
- context_dim: 768
52
- use_checkpoint: True
53
- legacy: False
54
-
55
- first_stage_config:
56
- target: ldm.models.autoencoder.AutoencoderKL
57
- params:
58
- embed_dim: 4
59
- monitor: val/rec_loss
60
- ddconfig:
61
- double_z: true
62
- z_channels: 4
63
- resolution: 256
64
- in_channels: 3
65
- out_ch: 3
66
- ch: 128
67
- ch_mult:
68
- - 1
69
- - 2
70
- - 4
71
- - 4
72
- num_res_blocks: 2
73
- attn_resolutions: []
74
- dropout: 0.0
75
- lossconfig:
76
- target: torch.nn.Identity
77
-
78
- cond_stage_config:
79
- target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
controlnet/control_v11p_sd15_mlsd_fp16.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d689682fcc9341581b788524ab813cda789acdbc16bdbecbd1b9d2221e119b7
3
- size 722601100
 
 
 
 
controlnet/control_v11p_sd15_normalbae.yaml DELETED
@@ -1,79 +0,0 @@
1
- model:
2
- target: cldm.cldm.ControlLDM
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- num_timesteps_cond: 1
7
- log_every_t: 200
8
- timesteps: 1000
9
- first_stage_key: "jpg"
10
- cond_stage_key: "txt"
11
- control_key: "hint"
12
- image_size: 64
13
- channels: 4
14
- cond_stage_trainable: false
15
- conditioning_key: crossattn
16
- monitor: val/loss_simple_ema
17
- scale_factor: 0.18215
18
- use_ema: False
19
- only_mid_control: False
20
-
21
- control_stage_config:
22
- target: cldm.cldm.ControlNet
23
- params:
24
- image_size: 32 # unused
25
- in_channels: 4
26
- hint_channels: 3
27
- model_channels: 320
28
- attention_resolutions: [ 4, 2, 1 ]
29
- num_res_blocks: 2
30
- channel_mult: [ 1, 2, 4, 4 ]
31
- num_heads: 8
32
- use_spatial_transformer: True
33
- transformer_depth: 1
34
- context_dim: 768
35
- use_checkpoint: True
36
- legacy: False
37
-
38
- unet_config:
39
- target: cldm.cldm.ControlledUnetModel
40
- params:
41
- image_size: 32 # unused
42
- in_channels: 4
43
- out_channels: 4
44
- model_channels: 320
45
- attention_resolutions: [ 4, 2, 1 ]
46
- num_res_blocks: 2
47
- channel_mult: [ 1, 2, 4, 4 ]
48
- num_heads: 8
49
- use_spatial_transformer: True
50
- transformer_depth: 1
51
- context_dim: 768
52
- use_checkpoint: True
53
- legacy: False
54
-
55
- first_stage_config:
56
- target: ldm.models.autoencoder.AutoencoderKL
57
- params:
58
- embed_dim: 4
59
- monitor: val/rec_loss
60
- ddconfig:
61
- double_z: true
62
- z_channels: 4
63
- resolution: 256
64
- in_channels: 3
65
- out_ch: 3
66
- ch: 128
67
- ch_mult:
68
- - 1
69
- - 2
70
- - 4
71
- - 4
72
- num_res_blocks: 2
73
- attn_resolutions: []
74
- dropout: 0.0
75
- lossconfig:
76
- target: torch.nn.Identity
77
-
78
- cond_stage_config:
79
- target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
controlnet/control_v11p_sd15_normalbae_fp16.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:79864bfc3a1df58ed35bd92fc8dd1e4d7b85cac424cc427b9049ddc7647cceec
3
- size 722601100
 
 
 
 
controlnet/control_v11p_sd15_openpose.yaml DELETED
@@ -1,79 +0,0 @@
1
- model:
2
- target: cldm.cldm.ControlLDM
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- num_timesteps_cond: 1
7
- log_every_t: 200
8
- timesteps: 1000
9
- first_stage_key: "jpg"
10
- cond_stage_key: "txt"
11
- control_key: "hint"
12
- image_size: 64
13
- channels: 4
14
- cond_stage_trainable: false
15
- conditioning_key: crossattn
16
- monitor: val/loss_simple_ema
17
- scale_factor: 0.18215
18
- use_ema: False
19
- only_mid_control: False
20
-
21
- control_stage_config:
22
- target: cldm.cldm.ControlNet
23
- params:
24
- image_size: 32 # unused
25
- in_channels: 4
26
- hint_channels: 3
27
- model_channels: 320
28
- attention_resolutions: [ 4, 2, 1 ]
29
- num_res_blocks: 2
30
- channel_mult: [ 1, 2, 4, 4 ]
31
- num_heads: 8
32
- use_spatial_transformer: True
33
- transformer_depth: 1
34
- context_dim: 768
35
- use_checkpoint: True
36
- legacy: False
37
-
38
- unet_config:
39
- target: cldm.cldm.ControlledUnetModel
40
- params:
41
- image_size: 32 # unused
42
- in_channels: 4
43
- out_channels: 4
44
- model_channels: 320
45
- attention_resolutions: [ 4, 2, 1 ]
46
- num_res_blocks: 2
47
- channel_mult: [ 1, 2, 4, 4 ]
48
- num_heads: 8
49
- use_spatial_transformer: True
50
- transformer_depth: 1
51
- context_dim: 768
52
- use_checkpoint: True
53
- legacy: False
54
-
55
- first_stage_config:
56
- target: ldm.models.autoencoder.AutoencoderKL
57
- params:
58
- embed_dim: 4
59
- monitor: val/rec_loss
60
- ddconfig:
61
- double_z: true
62
- z_channels: 4
63
- resolution: 256
64
- in_channels: 3
65
- out_ch: 3
66
- ch: 128
67
- ch_mult:
68
- - 1
69
- - 2
70
- - 4
71
- - 4
72
- num_res_blocks: 2
73
- attn_resolutions: []
74
- dropout: 0.0
75
- lossconfig:
76
- target: torch.nn.Identity
77
-
78
- cond_stage_config:
79
- target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
controlnet/control_v11p_sd15_openpose_fp16.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:4003c1da17b0e4ba444e02140e1c0d83bb24b79e4dcfd613c3a554d38f0f89c7
3
- size 722601100
 
 
 
 
controlnet/control_v11p_sd15_scribble.yaml DELETED
@@ -1,79 +0,0 @@
1
- model:
2
- target: cldm.cldm.ControlLDM
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- num_timesteps_cond: 1
7
- log_every_t: 200
8
- timesteps: 1000
9
- first_stage_key: "jpg"
10
- cond_stage_key: "txt"
11
- control_key: "hint"
12
- image_size: 64
13
- channels: 4
14
- cond_stage_trainable: false
15
- conditioning_key: crossattn
16
- monitor: val/loss_simple_ema
17
- scale_factor: 0.18215
18
- use_ema: False
19
- only_mid_control: False
20
-
21
- control_stage_config:
22
- target: cldm.cldm.ControlNet
23
- params:
24
- image_size: 32 # unused
25
- in_channels: 4
26
- hint_channels: 3
27
- model_channels: 320
28
- attention_resolutions: [ 4, 2, 1 ]
29
- num_res_blocks: 2
30
- channel_mult: [ 1, 2, 4, 4 ]
31
- num_heads: 8
32
- use_spatial_transformer: True
33
- transformer_depth: 1
34
- context_dim: 768
35
- use_checkpoint: True
36
- legacy: False
37
-
38
- unet_config:
39
- target: cldm.cldm.ControlledUnetModel
40
- params:
41
- image_size: 32 # unused
42
- in_channels: 4
43
- out_channels: 4
44
- model_channels: 320
45
- attention_resolutions: [ 4, 2, 1 ]
46
- num_res_blocks: 2
47
- channel_mult: [ 1, 2, 4, 4 ]
48
- num_heads: 8
49
- use_spatial_transformer: True
50
- transformer_depth: 1
51
- context_dim: 768
52
- use_checkpoint: True
53
- legacy: False
54
-
55
- first_stage_config:
56
- target: ldm.models.autoencoder.AutoencoderKL
57
- params:
58
- embed_dim: 4
59
- monitor: val/rec_loss
60
- ddconfig:
61
- double_z: true
62
- z_channels: 4
63
- resolution: 256
64
- in_channels: 3
65
- out_ch: 3
66
- ch: 128
67
- ch_mult:
68
- - 1
69
- - 2
70
- - 4
71
- - 4
72
- num_res_blocks: 2
73
- attn_resolutions: []
74
- dropout: 0.0
75
- lossconfig:
76
- target: torch.nn.Identity
77
-
78
- cond_stage_config:
79
- target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
controlnet/control_v11p_sd15_scribble_fp16.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:99edfd25b54c18c0ab19fba8c5618f741aac1f8c3101e7fa62cce925ad87ae68
3
- size 722601100
 
 
 
 
controlnet/control_v11p_sd15_seg.yaml DELETED
@@ -1,79 +0,0 @@
1
- model:
2
- target: cldm.cldm.ControlLDM
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- num_timesteps_cond: 1
7
- log_every_t: 200
8
- timesteps: 1000
9
- first_stage_key: "jpg"
10
- cond_stage_key: "txt"
11
- control_key: "hint"
12
- image_size: 64
13
- channels: 4
14
- cond_stage_trainable: false
15
- conditioning_key: crossattn
16
- monitor: val/loss_simple_ema
17
- scale_factor: 0.18215
18
- use_ema: False
19
- only_mid_control: False
20
-
21
- control_stage_config:
22
- target: cldm.cldm.ControlNet
23
- params:
24
- image_size: 32 # unused
25
- in_channels: 4
26
- hint_channels: 3
27
- model_channels: 320
28
- attention_resolutions: [ 4, 2, 1 ]
29
- num_res_blocks: 2
30
- channel_mult: [ 1, 2, 4, 4 ]
31
- num_heads: 8
32
- use_spatial_transformer: True
33
- transformer_depth: 1
34
- context_dim: 768
35
- use_checkpoint: True
36
- legacy: False
37
-
38
- unet_config:
39
- target: cldm.cldm.ControlledUnetModel
40
- params:
41
- image_size: 32 # unused
42
- in_channels: 4
43
- out_channels: 4
44
- model_channels: 320
45
- attention_resolutions: [ 4, 2, 1 ]
46
- num_res_blocks: 2
47
- channel_mult: [ 1, 2, 4, 4 ]
48
- num_heads: 8
49
- use_spatial_transformer: True
50
- transformer_depth: 1
51
- context_dim: 768
52
- use_checkpoint: True
53
- legacy: False
54
-
55
- first_stage_config:
56
- target: ldm.models.autoencoder.AutoencoderKL
57
- params:
58
- embed_dim: 4
59
- monitor: val/rec_loss
60
- ddconfig:
61
- double_z: true
62
- z_channels: 4
63
- resolution: 256
64
- in_channels: 3
65
- out_ch: 3
66
- ch: 128
67
- ch_mult:
68
- - 1
69
- - 2
70
- - 4
71
- - 4
72
- num_res_blocks: 2
73
- attn_resolutions: []
74
- dropout: 0.0
75
- lossconfig:
76
- target: torch.nn.Identity
77
-
78
- cond_stage_config:
79
- target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
controlnet/control_v11p_sd15_seg_fp16.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:acd4dd3df2da2f1f2b9dd00f4504cc0d98b20afb608e25f1789a95c0ccdba14a
3
- size 722601100
 
 
 
 
controlnet/control_v11p_sd15_softedge.yaml DELETED
@@ -1,79 +0,0 @@
1
- model:
2
- target: cldm.cldm.ControlLDM
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- num_timesteps_cond: 1
7
- log_every_t: 200
8
- timesteps: 1000
9
- first_stage_key: "jpg"
10
- cond_stage_key: "txt"
11
- control_key: "hint"
12
- image_size: 64
13
- channels: 4
14
- cond_stage_trainable: false
15
- conditioning_key: crossattn
16
- monitor: val/loss_simple_ema
17
- scale_factor: 0.18215
18
- use_ema: False
19
- only_mid_control: False
20
-
21
- control_stage_config:
22
- target: cldm.cldm.ControlNet
23
- params:
24
- image_size: 32 # unused
25
- in_channels: 4
26
- hint_channels: 3
27
- model_channels: 320
28
- attention_resolutions: [ 4, 2, 1 ]
29
- num_res_blocks: 2
30
- channel_mult: [ 1, 2, 4, 4 ]
31
- num_heads: 8
32
- use_spatial_transformer: True
33
- transformer_depth: 1
34
- context_dim: 768
35
- use_checkpoint: True
36
- legacy: False
37
-
38
- unet_config:
39
- target: cldm.cldm.ControlledUnetModel
40
- params:
41
- image_size: 32 # unused
42
- in_channels: 4
43
- out_channels: 4
44
- model_channels: 320
45
- attention_resolutions: [ 4, 2, 1 ]
46
- num_res_blocks: 2
47
- channel_mult: [ 1, 2, 4, 4 ]
48
- num_heads: 8
49
- use_spatial_transformer: True
50
- transformer_depth: 1
51
- context_dim: 768
52
- use_checkpoint: True
53
- legacy: False
54
-
55
- first_stage_config:
56
- target: ldm.models.autoencoder.AutoencoderKL
57
- params:
58
- embed_dim: 4
59
- monitor: val/rec_loss
60
- ddconfig:
61
- double_z: true
62
- z_channels: 4
63
- resolution: 256
64
- in_channels: 3
65
- out_ch: 3
66
- ch: 128
67
- ch_mult:
68
- - 1
69
- - 2
70
- - 4
71
- - 4
72
- num_res_blocks: 2
73
- attn_resolutions: []
74
- dropout: 0.0
75
- lossconfig:
76
- target: torch.nn.Identity
77
-
78
- cond_stage_config:
79
- target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
controlnet/control_v11p_sd15_softedge_fp16.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:e78fea5b4599fec2ecd7e3f14b171feb290b88200c95d569ec0ff59a19bc3478
3
- size 722601100
 
 
 
 
controlnet/control_v11p_sd15s2_lineart_anime.yaml DELETED
@@ -1,79 +0,0 @@
1
- model:
2
- target: cldm.cldm.ControlLDM
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- num_timesteps_cond: 1
7
- log_every_t: 200
8
- timesteps: 1000
9
- first_stage_key: "jpg"
10
- cond_stage_key: "txt"
11
- control_key: "hint"
12
- image_size: 64
13
- channels: 4
14
- cond_stage_trainable: false
15
- conditioning_key: crossattn
16
- monitor: val/loss_simple_ema
17
- scale_factor: 0.18215
18
- use_ema: False
19
- only_mid_control: False
20
-
21
- control_stage_config:
22
- target: cldm.cldm.ControlNet
23
- params:
24
- image_size: 32 # unused
25
- in_channels: 4
26
- hint_channels: 3
27
- model_channels: 320
28
- attention_resolutions: [ 4, 2, 1 ]
29
- num_res_blocks: 2
30
- channel_mult: [ 1, 2, 4, 4 ]
31
- num_heads: 8
32
- use_spatial_transformer: True
33
- transformer_depth: 1
34
- context_dim: 768
35
- use_checkpoint: True
36
- legacy: False
37
-
38
- unet_config:
39
- target: cldm.cldm.ControlledUnetModel
40
- params:
41
- image_size: 32 # unused
42
- in_channels: 4
43
- out_channels: 4
44
- model_channels: 320
45
- attention_resolutions: [ 4, 2, 1 ]
46
- num_res_blocks: 2
47
- channel_mult: [ 1, 2, 4, 4 ]
48
- num_heads: 8
49
- use_spatial_transformer: True
50
- transformer_depth: 1
51
- context_dim: 768
52
- use_checkpoint: True
53
- legacy: False
54
-
55
- first_stage_config:
56
- target: ldm.models.autoencoder.AutoencoderKL
57
- params:
58
- embed_dim: 4
59
- monitor: val/rec_loss
60
- ddconfig:
61
- double_z: true
62
- z_channels: 4
63
- resolution: 256
64
- in_channels: 3
65
- out_ch: 3
66
- ch: 128
67
- ch_mult:
68
- - 1
69
- - 2
70
- - 4
71
- - 4
72
- num_res_blocks: 2
73
- attn_resolutions: []
74
- dropout: 0.0
75
- lossconfig:
76
- target: torch.nn.Identity
77
-
78
- cond_stage_config:
79
- target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
controlnet/control_v11p_sd15s2_lineart_anime_fp16.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:067bf845109afdd1049bd9553d44faed1ad53691bd6b5ac9ee31c87466ef7c27
3
- size 722601100