File size: 2,011 Bytes
1f30907
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
pretrained_model_name_or_path: "./ckpt/img2mvimg"
mixed_precision: "bf16"

init_config: 
  # enable controls
  enable_cross_attn_lora: False
  enable_cross_attn_ip: False
  enable_self_attn_lora: False
  enable_self_attn_ref: False
  enable_multiview_attn: True

  # for cross attention
  init_cross_attn_lora: False
  init_cross_attn_ip: False
  cross_attn_lora_rank: 256        # 0 for not enabled
  cross_attn_lora_only_kv: False
  ipadapter_pretrained_name: "h94/IP-Adapter"
  ipadapter_subfolder_name: "models"
  ipadapter_weight_name: "ip-adapter_sd15.safetensors"
  ipadapter_effect_on: "all"    # all, first

  # for self attention
  init_self_attn_lora: False
  self_attn_lora_rank: 256
  self_attn_lora_only_kv: False

  # for self attention ref
  init_self_attn_ref: False
  self_attn_ref_position: "attn1"
  self_attn_ref_other_model_name: "lambdalabs/sd-image-variations-diffusers"
  self_attn_ref_pixel_wise_crosspond: False
  self_attn_ref_effect_on: "all"
  
  # for multiview attention
  init_multiview_attn: True
  multiview_attn_position: "attn1"
  use_mv_joint_attn: True
  num_modalities: 1
  
  # for unet
  init_unet_path: "${pretrained_model_name_or_path}"
  cat_condition: True       # cat condition to input
  
  # for cls embedding
  init_num_cls_label: 8     # for initialize
  cls_labels: [0, 1, 2, 3]  # for current task

trainers:
  - trainer_type: "image2mvimage_trainer"
    trainer:
        pretrained_model_name_or_path: "${pretrained_model_name_or_path}"
        attn_config:
          cls_labels: [0, 1, 2, 3]  # for current task
          enable_cross_attn_lora: False
          enable_cross_attn_ip: False
          enable_self_attn_lora: False
          enable_self_attn_ref: False
          enable_multiview_attn: True
        resolution: "256"
        condition_image_resolution: "256"
        normal_cls_offset: 4
        condition_image_column_name: "conditioning_image"
        image_column_name: "image"