control_v11e_sd15_shuffle.yaml 1.9 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980
  1. model:
  2. target: cldm.cldm.ControlLDM
  3. params:
  4. linear_start: 0.00085
  5. linear_end: 0.0120
  6. num_timesteps_cond: 1
  7. log_every_t: 200
  8. timesteps: 1000
  9. first_stage_key: "jpg"
  10. cond_stage_key: "txt"
  11. control_key: "hint"
  12. image_size: 64
  13. channels: 4
  14. cond_stage_trainable: false
  15. conditioning_key: crossattn
  16. monitor: val/loss_simple_ema
  17. scale_factor: 0.18215
  18. use_ema: False
  19. only_mid_control: False
  20. global_average_pooling: True
  21. control_stage_config:
  22. target: cldm.cldm.ControlNet
  23. params:
  24. image_size: 32 # unused
  25. in_channels: 4
  26. hint_channels: 3
  27. model_channels: 320
  28. attention_resolutions: [ 4, 2, 1 ]
  29. num_res_blocks: 2
  30. channel_mult: [ 1, 2, 4, 4 ]
  31. num_heads: 8
  32. use_spatial_transformer: True
  33. transformer_depth: 1
  34. context_dim: 768
  35. use_checkpoint: True
  36. legacy: False
  37. unet_config:
  38. target: cldm.cldm.ControlledUnetModel
  39. params:
  40. image_size: 32 # unused
  41. in_channels: 4
  42. out_channels: 4
  43. model_channels: 320
  44. attention_resolutions: [ 4, 2, 1 ]
  45. num_res_blocks: 2
  46. channel_mult: [ 1, 2, 4, 4 ]
  47. num_heads: 8
  48. use_spatial_transformer: True
  49. transformer_depth: 1
  50. context_dim: 768
  51. use_checkpoint: True
  52. legacy: False
  53. first_stage_config:
  54. target: ldm.models.autoencoder.AutoencoderKL
  55. params:
  56. embed_dim: 4
  57. monitor: val/rec_loss
  58. ddconfig:
  59. double_z: true
  60. z_channels: 4
  61. resolution: 256
  62. in_channels: 3
  63. out_ch: 3
  64. ch: 128
  65. ch_mult:
  66. - 1
  67. - 2
  68. - 4
  69. - 4
  70. num_res_blocks: 2
  71. attn_resolutions: []
  72. dropout: 0.0
  73. lossconfig:
  74. target: torch.nn.Identity
  75. cond_stage_config:
  76. target: ldm.modules.encoders.modules.FrozenCLIPEmbedder