custom_vqgan.yaml 995 B

12345678910111213141516171819202122232425262728293031323334353637383940414243
  1. model:
  2. base_learning_rate: 4.5e-6
  3. target: taming.models.vqgan.VQModel
  4. params:
  5. embed_dim: 256
  6. n_embed: 1024
  7. ddconfig:
  8. double_z: False
  9. z_channels: 256
  10. resolution: 256
  11. in_channels: 3
  12. out_ch: 3
  13. ch: 128
  14. ch_mult: [ 1,1,2,2,4] # num_down = len(ch_mult)-1
  15. num_res_blocks: 2
  16. attn_resolutions: [16]
  17. dropout: 0.0
  18. lossconfig:
  19. target: taming.modules.losses.vqperceptual.VQLPIPSWithDiscriminator
  20. params:
  21. disc_conditional: False
  22. disc_in_channels: 3
  23. disc_start: 10000
  24. disc_weight: 0.8
  25. codebook_weight: 1.0
  26. data:
  27. target: main.DataModuleFromConfig
  28. params:
  29. batch_size: 5
  30. num_workers: 8
  31. train:
  32. target: taming.data.custom.CustomTrain
  33. params:
  34. training_images_list_file: some/training.txt
  35. size: 256
  36. validation:
  37. target: taming.data.custom.CustomTest
  38. params:
  39. test_images_list_file: some/test.txt
  40. size: 256