jbeomlee93 commited on
Commit
f8ba65b
1 Parent(s): 7c59b2b

End of training

Browse files
README.md ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ---
3
+ license: openrail++
4
+ base_model: diffusers/stable-diffusion-xl-1.0-inpainting-0.1
5
+ tags:
6
+ - stable-diffusion-xl
7
+ - stable-diffusion-xl-diffusers
8
+ - text-to-image
9
+ - diffusers
10
+ - controlnet
11
+ inference: true
12
+ ---
13
+
14
+ # controlnet-jbeomlee93/output_lr1e-6_datav3_modify_size1024_step1000_zoomin_textprompt
15
+
16
+ These are controlnet weights trained on diffusers/stable-diffusion-xl-1.0-inpainting-0.1 with new type of conditioning.
17
+
checkpoint-1000/controlnet/config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "ControlNetModel",
3
+ "_diffusers_version": "0.24.0.dev0",
4
+ "_name_or_path": "diffusers/controlnet-canny-sdxl-1.0",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": "text_time",
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": 256,
9
+ "attention_head_dim": [
10
+ 5,
11
+ 10,
12
+ 20
13
+ ],
14
+ "block_out_channels": [
15
+ 320,
16
+ 640,
17
+ 1280
18
+ ],
19
+ "class_embed_type": null,
20
+ "conditioning_channels": 3,
21
+ "conditioning_embedding_out_channels": [
22
+ 16,
23
+ 32,
24
+ 96,
25
+ 256
26
+ ],
27
+ "controlnet_conditioning_channel_order": "rgb",
28
+ "cross_attention_dim": 2048,
29
+ "down_block_types": [
30
+ "DownBlock2D",
31
+ "CrossAttnDownBlock2D",
32
+ "CrossAttnDownBlock2D"
33
+ ],
34
+ "downsample_padding": 1,
35
+ "encoder_hid_dim": null,
36
+ "encoder_hid_dim_type": null,
37
+ "flip_sin_to_cos": true,
38
+ "freq_shift": 0,
39
+ "global_pool_conditions": false,
40
+ "in_channels": 4,
41
+ "layers_per_block": 2,
42
+ "mid_block_scale_factor": 1,
43
+ "norm_eps": 1e-05,
44
+ "norm_num_groups": 32,
45
+ "num_attention_heads": null,
46
+ "num_class_embeds": null,
47
+ "only_cross_attention": false,
48
+ "projection_class_embeddings_input_dim": 2816,
49
+ "resnet_time_scale_shift": "default",
50
+ "transformer_layers_per_block": [
51
+ 1,
52
+ 2,
53
+ 10
54
+ ],
55
+ "upcast_attention": null,
56
+ "use_linear_projection": true
57
+ }
checkpoint-1000/controlnet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fe935fb1361055d8694a63c04bd3ede1abbd2e2bea8dc574d7b61c24bbfd138
3
+ size 5004167864
checkpoint-1000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e219c03baa3fa91ef81dd2ea41661cc6f960a9dca549c0da5441d2ac19a5aa43
3
+ size 2510393614
checkpoint-1000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a81fb3fcb214f6ff8d6e672f4f2ff4a645e1ea680bc2312bbad21b01a1fc8946
3
+ size 16036
checkpoint-1000/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d8fdcd0311eba9854fff738038ed4c1a269832665b4d88ba4e4e3d02a1a7e0e
3
+ size 988
checkpoint-1000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cc9d529863b9458dbb9b91d10c2e89741ffa38f99dbc44be25770289ed29416
3
+ size 1000
checkpoint-500/controlnet/config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "ControlNetModel",
3
+ "_diffusers_version": "0.24.0.dev0",
4
+ "_name_or_path": "diffusers/controlnet-canny-sdxl-1.0",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": "text_time",
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": 256,
9
+ "attention_head_dim": [
10
+ 5,
11
+ 10,
12
+ 20
13
+ ],
14
+ "block_out_channels": [
15
+ 320,
16
+ 640,
17
+ 1280
18
+ ],
19
+ "class_embed_type": null,
20
+ "conditioning_channels": 3,
21
+ "conditioning_embedding_out_channels": [
22
+ 16,
23
+ 32,
24
+ 96,
25
+ 256
26
+ ],
27
+ "controlnet_conditioning_channel_order": "rgb",
28
+ "cross_attention_dim": 2048,
29
+ "down_block_types": [
30
+ "DownBlock2D",
31
+ "CrossAttnDownBlock2D",
32
+ "CrossAttnDownBlock2D"
33
+ ],
34
+ "downsample_padding": 1,
35
+ "encoder_hid_dim": null,
36
+ "encoder_hid_dim_type": null,
37
+ "flip_sin_to_cos": true,
38
+ "freq_shift": 0,
39
+ "global_pool_conditions": false,
40
+ "in_channels": 4,
41
+ "layers_per_block": 2,
42
+ "mid_block_scale_factor": 1,
43
+ "norm_eps": 1e-05,
44
+ "norm_num_groups": 32,
45
+ "num_attention_heads": null,
46
+ "num_class_embeds": null,
47
+ "only_cross_attention": false,
48
+ "projection_class_embeddings_input_dim": 2816,
49
+ "resnet_time_scale_shift": "default",
50
+ "transformer_layers_per_block": [
51
+ 1,
52
+ 2,
53
+ 10
54
+ ],
55
+ "upcast_attention": null,
56
+ "use_linear_projection": true
57
+ }
checkpoint-500/controlnet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:337bfde5d9a124ab7df4cb72dfa426aeb2f416cd9a24129d8b707dc4775b49b4
3
+ size 5004167864
checkpoint-500/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1072826b2b21e35b73aaba7b49b02e7211eba0d7ab762c24babeb3e1cb1df212
3
+ size 2510393614
checkpoint-500/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de01a9299f232fbd0927ea715881c91897bdbc641d9229a62088913105909ac1
3
+ size 16036
checkpoint-500/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18b984273ea2d45b7ffb1d047bb359d93111e41fcad70d16a1b453fd38f72636
3
+ size 988
checkpoint-500/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ff7e0081931acdf638a5b6dc6f89d270dc53395b51e189cd30a4b0fd9d14285
3
+ size 1000
config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "ControlNetModel",
3
+ "_diffusers_version": "0.24.0.dev0",
4
+ "_name_or_path": "diffusers/controlnet-canny-sdxl-1.0",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": "text_time",
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": 256,
9
+ "attention_head_dim": [
10
+ 5,
11
+ 10,
12
+ 20
13
+ ],
14
+ "block_out_channels": [
15
+ 320,
16
+ 640,
17
+ 1280
18
+ ],
19
+ "class_embed_type": null,
20
+ "conditioning_channels": 3,
21
+ "conditioning_embedding_out_channels": [
22
+ 16,
23
+ 32,
24
+ 96,
25
+ 256
26
+ ],
27
+ "controlnet_conditioning_channel_order": "rgb",
28
+ "cross_attention_dim": 2048,
29
+ "down_block_types": [
30
+ "DownBlock2D",
31
+ "CrossAttnDownBlock2D",
32
+ "CrossAttnDownBlock2D"
33
+ ],
34
+ "downsample_padding": 1,
35
+ "encoder_hid_dim": null,
36
+ "encoder_hid_dim_type": null,
37
+ "flip_sin_to_cos": true,
38
+ "freq_shift": 0,
39
+ "global_pool_conditions": false,
40
+ "in_channels": 4,
41
+ "layers_per_block": 2,
42
+ "mid_block_scale_factor": 1,
43
+ "norm_eps": 1e-05,
44
+ "norm_num_groups": 32,
45
+ "num_attention_heads": null,
46
+ "num_class_embeds": null,
47
+ "only_cross_attention": false,
48
+ "projection_class_embeddings_input_dim": 2816,
49
+ "resnet_time_scale_shift": "default",
50
+ "transformer_layers_per_block": [
51
+ 1,
52
+ 2,
53
+ 10
54
+ ],
55
+ "upcast_attention": null,
56
+ "use_linear_projection": true
57
+ }
diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fe935fb1361055d8694a63c04bd3ede1abbd2e2bea8dc574d7b61c24bbfd138
3
+ size 5004167864
logs/sd_xl_train_controlnet/1702515595.3223143/events.out.tfevents.1702515595.pytorch-2-0-0-gpu-ml-p3dn-24xlarge-051a6d0780b7e55a6ff84c63b4cd.269.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afc87975ff61badebc68fffeefc4374a35992f61d1d8bb62224cc965cd41945f
3
+ size 2665
logs/sd_xl_train_controlnet/1702515595.3654385/hparams.yml ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ caption_column: text
8
+ checkpointing_steps: 500
9
+ checkpoints_total_limit: null
10
+ conditioning_image_column: conditioning_image
11
+ controlnet_model_name_or_path: diffusers/controlnet-canny-sdxl-1.0
12
+ crops_coords_top_left_h: 0
13
+ crops_coords_top_left_w: 0
14
+ dataloader_num_workers: 0
15
+ dataset_config_name: null
16
+ dataset_name: dataset_JB
17
+ enable_xformers_memory_efficient_attention: true
18
+ gradient_accumulation_steps: 4
19
+ gradient_checkpointing: false
20
+ hub_model_id: null
21
+ hub_token: null
22
+ image_column: image
23
+ learning_rate: 1.0e-06
24
+ logging_dir: logs
25
+ lr_num_cycles: 1
26
+ lr_power: 1.0
27
+ lr_scheduler: constant
28
+ lr_warmup_steps: 500
29
+ max_grad_norm: 1.0
30
+ max_train_samples: null
31
+ max_train_steps: 1000
32
+ mixed_precision: fp16
33
+ num_train_epochs: 4
34
+ num_validation_images: 4
35
+ output_dir: output_lr1e-6_datav3_modify_size1024_step1000_zoomin_textprompt
36
+ pretrained_model_name_or_path: diffusers/stable-diffusion-xl-1.0-inpainting-0.1
37
+ pretrained_vae_model_name_or_path: null
38
+ proportion_empty_prompts: 0
39
+ push_to_hub: true
40
+ report_to: tensorboard
41
+ resolution: 1024
42
+ resume_from_checkpoint: null
43
+ revision: null
44
+ scale_lr: false
45
+ seed: 42
46
+ set_grads_to_none: true
47
+ tokenizer_name: null
48
+ tracker_project_name: sd_xl_train_controlnet
49
+ train_batch_size: 1
50
+ train_data_dir: null
51
+ use_8bit_adam: true
52
+ validation_steps: 10000
53
+ variant: null
logs/sd_xl_train_controlnet/1702516845.1419387/events.out.tfevents.1702516845.pytorch-2-0-0-gpu-ml-p3dn-24xlarge-051a6d0780b7e55a6ff84c63b4cd.681.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05c68ef42fdab0986de007ffd21e853ba18c426c8043fa35b1a4b0056a68f854
3
+ size 2665
logs/sd_xl_train_controlnet/1702516845.1953154/hparams.yml ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ caption_column: text
8
+ checkpointing_steps: 500
9
+ checkpoints_total_limit: null
10
+ conditioning_image_column: conditioning_image
11
+ controlnet_model_name_or_path: diffusers/controlnet-canny-sdxl-1.0
12
+ crops_coords_top_left_h: 0
13
+ crops_coords_top_left_w: 0
14
+ dataloader_num_workers: 0
15
+ dataset_config_name: null
16
+ dataset_name: dataset_JB
17
+ enable_xformers_memory_efficient_attention: true
18
+ gradient_accumulation_steps: 4
19
+ gradient_checkpointing: false
20
+ hub_model_id: null
21
+ hub_token: null
22
+ image_column: image
23
+ learning_rate: 1.0e-06
24
+ logging_dir: logs
25
+ lr_num_cycles: 1
26
+ lr_power: 1.0
27
+ lr_scheduler: constant
28
+ lr_warmup_steps: 500
29
+ max_grad_norm: 1.0
30
+ max_train_samples: null
31
+ max_train_steps: 1000
32
+ mixed_precision: fp16
33
+ num_train_epochs: 4
34
+ num_validation_images: 4
35
+ output_dir: output_lr1e-6_datav3_modify_size1024_step1000_zoomin_textprompt
36
+ pretrained_model_name_or_path: diffusers/stable-diffusion-xl-1.0-inpainting-0.1
37
+ pretrained_vae_model_name_or_path: null
38
+ proportion_empty_prompts: 0
39
+ push_to_hub: true
40
+ report_to: tensorboard
41
+ resolution: 1024
42
+ resume_from_checkpoint: null
43
+ revision: null
44
+ scale_lr: false
45
+ seed: 42
46
+ set_grads_to_none: true
47
+ tokenizer_name: null
48
+ tracker_project_name: sd_xl_train_controlnet
49
+ train_batch_size: 1
50
+ train_data_dir: null
51
+ use_8bit_adam: true
52
+ validation_steps: 10000
53
+ variant: null
logs/sd_xl_train_controlnet/events.out.tfevents.1702515595.pytorch-2-0-0-gpu-ml-p3dn-24xlarge-051a6d0780b7e55a6ff84c63b4cd.269.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:264398a240dedae469ec64fa13e46c71f66f5a7aa63b7da312f35b359fad8681
3
+ size 64826
logs/sd_xl_train_controlnet/events.out.tfevents.1702516845.pytorch-2-0-0-gpu-ml-p3dn-24xlarge-051a6d0780b7e55a6ff84c63b4cd.681.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df8ca83afb8dc24b62284107e1e61c8f4b2d0b68d5df5cd16b124d4ee1a37ddc
3
+ size 334298