fatimaaa1 commited on
Commit
78059ff
1 Parent(s): e0de558

End of training

Browse files
README.md CHANGED
@@ -7,6 +7,11 @@ tags:
7
  - diffusers-training
8
  - stable-diffusion
9
  - stable-diffusion-diffusers
 
 
 
 
 
10
  - text-to-image
11
  - text-to-image
12
  - diffusers-training
 
7
  - diffusers-training
8
  - stable-diffusion
9
  - stable-diffusion-diffusers
10
+ - diffusers
11
+ - dora
12
+ - template:sd-lora
13
+ - stable-diffusion-xl
14
+ - stable-diffusion-xl-diffusers
15
  - text-to-image
16
  - text-to-image
17
  - diffusers-training
checkpoint-500/config.json ADDED
@@ -0,0 +1,69 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.19.0.dev0",
4
+ "act_fn": "silu",
5
+ "addition_embed_type": "text_time",
6
+ "addition_embed_type_num_heads": 64,
7
+ "addition_time_embed_dim": 256,
8
+ "attention_head_dim": [
9
+ 5,
10
+ 10,
11
+ 20
12
+ ],
13
+ "block_out_channels": [
14
+ 320,
15
+ 640,
16
+ 1280
17
+ ],
18
+ "center_input_sample": false,
19
+ "class_embed_type": null,
20
+ "class_embeddings_concat": false,
21
+ "conv_in_kernel": 3,
22
+ "conv_out_kernel": 3,
23
+ "cross_attention_dim": 2048,
24
+ "cross_attention_norm": null,
25
+ "down_block_types": [
26
+ "DownBlock2D",
27
+ "CrossAttnDownBlock2D",
28
+ "CrossAttnDownBlock2D"
29
+ ],
30
+ "downsample_padding": 1,
31
+ "dual_cross_attention": false,
32
+ "encoder_hid_dim": null,
33
+ "encoder_hid_dim_type": null,
34
+ "flip_sin_to_cos": true,
35
+ "freq_shift": 0,
36
+ "in_channels": 4,
37
+ "layers_per_block": 2,
38
+ "mid_block_only_cross_attention": null,
39
+ "mid_block_scale_factor": 1,
40
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
41
+ "norm_eps": 1e-05,
42
+ "norm_num_groups": 32,
43
+ "num_attention_heads": null,
44
+ "num_class_embeds": null,
45
+ "only_cross_attention": false,
46
+ "out_channels": 4,
47
+ "projection_class_embeddings_input_dim": 2816,
48
+ "resnet_out_scale_factor": 1.0,
49
+ "resnet_skip_time_act": false,
50
+ "resnet_time_scale_shift": "default",
51
+ "sample_size": 128,
52
+ "time_cond_proj_dim": null,
53
+ "time_embedding_act_fn": null,
54
+ "time_embedding_dim": null,
55
+ "time_embedding_type": "positional",
56
+ "timestep_post_act": null,
57
+ "transformer_layers_per_block": [
58
+ 1,
59
+ 2,
60
+ 10
61
+ ],
62
+ "up_block_types": [
63
+ "CrossAttnUpBlock2D",
64
+ "CrossAttnUpBlock2D",
65
+ "UpBlock2D"
66
+ ],
67
+ "upcast_attention": null,
68
+ "use_linear_projection": true
69
+ }
checkpoint-500/unet/config.json CHANGED
@@ -1,17 +1,18 @@
1
  {
2
  "_class_name": "UNet2DConditionModel",
3
- "_diffusers_version": "0.28.0.dev0",
4
- "_name_or_path": "CompVis/stable-diffusion-v1-4",
5
  "act_fn": "silu",
6
- "addition_embed_type": null,
7
  "addition_embed_type_num_heads": 64,
8
- "addition_time_embed_dim": null,
9
- "attention_head_dim": 8,
10
- "attention_type": "default",
 
 
 
11
  "block_out_channels": [
12
  320,
13
  640,
14
- 1280,
15
  1280
16
  ],
17
  "center_input_sample": false,
@@ -19,16 +20,14 @@
19
  "class_embeddings_concat": false,
20
  "conv_in_kernel": 3,
21
  "conv_out_kernel": 3,
22
- "cross_attention_dim": 768,
23
  "cross_attention_norm": null,
24
  "down_block_types": [
 
25
  "CrossAttnDownBlock2D",
26
- "CrossAttnDownBlock2D",
27
- "CrossAttnDownBlock2D",
28
- "DownBlock2D"
29
  ],
30
  "downsample_padding": 1,
31
- "dropout": 0.0,
32
  "dual_cross_attention": false,
33
  "encoder_hid_dim": null,
34
  "encoder_hid_dim_type": null,
@@ -45,24 +44,26 @@
45
  "num_class_embeds": null,
46
  "only_cross_attention": false,
47
  "out_channels": 4,
48
- "projection_class_embeddings_input_dim": null,
49
  "resnet_out_scale_factor": 1.0,
50
  "resnet_skip_time_act": false,
51
  "resnet_time_scale_shift": "default",
52
- "reverse_transformer_layers_per_block": null,
53
- "sample_size": 64,
54
  "time_cond_proj_dim": null,
55
  "time_embedding_act_fn": null,
56
  "time_embedding_dim": null,
57
  "time_embedding_type": "positional",
58
  "timestep_post_act": null,
59
- "transformer_layers_per_block": 1,
 
 
 
 
60
  "up_block_types": [
61
- "UpBlock2D",
62
  "CrossAttnUpBlock2D",
63
  "CrossAttnUpBlock2D",
64
- "CrossAttnUpBlock2D"
65
  ],
66
- "upcast_attention": false,
67
- "use_linear_projection": false
68
  }
 
1
  {
2
  "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.19.0.dev0",
 
4
  "act_fn": "silu",
5
+ "addition_embed_type": "text_time",
6
  "addition_embed_type_num_heads": 64,
7
+ "addition_time_embed_dim": 256,
8
+ "attention_head_dim": [
9
+ 5,
10
+ 10,
11
+ 20
12
+ ],
13
  "block_out_channels": [
14
  320,
15
  640,
 
16
  1280
17
  ],
18
  "center_input_sample": false,
 
20
  "class_embeddings_concat": false,
21
  "conv_in_kernel": 3,
22
  "conv_out_kernel": 3,
23
+ "cross_attention_dim": 2048,
24
  "cross_attention_norm": null,
25
  "down_block_types": [
26
+ "DownBlock2D",
27
  "CrossAttnDownBlock2D",
28
+ "CrossAttnDownBlock2D"
 
 
29
  ],
30
  "downsample_padding": 1,
 
31
  "dual_cross_attention": false,
32
  "encoder_hid_dim": null,
33
  "encoder_hid_dim_type": null,
 
44
  "num_class_embeds": null,
45
  "only_cross_attention": false,
46
  "out_channels": 4,
47
+ "projection_class_embeddings_input_dim": 2816,
48
  "resnet_out_scale_factor": 1.0,
49
  "resnet_skip_time_act": false,
50
  "resnet_time_scale_shift": "default",
51
+ "sample_size": 128,
 
52
  "time_cond_proj_dim": null,
53
  "time_embedding_act_fn": null,
54
  "time_embedding_dim": null,
55
  "time_embedding_type": "positional",
56
  "timestep_post_act": null,
57
+ "transformer_layers_per_block": [
58
+ 1,
59
+ 2,
60
+ 10
61
+ ],
62
  "up_block_types": [
 
63
  "CrossAttnUpBlock2D",
64
  "CrossAttnUpBlock2D",
65
+ "UpBlock2D"
66
  ],
67
+ "upcast_attention": null,
68
+ "use_linear_projection": true
69
  }