tolgacangoz
commited on
Commit
•
4f3d3a0
1
Parent(s):
e4ec318
Update unet's config file
Browse files- unet/config.json +12 -12
unet/config.json
CHANGED
@@ -1,13 +1,13 @@
|
|
1 |
{
|
2 |
-
"_class_name": "
|
3 |
"_diffusers_version": "0.31.0.dev0",
|
|
|
4 |
"act_fn": "silu",
|
5 |
-
"addition_embed_type":
|
6 |
"addition_embed_type_num_heads": 64,
|
7 |
"addition_time_embed_dim": null,
|
8 |
-
"attention_bias": true,
|
9 |
"attention_head_dim": 8,
|
10 |
-
"attention_pre_only":
|
11 |
"attention_type": "default",
|
12 |
"block_out_channels": [
|
13 |
256,
|
@@ -20,7 +20,7 @@
|
|
20 |
"conv_in_kernel": 3,
|
21 |
"conv_out_kernel": 3,
|
22 |
"cross_attention_dim": 2048,
|
23 |
-
"cross_attention_norm":
|
24 |
"down_block_types": [
|
25 |
"DownBlock2D",
|
26 |
"CrossAttnDownBlock2D",
|
@@ -29,20 +29,20 @@
|
|
29 |
"downsample_padding": 1,
|
30 |
"dropout": 0.0,
|
31 |
"dual_cross_attention": false,
|
32 |
-
"encoder_hid_dim":
|
33 |
-
"encoder_hid_dim_type":
|
34 |
-
"
|
35 |
-
"ff_norm_type": "group_norm_matryoshka",
|
36 |
-
"flip_sin_to_cos": true,
|
37 |
"freq_shift": 0,
|
38 |
"in_channels": 3,
|
39 |
"layers_per_block": 2,
|
|
|
|
|
40 |
"mid_block_only_cross_attention": null,
|
41 |
"mid_block_scale_factor": 1,
|
42 |
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
43 |
"norm_eps": 1e-05,
|
44 |
"norm_num_groups": 32,
|
45 |
-
"norm_type": "
|
46 |
"num_attention_heads": null,
|
47 |
"num_class_embeds": null,
|
48 |
"only_cross_attention": false,
|
@@ -69,5 +69,5 @@
|
|
69 |
"UpBlock2D"
|
70 |
],
|
71 |
"upcast_attention": false,
|
72 |
-
"use_linear_projection":
|
73 |
}
|
|
|
1 |
{
|
2 |
+
"_class_name": "NestedUNet2DConditionModel",
|
3 |
"_diffusers_version": "0.31.0.dev0",
|
4 |
+
"_name_or_path": "/home/cosmos/Documents/matryoshka/unet",
|
5 |
"act_fn": "silu",
|
6 |
+
"addition_embed_type": "matryoshka",
|
7 |
"addition_embed_type_num_heads": 64,
|
8 |
"addition_time_embed_dim": null,
|
|
|
9 |
"attention_head_dim": 8,
|
10 |
+
"attention_pre_only": false,
|
11 |
"attention_type": "default",
|
12 |
"block_out_channels": [
|
13 |
256,
|
|
|
20 |
"conv_in_kernel": 3,
|
21 |
"conv_out_kernel": 3,
|
22 |
"cross_attention_dim": 2048,
|
23 |
+
"cross_attention_norm": null,
|
24 |
"down_block_types": [
|
25 |
"DownBlock2D",
|
26 |
"CrossAttnDownBlock2D",
|
|
|
29 |
"downsample_padding": 1,
|
30 |
"dropout": 0.0,
|
31 |
"dual_cross_attention": false,
|
32 |
+
"encoder_hid_dim": 2048,
|
33 |
+
"encoder_hid_dim_type": "text_proj",
|
34 |
+
"flip_sin_to_cos": false,
|
|
|
|
|
35 |
"freq_shift": 0,
|
36 |
"in_channels": 3,
|
37 |
"layers_per_block": 2,
|
38 |
+
"masked_cross_attention": false,
|
39 |
+
"micro_conditioning_scale": 64,
|
40 |
"mid_block_only_cross_attention": null,
|
41 |
"mid_block_scale_factor": 1,
|
42 |
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
43 |
"norm_eps": 1e-05,
|
44 |
"norm_num_groups": 32,
|
45 |
+
"norm_type": "layer_norm",
|
46 |
"num_attention_heads": null,
|
47 |
"num_class_embeds": null,
|
48 |
"only_cross_attention": false,
|
|
|
69 |
"UpBlock2D"
|
70 |
],
|
71 |
"upcast_attention": false,
|
72 |
+
"use_linear_projection": false
|
73 |
}
|