ptx0
commited on
Commit
•
02b28ff
1
Parent(s):
6d3949c
30000 steps (approx 4 epochs) with terminal SNR on 22k Midjourney 5.1 images plus 7200 real photographs as balance data with complete BLIP captions on all data. BS=4, LR=4e-7 to 1e-8
Browse files- config.yaml +1 -1
- model_index.json +1 -1
- scheduler/scheduler_config.json +3 -2
- text_encoder/config.json +2 -2
- text_encoder/model.safetensors +1 -1
- unet/config.json +1 -1
- unet/diffusion_pytorch_model.safetensors +1 -1
- vae/config.json +1 -1
config.yaml
CHANGED
@@ -65,4 +65,4 @@ model:
|
|
65 |
target: ldm.modules.encoders.modules.FrozenOpenCLIPEmbedder
|
66 |
params:
|
67 |
freeze: True
|
68 |
-
layer: "penultimate"
|
|
|
65 |
target: ldm.modules.encoders.modules.FrozenOpenCLIPEmbedder
|
66 |
params:
|
67 |
freeze: True
|
68 |
+
layer: "penultimate"
|
model_index.json
CHANGED
@@ -12,7 +12,7 @@
|
|
12 |
],
|
13 |
"scheduler": [
|
14 |
"diffusers",
|
15 |
-
"
|
16 |
],
|
17 |
"text_encoder": [
|
18 |
"transformers",
|
|
|
12 |
],
|
13 |
"scheduler": [
|
14 |
"diffusers",
|
15 |
+
"DDPMScheduler"
|
16 |
],
|
17 |
"text_encoder": [
|
18 |
"transformers",
|
scheduler/scheduler_config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_class_name": "
|
3 |
"_diffusers_version": "0.17.0.dev0",
|
4 |
"beta_end": 0.012,
|
5 |
"beta_schedule": "scaled_linear",
|
@@ -14,5 +14,6 @@
|
|
14 |
"skip_prk_steps": true,
|
15 |
"steps_offset": 1,
|
16 |
"thresholding": false,
|
17 |
-
"trained_betas": null
|
|
|
18 |
}
|
|
|
1 |
{
|
2 |
+
"_class_name": "DDPMScheduler",
|
3 |
"_diffusers_version": "0.17.0.dev0",
|
4 |
"beta_end": 0.012,
|
5 |
"beta_schedule": "scaled_linear",
|
|
|
14 |
"skip_prk_steps": true,
|
15 |
"steps_offset": 1,
|
16 |
"thresholding": false,
|
17 |
+
"trained_betas": null,
|
18 |
+
"variance_type": "fixed_small"
|
19 |
}
|
text_encoder/config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "/notebooks/
|
3 |
"architectures": [
|
4 |
"CLIPTextModel"
|
5 |
],
|
@@ -20,6 +20,6 @@
|
|
20 |
"pad_token_id": 1,
|
21 |
"projection_dim": 512,
|
22 |
"torch_dtype": "float32",
|
23 |
-
"transformers_version": "4.
|
24 |
"vocab_size": 49408
|
25 |
}
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "/notebooks/datasets/models/checkpoint-30000/text_encoder",
|
3 |
"architectures": [
|
4 |
"CLIPTextModel"
|
5 |
],
|
|
|
20 |
"pad_token_id": 1,
|
21 |
"projection_dim": 512,
|
22 |
"torch_dtype": "float32",
|
23 |
+
"transformers_version": "4.28.1",
|
24 |
"vocab_size": 49408
|
25 |
}
|
text_encoder/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1361597016
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0029ad268db15f83a8454ed1d5a99c6d712915f7f1dd04b948264a09efb35f43
|
3 |
size 1361597016
|
unet/config.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
"_class_name": "UNet2DConditionModel",
|
3 |
"_diffusers_version": "0.17.0.dev0",
|
4 |
-
"_name_or_path": "/notebooks/
|
5 |
"act_fn": "silu",
|
6 |
"addition_embed_type": null,
|
7 |
"addition_embed_type_num_heads": 64,
|
|
|
1 |
{
|
2 |
"_class_name": "UNet2DConditionModel",
|
3 |
"_diffusers_version": "0.17.0.dev0",
|
4 |
+
"_name_or_path": "/notebooks/datasets/models/checkpoint-30000/unet",
|
5 |
"act_fn": "silu",
|
6 |
"addition_embed_type": null,
|
7 |
"addition_embed_type_num_heads": 64,
|
unet/diffusion_pytorch_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3463726504
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19b83cdbc9c86dd0cbee9d8bc9dcb76f81615c3fc1a399a7f1c7eebda8c026ed
|
3 |
size 3463726504
|
vae/config.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
"_class_name": "AutoencoderKL",
|
3 |
"_diffusers_version": "0.17.0.dev0",
|
4 |
-
"_name_or_path": "/
|
5 |
"act_fn": "silu",
|
6 |
"block_out_channels": [
|
7 |
128,
|
|
|
1 |
{
|
2 |
"_class_name": "AutoencoderKL",
|
3 |
"_diffusers_version": "0.17.0.dev0",
|
4 |
+
"_name_or_path": "/root/.cache/huggingface/hub/models--stabilityai--stable-diffusion-2-1/snapshots/845609e6cf0a060d8cd837297e5c169df5bff72c/vae",
|
5 |
"act_fn": "silu",
|
6 |
"block_out_channels": [
|
7 |
128,
|