ptx0 commited on
Commit
02b28ff
1 Parent(s): 6d3949c

30000 steps (approx 4 epochs) with terminal SNR on 22k Midjourney 5.1 images plus 7200 real photographs as balance data with complete BLIP captions on all data. BS=4, LR=4e-7 to 1e-8

Browse files
config.yaml CHANGED
@@ -65,4 +65,4 @@ model:
65
  target: ldm.modules.encoders.modules.FrozenOpenCLIPEmbedder
66
  params:
67
  freeze: True
68
- layer: "penultimate"
 
65
  target: ldm.modules.encoders.modules.FrozenOpenCLIPEmbedder
66
  params:
67
  freeze: True
68
+ layer: "penultimate"
model_index.json CHANGED
@@ -12,7 +12,7 @@
12
  ],
13
  "scheduler": [
14
  "diffusers",
15
- "DDIMScheduler"
16
  ],
17
  "text_encoder": [
18
  "transformers",
 
12
  ],
13
  "scheduler": [
14
  "diffusers",
15
+ "DDPMScheduler"
16
  ],
17
  "text_encoder": [
18
  "transformers",
scheduler/scheduler_config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_class_name": "DDIMScheduler",
3
  "_diffusers_version": "0.17.0.dev0",
4
  "beta_end": 0.012,
5
  "beta_schedule": "scaled_linear",
@@ -14,5 +14,6 @@
14
  "skip_prk_steps": true,
15
  "steps_offset": 1,
16
  "thresholding": false,
17
- "trained_betas": null
 
18
  }
 
1
  {
2
+ "_class_name": "DDPMScheduler",
3
  "_diffusers_version": "0.17.0.dev0",
4
  "beta_end": 0.012,
5
  "beta_schedule": "scaled_linear",
 
14
  "skip_prk_steps": true,
15
  "steps_offset": 1,
16
  "thresholding": false,
17
+ "trained_betas": null,
18
+ "variance_type": "fixed_small"
19
  }
text_encoder/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/notebooks/images/datasets/models//checkpoint-550/text_encoder",
3
  "architectures": [
4
  "CLIPTextModel"
5
  ],
@@ -20,6 +20,6 @@
20
  "pad_token_id": 1,
21
  "projection_dim": 512,
22
  "torch_dtype": "float32",
23
- "transformers_version": "4.29.2",
24
  "vocab_size": 49408
25
  }
 
1
  {
2
+ "_name_or_path": "/notebooks/datasets/models/checkpoint-30000/text_encoder",
3
  "architectures": [
4
  "CLIPTextModel"
5
  ],
 
20
  "pad_token_id": 1,
21
  "projection_dim": 512,
22
  "torch_dtype": "float32",
23
+ "transformers_version": "4.28.1",
24
  "vocab_size": 49408
25
  }
text_encoder/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7f8471deacb5f976911bfcf000ec5ea27e912b491dfd5041d2bbeefe88ebf8a
3
  size 1361597016
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0029ad268db15f83a8454ed1d5a99c6d712915f7f1dd04b948264a09efb35f43
3
  size 1361597016
unet/config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.17.0.dev0",
4
- "_name_or_path": "/notebooks/images/datasets/models//checkpoint-550/unet",
5
  "act_fn": "silu",
6
  "addition_embed_type": null,
7
  "addition_embed_type_num_heads": 64,
 
1
  {
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.17.0.dev0",
4
+ "_name_or_path": "/notebooks/datasets/models/checkpoint-30000/unet",
5
  "act_fn": "silu",
6
  "addition_embed_type": null,
7
  "addition_embed_type_num_heads": 64,
unet/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:644a1dd448e2ac8faba304c89ae1c0f65e9d73ef84144b3d5d3ef22915b81f76
3
  size 3463726504
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19b83cdbc9c86dd0cbee9d8bc9dcb76f81615c3fc1a399a7f1c7eebda8c026ed
3
  size 3463726504
vae/config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_class_name": "AutoencoderKL",
3
  "_diffusers_version": "0.17.0.dev0",
4
- "_name_or_path": "/notebooks/datasets/models/pipeline/vae",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,
 
1
  {
2
  "_class_name": "AutoencoderKL",
3
  "_diffusers_version": "0.17.0.dev0",
4
+ "_name_or_path": "/root/.cache/huggingface/hub/models--stabilityai--stable-diffusion-2-1/snapshots/845609e6cf0a060d8cd837297e5c169df5bff72c/vae",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,