Spaces:
Runtime error
Runtime error
fix progress bar
Browse files- .gitignore +1 -0
- notebooks/test_vae.ipynb +0 -0
- scripts/train_unconditional.py +6 -5
- scripts/train_vae.py +0 -1
.gitignore
CHANGED
@@ -10,3 +10,4 @@ lightning_logs
|
|
10 |
taming
|
11 |
checkpoints
|
12 |
vae_model
|
|
|
|
10 |
taming
|
11 |
checkpoints
|
12 |
vae_model
|
13 |
+
latent-audio-diffusion-*
|
notebooks/test_vae.ipynb
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
scripts/train_unconditional.py
CHANGED
@@ -48,7 +48,8 @@ def main(args):
|
|
48 |
model = DDPMPipeline.from_pretrained(args.from_pretrained).unet
|
49 |
else:
|
50 |
model = UNet2DModel(
|
51 |
-
sample_size=args.resolution
|
|
|
52 |
in_channels=1 if args.vae is None else 3,
|
53 |
out_channels=1 if args.vae is None else 3,
|
54 |
layers_per_block=2,
|
@@ -211,9 +212,8 @@ def main(args):
|
|
211 |
ema_model.step(model)
|
212 |
optimizer.zero_grad()
|
213 |
|
214 |
-
|
215 |
-
|
216 |
-
global_step += 1
|
217 |
|
218 |
logs = {
|
219 |
"loss": loss.detach().item(),
|
@@ -304,7 +304,8 @@ if __name__ == "__main__":
|
|
304 |
parser.add_argument("--output_dir", type=str, default="ddpm-model-64")
|
305 |
parser.add_argument("--overwrite_output_dir", type=bool, default=False)
|
306 |
parser.add_argument("--cache_dir", type=str, default=None)
|
307 |
-
parser.add_argument("--resolution", type=int, default=
|
|
|
308 |
parser.add_argument("--train_batch_size", type=int, default=16)
|
309 |
parser.add_argument("--eval_batch_size", type=int, default=16)
|
310 |
parser.add_argument("--num_epochs", type=int, default=100)
|
|
|
48 |
model = DDPMPipeline.from_pretrained(args.from_pretrained).unet
|
49 |
else:
|
50 |
model = UNet2DModel(
|
51 |
+
sample_size=args.resolution
|
52 |
+
if args.vae is None else args.latent_resolution,
|
53 |
in_channels=1 if args.vae is None else 3,
|
54 |
out_channels=1 if args.vae is None else 3,
|
55 |
layers_per_block=2,
|
|
|
212 |
ema_model.step(model)
|
213 |
optimizer.zero_grad()
|
214 |
|
215 |
+
progress_bar.update(1)
|
216 |
+
global_step += 1
|
|
|
217 |
|
218 |
logs = {
|
219 |
"loss": loss.detach().item(),
|
|
|
304 |
parser.add_argument("--output_dir", type=str, default="ddpm-model-64")
|
305 |
parser.add_argument("--overwrite_output_dir", type=bool, default=False)
|
306 |
parser.add_argument("--cache_dir", type=str, default=None)
|
307 |
+
parser.add_argument("--resolution", type=int, default=256)
|
308 |
+
parser.add_argument("--latent_resolution", type=int, default=64)
|
309 |
parser.add_argument("--train_batch_size", type=int, default=16)
|
310 |
parser.add_argument("--eval_batch_size", type=int, default=16)
|
311 |
parser.add_argument("--num_epochs", type=int, default=100)
|
scripts/train_vae.py
CHANGED
@@ -3,7 +3,6 @@
|
|
3 |
# convert_original_stable_diffusion_to_diffusers.py
|
4 |
|
5 |
# TODO
|
6 |
-
# add latent resolution as parameter
|
7 |
# grayscale
|
8 |
# update README
|
9 |
|
|
|
3 |
# convert_original_stable_diffusion_to_diffusers.py
|
4 |
|
5 |
# TODO
|
|
|
6 |
# grayscale
|
7 |
# update README
|
8 |
|