Update to use default diffusers training scripts
Browse files- args.json +0 -60
- unet/diffusion_pytorch_model.bin → checkpoint-500/optimizer.bin +2 -2
- text_encoder/pytorch_model.bin → checkpoint-500/random_states_0.pkl +2 -2
- vae/diffusion_pytorch_model.bin → checkpoint-500/scheduler.bin +2 -2
- checkpoint-500/unet/config.json +66 -0
- checkpoint-500/unet/diffusion_pytorch_model.safetensors +3 -0
- feature_extractor/preprocessor_config.json +1 -1
- logs/dreambooth/1693358976.7018929/events.out.tfevents.1693358976.text-to-image-0.4436.1 +3 -0
- logs/dreambooth/1693358976.70344/hparams.yml +58 -0
- logs/dreambooth/1693366191.0888145/events.out.tfevents.1693366191.text-to-image-0.5967.1 +3 -0
- logs/dreambooth/1693366191.0903463/hparams.yml +58 -0
- logs/dreambooth/1693368952.1649532/events.out.tfevents.1693368952.text-to-image-0.6993.1 +3 -0
- logs/dreambooth/1693368952.1666262/hparams.yml +58 -0
- logs/dreambooth/1693369738.2229948/events.out.tfevents.1693369738.text-to-image-0.7423.1 +3 -0
- logs/dreambooth/1693369738.2245512/hparams.yml +58 -0
- logs/dreambooth/1693369858.7861362/events.out.tfevents.1693369858.text-to-image-0.7601.1 +3 -0
- logs/dreambooth/1693369858.787858/hparams.yml +58 -0
- logs/dreambooth/events.out.tfevents.1693358976.text-to-image-0.4436.0 +3 -0
- logs/dreambooth/events.out.tfevents.1693366191.text-to-image-0.5967.0 +3 -0
- logs/dreambooth/events.out.tfevents.1693368952.text-to-image-0.6993.0 +3 -0
- logs/dreambooth/events.out.tfevents.1693369738.text-to-image-0.7423.0 +3 -0
- logs/dreambooth/events.out.tfevents.1693369858.text-to-image-0.7601.0 +3 -0
- model_index.json +5 -4
- safety_checker/config.json +28 -0
- safety_checker/model.safetensors +3 -0
- samples/0.png +0 -0
- samples/1.png +0 -0
- samples/2.png +0 -0
- samples/3.png +0 -0
- scheduler/scheduler_config.json +3 -6
- text_encoder/config.json +1 -1
- text_encoder/model.safetensors +3 -0
- unet/config.json +15 -1
- unet/diffusion_pytorch_model.safetensors +3 -0
- vae/config.json +4 -3
- vae/diffusion_pytorch_model.safetensors +3 -0
args.json
DELETED
|
@@ -1,60 +0,0 @@
|
|
| 1 |
-
{
|
| 2 |
-
"pretrained_model_name_or_path": "runwayml/stable-diffusion-v1-5",
|
| 3 |
-
"pretrained_vae_name_or_path": "stabilityai/sd-vae-ft-mse",
|
| 4 |
-
"revision": "fp16",
|
| 5 |
-
"tokenizer_name": null,
|
| 6 |
-
"instance_data_dir": null,
|
| 7 |
-
"class_data_dir": null,
|
| 8 |
-
"instance_prompt": null,
|
| 9 |
-
"class_prompt": null,
|
| 10 |
-
"save_sample_prompt": "photo of a rhteddy dog",
|
| 11 |
-
"save_sample_negative_prompt": null,
|
| 12 |
-
"n_save_sample": 4,
|
| 13 |
-
"save_guidance_scale": 7.5,
|
| 14 |
-
"save_infer_steps": 20,
|
| 15 |
-
"pad_tokens": false,
|
| 16 |
-
"with_prior_preservation": true,
|
| 17 |
-
"prior_loss_weight": 1.0,
|
| 18 |
-
"num_class_images": 200,
|
| 19 |
-
"output_dir": "/opt/app-root/src/text-to-image-demo/custom/weights/redhat-dog",
|
| 20 |
-
"seed": 1337,
|
| 21 |
-
"resolution": 512,
|
| 22 |
-
"center_crop": false,
|
| 23 |
-
"train_text_encoder": true,
|
| 24 |
-
"train_batch_size": 1,
|
| 25 |
-
"sample_batch_size": 4,
|
| 26 |
-
"num_train_epochs": 4,
|
| 27 |
-
"max_train_steps": 800,
|
| 28 |
-
"gradient_accumulation_steps": 1,
|
| 29 |
-
"gradient_checkpointing": false,
|
| 30 |
-
"learning_rate": 1e-06,
|
| 31 |
-
"scale_lr": false,
|
| 32 |
-
"lr_scheduler": "constant",
|
| 33 |
-
"lr_warmup_steps": 0,
|
| 34 |
-
"use_8bit_adam": true,
|
| 35 |
-
"adam_beta1": 0.9,
|
| 36 |
-
"adam_beta2": 0.999,
|
| 37 |
-
"adam_weight_decay": 0.01,
|
| 38 |
-
"adam_epsilon": 1e-08,
|
| 39 |
-
"max_grad_norm": 1.0,
|
| 40 |
-
"push_to_hub": false,
|
| 41 |
-
"hub_token": null,
|
| 42 |
-
"hub_model_id": null,
|
| 43 |
-
"logging_dir": "logs",
|
| 44 |
-
"log_interval": 10,
|
| 45 |
-
"save_interval": 10000,
|
| 46 |
-
"save_min_steps": 0,
|
| 47 |
-
"mixed_precision": "fp16",
|
| 48 |
-
"not_cache_latents": false,
|
| 49 |
-
"hflip": false,
|
| 50 |
-
"local_rank": -1,
|
| 51 |
-
"concepts_list": [
|
| 52 |
-
{
|
| 53 |
-
"instance_prompt": "photo of a rhteddy dog",
|
| 54 |
-
"class_prompt": "a photo of dog",
|
| 55 |
-
"instance_data_dir": "/opt/app-root/src/text-to-image-demo/custom/data/instance_dir",
|
| 56 |
-
"class_data_dir": "/opt/app-root/src/text-to-image-demo/custom/data/class_dir"
|
| 57 |
-
}
|
| 58 |
-
],
|
| 59 |
-
"read_prompts_from_txts": false
|
| 60 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
unet/diffusion_pytorch_model.bin → checkpoint-500/optimizer.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f088d1eff6f69b6b321dea781a1d8279a1fecc1a202bf10ee9e25c7818ce8b54
|
| 3 |
+
size 1725109957
|
text_encoder/pytorch_model.bin → checkpoint-500/random_states_0.pkl
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0e73845fc88bfe687b6a9570caeaba8559d5362f771514e8f1986ac94f92ca79
|
| 3 |
+
size 14663
|
vae/diffusion_pytorch_model.bin → checkpoint-500/scheduler.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6be622d51c3bcf8a1991c02b9778f31d7e3a79a8b22e03e81a36e25205ef4c5b
|
| 3 |
+
size 563
|
checkpoint-500/unet/config.json
ADDED
|
@@ -0,0 +1,66 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_class_name": "UNet2DConditionModel",
|
| 3 |
+
"_diffusers_version": "0.21.0.dev0",
|
| 4 |
+
"_name_or_path": "runwayml/stable-diffusion-v1-5",
|
| 5 |
+
"act_fn": "silu",
|
| 6 |
+
"addition_embed_type": null,
|
| 7 |
+
"addition_embed_type_num_heads": 64,
|
| 8 |
+
"addition_time_embed_dim": null,
|
| 9 |
+
"attention_head_dim": 8,
|
| 10 |
+
"attention_type": "default",
|
| 11 |
+
"block_out_channels": [
|
| 12 |
+
320,
|
| 13 |
+
640,
|
| 14 |
+
1280,
|
| 15 |
+
1280
|
| 16 |
+
],
|
| 17 |
+
"center_input_sample": false,
|
| 18 |
+
"class_embed_type": null,
|
| 19 |
+
"class_embeddings_concat": false,
|
| 20 |
+
"conv_in_kernel": 3,
|
| 21 |
+
"conv_out_kernel": 3,
|
| 22 |
+
"cross_attention_dim": 768,
|
| 23 |
+
"cross_attention_norm": null,
|
| 24 |
+
"down_block_types": [
|
| 25 |
+
"CrossAttnDownBlock2D",
|
| 26 |
+
"CrossAttnDownBlock2D",
|
| 27 |
+
"CrossAttnDownBlock2D",
|
| 28 |
+
"DownBlock2D"
|
| 29 |
+
],
|
| 30 |
+
"downsample_padding": 1,
|
| 31 |
+
"dual_cross_attention": false,
|
| 32 |
+
"encoder_hid_dim": null,
|
| 33 |
+
"encoder_hid_dim_type": null,
|
| 34 |
+
"flip_sin_to_cos": true,
|
| 35 |
+
"freq_shift": 0,
|
| 36 |
+
"in_channels": 4,
|
| 37 |
+
"layers_per_block": 2,
|
| 38 |
+
"mid_block_only_cross_attention": null,
|
| 39 |
+
"mid_block_scale_factor": 1,
|
| 40 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
| 41 |
+
"norm_eps": 1e-05,
|
| 42 |
+
"norm_num_groups": 32,
|
| 43 |
+
"num_attention_heads": null,
|
| 44 |
+
"num_class_embeds": null,
|
| 45 |
+
"only_cross_attention": false,
|
| 46 |
+
"out_channels": 4,
|
| 47 |
+
"projection_class_embeddings_input_dim": null,
|
| 48 |
+
"resnet_out_scale_factor": 1.0,
|
| 49 |
+
"resnet_skip_time_act": false,
|
| 50 |
+
"resnet_time_scale_shift": "default",
|
| 51 |
+
"sample_size": 64,
|
| 52 |
+
"time_cond_proj_dim": null,
|
| 53 |
+
"time_embedding_act_fn": null,
|
| 54 |
+
"time_embedding_dim": null,
|
| 55 |
+
"time_embedding_type": "positional",
|
| 56 |
+
"timestep_post_act": null,
|
| 57 |
+
"transformer_layers_per_block": 1,
|
| 58 |
+
"up_block_types": [
|
| 59 |
+
"UpBlock2D",
|
| 60 |
+
"CrossAttnUpBlock2D",
|
| 61 |
+
"CrossAttnUpBlock2D",
|
| 62 |
+
"CrossAttnUpBlock2D"
|
| 63 |
+
],
|
| 64 |
+
"upcast_attention": false,
|
| 65 |
+
"use_linear_projection": false
|
| 66 |
+
}
|
checkpoint-500/unet/diffusion_pytorch_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f0f5861887c8c2df8f20e2bc61e4c82c06836e01465c948a24f8f9c27baf1fe0
|
| 3 |
+
size 3438167536
|
feature_extractor/preprocessor_config.json
CHANGED
|
@@ -14,7 +14,7 @@
|
|
| 14 |
0.4578275,
|
| 15 |
0.40821073
|
| 16 |
],
|
| 17 |
-
"image_processor_type": "
|
| 18 |
"image_std": [
|
| 19 |
0.26862954,
|
| 20 |
0.26130258,
|
|
|
|
| 14 |
0.4578275,
|
| 15 |
0.40821073
|
| 16 |
],
|
| 17 |
+
"image_processor_type": "CLIPImageProcessor",
|
| 18 |
"image_std": [
|
| 19 |
0.26862954,
|
| 20 |
0.26130258,
|
logs/dreambooth/1693358976.7018929/events.out.tfevents.1693358976.text-to-image-0.4436.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:560a0cdf21039623ed3cd0738493453a526242e4405acb3ba5e0f00215f42562
|
| 3 |
+
size 3007
|
logs/dreambooth/1693358976.70344/hparams.yml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
adam_beta1: 0.9
|
| 2 |
+
adam_beta2: 0.999
|
| 3 |
+
adam_epsilon: 1.0e-08
|
| 4 |
+
adam_weight_decay: 0.01
|
| 5 |
+
allow_tf32: false
|
| 6 |
+
center_crop: false
|
| 7 |
+
checkpointing_steps: 500
|
| 8 |
+
checkpoints_total_limit: null
|
| 9 |
+
class_data_dir: /opt/app-root/src/text-to-image-demo/notebook-output/data/class_dir
|
| 10 |
+
class_labels_conditioning: null
|
| 11 |
+
class_prompt: a photo of dog
|
| 12 |
+
dataloader_num_workers: 0
|
| 13 |
+
enable_xformers_memory_efficient_attention: true
|
| 14 |
+
gradient_accumulation_steps: 1
|
| 15 |
+
gradient_checkpointing: false
|
| 16 |
+
hub_model_id: null
|
| 17 |
+
hub_token: null
|
| 18 |
+
instance_data_dir: /opt/app-root/src/text-to-image-demo/notebook-output/data/instance_dir
|
| 19 |
+
instance_prompt: photo of a rhteddy dog
|
| 20 |
+
learning_rate: 5.0e-06
|
| 21 |
+
local_rank: -1
|
| 22 |
+
logging_dir: logs
|
| 23 |
+
lr_num_cycles: 1
|
| 24 |
+
lr_power: 1.0
|
| 25 |
+
lr_scheduler: constant
|
| 26 |
+
lr_warmup_steps: 0
|
| 27 |
+
max_grad_norm: 1.0
|
| 28 |
+
max_train_steps: 800
|
| 29 |
+
mixed_precision: null
|
| 30 |
+
num_class_images: 200
|
| 31 |
+
num_train_epochs: 4
|
| 32 |
+
num_validation_images: 4
|
| 33 |
+
offset_noise: false
|
| 34 |
+
output_dir: /opt/app-root/src/text-to-image-demo/notebook-output/stable_diffusion_weights/redhat-dog
|
| 35 |
+
pre_compute_text_embeddings: false
|
| 36 |
+
pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
|
| 37 |
+
prior_generation_precision: null
|
| 38 |
+
prior_loss_weight: 1.0
|
| 39 |
+
push_to_hub: false
|
| 40 |
+
report_to: tensorboard
|
| 41 |
+
resolution: 512
|
| 42 |
+
resume_from_checkpoint: null
|
| 43 |
+
revision: null
|
| 44 |
+
sample_batch_size: 4
|
| 45 |
+
scale_lr: false
|
| 46 |
+
seed: null
|
| 47 |
+
set_grads_to_none: false
|
| 48 |
+
skip_save_text_encoder: false
|
| 49 |
+
text_encoder_use_attention_mask: false
|
| 50 |
+
tokenizer_max_length: null
|
| 51 |
+
tokenizer_name: null
|
| 52 |
+
train_batch_size: 1
|
| 53 |
+
train_text_encoder: false
|
| 54 |
+
use_8bit_adam: false
|
| 55 |
+
validation_prompt: null
|
| 56 |
+
validation_scheduler: DPMSolverMultistepScheduler
|
| 57 |
+
validation_steps: 100
|
| 58 |
+
with_prior_preservation: true
|
logs/dreambooth/1693366191.0888145/events.out.tfevents.1693366191.text-to-image-0.5967.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e52753eb744a0c0bc6dc223673b367087abe2d3216feb29b436390b8c04d3670
|
| 3 |
+
size 3007
|
logs/dreambooth/1693366191.0903463/hparams.yml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
adam_beta1: 0.9
|
| 2 |
+
adam_beta2: 0.999
|
| 3 |
+
adam_epsilon: 1.0e-08
|
| 4 |
+
adam_weight_decay: 0.01
|
| 5 |
+
allow_tf32: false
|
| 6 |
+
center_crop: false
|
| 7 |
+
checkpointing_steps: 500
|
| 8 |
+
checkpoints_total_limit: null
|
| 9 |
+
class_data_dir: /opt/app-root/src/text-to-image-demo/notebook-output/data/class_dir
|
| 10 |
+
class_labels_conditioning: null
|
| 11 |
+
class_prompt: a photo of dog
|
| 12 |
+
dataloader_num_workers: 0
|
| 13 |
+
enable_xformers_memory_efficient_attention: true
|
| 14 |
+
gradient_accumulation_steps: 2
|
| 15 |
+
gradient_checkpointing: true
|
| 16 |
+
hub_model_id: null
|
| 17 |
+
hub_token: null
|
| 18 |
+
instance_data_dir: /opt/app-root/src/text-to-image-demo/notebook-output/data/instance_dir
|
| 19 |
+
instance_prompt: photo of a rhteddy dog
|
| 20 |
+
learning_rate: 5.0e-06
|
| 21 |
+
local_rank: -1
|
| 22 |
+
logging_dir: logs
|
| 23 |
+
lr_num_cycles: 1
|
| 24 |
+
lr_power: 1.0
|
| 25 |
+
lr_scheduler: constant
|
| 26 |
+
lr_warmup_steps: 0
|
| 27 |
+
max_grad_norm: 1.0
|
| 28 |
+
max_train_steps: 800
|
| 29 |
+
mixed_precision: null
|
| 30 |
+
num_class_images: 200
|
| 31 |
+
num_train_epochs: 8
|
| 32 |
+
num_validation_images: 4
|
| 33 |
+
offset_noise: false
|
| 34 |
+
output_dir: /opt/app-root/src/text-to-image-demo/notebook-output/stable_diffusion_weights/redhat-dog
|
| 35 |
+
pre_compute_text_embeddings: false
|
| 36 |
+
pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
|
| 37 |
+
prior_generation_precision: null
|
| 38 |
+
prior_loss_weight: 1.0
|
| 39 |
+
push_to_hub: false
|
| 40 |
+
report_to: tensorboard
|
| 41 |
+
resolution: 512
|
| 42 |
+
resume_from_checkpoint: null
|
| 43 |
+
revision: null
|
| 44 |
+
sample_batch_size: 4
|
| 45 |
+
scale_lr: false
|
| 46 |
+
seed: null
|
| 47 |
+
set_grads_to_none: false
|
| 48 |
+
skip_save_text_encoder: false
|
| 49 |
+
text_encoder_use_attention_mask: false
|
| 50 |
+
tokenizer_max_length: null
|
| 51 |
+
tokenizer_name: null
|
| 52 |
+
train_batch_size: 1
|
| 53 |
+
train_text_encoder: false
|
| 54 |
+
use_8bit_adam: true
|
| 55 |
+
validation_prompt: null
|
| 56 |
+
validation_scheduler: DPMSolverMultistepScheduler
|
| 57 |
+
validation_steps: 100
|
| 58 |
+
with_prior_preservation: true
|
logs/dreambooth/1693368952.1649532/events.out.tfevents.1693368952.text-to-image-0.6993.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5c8858414d41d75e1ac823f3703064604896f8a21316cb5fa7e5e2d847373d04
|
| 3 |
+
size 3007
|
logs/dreambooth/1693368952.1666262/hparams.yml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
adam_beta1: 0.9
|
| 2 |
+
adam_beta2: 0.999
|
| 3 |
+
adam_epsilon: 1.0e-08
|
| 4 |
+
adam_weight_decay: 0.01
|
| 5 |
+
allow_tf32: false
|
| 6 |
+
center_crop: false
|
| 7 |
+
checkpointing_steps: 500
|
| 8 |
+
checkpoints_total_limit: null
|
| 9 |
+
class_data_dir: /opt/app-root/src/text-to-image-demo/notebook-output/data/class_dir
|
| 10 |
+
class_labels_conditioning: null
|
| 11 |
+
class_prompt: a photo of dog
|
| 12 |
+
dataloader_num_workers: 0
|
| 13 |
+
enable_xformers_memory_efficient_attention: true
|
| 14 |
+
gradient_accumulation_steps: 2
|
| 15 |
+
gradient_checkpointing: true
|
| 16 |
+
hub_model_id: null
|
| 17 |
+
hub_token: null
|
| 18 |
+
instance_data_dir: /opt/app-root/src/text-to-image-demo/notebook-output/data/instance_dir
|
| 19 |
+
instance_prompt: photo of a rhteddy dog
|
| 20 |
+
learning_rate: 5.0e-06
|
| 21 |
+
local_rank: -1
|
| 22 |
+
logging_dir: logs
|
| 23 |
+
lr_num_cycles: 1
|
| 24 |
+
lr_power: 1.0
|
| 25 |
+
lr_scheduler: constant
|
| 26 |
+
lr_warmup_steps: 0
|
| 27 |
+
max_grad_norm: 1.0
|
| 28 |
+
max_train_steps: 800
|
| 29 |
+
mixed_precision: null
|
| 30 |
+
num_class_images: 200
|
| 31 |
+
num_train_epochs: 8
|
| 32 |
+
num_validation_images: 4
|
| 33 |
+
offset_noise: false
|
| 34 |
+
output_dir: /opt/app-root/src/text-to-image-demo/notebook-output/stable_diffusion_weights/redhat-dog
|
| 35 |
+
pre_compute_text_embeddings: false
|
| 36 |
+
pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
|
| 37 |
+
prior_generation_precision: null
|
| 38 |
+
prior_loss_weight: 1.0
|
| 39 |
+
push_to_hub: false
|
| 40 |
+
report_to: tensorboard
|
| 41 |
+
resolution: 512
|
| 42 |
+
resume_from_checkpoint: null
|
| 43 |
+
revision: null
|
| 44 |
+
sample_batch_size: 4
|
| 45 |
+
scale_lr: false
|
| 46 |
+
seed: null
|
| 47 |
+
set_grads_to_none: false
|
| 48 |
+
skip_save_text_encoder: false
|
| 49 |
+
text_encoder_use_attention_mask: false
|
| 50 |
+
tokenizer_max_length: null
|
| 51 |
+
tokenizer_name: null
|
| 52 |
+
train_batch_size: 1
|
| 53 |
+
train_text_encoder: false
|
| 54 |
+
use_8bit_adam: true
|
| 55 |
+
validation_prompt: null
|
| 56 |
+
validation_scheduler: DPMSolverMultistepScheduler
|
| 57 |
+
validation_steps: 100
|
| 58 |
+
with_prior_preservation: true
|
logs/dreambooth/1693369738.2229948/events.out.tfevents.1693369738.text-to-image-0.7423.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9c7f32b60524f38f3881891fc3238ecfdf4f8994ece65aa640eeb24e95198658
|
| 3 |
+
size 3007
|
logs/dreambooth/1693369738.2245512/hparams.yml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
adam_beta1: 0.9
|
| 2 |
+
adam_beta2: 0.999
|
| 3 |
+
adam_epsilon: 1.0e-08
|
| 4 |
+
adam_weight_decay: 0.01
|
| 5 |
+
allow_tf32: false
|
| 6 |
+
center_crop: false
|
| 7 |
+
checkpointing_steps: 500
|
| 8 |
+
checkpoints_total_limit: null
|
| 9 |
+
class_data_dir: /opt/app-root/src/text-to-image-demo/notebook-output/data/class_dir
|
| 10 |
+
class_labels_conditioning: null
|
| 11 |
+
class_prompt: a photo of dog
|
| 12 |
+
dataloader_num_workers: 0
|
| 13 |
+
enable_xformers_memory_efficient_attention: true
|
| 14 |
+
gradient_accumulation_steps: 2
|
| 15 |
+
gradient_checkpointing: true
|
| 16 |
+
hub_model_id: null
|
| 17 |
+
hub_token: null
|
| 18 |
+
instance_data_dir: /opt/app-root/src/text-to-image-demo/notebook-output/data/instance_dir
|
| 19 |
+
instance_prompt: photo of a rhteddy dog
|
| 20 |
+
learning_rate: 5.0e-06
|
| 21 |
+
local_rank: -1
|
| 22 |
+
logging_dir: logs
|
| 23 |
+
lr_num_cycles: 1
|
| 24 |
+
lr_power: 1.0
|
| 25 |
+
lr_scheduler: constant
|
| 26 |
+
lr_warmup_steps: 0
|
| 27 |
+
max_grad_norm: 1.0
|
| 28 |
+
max_train_steps: 800
|
| 29 |
+
mixed_precision: null
|
| 30 |
+
num_class_images: 200
|
| 31 |
+
num_train_epochs: 8
|
| 32 |
+
num_validation_images: 4
|
| 33 |
+
offset_noise: false
|
| 34 |
+
output_dir: /opt/app-root/src/text-to-image-demo/notebook-output/stable_diffusion_weights/redhat-dog
|
| 35 |
+
pre_compute_text_embeddings: false
|
| 36 |
+
pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
|
| 37 |
+
prior_generation_precision: null
|
| 38 |
+
prior_loss_weight: 1.0
|
| 39 |
+
push_to_hub: false
|
| 40 |
+
report_to: tensorboard
|
| 41 |
+
resolution: 512
|
| 42 |
+
resume_from_checkpoint: null
|
| 43 |
+
revision: null
|
| 44 |
+
sample_batch_size: 4
|
| 45 |
+
scale_lr: false
|
| 46 |
+
seed: null
|
| 47 |
+
set_grads_to_none: false
|
| 48 |
+
skip_save_text_encoder: false
|
| 49 |
+
text_encoder_use_attention_mask: false
|
| 50 |
+
tokenizer_max_length: null
|
| 51 |
+
tokenizer_name: null
|
| 52 |
+
train_batch_size: 1
|
| 53 |
+
train_text_encoder: false
|
| 54 |
+
use_8bit_adam: true
|
| 55 |
+
validation_prompt: null
|
| 56 |
+
validation_scheduler: DPMSolverMultistepScheduler
|
| 57 |
+
validation_steps: 100
|
| 58 |
+
with_prior_preservation: true
|
logs/dreambooth/1693369858.7861362/events.out.tfevents.1693369858.text-to-image-0.7601.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b077a286ba05bfd2c12c82ee7d7cf4e1c110d75d08934fb77c72c2786f7818d
|
| 3 |
+
size 3007
|
logs/dreambooth/1693369858.787858/hparams.yml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
adam_beta1: 0.9
|
| 2 |
+
adam_beta2: 0.999
|
| 3 |
+
adam_epsilon: 1.0e-08
|
| 4 |
+
adam_weight_decay: 0.01
|
| 5 |
+
allow_tf32: false
|
| 6 |
+
center_crop: false
|
| 7 |
+
checkpointing_steps: 500
|
| 8 |
+
checkpoints_total_limit: null
|
| 9 |
+
class_data_dir: /opt/app-root/src/text-to-image-demo/notebook-output/data/class_dir
|
| 10 |
+
class_labels_conditioning: null
|
| 11 |
+
class_prompt: a photo of dog
|
| 12 |
+
dataloader_num_workers: 0
|
| 13 |
+
enable_xformers_memory_efficient_attention: true
|
| 14 |
+
gradient_accumulation_steps: 2
|
| 15 |
+
gradient_checkpointing: true
|
| 16 |
+
hub_model_id: null
|
| 17 |
+
hub_token: null
|
| 18 |
+
instance_data_dir: /opt/app-root/src/text-to-image-demo/notebook-output/data/instance_dir
|
| 19 |
+
instance_prompt: photo of a rhteddy dog
|
| 20 |
+
learning_rate: 5.0e-06
|
| 21 |
+
local_rank: -1
|
| 22 |
+
logging_dir: logs
|
| 23 |
+
lr_num_cycles: 1
|
| 24 |
+
lr_power: 1.0
|
| 25 |
+
lr_scheduler: constant
|
| 26 |
+
lr_warmup_steps: 0
|
| 27 |
+
max_grad_norm: 1.0
|
| 28 |
+
max_train_steps: 800
|
| 29 |
+
mixed_precision: null
|
| 30 |
+
num_class_images: 200
|
| 31 |
+
num_train_epochs: 8
|
| 32 |
+
num_validation_images: 4
|
| 33 |
+
offset_noise: false
|
| 34 |
+
output_dir: /opt/app-root/src/text-to-image-demo/notebook-output/stable_diffusion_weights/redhat-dog
|
| 35 |
+
pre_compute_text_embeddings: false
|
| 36 |
+
pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
|
| 37 |
+
prior_generation_precision: null
|
| 38 |
+
prior_loss_weight: 1.0
|
| 39 |
+
push_to_hub: false
|
| 40 |
+
report_to: tensorboard
|
| 41 |
+
resolution: 512
|
| 42 |
+
resume_from_checkpoint: null
|
| 43 |
+
revision: null
|
| 44 |
+
sample_batch_size: 4
|
| 45 |
+
scale_lr: false
|
| 46 |
+
seed: null
|
| 47 |
+
set_grads_to_none: false
|
| 48 |
+
skip_save_text_encoder: false
|
| 49 |
+
text_encoder_use_attention_mask: false
|
| 50 |
+
tokenizer_max_length: null
|
| 51 |
+
tokenizer_name: null
|
| 52 |
+
train_batch_size: 1
|
| 53 |
+
train_text_encoder: false
|
| 54 |
+
use_8bit_adam: true
|
| 55 |
+
validation_prompt: null
|
| 56 |
+
validation_scheduler: DPMSolverMultistepScheduler
|
| 57 |
+
validation_steps: 100
|
| 58 |
+
with_prior_preservation: true
|
logs/dreambooth/events.out.tfevents.1693358976.text-to-image-0.4436.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11627ca05f2831fbb4cc906fbc98538bd8375b17a302362203385607ed68df79
|
| 3 |
+
size 66986
|
logs/dreambooth/events.out.tfevents.1693366191.text-to-image-0.5967.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5cce4a92c7044e6b95678faf6d1e42915fff7795e4ac9a7ebeae009c4f3fddfa
|
| 3 |
+
size 133926
|
logs/dreambooth/events.out.tfevents.1693368952.text-to-image-0.6993.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ebc0ae002693c88fff7ce665688e55f809b138323e5997042992f68c0e7277f1
|
| 3 |
+
size 29850
|
logs/dreambooth/events.out.tfevents.1693369738.text-to-image-0.7423.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:92f450e0333ab41c6f808820b9d2996c658785ad4cc3e64ae13212688cd34b02
|
| 3 |
+
size 2906
|
logs/dreambooth/events.out.tfevents.1693369858.text-to-image-0.7601.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5820131ad19ee973f5856a233d7e8ad264586d5c6b40fcac91feb072d755c1a
|
| 3 |
+
size 133926
|
model_index.json
CHANGED
|
@@ -1,14 +1,15 @@
|
|
| 1 |
{
|
| 2 |
"_class_name": "StableDiffusionPipeline",
|
| 3 |
-
"_diffusers_version": "0.
|
|
|
|
| 4 |
"feature_extractor": [
|
| 5 |
"transformers",
|
| 6 |
-
"
|
| 7 |
],
|
| 8 |
"requires_safety_checker": true,
|
| 9 |
"safety_checker": [
|
| 10 |
-
|
| 11 |
-
|
| 12 |
],
|
| 13 |
"scheduler": [
|
| 14 |
"diffusers",
|
|
|
|
| 1 |
{
|
| 2 |
"_class_name": "StableDiffusionPipeline",
|
| 3 |
+
"_diffusers_version": "0.21.0.dev0",
|
| 4 |
+
"_name_or_path": "runwayml/stable-diffusion-v1-5",
|
| 5 |
"feature_extractor": [
|
| 6 |
"transformers",
|
| 7 |
+
"CLIPImageProcessor"
|
| 8 |
],
|
| 9 |
"requires_safety_checker": true,
|
| 10 |
"safety_checker": [
|
| 11 |
+
"stable_diffusion",
|
| 12 |
+
"StableDiffusionSafetyChecker"
|
| 13 |
],
|
| 14 |
"scheduler": [
|
| 15 |
"diffusers",
|
safety_checker/config.json
ADDED
|
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_name_or_path": "/opt/app-root/src/.cache/huggingface/hub/models--runwayml--stable-diffusion-v1-5/snapshots/1d0c4ebf6ff58a5caecab40fa1406526bca4b5b9/safety_checker",
|
| 3 |
+
"architectures": [
|
| 4 |
+
"StableDiffusionSafetyChecker"
|
| 5 |
+
],
|
| 6 |
+
"initializer_factor": 1.0,
|
| 7 |
+
"logit_scale_init_value": 2.6592,
|
| 8 |
+
"model_type": "clip",
|
| 9 |
+
"projection_dim": 768,
|
| 10 |
+
"text_config": {
|
| 11 |
+
"dropout": 0.0,
|
| 12 |
+
"hidden_size": 768,
|
| 13 |
+
"intermediate_size": 3072,
|
| 14 |
+
"model_type": "clip_text_model",
|
| 15 |
+
"num_attention_heads": 12
|
| 16 |
+
},
|
| 17 |
+
"torch_dtype": "float32",
|
| 18 |
+
"transformers_version": "4.32.1",
|
| 19 |
+
"vision_config": {
|
| 20 |
+
"dropout": 0.0,
|
| 21 |
+
"hidden_size": 1024,
|
| 22 |
+
"intermediate_size": 4096,
|
| 23 |
+
"model_type": "clip_vision_model",
|
| 24 |
+
"num_attention_heads": 16,
|
| 25 |
+
"num_hidden_layers": 24,
|
| 26 |
+
"patch_size": 14
|
| 27 |
+
}
|
| 28 |
+
}
|
safety_checker/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb351a5ded815c3ff744968ad9c6b218d071b9d313d04f35e813b84b4c0ffde8
|
| 3 |
+
size 1215979664
|
samples/0.png
DELETED
|
Binary file (409 kB)
|
|
|
samples/1.png
DELETED
|
Binary file (528 kB)
|
|
|
samples/2.png
DELETED
|
Binary file (404 kB)
|
|
|
samples/3.png
DELETED
|
Binary file (452 kB)
|
|
|
scheduler/scheduler_config.json
CHANGED
|
@@ -1,18 +1,15 @@
|
|
| 1 |
{
|
| 2 |
-
"_class_name": "
|
| 3 |
-
"_diffusers_version": "0.
|
| 4 |
"beta_end": 0.012,
|
| 5 |
"beta_schedule": "scaled_linear",
|
| 6 |
"beta_start": 0.00085,
|
| 7 |
"clip_sample": false,
|
| 8 |
-
"clip_sample_range": 1.0,
|
| 9 |
-
"dynamic_thresholding_ratio": 0.995,
|
| 10 |
"num_train_timesteps": 1000,
|
| 11 |
"prediction_type": "epsilon",
|
| 12 |
-
"sample_max_value": 1.0,
|
| 13 |
"set_alpha_to_one": false,
|
| 14 |
"skip_prk_steps": true,
|
| 15 |
"steps_offset": 1,
|
| 16 |
-
"
|
| 17 |
"trained_betas": null
|
| 18 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"_class_name": "PNDMScheduler",
|
| 3 |
+
"_diffusers_version": "0.21.0.dev0",
|
| 4 |
"beta_end": 0.012,
|
| 5 |
"beta_schedule": "scaled_linear",
|
| 6 |
"beta_start": 0.00085,
|
| 7 |
"clip_sample": false,
|
|
|
|
|
|
|
| 8 |
"num_train_timesteps": 1000,
|
| 9 |
"prediction_type": "epsilon",
|
|
|
|
| 10 |
"set_alpha_to_one": false,
|
| 11 |
"skip_prk_steps": true,
|
| 12 |
"steps_offset": 1,
|
| 13 |
+
"timestep_spacing": "leading",
|
| 14 |
"trained_betas": null
|
| 15 |
}
|
text_encoder/config.json
CHANGED
|
@@ -20,6 +20,6 @@
|
|
| 20 |
"pad_token_id": 1,
|
| 21 |
"projection_dim": 768,
|
| 22 |
"torch_dtype": "float32",
|
| 23 |
-
"transformers_version": "4.
|
| 24 |
"vocab_size": 49408
|
| 25 |
}
|
|
|
|
| 20 |
"pad_token_id": 1,
|
| 21 |
"projection_dim": 768,
|
| 22 |
"torch_dtype": "float32",
|
| 23 |
+
"transformers_version": "4.32.1",
|
| 24 |
"vocab_size": 49408
|
| 25 |
}
|
text_encoder/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:778d02eb9e707c3fbaae0b67b79ea0d1399b52e624fb634f2f19375ae7c047c3
|
| 3 |
+
size 492265168
|
unet/config.json
CHANGED
|
@@ -1,9 +1,13 @@
|
|
| 1 |
{
|
| 2 |
"_class_name": "UNet2DConditionModel",
|
| 3 |
-
"_diffusers_version": "0.
|
| 4 |
"_name_or_path": "runwayml/stable-diffusion-v1-5",
|
| 5 |
"act_fn": "silu",
|
|
|
|
|
|
|
|
|
|
| 6 |
"attention_head_dim": 8,
|
|
|
|
| 7 |
"block_out_channels": [
|
| 8 |
320,
|
| 9 |
640,
|
|
@@ -16,6 +20,7 @@
|
|
| 16 |
"conv_in_kernel": 3,
|
| 17 |
"conv_out_kernel": 3,
|
| 18 |
"cross_attention_dim": 768,
|
|
|
|
| 19 |
"down_block_types": [
|
| 20 |
"CrossAttnDownBlock2D",
|
| 21 |
"CrossAttnDownBlock2D",
|
|
@@ -24,23 +29,32 @@
|
|
| 24 |
],
|
| 25 |
"downsample_padding": 1,
|
| 26 |
"dual_cross_attention": false,
|
|
|
|
|
|
|
| 27 |
"flip_sin_to_cos": true,
|
| 28 |
"freq_shift": 0,
|
| 29 |
"in_channels": 4,
|
| 30 |
"layers_per_block": 2,
|
|
|
|
| 31 |
"mid_block_scale_factor": 1,
|
| 32 |
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
| 33 |
"norm_eps": 1e-05,
|
| 34 |
"norm_num_groups": 32,
|
|
|
|
| 35 |
"num_class_embeds": null,
|
| 36 |
"only_cross_attention": false,
|
| 37 |
"out_channels": 4,
|
| 38 |
"projection_class_embeddings_input_dim": null,
|
|
|
|
|
|
|
| 39 |
"resnet_time_scale_shift": "default",
|
| 40 |
"sample_size": 64,
|
| 41 |
"time_cond_proj_dim": null,
|
|
|
|
|
|
|
| 42 |
"time_embedding_type": "positional",
|
| 43 |
"timestep_post_act": null,
|
|
|
|
| 44 |
"up_block_types": [
|
| 45 |
"UpBlock2D",
|
| 46 |
"CrossAttnUpBlock2D",
|
|
|
|
| 1 |
{
|
| 2 |
"_class_name": "UNet2DConditionModel",
|
| 3 |
+
"_diffusers_version": "0.21.0.dev0",
|
| 4 |
"_name_or_path": "runwayml/stable-diffusion-v1-5",
|
| 5 |
"act_fn": "silu",
|
| 6 |
+
"addition_embed_type": null,
|
| 7 |
+
"addition_embed_type_num_heads": 64,
|
| 8 |
+
"addition_time_embed_dim": null,
|
| 9 |
"attention_head_dim": 8,
|
| 10 |
+
"attention_type": "default",
|
| 11 |
"block_out_channels": [
|
| 12 |
320,
|
| 13 |
640,
|
|
|
|
| 20 |
"conv_in_kernel": 3,
|
| 21 |
"conv_out_kernel": 3,
|
| 22 |
"cross_attention_dim": 768,
|
| 23 |
+
"cross_attention_norm": null,
|
| 24 |
"down_block_types": [
|
| 25 |
"CrossAttnDownBlock2D",
|
| 26 |
"CrossAttnDownBlock2D",
|
|
|
|
| 29 |
],
|
| 30 |
"downsample_padding": 1,
|
| 31 |
"dual_cross_attention": false,
|
| 32 |
+
"encoder_hid_dim": null,
|
| 33 |
+
"encoder_hid_dim_type": null,
|
| 34 |
"flip_sin_to_cos": true,
|
| 35 |
"freq_shift": 0,
|
| 36 |
"in_channels": 4,
|
| 37 |
"layers_per_block": 2,
|
| 38 |
+
"mid_block_only_cross_attention": null,
|
| 39 |
"mid_block_scale_factor": 1,
|
| 40 |
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
| 41 |
"norm_eps": 1e-05,
|
| 42 |
"norm_num_groups": 32,
|
| 43 |
+
"num_attention_heads": null,
|
| 44 |
"num_class_embeds": null,
|
| 45 |
"only_cross_attention": false,
|
| 46 |
"out_channels": 4,
|
| 47 |
"projection_class_embeddings_input_dim": null,
|
| 48 |
+
"resnet_out_scale_factor": 1.0,
|
| 49 |
+
"resnet_skip_time_act": false,
|
| 50 |
"resnet_time_scale_shift": "default",
|
| 51 |
"sample_size": 64,
|
| 52 |
"time_cond_proj_dim": null,
|
| 53 |
+
"time_embedding_act_fn": null,
|
| 54 |
+
"time_embedding_dim": null,
|
| 55 |
"time_embedding_type": "positional",
|
| 56 |
"timestep_post_act": null,
|
| 57 |
+
"transformer_layers_per_block": 1,
|
| 58 |
"up_block_types": [
|
| 59 |
"UpBlock2D",
|
| 60 |
"CrossAttnUpBlock2D",
|
unet/diffusion_pytorch_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:12e61c28a03105f2730232cc88b784e7451ba9c0510b88a31a6255460307be22
|
| 3 |
+
size 3438167536
|
vae/config.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
"_class_name": "AutoencoderKL",
|
| 3 |
-
"_diffusers_version": "0.
|
| 4 |
-
"_name_or_path": "
|
| 5 |
"act_fn": "silu",
|
| 6 |
"block_out_channels": [
|
| 7 |
128,
|
|
@@ -15,12 +15,13 @@
|
|
| 15 |
"DownEncoderBlock2D",
|
| 16 |
"DownEncoderBlock2D"
|
| 17 |
],
|
|
|
|
| 18 |
"in_channels": 3,
|
| 19 |
"latent_channels": 4,
|
| 20 |
"layers_per_block": 2,
|
| 21 |
"norm_num_groups": 32,
|
| 22 |
"out_channels": 3,
|
| 23 |
-
"sample_size":
|
| 24 |
"scaling_factor": 0.18215,
|
| 25 |
"up_block_types": [
|
| 26 |
"UpDecoderBlock2D",
|
|
|
|
| 1 |
{
|
| 2 |
"_class_name": "AutoencoderKL",
|
| 3 |
+
"_diffusers_version": "0.21.0.dev0",
|
| 4 |
+
"_name_or_path": "/opt/app-root/src/.cache/huggingface/hub/models--runwayml--stable-diffusion-v1-5/snapshots/1d0c4ebf6ff58a5caecab40fa1406526bca4b5b9/vae",
|
| 5 |
"act_fn": "silu",
|
| 6 |
"block_out_channels": [
|
| 7 |
128,
|
|
|
|
| 15 |
"DownEncoderBlock2D",
|
| 16 |
"DownEncoderBlock2D"
|
| 17 |
],
|
| 18 |
+
"force_upcast": true,
|
| 19 |
"in_channels": 3,
|
| 20 |
"latent_channels": 4,
|
| 21 |
"layers_per_block": 2,
|
| 22 |
"norm_num_groups": 32,
|
| 23 |
"out_channels": 3,
|
| 24 |
+
"sample_size": 512,
|
| 25 |
"scaling_factor": 0.18215,
|
| 26 |
"up_block_types": [
|
| 27 |
"UpDecoderBlock2D",
|
vae/diffusion_pytorch_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b4d2b5932bb4151e54e694fd31ccf51fca908223c9485bd56cd0e1d83ad94c49
|
| 3 |
+
size 334643268
|