End of training
Browse files- README.md +21 -0
- image_0.png +0 -0
- image_1.png +0 -0
- image_2.png +0 -0
- image_3.png +0 -0
- logs/text2image-fine-tune/1698226805.5745053/events.out.tfevents.1698226805.146-235-238-191.296963.1 +3 -0
- logs/text2image-fine-tune/1698226805.575728/hparams.yml +50 -0
- logs/text2image-fine-tune/1698236900.876514/events.out.tfevents.1698236900.146-235-238-191.348206.1 +3 -0
- logs/text2image-fine-tune/1698236900.8777218/hparams.yml +52 -0
- logs/text2image-fine-tune/1698238676.22221/events.out.tfevents.1698238676.146-235-238-191.363907.1 +3 -0
- logs/text2image-fine-tune/1698238676.2234287/hparams.yml +52 -0
- logs/text2image-fine-tune/events.out.tfevents.1698226805.146-235-238-191.296963.0 +3 -0
- logs/text2image-fine-tune/events.out.tfevents.1698236900.146-235-238-191.348206.0 +3 -0
- logs/text2image-fine-tune/events.out.tfevents.1698238676.146-235-238-191.363907.0 +3 -0
- pytorch_lora_weights.safetensors +3 -0
README.md
ADDED
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
---
|
3 |
+
license: creativeml-openrail-m
|
4 |
+
base_model: runwayml/stable-diffusion-v1-5
|
5 |
+
tags:
|
6 |
+
- stable-diffusion
|
7 |
+
- stable-diffusion-diffusers
|
8 |
+
- text-to-image
|
9 |
+
- diffusers
|
10 |
+
- lora
|
11 |
+
inference: true
|
12 |
+
---
|
13 |
+
|
14 |
+
# LoRA text2image fine-tuning - anjakuzev/michael_scott_v2
|
15 |
+
These are LoRA adaption weights for runwayml/stable-diffusion-v1-5. The weights were fine-tuned on the anjakuzev/michael_scott dataset. You can find some example images in the following.
|
16 |
+
|
17 |
+
![img_0](./image_0.png)
|
18 |
+
![img_1](./image_1.png)
|
19 |
+
![img_2](./image_2.png)
|
20 |
+
![img_3](./image_3.png)
|
21 |
+
|
image_0.png
ADDED
image_1.png
ADDED
image_2.png
ADDED
image_3.png
ADDED
logs/text2image-fine-tune/1698226805.5745053/events.out.tfevents.1698226805.146-235-238-191.296963.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ce8c4f5b31a84cec97885432705c9773dd8f0dc055221ff195fc6e161484298
|
3 |
+
size 2447
|
logs/text2image-fine-tune/1698226805.575728/hparams.yml
ADDED
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
adam_beta1: 0.9
|
2 |
+
adam_beta2: 0.999
|
3 |
+
adam_epsilon: 1.0e-08
|
4 |
+
adam_weight_decay: 0.01
|
5 |
+
allow_tf32: false
|
6 |
+
cache_dir: null
|
7 |
+
caption_column: additional_feature
|
8 |
+
center_crop: true
|
9 |
+
checkpointing_steps: 3000
|
10 |
+
checkpoints_total_limit: null
|
11 |
+
dataloader_num_workers: 8
|
12 |
+
dataset_config_name: null
|
13 |
+
dataset_name: anjakuzev/harry_styles
|
14 |
+
enable_xformers_memory_efficient_attention: false
|
15 |
+
gradient_accumulation_steps: 4
|
16 |
+
gradient_checkpointing: false
|
17 |
+
hub_model_id: anjakuzev/my-text-to-image-model_8
|
18 |
+
hub_token: null
|
19 |
+
image_column: image
|
20 |
+
learning_rate: 0.0001
|
21 |
+
local_rank: -1
|
22 |
+
logging_dir: logs
|
23 |
+
lr_scheduler: cosine
|
24 |
+
lr_warmup_steps: 0
|
25 |
+
max_grad_norm: 1.0
|
26 |
+
max_train_samples: null
|
27 |
+
max_train_steps: 500
|
28 |
+
mixed_precision: null
|
29 |
+
noise_offset: 0
|
30 |
+
num_train_epochs: 50
|
31 |
+
num_validation_images: 4
|
32 |
+
output_dir: diffusers/output
|
33 |
+
prediction_type: null
|
34 |
+
pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
|
35 |
+
push_to_hub: true
|
36 |
+
random_flip: true
|
37 |
+
rank: 4
|
38 |
+
report_to: tensorboard
|
39 |
+
resolution: 512
|
40 |
+
resume_from_checkpoint: null
|
41 |
+
revision: null
|
42 |
+
scale_lr: false
|
43 |
+
seed: 42
|
44 |
+
snr_gamma: null
|
45 |
+
train_batch_size: 1
|
46 |
+
train_data_dir: null
|
47 |
+
use_8bit_adam: false
|
48 |
+
validation_epochs: 1
|
49 |
+
validation_prompt: Generate an image of Harry Styles with wavy hair and sharp facial
|
50 |
+
features. He should be wearing contemporary formal attire with a confident expression.
|
logs/text2image-fine-tune/1698236900.876514/events.out.tfevents.1698236900.146-235-238-191.348206.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e4d83bb95e9aee0cc7044f129c8a5b09908559fdcdebfd9d8b448e8eb9ab555
|
3 |
+
size 2598
|
logs/text2image-fine-tune/1698236900.8777218/hparams.yml
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
adam_beta1: 0.9
|
2 |
+
adam_beta2: 0.999
|
3 |
+
adam_epsilon: 1.0e-08
|
4 |
+
adam_weight_decay: 0.01
|
5 |
+
allow_tf32: false
|
6 |
+
cache_dir: null
|
7 |
+
caption_column: additional_feature
|
8 |
+
center_crop: true
|
9 |
+
checkpointing_steps: 3000
|
10 |
+
checkpoints_total_limit: null
|
11 |
+
dataloader_num_workers: 8
|
12 |
+
dataset_config_name: null
|
13 |
+
dataset_name: anjakuzev/michael_scott
|
14 |
+
enable_xformers_memory_efficient_attention: false
|
15 |
+
gradient_accumulation_steps: 4
|
16 |
+
gradient_checkpointing: false
|
17 |
+
hub_model_id: anjakuzev/michael_scott
|
18 |
+
hub_token: null
|
19 |
+
image_column: image
|
20 |
+
learning_rate: 0.0001
|
21 |
+
local_rank: -1
|
22 |
+
logging_dir: logs
|
23 |
+
lr_scheduler: cosine
|
24 |
+
lr_warmup_steps: 0
|
25 |
+
max_grad_norm: 1.0
|
26 |
+
max_train_samples: null
|
27 |
+
max_train_steps: 500
|
28 |
+
mixed_precision: null
|
29 |
+
noise_offset: 0
|
30 |
+
num_train_epochs: 56
|
31 |
+
num_validation_images: 4
|
32 |
+
output_dir: diffusers/output
|
33 |
+
prediction_type: null
|
34 |
+
pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
|
35 |
+
push_to_hub: true
|
36 |
+
random_flip: true
|
37 |
+
rank: 4
|
38 |
+
report_to: tensorboard
|
39 |
+
resolution: 512
|
40 |
+
resume_from_checkpoint: null
|
41 |
+
revision: null
|
42 |
+
scale_lr: false
|
43 |
+
seed: 42
|
44 |
+
snr_gamma: null
|
45 |
+
train_batch_size: 1
|
46 |
+
train_data_dir: null
|
47 |
+
use_8bit_adam: false
|
48 |
+
validation_epochs: 1
|
49 |
+
validation_prompt: Generate an image of Michael Scott with short dark hair and deep-set
|
50 |
+
eyes. He should be wearing professional attire, including a dark suit jacket and
|
51 |
+
tie. His expression should range from jovial and smiling to deep in thought or surprised.
|
52 |
+
The setting should hint at a workplace environment, preferably an office.
|
logs/text2image-fine-tune/1698238676.22221/events.out.tfevents.1698238676.146-235-238-191.363907.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd75d423570be1533fa29584136148e13190b6ec94f4cb03efa0234eec77c858
|
3 |
+
size 2601
|
logs/text2image-fine-tune/1698238676.2234287/hparams.yml
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
adam_beta1: 0.9
|
2 |
+
adam_beta2: 0.999
|
3 |
+
adam_epsilon: 1.0e-08
|
4 |
+
adam_weight_decay: 0.01
|
5 |
+
allow_tf32: false
|
6 |
+
cache_dir: null
|
7 |
+
caption_column: additional_feature
|
8 |
+
center_crop: true
|
9 |
+
checkpointing_steps: 3000
|
10 |
+
checkpoints_total_limit: null
|
11 |
+
dataloader_num_workers: 8
|
12 |
+
dataset_config_name: null
|
13 |
+
dataset_name: anjakuzev/michael_scott
|
14 |
+
enable_xformers_memory_efficient_attention: false
|
15 |
+
gradient_accumulation_steps: 4
|
16 |
+
gradient_checkpointing: false
|
17 |
+
hub_model_id: anjakuzev/michael_scott_v2
|
18 |
+
hub_token: null
|
19 |
+
image_column: image
|
20 |
+
learning_rate: 0.0001
|
21 |
+
local_rank: -1
|
22 |
+
logging_dir: logs
|
23 |
+
lr_scheduler: cosine
|
24 |
+
lr_warmup_steps: 0
|
25 |
+
max_grad_norm: 1.0
|
26 |
+
max_train_samples: null
|
27 |
+
max_train_steps: 800
|
28 |
+
mixed_precision: null
|
29 |
+
noise_offset: 0
|
30 |
+
num_train_epochs: 89
|
31 |
+
num_validation_images: 4
|
32 |
+
output_dir: diffusers/output
|
33 |
+
prediction_type: null
|
34 |
+
pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
|
35 |
+
push_to_hub: true
|
36 |
+
random_flip: true
|
37 |
+
rank: 4
|
38 |
+
report_to: tensorboard
|
39 |
+
resolution: 512
|
40 |
+
resume_from_checkpoint: null
|
41 |
+
revision: null
|
42 |
+
scale_lr: false
|
43 |
+
seed: 1337
|
44 |
+
snr_gamma: null
|
45 |
+
train_batch_size: 1
|
46 |
+
train_data_dir: null
|
47 |
+
use_8bit_adam: false
|
48 |
+
validation_epochs: 1
|
49 |
+
validation_prompt: Generate an image of Michael Scott with short dark hair and deep-set
|
50 |
+
eyes. He should be wearing professional attire, including a dark suit jacket and
|
51 |
+
tie. His expression should range from jovial and smiling to deep in thought or surprised.
|
52 |
+
The setting should hint at a workplace environment, preferably an office.
|
logs/text2image-fine-tune/events.out.tfevents.1698226805.146-235-238-191.296963.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8065922af2ac88de65a6467d27d647cc097a4ff7851d16dee5de51ab37ef873
|
3 |
+
size 568
|
logs/text2image-fine-tune/events.out.tfevents.1698236900.146-235-238-191.348206.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dedc254ab9261a7eb5042d54765f181d021af5eba3f9a14567f24a0ad71e55c3
|
3 |
+
size 77564499
|
logs/text2image-fine-tune/events.out.tfevents.1698238676.146-235-238-191.363907.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce325528dc7dd7d7c9ca32ab112003c21974d8e7b1273484c2c3bc157973076a
|
3 |
+
size 119833604
|
pytorch_lora_weights.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8b7589a45554b63dde858037d4671e9da224e2e1c63187efd090644e8b0c48f
|
3 |
+
size 3227336
|