anjakuzev commited on
Commit
33c54bb
1 Parent(s): d14c4eb

End of training

Browse files
README.md ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ---
3
+ license: creativeml-openrail-m
4
+ base_model: runwayml/stable-diffusion-v1-5
5
+ tags:
6
+ - stable-diffusion
7
+ - stable-diffusion-diffusers
8
+ - text-to-image
9
+ - diffusers
10
+ - lora
11
+ inference: true
12
+ ---
13
+
14
+ # LoRA text2image fine-tuning - anjakuzev/michael_scott_v2
15
+ These are LoRA adaption weights for runwayml/stable-diffusion-v1-5. The weights were fine-tuned on the anjakuzev/michael_scott dataset. You can find some example images in the following.
16
+
17
+ ![img_0](./image_0.png)
18
+ ![img_1](./image_1.png)
19
+ ![img_2](./image_2.png)
20
+ ![img_3](./image_3.png)
21
+
image_0.png ADDED
image_1.png ADDED
image_2.png ADDED
image_3.png ADDED
logs/text2image-fine-tune/1698226805.5745053/events.out.tfevents.1698226805.146-235-238-191.296963.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ce8c4f5b31a84cec97885432705c9773dd8f0dc055221ff195fc6e161484298
3
+ size 2447
logs/text2image-fine-tune/1698226805.575728/hparams.yml ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ caption_column: additional_feature
8
+ center_crop: true
9
+ checkpointing_steps: 3000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 8
12
+ dataset_config_name: null
13
+ dataset_name: anjakuzev/harry_styles
14
+ enable_xformers_memory_efficient_attention: false
15
+ gradient_accumulation_steps: 4
16
+ gradient_checkpointing: false
17
+ hub_model_id: anjakuzev/my-text-to-image-model_8
18
+ hub_token: null
19
+ image_column: image
20
+ learning_rate: 0.0001
21
+ local_rank: -1
22
+ logging_dir: logs
23
+ lr_scheduler: cosine
24
+ lr_warmup_steps: 0
25
+ max_grad_norm: 1.0
26
+ max_train_samples: null
27
+ max_train_steps: 500
28
+ mixed_precision: null
29
+ noise_offset: 0
30
+ num_train_epochs: 50
31
+ num_validation_images: 4
32
+ output_dir: diffusers/output
33
+ prediction_type: null
34
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
35
+ push_to_hub: true
36
+ random_flip: true
37
+ rank: 4
38
+ report_to: tensorboard
39
+ resolution: 512
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 42
44
+ snr_gamma: null
45
+ train_batch_size: 1
46
+ train_data_dir: null
47
+ use_8bit_adam: false
48
+ validation_epochs: 1
49
+ validation_prompt: Generate an image of Harry Styles with wavy hair and sharp facial
50
+ features. He should be wearing contemporary formal attire with a confident expression.
logs/text2image-fine-tune/1698236900.876514/events.out.tfevents.1698236900.146-235-238-191.348206.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e4d83bb95e9aee0cc7044f129c8a5b09908559fdcdebfd9d8b448e8eb9ab555
3
+ size 2598
logs/text2image-fine-tune/1698236900.8777218/hparams.yml ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ caption_column: additional_feature
8
+ center_crop: true
9
+ checkpointing_steps: 3000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 8
12
+ dataset_config_name: null
13
+ dataset_name: anjakuzev/michael_scott
14
+ enable_xformers_memory_efficient_attention: false
15
+ gradient_accumulation_steps: 4
16
+ gradient_checkpointing: false
17
+ hub_model_id: anjakuzev/michael_scott
18
+ hub_token: null
19
+ image_column: image
20
+ learning_rate: 0.0001
21
+ local_rank: -1
22
+ logging_dir: logs
23
+ lr_scheduler: cosine
24
+ lr_warmup_steps: 0
25
+ max_grad_norm: 1.0
26
+ max_train_samples: null
27
+ max_train_steps: 500
28
+ mixed_precision: null
29
+ noise_offset: 0
30
+ num_train_epochs: 56
31
+ num_validation_images: 4
32
+ output_dir: diffusers/output
33
+ prediction_type: null
34
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
35
+ push_to_hub: true
36
+ random_flip: true
37
+ rank: 4
38
+ report_to: tensorboard
39
+ resolution: 512
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 42
44
+ snr_gamma: null
45
+ train_batch_size: 1
46
+ train_data_dir: null
47
+ use_8bit_adam: false
48
+ validation_epochs: 1
49
+ validation_prompt: Generate an image of Michael Scott with short dark hair and deep-set
50
+ eyes. He should be wearing professional attire, including a dark suit jacket and
51
+ tie. His expression should range from jovial and smiling to deep in thought or surprised.
52
+ The setting should hint at a workplace environment, preferably an office.
logs/text2image-fine-tune/1698238676.22221/events.out.tfevents.1698238676.146-235-238-191.363907.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd75d423570be1533fa29584136148e13190b6ec94f4cb03efa0234eec77c858
3
+ size 2601
logs/text2image-fine-tune/1698238676.2234287/hparams.yml ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ caption_column: additional_feature
8
+ center_crop: true
9
+ checkpointing_steps: 3000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 8
12
+ dataset_config_name: null
13
+ dataset_name: anjakuzev/michael_scott
14
+ enable_xformers_memory_efficient_attention: false
15
+ gradient_accumulation_steps: 4
16
+ gradient_checkpointing: false
17
+ hub_model_id: anjakuzev/michael_scott_v2
18
+ hub_token: null
19
+ image_column: image
20
+ learning_rate: 0.0001
21
+ local_rank: -1
22
+ logging_dir: logs
23
+ lr_scheduler: cosine
24
+ lr_warmup_steps: 0
25
+ max_grad_norm: 1.0
26
+ max_train_samples: null
27
+ max_train_steps: 800
28
+ mixed_precision: null
29
+ noise_offset: 0
30
+ num_train_epochs: 89
31
+ num_validation_images: 4
32
+ output_dir: diffusers/output
33
+ prediction_type: null
34
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
35
+ push_to_hub: true
36
+ random_flip: true
37
+ rank: 4
38
+ report_to: tensorboard
39
+ resolution: 512
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 1337
44
+ snr_gamma: null
45
+ train_batch_size: 1
46
+ train_data_dir: null
47
+ use_8bit_adam: false
48
+ validation_epochs: 1
49
+ validation_prompt: Generate an image of Michael Scott with short dark hair and deep-set
50
+ eyes. He should be wearing professional attire, including a dark suit jacket and
51
+ tie. His expression should range from jovial and smiling to deep in thought or surprised.
52
+ The setting should hint at a workplace environment, preferably an office.
logs/text2image-fine-tune/events.out.tfevents.1698226805.146-235-238-191.296963.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8065922af2ac88de65a6467d27d647cc097a4ff7851d16dee5de51ab37ef873
3
+ size 568
logs/text2image-fine-tune/events.out.tfevents.1698236900.146-235-238-191.348206.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dedc254ab9261a7eb5042d54765f181d021af5eba3f9a14567f24a0ad71e55c3
3
+ size 77564499
logs/text2image-fine-tune/events.out.tfevents.1698238676.146-235-238-191.363907.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce325528dc7dd7d7c9ca32ab112003c21974d8e7b1273484c2c3bc157973076a
3
+ size 119833604
pytorch_lora_weights.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8b7589a45554b63dde858037d4671e9da224e2e1c63187efd090644e8b0c48f
3
+ size 3227336