zhangyi617 commited on
Commit
1e316c3
·
verified ·
1 Parent(s): b8fd670

End of training

Browse files
.gitattributes CHANGED
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ image_0.png filter=lfs diff=lfs merge=lfs -text
37
+ image_1.png filter=lfs diff=lfs merge=lfs -text
38
+ image_2.png filter=lfs diff=lfs merge=lfs -text
39
+ image_3.png filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: runwayml/stable-diffusion-v1-5
3
+ library_name: diffusers
4
+ license: creativeml-openrail-m
5
+ inference: true
6
+ tags:
7
+ - stable-diffusion
8
+ - stable-diffusion-diffusers
9
+ - text-to-image
10
+ - diffusers
11
+ - diffusers-training
12
+ - lora
13
+ ---
14
+
15
+ <!-- This model card has been generated automatically according to the information the training script had access to. You
16
+ should probably proofread and complete it, then remove this comment. -->
17
+
18
+
19
+ # LoRA text2image fine-tuning - zhangyi617/sd15_naruto_text_0.005_mix_0.8
20
+ These are LoRA adaption weights for runwayml/stable-diffusion-v1-5. The weights were fine-tuned on the lambdalabs/naruto-blip-captions dataset. You can find some example images in the following.
21
+
22
+ ![img_0](./image_0.png)
23
+ ![img_1](./image_1.png)
24
+ ![img_2](./image_2.png)
25
+ ![img_3](./image_3.png)
26
+
27
+
28
+
29
+ ## Intended uses & limitations
30
+
31
+ #### How to use
32
+
33
+ ```python
34
+ # TODO: add an example code snippet for running this diffusion pipeline
35
+ ```
36
+
37
+ #### Limitations and bias
38
+
39
+ [TODO: provide examples of latent issues and potential remediations]
40
+
41
+ ## Training details
42
+
43
+ [TODO: describe the data used to train the model]
checkpoint-6000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27b8ff4c244fa60a0f03776d1d14c713af85e60a71de1b53b3b31100a55002a2
3
+ size 1722353544
checkpoint-6000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa3c4b5cea55cfd1afdda07ed02be7d93b7dd37bf4f47e86ee482879098c548b
3
+ size 6592523
checkpoint-6000/pytorch_lora_weights.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64e33902d7330ac36596c3174561af8234656e04381237da0a0474faf80b5446
3
+ size 3226184
checkpoint-6000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:119b45dc050f67f8ac6ef9a1863bdb7ed8b76bba0c35c5bbd6d2ea7c00967bee
3
+ size 14821
checkpoint-6000/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bb2b51b22f222dc6df63edb791d76de5de25b8bb724e885f8753e34cfb8ae10
3
+ size 1383
checkpoint-6000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cd36bc98fdcd79a93149a23d5d1fe1a31ea2e04bc414545257bbcc4e0ffd739
3
+ size 1401
image_0.png ADDED

Git LFS Details

  • SHA256: 715fde221607efc4616321a101341f2eead351d39a7efabc1ade6cff4c2138cc
  • Pointer size: 131 Bytes
  • Size of remote file: 423 kB
image_1.png ADDED

Git LFS Details

  • SHA256: 3f0f269cb05e1f42dfa23cf0a816be5659b1a6c5e7ef7d80c4d23015121f3d83
  • Pointer size: 131 Bytes
  • Size of remote file: 399 kB
image_2.png ADDED

Git LFS Details

  • SHA256: 68473f7e9309b26bc9e154d11d0727df8e80c9192d4da1c5269b31ca2b1f286a
  • Pointer size: 131 Bytes
  • Size of remote file: 386 kB
image_3.png ADDED

Git LFS Details

  • SHA256: cc5bd4e2381599696bd982003eeb9018acb3ed6751198378c57283bdf76cd23b
  • Pointer size: 131 Bytes
  • Size of remote file: 466 kB
logs/text2image-fine-tune/1770849359.1233923/events.out.tfevents.1770849359.wmgubws17.wmgds.wmg.warwick.ac.uk.1346513.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23364a3e71d8ec3d4ff4723dc71a9f7becaaf0390a5647171204836461792ddd
3
+ size 2545
logs/text2image-fine-tune/1770849359.1247902/hparams.yml ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ alpha: 0.8
7
+ cache_dir: null
8
+ caption_column: text
9
+ center_crop: true
10
+ checkpointing_steps: 6000
11
+ checkpoints_total_limit: null
12
+ dataloader_num_workers: 8
13
+ dataset_config_name: null
14
+ dataset_name: lambdalabs/naruto-blip-captions
15
+ enable_xformers_memory_efficient_attention: false
16
+ epsilon_m: 0.005
17
+ gradient_accumulation_steps: 1
18
+ gradient_checkpointing: false
19
+ hub_model_id: sd15_naruto_text_0.005_mix_0.8
20
+ hub_token: null
21
+ image_column: image
22
+ image_interpolation_mode: lanczos
23
+ learning_rate: 0.0001
24
+ local_rank: -1
25
+ logging_dir: logs
26
+ lr_scheduler: cosine
27
+ lr_warmup_steps: 0
28
+ max_grad_norm: 1.0
29
+ max_train_samples: null
30
+ max_train_steps: 6120
31
+ mixed_precision: fp16
32
+ noise_offset: 0
33
+ num_train_epochs: 20
34
+ num_validation_images: 4
35
+ output_dir: output_models/sd15_naruto_text_0.005_mix_0.8
36
+ prediction_type: null
37
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
38
+ push_to_hub: true
39
+ random_flip: true
40
+ rank: 4
41
+ report_to: tensorboard
42
+ resolution: 512
43
+ resume_from_checkpoint: null
44
+ revision: null
45
+ scale_lr: false
46
+ seed: 42
47
+ snr_gamma: null
48
+ train_batch_size: 4
49
+ train_data_dir: null
50
+ use_8bit_adam: false
51
+ validation_epochs: 1
52
+ validation_prompt: a car is driving down the road with another car
53
+ variant: null
logs/text2image-fine-tune/1770849377.587789/events.out.tfevents.1770849377.wmgubws17.wmgds.wmg.warwick.ac.uk.1347184.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04d3211a991b5309dc13dd0bafb67be2758be385e0bd8c78bba3aef457575511
3
+ size 2545
logs/text2image-fine-tune/1770849377.5892653/hparams.yml ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ alpha: 0.8
7
+ cache_dir: null
8
+ caption_column: text
9
+ center_crop: true
10
+ checkpointing_steps: 6000
11
+ checkpoints_total_limit: null
12
+ dataloader_num_workers: 8
13
+ dataset_config_name: null
14
+ dataset_name: lambdalabs/naruto-blip-captions
15
+ enable_xformers_memory_efficient_attention: false
16
+ epsilon_m: 0.005
17
+ gradient_accumulation_steps: 1
18
+ gradient_checkpointing: false
19
+ hub_model_id: sd15_naruto_text_0.005_mix_0.8
20
+ hub_token: null
21
+ image_column: image
22
+ image_interpolation_mode: lanczos
23
+ learning_rate: 0.0001
24
+ local_rank: -1
25
+ logging_dir: logs
26
+ lr_scheduler: cosine
27
+ lr_warmup_steps: 0
28
+ max_grad_norm: 1.0
29
+ max_train_samples: null
30
+ max_train_steps: 6120
31
+ mixed_precision: fp16
32
+ noise_offset: 0
33
+ num_train_epochs: 20
34
+ num_validation_images: 4
35
+ output_dir: output_models/sd15_naruto_text_0.005_mix_0.8
36
+ prediction_type: null
37
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
38
+ push_to_hub: true
39
+ random_flip: true
40
+ rank: 4
41
+ report_to: tensorboard
42
+ resolution: 512
43
+ resume_from_checkpoint: null
44
+ revision: null
45
+ scale_lr: false
46
+ seed: 42
47
+ snr_gamma: null
48
+ train_batch_size: 4
49
+ train_data_dir: null
50
+ use_8bit_adam: false
51
+ validation_epochs: 1
52
+ validation_prompt: a car is driving down the road with another car
53
+ variant: null
logs/text2image-fine-tune/events.out.tfevents.1770849359.wmgubws17.wmgds.wmg.warwick.ac.uk.1346513.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ced6399156e8957e8015207be5ffc2d9a7be8c0321f8110f88922845588ca774
3
+ size 376
logs/text2image-fine-tune/events.out.tfevents.1770849377.wmgubws17.wmgds.wmg.warwick.ac.uk.1347184.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f25d11b588ee7c8fc5785dce22dce2decd89799dde1b9c96ec6f1ca3654c86c0
3
+ size 36735625
pytorch_lora_weights.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2d55ea1c4f8245e0a2eff5ab92fa960af3afe9884aa4415013f1d0144864179
3
+ size 3226184