asrimanth commited on Jul 12, 2023

Commit

57acb59

1 Parent(s): 40d8754

End of training

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +6 -0
README.md +21 -0
checkpoint-1000/optimizer.bin +3 -0
checkpoint-1000/pytorch_model.bin +3 -0
checkpoint-1000/random_states_0.pkl +3 -0
checkpoint-1000/scaler.pt +3 -0
checkpoint-1000/scheduler.bin +3 -0
checkpoint-1500/optimizer.bin +3 -0
checkpoint-1500/pytorch_model.bin +3 -0
checkpoint-1500/random_states_0.pkl +3 -0
checkpoint-1500/scaler.pt +3 -0
checkpoint-1500/scheduler.bin +3 -0
checkpoint-2000/optimizer.bin +3 -0
checkpoint-2000/pytorch_model.bin +3 -0
checkpoint-2000/random_states_0.pkl +3 -0
checkpoint-2000/scaler.pt +3 -0
checkpoint-2000/scheduler.bin +3 -0
checkpoint-2500/optimizer.bin +3 -0
checkpoint-2500/pytorch_model.bin +3 -0
checkpoint-2500/random_states_0.pkl +3 -0
checkpoint-2500/scaler.pt +3 -0
checkpoint-2500/scheduler.bin +3 -0
checkpoint-3000/optimizer.bin +3 -0
checkpoint-3000/pytorch_model.bin +3 -0
checkpoint-3000/random_states_0.pkl +3 -0
checkpoint-3000/scaler.pt +3 -0
checkpoint-3000/scheduler.bin +3 -0
checkpoint-500/optimizer.bin +3 -0
checkpoint-500/pytorch_model.bin +3 -0
checkpoint-500/random_states_0.pkl +3 -0
checkpoint-500/scaler.pt +3 -0
checkpoint-500/scheduler.bin +3 -0
image_0.png +0 -0
image_1.png +0 -0
image_2.png +0 -0
image_3.png +0 -0
logs/text2image-fine-tune/1688955167.1630535/events.out.tfevents.1688955167.magneton.3115945.1 +3 -0
logs/text2image-fine-tune/1688955167.1711032/hparams.yml +49 -0
logs/text2image-fine-tune/1688962584.3811932/events.out.tfevents.1688962584.magneton.3120424.1 +3 -0
logs/text2image-fine-tune/1688962584.6847372/hparams.yml +49 -0
logs/text2image-fine-tune/events.out.tfevents.1688955166.magneton.3115945.0 +3 -0
logs/text2image-fine-tune/events.out.tfevents.1688962584.magneton.3120424.0 +3 -0
pytorch_lora_weights.bin +3 -0
wandb/debug-internal.log +0 -0
wandb/debug.log +27 -0
wandb/run-20230708_162040-7wojc8os/files/config.yaml +39 -0
wandb/run-20230708_162040-7wojc8os/files/output.log +29 -0
wandb/run-20230708_162040-7wojc8os/files/requirements.txt +165 -0
wandb/run-20230708_162040-7wojc8os/files/wandb-metadata.json +127 -0
wandb/run-20230708_162040-7wojc8os/files/wandb-summary.json +1 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,9 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+wandb/run-20230708_164840-v06ksyvb/run-v06ksyvb.wandb filter=lfs diff=lfs merge=lfs -text
+wandb/run-20230708_224302-qtf3vlop/run-qtf3vlop.wandb filter=lfs diff=lfs merge=lfs -text
+wandb/run-20230710_001721-cfgbywnm/run-cfgbywnm.wandb filter=lfs diff=lfs merge=lfs -text
+wandb/run-20230710_170714-2kdshdih/run-2kdshdih.wandb filter=lfs diff=lfs merge=lfs -text
+wandb/run-20230710_170714-kkjwpam4/run-kkjwpam4.wandb filter=lfs diff=lfs merge=lfs -text
+wandb/run-20230710_170714-ncgsl9n1/run-ncgsl9n1.wandb filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,21 @@

+---
+license: creativeml-openrail-m
+base_model: runwayml/stable-diffusion-v1-5
+tags:
+- stable-diffusion
+- stable-diffusion-diffusers
+- text-to-image
+- diffusers
+- lora
+inference: true
+---
+# LoRA text2image fine-tuning - asrimanth/person-thumbs-up-lora
+These are LoRA adaption weights for runwayml/stable-diffusion-v1-5. The weights were fine-tuned on the Custom dataset dataset. You can find some example images in the following.
+![img_0](./image_0.png)
+![img_1](./image_1.png)
+![img_2](./image_2.png)
+![img_3](./image_3.png)

checkpoint-1000/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:acc770b81b4cd51d8d396ac49ad6237abe1de0f88b98675d99f6dd00c98d602e
+size 6591685

checkpoint-1000/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:59f1fe3f7ed6197c881c1ea8c0fe33b8c17bd8c3883ea878206f8812572a85c5
+size 3285965

checkpoint-1000/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bf626b00f0c0a21c1ee2f5631667c9175d425a61775d2fd75a66283361ef7cec
+size 16719

checkpoint-1000/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:68cff80b680ddf6e7abbef98b5f336b97f9b5963e2209307f639383870e8cc71
+size 557

checkpoint-1000/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:61808704787602dc93c00aa68d75b73415f1c6bfacfbeb97c14702c3e19cf9f2
+size 563

checkpoint-1500/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e73f085755d82ce94c7eef162ea81a6be44d9cf83bfb978566e4cbcd44fea671
+size 6591685

checkpoint-1500/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6b99d4fd36435243e9f5590704bbb2bc273f02ee1b17121e2c47cb0e21f6743d
+size 3285965

checkpoint-1500/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:863bba4edd1ca97dc90e081725c55f3be037349b333f06678cdaad3d9501ed3e
+size 16719

checkpoint-1500/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:203a72d6c29f42a0e2964fdddc8d7a98df1eccee78fea9de0fa416613390f5c6
+size 557

checkpoint-1500/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e89f6844bbfca1eeee319b6e2d6f3fd9d9df58879544d455482ad32bb3ad4df6
+size 563

checkpoint-2000/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cd34409bd46e07d33c9329f19b9e01065b2b0b573406a8be0df757bafb8848e4
+size 6591685

checkpoint-2000/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:990ebd79940a1e4dd99d3b67507594172bd3fde5ea6945c1d8ebc9062ae26070
+size 3285965

checkpoint-2000/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5fd21d1d8596fbae8788b9060a2386fe2636e634218aff7b075ff9bbd70231b3
+size 16719

checkpoint-2000/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dd2de9749828adacdf103bf6e9592702bb7067a2c1df27dd62ab38c1eb8c070f
+size 557

checkpoint-2000/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:00f6a413e75a46219e92e544cae3353a4577b60b728f62a720befd9033032acd
+size 563

checkpoint-2500/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c77079603d43b27f512ea17960b3acbf0321fa0b85e027b985677f1cdd421990
+size 6591685

checkpoint-2500/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6e09ae9cce63c0ee0d6e5e98d7e1ae9ff414394d3352c45afd14f6f98b6ae6c3
+size 3285965

checkpoint-2500/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:39f28d64d6912cc34eaaa0bb0cd0819897835a6aae2d96c1c19aa15468bb16c1
+size 16719

checkpoint-2500/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0fbcebc8f5487b0c117b5dd47f2ea304af3eebf408d297118d9307e1223927e1
+size 557

checkpoint-2500/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:df00e6adcececef3aacd6addf17f6c85eae895b25ab91e673e9360b2a7f6ee86
+size 563

checkpoint-3000/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e95e8b7ea8d3aa3348d3e013cea0904c9229e2955666cb78f5a4e90bc7f6401c
+size 6591685

checkpoint-3000/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a1541b4e79e7efab51d556a7179c5f74f5965962bb2aa0d29ab8c5b8837a2d02
+size 3285965

checkpoint-3000/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d12ebe8df23ebc27557c11a245e66d96279ac2a3ff7c8b15aac109084cee9e94
+size 16719

checkpoint-3000/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fb1f9398b77268202e8e1465734a63d123b1ef11c27f20f2473677e9883a6869
+size 557

checkpoint-3000/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:807d7d063623792ef9b8c66da2304691aed0888f14ad6e70a728375b9c90fe9d
+size 563

checkpoint-500/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:88a7bc9b20ad346345b5058e353cca20ea8b834a515dc312027da289b320c6e7
+size 6591685

checkpoint-500/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c44be5a37b7d6cc6ac4beba90965c20ccdd2f336aa993dc70152235db222227b
+size 3285965

checkpoint-500/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e670e6c021cd2c9f45d7068757a1a37ed11280498d332d84fc9b52b93dce0e7d
+size 16719

checkpoint-500/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a3f196a54202bb4ba1220e8c59f42f9cda0702d68ea83147d814c2fb2f36b8f2
+size 557

checkpoint-500/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6bc0a22eef87625080f7c833304b0844a5e9a28131b856c035cff1e8f8d56121
+size 563

image_0.png ADDED Viewed

image_1.png ADDED Viewed

image_2.png ADDED Viewed

image_3.png ADDED Viewed

logs/text2image-fine-tune/1688955167.1630535/events.out.tfevents.1688955167.magneton.3115945.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b5f447f4cdd861cff146802771b78a632005903e712beccf0a6b73f15ccd5cdf
+size 2399

logs/text2image-fine-tune/1688955167.1711032/hparams.yml ADDED Viewed

	@@ -0,0 +1,49 @@

+adam_beta1: 0.9
+adam_beta2: 0.999
+adam_epsilon: 1.0e-08
+adam_weight_decay: 0.01
+allow_tf32: false
+cache_dir: /l/vision/v5/sragas/hf_models/
+caption_column: text
+center_crop: true
+checkpointing_steps: 500
+checkpoints_total_limit: null
+dataloader_num_workers: 0
+dataset_config_name: null
+dataset_name: null
+enable_xformers_memory_efficient_attention: false
+gradient_accumulation_steps: 4
+gradient_checkpointing: false
+hub_model_id: sachin-thumbs-up-lora
+hub_token: null
+image_column: image
+learning_rate: 0.0001
+local_rank: 0
+logging_dir: logs
+lr_scheduler: cosine
+lr_warmup_steps: 0
+max_grad_norm: 1.0
+max_train_samples: null
+max_train_steps: 360
+mixed_precision: null
+noise_offset: 0
+num_train_epochs: 60
+num_validation_images: 4
+output_dir: /l/vision/v5/sragas/easel_ai/models/
+prediction_type: null
+pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
+push_to_hub: true
+random_flip: true
+rank: 4
+report_to: tensorboard
+resolution: 512
+resume_from_checkpoint: null
+revision: null
+scale_lr: false
+seed: 15
+snr_gamma: null
+train_batch_size: 2
+train_data_dir: /l/vision/v5/sragas/easel_ai/thumbs_up_dataset/
+use_8bit_adam: false
+validation_epochs: 1
+validation_prompt: 'A person with #thumbsup'

logs/text2image-fine-tune/1688962584.3811932/events.out.tfevents.1688962584.magneton.3120424.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef5f855e4dcff4457f8e1694736372661f8ad463d3551cb73d9429b3c1047869
+size 2398

logs/text2image-fine-tune/1688962584.6847372/hparams.yml ADDED Viewed

	@@ -0,0 +1,49 @@

+adam_beta1: 0.9
+adam_beta2: 0.999
+adam_epsilon: 1.0e-08
+adam_weight_decay: 0.01
+allow_tf32: false
+cache_dir: /l/vision/v5/sragas/hf_models/
+caption_column: text
+center_crop: true
+checkpointing_steps: 500
+checkpoints_total_limit: null
+dataloader_num_workers: 0
+dataset_config_name: null
+dataset_name: null
+enable_xformers_memory_efficient_attention: false
+gradient_accumulation_steps: 4
+gradient_checkpointing: false
+hub_model_id: sachin-thumbs-up-lora
+hub_token: null
+image_column: image
+learning_rate: 0.0001
+local_rank: 0
+logging_dir: logs
+lr_scheduler: cosine
+lr_warmup_steps: 0
+max_grad_norm: 1.0
+max_train_samples: null
+max_train_steps: 700
+mixed_precision: null
+noise_offset: 0
+num_train_epochs: 100
+num_validation_images: 4
+output_dir: /l/vision/v5/sragas/easel_ai/models/
+prediction_type: null
+pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
+push_to_hub: true
+random_flip: true
+rank: 4
+report_to: tensorboard
+resolution: 512
+resume_from_checkpoint: null
+revision: null
+scale_lr: false
+seed: 15
+snr_gamma: null
+train_batch_size: 3
+train_data_dir: /l/vision/v5/sragas/easel_ai/thumbs_up_dataset/
+use_8bit_adam: false
+validation_epochs: 1
+validation_prompt: '<tom_cruise> #thumbsup'

logs/text2image-fine-tune/events.out.tfevents.1688955166.magneton.3115945.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:98e366dd41155488121dc6e6b816f564dd5abb7d3b97e7b23c6f5521972aff09
+size 88

logs/text2image-fine-tune/events.out.tfevents.1688962584.magneton.3120424.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:91956d6612c16c0d39d3feb1915fdd2a9fc6c1093a4acf6828307527b152dfea
+size 88

pytorch_lora_weights.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1613e7cca2fa0fc15cc06a4dcdcbfb1568c9a80c32aad18dfe283b7f9c5ea2ca
+size 3287771

wandb/debug-internal.log ADDED Viewed

The diff for this file is too large to render. See raw diff

wandb/debug.log ADDED Viewed

	@@ -0,0 +1,27 @@

+2023-07-10 17:07:15,048 INFO    MainThread:3133504 [wandb_setup.py:_flush():76] Current SDK version is 0.15.4
+2023-07-10 17:07:15,048 INFO    MainThread:3133504 [wandb_setup.py:_flush():76] Configure stats pid to 3133504
+2023-07-10 17:07:15,049 INFO    MainThread:3133504 [wandb_setup.py:_flush():76] Loading settings from /u/sragas/.config/wandb/settings
+2023-07-10 17:07:15,049 INFO    MainThread:3133504 [wandb_setup.py:_flush():76] Loading settings from /nfs/nfs2/home/sragas/demo/wandb/settings
+2023-07-10 17:07:15,049 INFO    MainThread:3133504 [wandb_setup.py:_flush():76] Loading settings from environment variables: {}
+2023-07-10 17:07:15,049 INFO    MainThread:3133504 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
+2023-07-10 17:07:15,049 INFO    MainThread:3133504 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program_relpath': 'train_text_to_image_lora.py', 'program': 'train_text_to_image_lora.py'}
+2023-07-10 17:07:15,049 INFO    MainThread:3133504 [wandb_init.py:_log_setup():507] Logging user logs to /l/vision/v5/sragas/easel_ai/models/wandb/run-20230710_170714-2kdshdih/logs/debug.log
+2023-07-10 17:07:15,049 INFO    MainThread:3133504 [wandb_init.py:_log_setup():508] Logging internal logs to /l/vision/v5/sragas/easel_ai/models/wandb/run-20230710_170714-2kdshdih/logs/debug-internal.log
+2023-07-10 17:07:15,049 INFO    MainThread:3133504 [wandb_init.py:init():547] calling init triggers
+2023-07-10 17:07:15,049 INFO    MainThread:3133504 [wandb_init.py:init():554] wandb.init called with sweep_config: {}
+config: {}
+2023-07-10 17:07:15,050 INFO    MainThread:3133504 [wandb_init.py:init():596] starting backend
+2023-07-10 17:07:15,050 INFO    MainThread:3133504 [wandb_init.py:init():600] setting up manager
+2023-07-10 17:07:15,053 INFO    MainThread:3133504 [backend.py:_multiprocessing_setup():106] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
+2023-07-10 17:07:15,056 INFO    MainThread:3133504 [wandb_init.py:init():606] backend started and connected
+2023-07-10 17:07:15,063 INFO    MainThread:3133504 [wandb_init.py:init():703] updated telemetry
+2023-07-10 17:07:15,064 INFO    MainThread:3133504 [wandb_init.py:init():736] communicating run to backend with 60.0 second timeout
+2023-07-10 17:07:15,246 INFO    MainThread:3133504 [wandb_run.py:_on_init():2176] communicating current version
+2023-07-10 17:07:15,317 INFO    MainThread:3133504 [wandb_run.py:_on_init():2185] got version response upgrade_message: "wandb version 0.15.5 is available!  To upgrade, please run:\n $ pip install wandb --upgrade"
+2023-07-10 17:07:15,317 INFO    MainThread:3133504 [wandb_init.py:init():787] starting run threads in backend
+2023-07-10 17:07:15,502 INFO    MainThread:3133504 [wandb_run.py:_console_start():2155] atexit reg
+2023-07-10 17:07:15,503 INFO    MainThread:3133504 [wandb_run.py:_redirect():2010] redirect: SettingsConsole.WRAP_RAW
+2023-07-10 17:07:15,503 INFO    MainThread:3133504 [wandb_run.py:_redirect():2075] Wrapping output streams.
+2023-07-10 17:07:15,503 INFO    MainThread:3133504 [wandb_run.py:_redirect():2100] Redirects installed.
+2023-07-10 17:07:15,504 INFO    MainThread:3133504 [wandb_init.py:init():828] run started, returning control to user process

wandb/run-20230708_162040-7wojc8os/files/config.yaml ADDED Viewed

	@@ -0,0 +1,39 @@

+wandb_version: 1
+_wandb:
+  desc: null
+  value:
+    python_version: 3.8.10
+    cli_version: 0.15.4
+    framework: huggingface
+    huggingface_version: 4.30.2
+    is_jupyter_run: false
+    is_kaggle_kernel: true
+    start_time: 1688847640.60948
+    t:
+      1:
+      - 1
+      - 11
+      - 41
+      - 49
+      - 51
+      - 55
+      - 71
+      - 83
+      2:
+      - 1
+      - 11
+      - 41
+      - 49
+      - 51
+      - 55
+      - 71
+      - 83
+      3:
+      - 23
+      4: 3.8.10
+      5: 0.15.4
+      6: 4.30.2
+      8:
+      - 2
+      - 5

wandb/run-20230708_162040-7wojc8os/files/output.log ADDED Viewed

	@@ -0,0 +1,29 @@

+07/08/2023 16:20:41 - INFO - __main__ - Distributed environment: MULTI_GPU  Backend: nccl
+Num processes: 3
+Process index: 1
+Local process index: 1
+Device: cuda:1
+Mixed precision type: fp16
+Traceback (most recent call last):
+  File "/nfs/blitzle/home/data/vision5/sragas/easel_venv/lib/python3.8/site-packages/diffusers/utils/hub_utils.py", line 311, in _get_model_file
+    model_file = hf_hub_download(
+  File "/nfs/blitzle/home/data/vision5/sragas/easel_venv/lib/python3.8/site-packages/huggingface_hub/utils/_validators.py", line 118, in _inner_fn
+    return fn(*args, **kwargs)
+  File "/nfs/blitzle/home/data/vision5/sragas/easel_venv/lib/python3.8/site-packages/huggingface_hub/file_download.py", line 1361, in hf_hub_download
+    with temp_file_manager() as temp_file:
+  File "/usr/lib/python3.8/tempfile.py", line 679, in NamedTemporaryFile
+    (fd, name) = _mkstemp_inner(dir, prefix, suffix, flags, output_type)
+  File "/usr/lib/python3.8/tempfile.py", line 389, in _mkstemp_inner
+    fd = _os.open(file, flags, 0o600)
+OSError: [Errno 122] Disk quota exceeded: '/u/sragas/.cache/huggingface/hub/tmpltn5e7d6'
+During handling of the above exception, another exception occurred:
+Traceback (most recent call last):
+  File "train_text_to_image_lora.py", line 951, in <module>
+    main()
+  File "train_text_to_image_lora.py", line 426, in main
+    unet = UNet2DConditionModel.from_pretrained(
+  File "/nfs/blitzle/home/data/vision5/sragas/easel_venv/lib/python3.8/site-packages/diffusers/models/modeling_utils.py", line 576, in from_pretrained
+    model_file = _get_model_file(
+  File "/nfs/blitzle/home/data/vision5/sragas/easel_venv/lib/python3.8/site-packages/diffusers/utils/hub_utils.py", line 356, in _get_model_file
+    raise EnvironmentError(
+OSError: Can't load the model for 'runwayml/stable-diffusion-v1-5'. If you were trying to load it from 'https://huggingface.co/models', make sure you don't have a local directory with the same name. Otherwise, make sure 'runwayml/stable-diffusion-v1-5' is the correct path to a directory containing a file named diffusion_pytorch_model.bin

wandb/run-20230708_162040-7wojc8os/files/requirements.txt ADDED Viewed

	@@ -0,0 +1,165 @@

+absl-py==1.4.0
+accelerate==0.20.3
+aiohttp==3.8.4
+aiosignal==1.3.1
+anyio==3.7.0
+appdirs==1.4.4
+argon2-cffi-bindings==21.2.0
+argon2-cffi==21.3.0
+asttokens==2.2.1
+async-lru==2.0.2
+async-timeout==4.0.2
+attrs==23.1.0
+babel==2.12.1
+backcall==0.2.0
+beautifulsoup4==4.12.2
+bleach==6.0.0
+cachetools==5.3.1
+certifi==2023.5.7
+cffi==1.15.1
+charset-normalizer==3.1.0
+click==8.1.3
+cmake==3.26.4
+comm==0.1.3
+datasets==2.13.1
+debugpy==1.6.7
+decorator==5.1.1
+defusedxml==0.7.1
+diffusers==0.18.0.dev0
+dill==0.3.6
+docker-pycreds==0.4.0
+exceptiongroup==1.1.2
+executing==1.2.0
+fastjsonschema==2.17.1
+filelock==3.12.2
+frozenlist==1.3.3
+fsspec==2023.6.0
+ftfy==6.1.1
+gitdb==4.0.10
+gitpython==3.1.31
+google-auth-oauthlib==1.0.0
+google-auth==2.21.0
+grpcio==1.56.0
+huggingface-hub==0.15.1
+idna==3.4
+importlib-metadata==6.7.0
+importlib-resources==5.12.0
+ipykernel==6.24.0
+ipython==8.12.2
+jedi==0.18.2
+jinja2==3.1.2
+json5==0.9.14
+jsonschema==4.17.3
+jupyter-client==8.3.0
+jupyter-core==5.3.1
+jupyter-events==0.6.3
+jupyter-lsp==2.2.0
+jupyter-server-terminals==0.4.4
+jupyter-server==2.7.0
+jupyterlab-pygments==0.2.2
+jupyterlab-server==2.23.0
+jupyterlab==4.0.2
+lit==16.0.6
+markdown==3.4.3
+markupsafe==2.1.3
+matplotlib-inline==0.1.6
+mistune==3.0.1
+mpmath==1.3.0
+multidict==6.0.4
+multiprocess==0.70.14
+mypy-extensions==1.0.0
+nbclient==0.8.0
+nbconvert==7.6.0
+nbformat==5.9.0
+nest-asyncio==1.5.6
+networkx==3.1
+notebook-shim==0.2.3
+numpy==1.24.4
+nvidia-cublas-cu11==11.10.3.66
+nvidia-cuda-cupti-cu11==11.7.101
+nvidia-cuda-nvrtc-cu11==11.7.99
+nvidia-cuda-runtime-cu11==11.7.99
+nvidia-cudnn-cu11==8.5.0.96
+nvidia-cufft-cu11==10.9.0.58
+nvidia-curand-cu11==10.2.10.91
+nvidia-cusolver-cu11==11.4.0.1
+nvidia-cusparse-cu11==11.7.4.91
+nvidia-nccl-cu11==2.14.3
+nvidia-nvtx-cu11==11.7.91
+oauthlib==3.2.2
+overrides==7.3.1
+packaging==23.1
+pandas==2.0.3
+pandocfilters==1.5.0
+parso==0.8.3
+pathtools==0.1.2
+pexpect==4.8.0
+pickleshare==0.7.5
+pillow==10.0.0
+pip==20.0.2
+pkg-resources==0.0.0
+pkgutil-resolve-name==1.3.10
+platformdirs==3.8.0
+prometheus-client==0.17.0
+prompt-toolkit==3.0.39
+protobuf==4.23.3
+psutil==5.9.5
+ptyprocess==0.7.0
+pure-eval==0.2.2
+pyarrow==12.0.1
+pyasn1-modules==0.3.0
+pyasn1==0.5.0
+pycparser==2.21
+pygments==2.15.1
+pyre-extensions==0.0.29
+pyrsistent==0.19.3
+python-dateutil==2.8.2
+python-json-logger==2.0.7
+pytz==2023.3
+pyyaml==6.0
+pyzmq==25.1.0
+regex==2023.6.3
+requests-oauthlib==1.3.1
+requests==2.31.0
+rfc3339-validator==0.1.4
+rfc3986-validator==0.1.1
+rsa==4.9
+safetensors==0.3.1
+send2trash==1.8.2
+sentry-sdk==1.27.0
+setproctitle==1.3.2
+setuptools==44.0.0
+six==1.16.0
+smmap==5.0.0
+sniffio==1.3.0
+soupsieve==2.4.1
+stack-data==0.6.2
+sympy==1.12
+tensorboard-data-server==0.7.1
+tensorboard==2.13.0
+terminado==0.17.1
+tinycss2==1.2.1
+tokenizers==0.13.3
+tomli==2.0.1
+torch==2.0.1
+torchaudio==2.0.2
+torchvision==0.15.2
+tornado==6.3.2
+tqdm==4.65.0
+traitlets==5.9.0
+transformers==4.30.2
+triton==2.0.0
+typing-extensions==4.7.1
+typing-inspect==0.9.0
+tzdata==2023.3
+urllib3==2.0.3
+wandb==0.15.4
+wcwidth==0.2.6
+webencodings==0.5.1
+websocket-client==1.6.1
+werkzeug==2.3.6
+wheel==0.40.0
+xformers==0.0.20
+xxhash==3.2.0
+yarl==1.9.2
+zipp==3.15.0

wandb/run-20230708_162040-7wojc8os/files/wandb-metadata.json ADDED Viewed

	@@ -0,0 +1,127 @@

+{
+    "os": "Linux-5.15.0-60-generic-x86_64-with-glibc2.29",
+    "python": "3.8.10",
+    "heartbeatAt": "2023-07-08T20:20:41.026887",
+    "startedAt": "2023-07-08T20:20:40.579314",
+    "docker": null,
+    "cuda": null,
+    "args": [
+        "--pretrained_model_name_or_path=runwayml/stable-diffusion-v1-5",
+        "--train_data_dir=/l/vision/v5/sragas/easel_ai/thumbs_up_dataset/",
+        "--resolution=512",
+        "--center_crop",
+        "--random_flip",
+        "--train_batch_size=1",
+        "--gradient_accumulation_steps=4",
+        "--max_train_steps=15000",
+        "--learning_rate=1e-04",
+        "--max_grad_norm=1",
+        "--lr_scheduler=cosine",
+        "--lr_warmup_steps=0",
+        "--output_dir=/l/vision/v5/sragas/easel_ai/models/",
+        "--push_to_hub",
+        "--hub_model_id=thumbs-up-lora",
+        "--report_to=wandb",
+        "--checkpointing_steps=500",
+        "--validation_prompt=A person with #thumbsup",
+        "--seed=1337"
+    ],
+    "state": "running",
+    "program": "train_text_to_image_lora.py",
+    "codePath": "train_text_to_image_lora.py",
+    "host": "magneton",
+    "username": "sragas",
+    "executable": "/nfs/blitzle/home/data/vision5/sragas/easel_venv/bin/python3",
+    "cpu_count": 6,
+    "cpu_count_logical": 12,
+    "cpu_freq": {
+        "current": 1897.8334166666666,
+        "min": 1200.0,
+        "max": 3700.0
+    },
+    "cpu_freq_per_core": [
+        {
+            "current": 1200.0,
+            "min": 1200.0,
+            "max": 3700.0
+        },
+        {
+            "current": 1456.076,
+            "min": 1200.0,
+            "max": 3700.0
+        },
+        {
+            "current": 1300.0,
+            "min": 1200.0,
+            "max": 3700.0
+        },
+        {
+            "current": 2496.8,
+            "min": 1200.0,
+            "max": 3700.0
+        },
+        {
+            "current": 2981.104,
+            "min": 1200.0,
+            "max": 3700.0
+        },
+        {
+            "current": 1200.0,
+            "min": 1200.0,
+            "max": 3700.0
+        },
+        {
+            "current": 1200.0,
+            "min": 1200.0,
+            "max": 3700.0
+        },
+        {
+            "current": 1300.0,
+            "min": 1200.0,
+            "max": 3700.0
+        },
+        {
+            "current": 2200.0,
+            "min": 1200.0,
+            "max": 3700.0
+        },
+        {
+            "current": 1300.0,
+            "min": 1200.0,
+            "max": 3700.0
+        },
+        {
+            "current": 1200.0,
+            "min": 1200.0,
+            "max": 3700.0
+        },
+        {
+            "current": 2435.006,
+            "min": 1200.0,
+            "max": 3700.0
+        }
+    ],
+    "disk": {
+        "total": 467.8895797729492,
+        "used": 42.67890548706055
+    },
+    "gpu": "NVIDIA GeForce GTX TITAN X",
+    "gpu_count": 3,
+    "gpu_devices": [
+        {
+            "name": "NVIDIA GeForce GTX TITAN X",
+            "memory_total": 12884901888
+        },
+        {
+            "name": "NVIDIA TITAN X (Pascal)",
+            "memory_total": 12884901888
+        },
+        {
+            "name": "NVIDIA GeForce GTX TITAN X",
+            "memory_total": 12884901888
+        }
+    ],
+    "memory": {
+        "total": 31.240768432617188
+    }
+}

wandb/run-20230708_162040-7wojc8os/files/wandb-summary.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"_wandb": {"runtime": 53}}