zhiyang1 commited on Jul 28

Commit

026e4b9

verified ·

1 Parent(s): e57000a

Upload folder using huggingface_hub

Browse files

Files changed (27) hide show

.gitattributes +2 -0
checkpoint-78000/config.json +79 -0
checkpoint-78000/generation_config.json +6 -0
checkpoint-78000/model-00001-of-00002.safetensors +3 -0
checkpoint-78000/model-00002-of-00002.safetensors +3 -0
checkpoint-78000/model.safetensors.index.json +0 -0
checkpoint-78000/optimizer.pt +3 -0
checkpoint-78000/rng_state_0.pth +3 -0
checkpoint-78000/rng_state_1.pth +3 -0
checkpoint-78000/rng_state_2.pth +3 -0
checkpoint-78000/rng_state_3.pth +3 -0
checkpoint-78000/scheduler.pt +3 -0
checkpoint-78000/trainer_state.json +3 -0
checkpoint-78000/training_args.bin +3 -0
checkpoint-80000/config.json +79 -0
checkpoint-80000/generation_config.json +6 -0
checkpoint-80000/model-00001-of-00002.safetensors +3 -0
checkpoint-80000/model-00002-of-00002.safetensors +3 -0
checkpoint-80000/model.safetensors.index.json +0 -0
checkpoint-80000/optimizer.pt +3 -0
checkpoint-80000/rng_state_0.pth +3 -0
checkpoint-80000/rng_state_1.pth +3 -0
checkpoint-80000/rng_state_2.pth +3 -0
checkpoint-80000/rng_state_3.pth +3 -0
checkpoint-80000/scheduler.pt +3 -0
checkpoint-80000/trainer_state.json +3 -0
checkpoint-80000/training_args.bin +3 -0

.gitattributes CHANGED Viewed

@@ -34,3 +34,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 checkpoint-70000/trainer_state.json filter=lfs diff=lfs merge=lfs -text

 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 checkpoint-70000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-78000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-80000/trainer_state.json filter=lfs diff=lfs merge=lfs -text

checkpoint-78000/config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+  "ar_steps": 1,
+  "architectures": [
+    "DiffVLMDiffusion"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 151643,
+  "condition_layer": -1,
+  "eos_token_id": 151645,
+  "hidden_act": "silu",
+  "hidden_size": 1536,
+  "image_token_id": 151655,
+  "img_cross_attention_dim": 2048,
+  "img_diffuser_depth": 1,
+  "img_ffn_dim_multiplier": null,
+  "img_hidden_size": 1536,
+  "img_multiple_of": 256,
+  "img_norm_eps": 1e-05,
+  "img_num_attention_heads": 12,
+  "img_num_kv_heads": 12,
+  "img_qk_norm": true,
+  "in_channels": 32,
+  "initializer_range": 0.02,
+  "inject_img_diffuser": false,
+  "input_size": 32,
+  "intermediate_size": 8960,
+  "layer_group_size": 7,
+  "layerwise_start_idx": 0,
+  "lora_alpha": 16,
+  "lora_bias": "none",
+  "lora_dropout": 0.05,
+  "lora_enable": false,
+  "lora_r": 64,
+  "max_position_embeddings": 32768,
+  "max_window_layers": 28,
+  "model_type": "qwen2_vl",
+  "non_linearity": 1,
+  "norm_elementwise_affine": true,
+  "num_attention_heads": 12,
+  "num_hidden_layers": 28,
+  "num_key_value_heads": 2,
+  "patch_size": 1,
+  "repa_coeff": 0.5,
+  "repa_layers": null,
+  "repa_shared": false,
+  "rms_norm_eps": 1e-06,
+  "rope_scaling": {
+    "mrope_section": [
+      16,
+      24,
+      24
+    ],
+    "rope_type": "default",
+    "type": "default"
+  },
+  "rope_theta": 1000000.0,
+  "sample_size": 128,
+  "sampling_steps": 28,
+  "sliding_window": null,
+  "tie_word_embeddings": true,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.47.0",
+  "use_cache": true,
+  "use_repa": false,
+  "use_residual_attn": true,
+  "use_sliding_window": false,
+  "vae_path": "mit-han-lab/dc-ae-f32c32-sana-1.1-diffusers",
+  "video_token_id": 151656,
+  "vision_config": {
+    "hidden_size": 1536,
+    "in_chans": 3,
+    "model_type": "qwen2_vl",
+    "spatial_patch_size": 14
+  },
+  "vision_end_token_id": 151653,
+  "vision_start_token_id": 151652,
+  "vision_token_id": 151654,
+  "vocab_size": 151936
+}

checkpoint-78000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 151643,
+  "eos_token_id": 151645,
+  "transformers_version": "4.47.0"
+}

checkpoint-78000/model-00001-of-00002.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d5196c102b31879964e83f95aa8fbe45ca382b048cf06483d52d79e023268ccb
+size 4974360904

checkpoint-78000/model-00002-of-00002.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:335152f50804d331e6351c0fe2d2a0638095e1edcc2617a54dbd66604fd94a6e
+size 3234250886

checkpoint-78000/model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-78000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:da8b11de6c0fbea109791bf0320e314d2d4fc8ce13d442143ba059a542a9e78c
+size 7455061885

checkpoint-78000/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:22c71767086ac1e944013284132fbf5547e4bc072a910a39a3d7a2c77e99dc8a
+size 15024

checkpoint-78000/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8cc2974f61d3055c1e66e277d85483d5fbdb26c55fb694d0eb46cde49e3d137e
+size 15024

checkpoint-78000/rng_state_2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d344ba3023c82e25d86e5f71882dec7a2cc3ecc3a2ea24ec4d4ae0ea2144acc2
+size 15024

checkpoint-78000/rng_state_3.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2f0985c5abe29b110d77d734e277f7ce281b6856efe8188d730de1289af0bc71
+size 15024

checkpoint-78000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:49f6913d40daa41cf0a1e95007c742afdb1dd55d6a83f43e77f4ad354fb93e5f
+size 1064

checkpoint-78000/trainer_state.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1a5ee8121bc2cdabe7d2f5a3901a4f1cf6eeaf9a53b296265e4cc5af32196b9a
+size 11998321

checkpoint-78000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4b98fa098d6fa8464ac0be8cce3448fef80b406b76cab5d70e7613739913f94d
+size 6008

checkpoint-80000/config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+  "ar_steps": 1,
+  "architectures": [
+    "DiffVLMDiffusion"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 151643,
+  "condition_layer": -1,
+  "eos_token_id": 151645,
+  "hidden_act": "silu",
+  "hidden_size": 1536,
+  "image_token_id": 151655,
+  "img_cross_attention_dim": 2048,
+  "img_diffuser_depth": 1,
+  "img_ffn_dim_multiplier": null,
+  "img_hidden_size": 1536,
+  "img_multiple_of": 256,
+  "img_norm_eps": 1e-05,
+  "img_num_attention_heads": 12,
+  "img_num_kv_heads": 12,
+  "img_qk_norm": true,
+  "in_channels": 32,
+  "initializer_range": 0.02,
+  "inject_img_diffuser": false,
+  "input_size": 32,
+  "intermediate_size": 8960,
+  "layer_group_size": 7,
+  "layerwise_start_idx": 0,
+  "lora_alpha": 16,
+  "lora_bias": "none",
+  "lora_dropout": 0.05,
+  "lora_enable": false,
+  "lora_r": 64,
+  "max_position_embeddings": 32768,
+  "max_window_layers": 28,
+  "model_type": "qwen2_vl",
+  "non_linearity": 1,
+  "norm_elementwise_affine": true,
+  "num_attention_heads": 12,
+  "num_hidden_layers": 28,
+  "num_key_value_heads": 2,
+  "patch_size": 1,
+  "repa_coeff": 0.5,
+  "repa_layers": null,
+  "repa_shared": false,
+  "rms_norm_eps": 1e-06,
+  "rope_scaling": {
+    "mrope_section": [
+      16,
+      24,
+      24
+    ],
+    "rope_type": "default",
+    "type": "default"
+  },
+  "rope_theta": 1000000.0,
+  "sample_size": 128,
+  "sampling_steps": 28,
+  "sliding_window": null,
+  "tie_word_embeddings": true,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.47.0",
+  "use_cache": true,
+  "use_repa": false,
+  "use_residual_attn": true,
+  "use_sliding_window": false,
+  "vae_path": "mit-han-lab/dc-ae-f32c32-sana-1.1-diffusers",
+  "video_token_id": 151656,
+  "vision_config": {
+    "hidden_size": 1536,
+    "in_chans": 3,
+    "model_type": "qwen2_vl",
+    "spatial_patch_size": 14
+  },
+  "vision_end_token_id": 151653,
+  "vision_start_token_id": 151652,
+  "vision_token_id": 151654,
+  "vocab_size": 151936
+}

checkpoint-80000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 151643,
+  "eos_token_id": 151645,
+  "transformers_version": "4.47.0"
+}

checkpoint-80000/model-00001-of-00002.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:729a5ff18d73723b67bdd7de9e35bdaf98947cf51acb72cf4adbdb8809bc6c10
+size 4974360904

checkpoint-80000/model-00002-of-00002.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5df92bccb48a6f5db54dc283a91dcc393139ad53d8923c1b87546f8e6b9b1f50
+size 3234250886

checkpoint-80000/model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-80000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9b817540b0641b0ebade160ec568b21743191b8ddcc8dfbbdf545fe1beb6dfd9
+size 7455061885

checkpoint-80000/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2c8a29c991aa9b4eb43c6430c319bf00d11008a67a9233d45379275dd7a34169
+size 15024

checkpoint-80000/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5f5cbff43dc5ca6f4fcd1abb9ddba3122dff4e44fcecb8e2c8d10bcb939131cd
+size 15024

checkpoint-80000/rng_state_2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:51a9893141d5e8b4627f5b72a759ded15f737764d57e38ff95b8c3685c2a2e96
+size 15024

checkpoint-80000/rng_state_3.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5d145ad698d7e0e3270e0ee60172edcc6b8b601e0bb577bbbbc924963e8bb8d
+size 15024

checkpoint-80000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f8fd8bd978d36e1ca7ed9dae0bf8bc6b835705726801a0ae5084d053c6cfd261
+size 1064

checkpoint-80000/trainer_state.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:32fe84b0d30cedd77aea9437a15cf50dce036b5781c7cf653e7838c800290185
+size 12305225

checkpoint-80000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4b98fa098d6fa8464ac0be8cce3448fef80b406b76cab5d70e7613739913f94d
+size 6008